// Copyright 2018 Mozilla // // Licensed under the Apache License, Version 2.0 (the "License"); you may not use // this file except in compliance with the License. You may obtain a copy of the // License at http://www.apache.org/licenses/LICENSE-2.0 // Unless required by applicable law or agreed to in writing, software distributed // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR // CONDITIONS OF ANY KIND, either express or implied. See the License for the // specific language governing permissions and limitations under the License. use core_traits::{ValueType, ValueTypeSet}; use edn::query::{Aggregate, QueryFunction, Variable}; use mentat_query_algebrizer::{ColumnName, ConjoiningClauses, VariableColumn}; use mentat_query_sql::{ColumnOrExpression, Expression, Name, ProjectedColumn}; use errors::{ProjectorErrorKind, Result}; #[derive(Clone, Copy, Debug, Eq, PartialEq)] pub enum SimpleAggregationOp { Avg, Count, Max, Min, Sum, } impl SimpleAggregationOp { pub fn to_sql(&self) -> &'static str { use self::SimpleAggregationOp::*; match self { &Avg => "avg", &Count => "count", &Max => "max", &Min => "min", &Sum => "sum", } } fn for_function(function: &QueryFunction) -> Option { match function.0.name() { "avg" => Some(SimpleAggregationOp::Avg), "count" => Some(SimpleAggregationOp::Count), "max" => Some(SimpleAggregationOp::Max), "min" => Some(SimpleAggregationOp::Min), "sum" => Some(SimpleAggregationOp::Sum), _ => None, } } /// With knowledge of the types to which a variable might be bound, /// return a `Result` to determine whether this aggregation is suitable. /// For example, it's valid to take the `Avg` of `{Double, Long}`, invalid /// to take `Sum` of `{Instant}`, valid to take (lexicographic) `Max` of `{String}`, /// but invalid to take `Max` of `{Uuid, String}`. /// /// The returned type is the type of the result of the aggregation. pub fn is_applicable_to_types(&self, possibilities: ValueTypeSet) -> Result { use self::SimpleAggregationOp::*; if possibilities.is_empty() { bail!(ProjectorErrorKind::CannotProjectImpossibleBinding(*self)) } match self { // One can always count results. &Count => Ok(ValueType::Long), // Only numeric types can be averaged or summed. &Avg => { if possibilities.is_only_numeric() { // The mean of a set of numeric values will always, for our purposes, be a double. Ok(ValueType::Double) } else { bail!(ProjectorErrorKind::CannotApplyAggregateOperationToTypes( *self, possibilities )) } } &Sum => { if possibilities.is_only_numeric() { if possibilities.contains(ValueType::Double) { Ok(ValueType::Double) } else { // TODO: BigInt. Ok(ValueType::Long) } } else { bail!(ProjectorErrorKind::CannotApplyAggregateOperationToTypes( *self, possibilities )) } } &Max | &Min => { if possibilities.is_unit() { use self::ValueType::*; let the_type = possibilities.exemplar().expect("a type"); match the_type { // These types are numerically ordered. Double | Long | Instant => Ok(the_type), // Boolean: false < true. Boolean => Ok(the_type), // String: lexicographic order. String => Ok(the_type), // These types are unordered. Keyword | Ref | Uuid => { bail!(ProjectorErrorKind::CannotApplyAggregateOperationToTypes( *self, possibilities )) } } } else { // It cannot be empty -- we checked. // The only types that are valid to compare cross-type are numbers. if possibilities.is_only_numeric() { // Note that if the max/min is a Long, it will be returned as a Double! if possibilities.contains(ValueType::Double) { Ok(ValueType::Double) } else { // TODO: BigInt. Ok(ValueType::Long) } } else { bail!(ProjectorErrorKind::CannotApplyAggregateOperationToTypes( *self, possibilities )) } } } } } } pub struct SimpleAggregate { pub op: SimpleAggregationOp, pub var: Variable, } impl SimpleAggregate { pub fn column_name(&self) -> Name { format!("({} {})", self.op.to_sql(), self.var.name()) } pub fn use_static_value(&self) -> bool { use self::SimpleAggregationOp::*; match self.op { Avg | Max | Min => true, Count | Sum => false, } } /// Return `true` if this aggregate can be `NULL` over 0 rows. pub fn is_nullable(&self) -> bool { use self::SimpleAggregationOp::*; match self.op { Avg | Max | Min => true, Count | Sum => false, } } } pub trait SimpleAggregation { fn to_simple(&self) -> Option; } impl SimpleAggregation for Aggregate { fn to_simple(&self) -> Option { if self.args.len() != 1 { return None; } self.args[0].as_variable().and_then(|v| { SimpleAggregationOp::for_function(&self.func) .map(|op| SimpleAggregate { op, var: v.clone() }) }) } } /// Returns two values: /// - The `ColumnOrExpression` to use in the query. This will always refer to other /// variables by name; never to a datoms column. /// - The known type of that value. pub fn projected_column_for_simple_aggregate( simple: &SimpleAggregate, cc: &ConjoiningClauses, ) -> Result<(ProjectedColumn, ValueType)> { let known_types = cc.known_type_set(&simple.var); let return_type = simple.op.is_applicable_to_types(known_types)?; let projected_column_or_expression = if let Some(value) = cc.bound_value(&simple.var) { // Oh, we already know the value! if simple.use_static_value() { // We can statically compute the aggregate result for some operators -- not count or // sum, but avg/max/min are OK. ColumnOrExpression::Value(value) } else { let expression = Expression::Unary { sql_op: simple.op.to_sql(), arg: ColumnOrExpression::Value(value), }; if simple.is_nullable() { ColumnOrExpression::NullableAggregate(Box::new(expression), return_type) } else { ColumnOrExpression::Expression(Box::new(expression), return_type) } } } else { // The common case: the values are bound during execution. let name = VariableColumn::Variable(simple.var.clone()).column_name(); let expression = Expression::Unary { sql_op: simple.op.to_sql(), arg: ColumnOrExpression::ExistingColumn(name), }; if simple.is_nullable() { ColumnOrExpression::NullableAggregate(Box::new(expression), return_type) } else { ColumnOrExpression::Expression(Box::new(expression), return_type) } }; Ok(( ProjectedColumn(projected_column_or_expression, simple.column_name()), return_type, )) }