// Copyright 2016 Mozilla // // Licensed under the Apache License, Version 2.0 (the "License"); you may not use // this file except in compliance with the License. You may obtain a copy of the // License at http://www.apache.org/licenses/LICENSE-2.0 // Unless required by applicable law or agreed to in writing, software distributed // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR // CONDITIONS OF ANY KIND, either express or implied. See the License for the // specific language governing permissions and limitations under the License. #[macro_use] extern crate error_chain; #[cfg(test)] #[macro_use] extern crate maplit; extern crate mentat_core; extern crate mentat_query; use std::collections::BTreeSet; use std::ops::Sub; use std::rc::Rc; mod errors; mod types; mod validate; mod clauses; use mentat_core::{ Schema, TypedValue, ValueType, }; use mentat_core::counter::RcCounter; use mentat_query::{ FindQuery, FindSpec, Limit, Order, SrcVar, Variable, }; pub use errors::{ BindingError, Error, ErrorKind, Result, }; pub use clauses::{ QueryInputs, }; pub use types::{ EmptyBecause, }; #[derive(Debug)] pub struct AlgebraicQuery { default_source: SrcVar, pub find_spec: Rc, has_aggregates: bool, pub with: BTreeSet, pub order: Option>, pub limit: Limit, pub cc: clauses::ConjoiningClauses, } impl AlgebraicQuery { #[inline] pub fn is_known_empty(&self) -> bool { self.cc.is_known_empty() } /// Return a set of the input variables mentioned in the `:in` clause that have not yet been /// bound. We do this by looking at the CC. pub fn unbound_variables(&self) -> BTreeSet { self.cc.input_variables.sub(&self.cc.value_bound_variable_set()) } } pub fn algebrize_with_counter(schema: &Schema, parsed: FindQuery, counter: usize) -> Result { algebrize_with_inputs(schema, parsed, counter, QueryInputs::default()) } pub fn algebrize(schema: &Schema, parsed: FindQuery) -> Result { algebrize_with_inputs(schema, parsed, 0, QueryInputs::default()) } /// Take an ordering list. Any variables that aren't fixed by the query are used to produce /// a vector of `OrderBy` instances, including type comparisons if necessary. This function also /// returns a set of variables that should be added to the `with` clause to make the ordering /// clauses possible. fn validate_and_simplify_order(cc: &ConjoiningClauses, order: Option>) -> Result<(Option>, BTreeSet)> { match order { None => Ok((None, BTreeSet::default())), Some(order) => { let mut order_bys: Vec = Vec::with_capacity(order.len() * 2); // Space for tags. let mut vars: BTreeSet = BTreeSet::default(); for Order(direction, var) in order.into_iter() { // Eliminate any ordering clauses that are bound to fixed values. if cc.bound_value(&var).is_some() { continue; } // Fail if the var isn't bound by the query. if !cc.column_bindings.contains_key(&var) { bail!(ErrorKind::UnboundVariable(var.name())); } // Otherwise, determine if we also need to order by type… if cc.known_type(&var).is_none() { order_bys.push(OrderBy(direction.clone(), VariableColumn::VariableTypeTag(var.clone()))); } order_bys.push(OrderBy(direction, VariableColumn::Variable(var.clone()))); vars.insert(var.clone()); } Ok((if order_bys.is_empty() { None } else { Some(order_bys) }, vars)) } } } fn simplify_limit(mut query: AlgebraicQuery) -> Result { // Unpack any limit variables in place. let refined_limit = match query.limit { Limit::Variable(ref v) => { match query.cc.bound_value(v) { Some(TypedValue::Long(n)) => { if n <= 0 { // User-specified limits should always be natural numbers (> 0). bail!(ErrorKind::InvalidLimit(n.to_string(), ValueType::Long)); } else { Some(Limit::Fixed(n as u64)) } }, Some(val) => { // Same. bail!(ErrorKind::InvalidLimit(format!("{:?}", val), val.value_type())); }, None => { // We know that the limit variable is mentioned in `:in`. // That it's not bound here implies that we haven't got all the variables // we'll need to run the query yet. // (We should never hit this in `q_once`.) // Simply pass the `Limit` through to `SelectQuery` untouched. None }, } }, Limit::None => None, Limit::Fixed(_) => None, }; if let Some(lim) = refined_limit { query.limit = lim; } Ok(query) } pub fn algebrize_with_inputs(schema: &Schema, parsed: FindQuery, counter: usize, inputs: QueryInputs) -> Result { let alias_counter = RcCounter::with_initial(counter); let mut cc = ConjoiningClauses::with_inputs_and_alias_counter(parsed.in_vars, inputs, alias_counter); // Do we have a variable limit? If so, tell the CC that the var must be numeric. if let &Limit::Variable(ref var) = &parsed.limit { cc.constrain_var_to_long(var.clone()); } // TODO: integrate default source into pattern processing. // TODO: flesh out the rest of find-into-context. cc.apply_clauses(schema, parsed.where_clauses)?; cc.expand_column_bindings(); cc.prune_extracted_types(); cc.process_required_types()?; let (order, extra_vars) = validate_and_simplify_order(&cc, parsed.order)?; let with: BTreeSet = parsed.with.into_iter().chain(extra_vars.into_iter()).collect(); // This might leave us with an unused `:in` variable. let limit = if parsed.find_spec.is_unit_limited() { Limit::Fixed(1) } else { parsed.limit }; let q = AlgebraicQuery { default_source: parsed.default_source, find_spec: Rc::new(parsed.find_spec), has_aggregates: false, // TODO: we don't parse them yet. with: with, order: order, limit: limit, cc: cc, }; // Substitute in any fixed values and fail if they're out of range. simplify_limit(q) } pub use clauses::{ ConjoiningClauses, }; pub use types::{ Column, ColumnAlternation, ColumnConstraint, ColumnConstraintOrAlternation, ColumnIntersection, ColumnName, ComputedTable, DatomsColumn, DatomsTable, FulltextColumn, OrderBy, QualifiedAlias, QueryValue, SourceAlias, TableAlias, VariableColumn, };