19fc7cddf1
* Part 1: define ValueTypeSet. We're going to use this instead of `HashSet<ValueType>` so that we can clearly express the empty set and the set of all types, and also to encapsulate a switch to `EnumSet`." * Part 2: use ValueTypeSet. * Part 3: fix type expansion. * Part 4: add a test for type extraction from nested `or`. * Review comments. * Review comments: simplify ValueTypeSet.
222 lines
7.1 KiB
Rust
222 lines
7.1 KiB
Rust
// Copyright 2016 Mozilla
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use
|
|
// this file except in compliance with the License. You may obtain a copy of the
|
|
// License at http://www.apache.org/licenses/LICENSE-2.0
|
|
// Unless required by applicable law or agreed to in writing, software distributed
|
|
// under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
|
|
// CONDITIONS OF ANY KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations under the License.
|
|
|
|
extern crate enum_set;
|
|
|
|
#[macro_use]
|
|
extern crate error_chain;
|
|
|
|
extern crate mentat_core;
|
|
extern crate mentat_query;
|
|
|
|
use std::collections::BTreeSet;
|
|
use std::ops::Sub;
|
|
|
|
mod errors;
|
|
mod types;
|
|
mod validate;
|
|
mod clauses;
|
|
|
|
use mentat_core::{
|
|
Schema,
|
|
TypedValue,
|
|
ValueType,
|
|
};
|
|
|
|
use mentat_core::counter::RcCounter;
|
|
|
|
use mentat_query::{
|
|
FindQuery,
|
|
FindSpec,
|
|
Limit,
|
|
Order,
|
|
SrcVar,
|
|
Variable,
|
|
};
|
|
|
|
pub use errors::{
|
|
Error,
|
|
ErrorKind,
|
|
Result,
|
|
};
|
|
|
|
pub use clauses::{
|
|
QueryInputs,
|
|
};
|
|
|
|
#[allow(dead_code)]
|
|
pub struct AlgebraicQuery {
|
|
default_source: SrcVar,
|
|
pub find_spec: FindSpec,
|
|
has_aggregates: bool,
|
|
pub with: BTreeSet<Variable>,
|
|
pub order: Option<Vec<OrderBy>>,
|
|
pub limit: Limit,
|
|
pub cc: clauses::ConjoiningClauses,
|
|
}
|
|
|
|
impl AlgebraicQuery {
|
|
#[inline]
|
|
pub fn is_known_empty(&self) -> bool {
|
|
self.cc.is_known_empty()
|
|
}
|
|
|
|
/// Return a set of the input variables mentioned in the `:in` clause that have not yet been
|
|
/// bound. We do this by looking at the CC.
|
|
pub fn unbound_variables(&self) -> BTreeSet<Variable> {
|
|
self.cc.input_variables.sub(&self.cc.value_bound_variables())
|
|
}
|
|
}
|
|
|
|
pub fn algebrize_with_counter(schema: &Schema, parsed: FindQuery, counter: usize) -> Result<AlgebraicQuery> {
|
|
algebrize_with_inputs(schema, parsed, counter, QueryInputs::default())
|
|
}
|
|
|
|
pub fn algebrize(schema: &Schema, parsed: FindQuery) -> Result<AlgebraicQuery> {
|
|
algebrize_with_inputs(schema, parsed, 0, QueryInputs::default())
|
|
}
|
|
|
|
/// Take an ordering list. Any variables that aren't fixed by the query are used to produce
|
|
/// a vector of `OrderBy` instances, including type comparisons if necessary. This function also
|
|
/// returns a set of variables that should be added to the `with` clause to make the ordering
|
|
/// clauses possible.
|
|
fn validate_and_simplify_order(cc: &ConjoiningClauses, order: Option<Vec<Order>>)
|
|
-> Result<(Option<Vec<OrderBy>>, BTreeSet<Variable>)> {
|
|
match order {
|
|
None => Ok((None, BTreeSet::default())),
|
|
Some(order) => {
|
|
let mut order_bys: Vec<OrderBy> = Vec::with_capacity(order.len() * 2); // Space for tags.
|
|
let mut vars: BTreeSet<Variable> = BTreeSet::default();
|
|
|
|
for Order(direction, var) in order.into_iter() {
|
|
// Eliminate any ordering clauses that are bound to fixed values.
|
|
if cc.bound_value(&var).is_some() {
|
|
continue;
|
|
}
|
|
|
|
// Fail if the var isn't bound by the query.
|
|
if !cc.column_bindings.contains_key(&var) {
|
|
bail!(ErrorKind::UnboundVariable(var.name()));
|
|
}
|
|
|
|
// Otherwise, determine if we also need to order by type…
|
|
if cc.known_type(&var).is_none() {
|
|
order_bys.push(OrderBy(direction.clone(), VariableColumn::VariableTypeTag(var.clone())));
|
|
}
|
|
order_bys.push(OrderBy(direction, VariableColumn::Variable(var.clone())));
|
|
vars.insert(var.clone());
|
|
}
|
|
|
|
Ok((if order_bys.is_empty() { None } else { Some(order_bys) }, vars))
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
fn simplify_limit(mut query: AlgebraicQuery) -> Result<AlgebraicQuery> {
|
|
// Unpack any limit variables in place.
|
|
let refined_limit =
|
|
match query.limit {
|
|
Limit::Variable(ref v) => {
|
|
match query.cc.bound_value(v) {
|
|
Some(TypedValue::Long(n)) => {
|
|
if n <= 0 {
|
|
// User-specified limits should always be natural numbers (> 0).
|
|
bail!(ErrorKind::InvalidLimit(n.to_string(), ValueType::Long));
|
|
} else {
|
|
Some(Limit::Fixed(n as u64))
|
|
}
|
|
},
|
|
Some(val) => {
|
|
// Same.
|
|
bail!(ErrorKind::InvalidLimit(format!("{:?}", val), val.value_type()));
|
|
},
|
|
None => {
|
|
// We know that the limit variable is mentioned in `:in`.
|
|
// That it's not bound here implies that we haven't got all the variables
|
|
// we'll need to run the query yet.
|
|
// (We should never hit this in `q_once`.)
|
|
// Simply pass the `Limit` through to `SelectQuery` untouched.
|
|
None
|
|
},
|
|
}
|
|
},
|
|
Limit::None => None,
|
|
Limit::Fixed(_) => None,
|
|
};
|
|
|
|
if let Some(lim) = refined_limit {
|
|
query.limit = lim;
|
|
}
|
|
Ok(query)
|
|
}
|
|
|
|
pub fn algebrize_with_inputs(schema: &Schema,
|
|
parsed: FindQuery,
|
|
counter: usize,
|
|
inputs: QueryInputs) -> Result<AlgebraicQuery> {
|
|
let alias_counter = RcCounter::with_initial(counter);
|
|
let mut cc = ConjoiningClauses::with_inputs_and_alias_counter(parsed.in_vars, inputs, alias_counter);
|
|
|
|
// Do we have a variable limit? If so, tell the CC that the var must be numeric.
|
|
if let &Limit::Variable(ref var) = &parsed.limit {
|
|
cc.constrain_var_to_long(var.clone());
|
|
}
|
|
|
|
// TODO: integrate default source into pattern processing.
|
|
// TODO: flesh out the rest of find-into-context.
|
|
let where_clauses = parsed.where_clauses;
|
|
for where_clause in where_clauses {
|
|
cc.apply_clause(schema, where_clause)?;
|
|
}
|
|
cc.expand_column_bindings();
|
|
cc.prune_extracted_types();
|
|
|
|
let (order, extra_vars) = validate_and_simplify_order(&cc, parsed.order)?;
|
|
let with: BTreeSet<Variable> = parsed.with.into_iter().chain(extra_vars.into_iter()).collect();
|
|
|
|
// This might leave us with an unused `:in` variable.
|
|
let limit = if parsed.find_spec.is_unit_limited() { Limit::Fixed(1) } else { parsed.limit };
|
|
let q = AlgebraicQuery {
|
|
default_source: parsed.default_source,
|
|
find_spec: parsed.find_spec,
|
|
has_aggregates: false, // TODO: we don't parse them yet.
|
|
with: with,
|
|
order: order,
|
|
limit: limit,
|
|
cc: cc,
|
|
};
|
|
|
|
// Substitute in any fixed values and fail if they're out of range.
|
|
simplify_limit(q)
|
|
}
|
|
|
|
pub use clauses::{
|
|
ConjoiningClauses,
|
|
};
|
|
|
|
pub use types::{
|
|
Column,
|
|
ColumnAlternation,
|
|
ColumnConstraint,
|
|
ColumnConstraintOrAlternation,
|
|
ColumnIntersection,
|
|
ColumnName,
|
|
ComputedTable,
|
|
DatomsColumn,
|
|
DatomsTable,
|
|
OrderBy,
|
|
QualifiedAlias,
|
|
QueryValue,
|
|
SourceAlias,
|
|
TableAlias,
|
|
VariableColumn,
|
|
};
|
|
|