2023-06-30 16:51:03 +00:00
|
|
|
use crate::ctx::Context;
|
2023-06-19 18:41:13 +00:00
|
|
|
use crate::dbs::{Options, Transaction};
|
|
|
|
use crate::err::Error;
|
2023-09-12 15:43:32 +00:00
|
|
|
use crate::idx::planner::plan::{IndexOperator, IndexOption};
|
2023-06-21 18:31:15 +00:00
|
|
|
use crate::sql::index::Index;
|
2023-06-19 18:41:13 +00:00
|
|
|
use crate::sql::statements::DefineIndexStatement;
|
2023-10-25 10:24:04 +00:00
|
|
|
use crate::sql::{Array, Cond, Expression, Idiom, Operator, Part, Subquery, Table, Value, With};
|
2023-06-19 18:41:13 +00:00
|
|
|
use async_recursion::async_recursion;
|
2023-06-23 20:26:19 +00:00
|
|
|
use std::collections::HashMap;
|
2023-06-19 18:41:13 +00:00
|
|
|
use std::sync::Arc;
|
|
|
|
|
2023-06-21 18:31:15 +00:00
|
|
|
pub(super) struct Tree {}
|
2023-06-19 18:41:13 +00:00
|
|
|
|
2023-10-26 21:34:28 +00:00
|
|
|
#[derive(Clone, Copy)]
|
|
|
|
enum IdiomPosition {
|
|
|
|
Left,
|
|
|
|
Right,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl IdiomPosition {
|
|
|
|
// Reverses the operator for non commutative operators
|
|
|
|
fn transform(&self, op: &Operator) -> Operator {
|
|
|
|
match self {
|
|
|
|
IdiomPosition::Left => op.clone(),
|
|
|
|
IdiomPosition::Right => match op {
|
|
|
|
Operator::LessThan => Operator::MoreThan,
|
|
|
|
Operator::LessThanOrEqual => Operator::MoreThanOrEqual,
|
|
|
|
Operator::MoreThan => Operator::LessThan,
|
|
|
|
Operator::MoreThanOrEqual => Operator::LessThanOrEqual,
|
|
|
|
_ => op.clone(),
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-19 18:41:13 +00:00
|
|
|
impl Tree {
|
2023-09-12 15:43:32 +00:00
|
|
|
/// Traverse all the conditions and extract every expression
|
2023-06-23 20:26:19 +00:00
|
|
|
/// that can be resolved by an index.
|
2023-06-19 18:41:13 +00:00
|
|
|
pub(super) async fn build<'a>(
|
2023-06-30 16:51:03 +00:00
|
|
|
ctx: &'a Context<'_>,
|
2023-06-19 18:41:13 +00:00
|
|
|
opt: &'a Options,
|
|
|
|
txn: &'a Transaction,
|
|
|
|
table: &'a Table,
|
2023-07-21 18:41:36 +00:00
|
|
|
cond: &'a Option<Cond>,
|
2023-09-12 15:43:32 +00:00
|
|
|
with: &'a Option<With>,
|
|
|
|
) -> Result<Option<(Node, IndexMap, Vec<IndexRef>)>, Error> {
|
|
|
|
let with_indexes = match with {
|
|
|
|
Some(With::Index(ixs)) => Vec::with_capacity(ixs.len()),
|
|
|
|
_ => vec![],
|
|
|
|
};
|
2023-06-19 18:41:13 +00:00
|
|
|
let mut b = TreeBuilder {
|
2023-06-30 16:51:03 +00:00
|
|
|
ctx,
|
2023-06-19 18:41:13 +00:00
|
|
|
opt,
|
|
|
|
txn,
|
|
|
|
table,
|
2023-09-12 15:43:32 +00:00
|
|
|
with,
|
2023-06-19 18:41:13 +00:00
|
|
|
indexes: None,
|
2023-09-12 15:43:32 +00:00
|
|
|
index_lookup: Default::default(),
|
2023-06-19 18:41:13 +00:00
|
|
|
index_map: IndexMap::default(),
|
2023-09-12 15:43:32 +00:00
|
|
|
with_indexes,
|
2023-06-19 18:41:13 +00:00
|
|
|
};
|
|
|
|
let mut res = None;
|
|
|
|
if let Some(cond) = cond {
|
2023-09-12 15:43:32 +00:00
|
|
|
res = Some((b.eval_value(&cond.0).await?, b.index_map, b.with_indexes));
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
Ok(res)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
struct TreeBuilder<'a> {
|
2023-06-30 16:51:03 +00:00
|
|
|
ctx: &'a Context<'a>,
|
2023-06-19 18:41:13 +00:00
|
|
|
opt: &'a Options,
|
|
|
|
txn: &'a Transaction,
|
|
|
|
table: &'a Table,
|
2023-09-12 15:43:32 +00:00
|
|
|
with: &'a Option<With>,
|
2023-06-19 18:41:13 +00:00
|
|
|
indexes: Option<Arc<[DefineIndexStatement]>>,
|
2023-09-12 16:36:43 +00:00
|
|
|
index_lookup: HashMap<Idiom, Option<Arc<Vec<IndexRef>>>>,
|
2023-06-19 18:41:13 +00:00
|
|
|
index_map: IndexMap,
|
2023-09-12 15:43:32 +00:00
|
|
|
with_indexes: Vec<IndexRef>,
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> TreeBuilder<'a> {
|
2023-09-12 16:36:43 +00:00
|
|
|
async fn find_indexes(&mut self, i: &Idiom) -> Result<Option<Arc<Vec<IndexRef>>>, Error> {
|
|
|
|
if let Some(irs) = self.index_lookup.get(i) {
|
|
|
|
return Ok(irs.clone());
|
2023-09-12 15:43:32 +00:00
|
|
|
}
|
2023-06-19 18:41:13 +00:00
|
|
|
if self.indexes.is_none() {
|
|
|
|
let indexes = self
|
|
|
|
.txn
|
|
|
|
.clone()
|
|
|
|
.lock()
|
|
|
|
.await
|
2023-09-01 11:52:02 +00:00
|
|
|
.all_tb_indexes(self.opt.ns(), self.opt.db(), &self.table.0)
|
2023-06-19 18:41:13 +00:00
|
|
|
.await?;
|
|
|
|
self.indexes = Some(indexes);
|
|
|
|
}
|
2023-09-12 16:36:43 +00:00
|
|
|
let mut irs = Vec::new();
|
2023-06-19 18:41:13 +00:00
|
|
|
if let Some(indexes) = &self.indexes {
|
|
|
|
for ix in indexes.as_ref() {
|
|
|
|
if ix.cols.len() == 1 && ix.cols[0].eq(i) {
|
2023-09-12 16:36:43 +00:00
|
|
|
let ir = self.index_map.definitions.len() as IndexRef;
|
2023-09-12 15:43:32 +00:00
|
|
|
if let Some(With::Index(ixs)) = self.with {
|
|
|
|
if ixs.contains(&ix.name.0) {
|
|
|
|
self.with_indexes.push(ir);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
self.index_map.definitions.insert(ir, ix.clone());
|
2023-09-12 16:36:43 +00:00
|
|
|
irs.push(ir);
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2023-09-12 16:36:43 +00:00
|
|
|
let irs = if irs.is_empty() {
|
|
|
|
None
|
|
|
|
} else {
|
|
|
|
Some(Arc::new(irs))
|
|
|
|
};
|
|
|
|
self.index_lookup.insert(i.clone(), irs.clone());
|
|
|
|
Ok(irs)
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg_attr(not(target_arch = "wasm32"), async_recursion)]
|
|
|
|
#[cfg_attr(target_arch = "wasm32", async_recursion(?Send))]
|
|
|
|
async fn eval_value(&mut self, v: &Value) -> Result<Node, Error> {
|
2023-09-07 23:36:39 +00:00
|
|
|
match v {
|
|
|
|
Value::Expression(e) => self.eval_expression(e).await,
|
|
|
|
Value::Idiom(i) => self.eval_idiom(i).await,
|
2023-09-12 20:26:03 +00:00
|
|
|
Value::Strand(_) | Value::Number(_) | Value::Bool(_) | Value::Thing(_) => {
|
2023-10-26 21:34:28 +00:00
|
|
|
Ok(Node::Computed(v.to_owned()))
|
2023-09-12 20:26:03 +00:00
|
|
|
}
|
2023-10-26 21:34:28 +00:00
|
|
|
Value::Array(a) => self.eval_array(a).await,
|
2023-09-07 23:36:39 +00:00
|
|
|
Value::Subquery(s) => self.eval_subquery(s).await,
|
2023-06-30 16:51:03 +00:00
|
|
|
Value::Param(p) => {
|
2023-07-06 14:57:42 +00:00
|
|
|
let v = p.compute(self.ctx, self.opt, self.txn, None).await?;
|
2023-09-07 23:36:39 +00:00
|
|
|
self.eval_value(&v).await
|
2023-06-30 16:51:03 +00:00
|
|
|
}
|
2023-09-07 23:36:39 +00:00
|
|
|
_ => Ok(Node::Unsupported(format!("Unsupported value: {}", v))),
|
|
|
|
}
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
|
2023-10-26 21:34:28 +00:00
|
|
|
async fn eval_array(&mut self, a: &Array) -> Result<Node, Error> {
|
|
|
|
let mut values = Vec::with_capacity(a.len());
|
2023-09-12 20:26:03 +00:00
|
|
|
for v in &a.0 {
|
2023-10-26 21:34:28 +00:00
|
|
|
values.push(v.compute(self.ctx, self.opt, self.txn, None).await?);
|
2023-09-12 20:26:03 +00:00
|
|
|
}
|
2023-10-26 21:34:28 +00:00
|
|
|
Ok(Node::Computed(Value::Array(Array::from(values))))
|
2023-09-12 20:26:03 +00:00
|
|
|
}
|
|
|
|
|
2023-06-19 18:41:13 +00:00
|
|
|
async fn eval_idiom(&mut self, i: &Idiom) -> Result<Node, Error> {
|
2023-10-25 10:24:04 +00:00
|
|
|
// Compute the idiom value if it is a param
|
|
|
|
if let Some(Part::Start(x)) = i.0.first() {
|
|
|
|
if x.is_param() {
|
|
|
|
let v = i.compute(self.ctx, self.opt, self.txn, None).await?;
|
|
|
|
return self.eval_value(&v).await;
|
|
|
|
}
|
|
|
|
}
|
2023-09-12 16:36:43 +00:00
|
|
|
if let Some(irs) = self.find_indexes(i).await? {
|
|
|
|
if !irs.is_empty() {
|
|
|
|
return Ok(Node::IndexedField(i.to_owned(), irs));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(Node::NonIndexedField)
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
async fn eval_expression(&mut self, e: &Expression) -> Result<Node, Error> {
|
2023-06-20 23:31:23 +00:00
|
|
|
match e {
|
|
|
|
Expression::Unary {
|
|
|
|
..
|
2023-09-07 23:36:39 +00:00
|
|
|
} => Ok(Node::Unsupported("unary expressions not supported".to_string())),
|
2023-06-20 23:31:23 +00:00
|
|
|
Expression::Binary {
|
|
|
|
l,
|
|
|
|
o,
|
|
|
|
r,
|
|
|
|
} => {
|
|
|
|
let left = self.eval_value(l).await?;
|
|
|
|
let right = self.eval_value(r).await?;
|
2023-09-12 15:43:32 +00:00
|
|
|
if let Some(io) = self.index_map.options.get(e) {
|
2023-06-23 20:26:19 +00:00
|
|
|
return Ok(Node::Expression {
|
|
|
|
io: Some(io.clone()),
|
|
|
|
left: Box::new(left),
|
|
|
|
right: Box::new(right),
|
2023-09-12 15:43:32 +00:00
|
|
|
exp: Arc::new(e.clone()),
|
2023-06-23 20:26:19 +00:00
|
|
|
});
|
|
|
|
}
|
|
|
|
let mut io = None;
|
2023-09-12 16:36:43 +00:00
|
|
|
if let Some((id, irs)) = left.is_indexed_field() {
|
2023-10-26 21:34:28 +00:00
|
|
|
io = self.lookup_index_option(
|
|
|
|
irs.as_slice(),
|
|
|
|
o,
|
|
|
|
id,
|
|
|
|
&right,
|
|
|
|
e,
|
|
|
|
IdiomPosition::Left,
|
|
|
|
);
|
2023-09-12 16:36:43 +00:00
|
|
|
} else if let Some((id, irs)) = right.is_indexed_field() {
|
2023-10-26 21:34:28 +00:00
|
|
|
io = self.lookup_index_option(
|
|
|
|
irs.as_slice(),
|
|
|
|
o,
|
|
|
|
id,
|
|
|
|
&left,
|
|
|
|
e,
|
|
|
|
IdiomPosition::Right,
|
|
|
|
);
|
2023-06-21 18:31:15 +00:00
|
|
|
};
|
2023-06-20 23:31:23 +00:00
|
|
|
Ok(Node::Expression {
|
2023-06-23 20:26:19 +00:00
|
|
|
io,
|
2023-06-20 23:31:23 +00:00
|
|
|
left: Box::new(left),
|
|
|
|
right: Box::new(right),
|
2023-09-12 15:43:32 +00:00
|
|
|
exp: Arc::new(e.clone()),
|
2023-06-20 23:31:23 +00:00
|
|
|
})
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-21 18:31:15 +00:00
|
|
|
fn lookup_index_option(
|
|
|
|
&mut self,
|
2023-09-12 16:36:43 +00:00
|
|
|
irs: &[IndexRef],
|
2023-06-21 18:31:15 +00:00
|
|
|
op: &Operator,
|
|
|
|
id: &Idiom,
|
2023-09-12 20:26:03 +00:00
|
|
|
n: &Node,
|
2023-06-23 20:26:19 +00:00
|
|
|
e: &Expression,
|
2023-10-26 21:34:28 +00:00
|
|
|
p: IdiomPosition,
|
2023-06-21 18:31:15 +00:00
|
|
|
) -> Option<IndexOption> {
|
2023-09-12 20:26:03 +00:00
|
|
|
for ir in irs {
|
|
|
|
if let Some(ix) = self.index_map.definitions.get(ir) {
|
|
|
|
let op = match &ix.index {
|
2023-10-26 21:34:28 +00:00
|
|
|
Index::Idx => Self::eval_index_operator(op, n, p),
|
|
|
|
Index::Uniq => Self::eval_index_operator(op, n, p),
|
2023-09-12 20:26:03 +00:00
|
|
|
Index::Search {
|
|
|
|
..
|
2023-10-26 21:34:28 +00:00
|
|
|
} => Self::eval_matches_operator(op, n),
|
|
|
|
Index::MTree(_) => Self::eval_knn_operator(op, n),
|
2023-09-12 20:26:03 +00:00
|
|
|
};
|
|
|
|
if let Some(op) = op {
|
|
|
|
let io = IndexOption::new(*ir, id.clone(), op);
|
|
|
|
self.index_map.options.insert(Arc::new(e.clone()), io.clone());
|
|
|
|
return Some(io);
|
2023-06-21 18:31:15 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None
|
|
|
|
}
|
2023-10-26 21:34:28 +00:00
|
|
|
fn eval_matches_operator(op: &Operator, n: &Node) -> Option<IndexOperator> {
|
|
|
|
if let Some(v) = n.is_computed() {
|
|
|
|
if let Operator::Matches(mr) = op {
|
|
|
|
return Some(IndexOperator::Matches(v.clone().to_raw_string(), *mr));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None
|
|
|
|
}
|
2023-06-21 18:31:15 +00:00
|
|
|
|
2023-10-26 21:34:28 +00:00
|
|
|
fn eval_knn_operator(op: &Operator, n: &Node) -> Option<IndexOperator> {
|
|
|
|
if let Operator::Knn(k) = op {
|
|
|
|
if let Node::Computed(Value::Array(a)) = n {
|
|
|
|
return Some(IndexOperator::Knn(a.clone(), *k));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None
|
|
|
|
}
|
|
|
|
|
|
|
|
fn eval_index_operator(op: &Operator, n: &Node, p: IdiomPosition) -> Option<IndexOperator> {
|
|
|
|
if let Some(v) = n.is_computed() {
|
|
|
|
match (op, v, p) {
|
|
|
|
(Operator::Equal, v, _) => Some(IndexOperator::Equality(v.clone())),
|
|
|
|
(Operator::Contain, v, IdiomPosition::Left) => {
|
|
|
|
Some(IndexOperator::Equality(v.clone()))
|
|
|
|
}
|
|
|
|
(Operator::ContainAny, Value::Array(a), IdiomPosition::Left) => {
|
|
|
|
Some(IndexOperator::Union(a.clone()))
|
|
|
|
}
|
|
|
|
(Operator::ContainAll, Value::Array(a), IdiomPosition::Left) => {
|
|
|
|
Some(IndexOperator::Union(a.clone()))
|
|
|
|
}
|
|
|
|
(
|
|
|
|
Operator::LessThan
|
|
|
|
| Operator::LessThanOrEqual
|
|
|
|
| Operator::MoreThan
|
|
|
|
| Operator::MoreThanOrEqual,
|
|
|
|
v,
|
|
|
|
p,
|
|
|
|
) => Some(IndexOperator::RangePart(p.transform(op), v.clone())),
|
2023-09-12 20:26:03 +00:00
|
|
|
_ => None,
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
None
|
2023-09-12 15:43:32 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-19 18:41:13 +00:00
|
|
|
async fn eval_subquery(&mut self, s: &Subquery) -> Result<Node, Error> {
|
2023-09-07 23:36:39 +00:00
|
|
|
match s {
|
|
|
|
Subquery::Value(v) => self.eval_value(v).await,
|
|
|
|
_ => Ok(Node::Unsupported(format!("Unsupported subquery: {}", s))),
|
|
|
|
}
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-12 15:43:32 +00:00
|
|
|
pub(super) type IndexRef = u16;
|
|
|
|
|
2023-06-23 20:26:19 +00:00
|
|
|
/// For each expression the a possible index option
|
|
|
|
#[derive(Default)]
|
2023-09-12 15:43:32 +00:00
|
|
|
pub(super) struct IndexMap {
|
|
|
|
pub(super) options: HashMap<Arc<Expression>, IndexOption>,
|
|
|
|
pub(super) definitions: HashMap<IndexRef, DefineIndexStatement>,
|
2023-06-23 20:26:19 +00:00
|
|
|
}
|
|
|
|
|
2023-06-19 18:41:13 +00:00
|
|
|
#[derive(Debug, Clone, Eq, PartialEq, Hash)]
|
|
|
|
pub(super) enum Node {
|
|
|
|
Expression {
|
2023-06-23 20:26:19 +00:00
|
|
|
io: Option<IndexOption>,
|
2023-06-19 18:41:13 +00:00
|
|
|
left: Box<Node>,
|
|
|
|
right: Box<Node>,
|
2023-09-12 15:43:32 +00:00
|
|
|
exp: Arc<Expression>,
|
2023-06-19 18:41:13 +00:00
|
|
|
},
|
2023-09-12 16:36:43 +00:00
|
|
|
IndexedField(Idiom, Arc<Vec<IndexRef>>),
|
2023-06-19 18:41:13 +00:00
|
|
|
NonIndexedField,
|
2023-10-26 21:34:28 +00:00
|
|
|
Computed(Value),
|
2023-09-07 23:36:39 +00:00
|
|
|
Unsupported(String),
|
2023-06-19 18:41:13 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Node {
|
2023-10-26 21:34:28 +00:00
|
|
|
pub(super) fn is_computed(&self) -> Option<&Value> {
|
|
|
|
if let Node::Computed(v) = self {
|
2023-06-19 18:41:13 +00:00
|
|
|
Some(v)
|
|
|
|
} else {
|
|
|
|
None
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-12 16:36:43 +00:00
|
|
|
pub(super) fn is_indexed_field(&self) -> Option<(&Idiom, Arc<Vec<IndexRef>>)> {
|
|
|
|
if let Node::IndexedField(id, irs) = self {
|
|
|
|
Some((id, irs.clone()))
|
2023-06-19 18:41:13 +00:00
|
|
|
} else {
|
|
|
|
None
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|