surrealpatch/lib/src/dbs/iterator.rs

515 lines
13 KiB
Rust
Raw Normal View History

use crate::ctx::Canceller;
use crate::ctx::Context;
use crate::dbs::Options;
use crate::dbs::Statement;
use crate::dbs::Transaction;
2022-07-19 08:28:24 +00:00
use crate::dbs::LOG;
use crate::doc::Document;
2021-03-29 15:43:37 +00:00
use crate::err::Error;
2022-03-25 18:43:22 +00:00
use crate::sql::array::Array;
use crate::sql::edges::Edges;
2022-03-25 18:43:22 +00:00
use crate::sql::field::Field;
use crate::sql::range::Range;
use crate::sql::table::Table;
use crate::sql::thing::Thing;
use crate::sql::value::Value;
use async_recursion::async_recursion;
2022-03-23 11:56:39 +00:00
use std::cmp::Ordering;
2022-03-25 18:43:22 +00:00
use std::collections::BTreeMap;
use std::mem;
2022-05-30 15:32:26 +00:00
pub enum Iterable {
Value(Value),
Table(Table),
Thing(Thing),
Range(Range),
Edges(Edges),
2022-05-30 15:32:26 +00:00
Mergeable(Thing, Value),
Relatable(Thing, Thing, Thing),
}
pub enum Operable {
Value(Value),
Mergeable(Value, Value),
Relatable(Thing, Value, Thing),
}
pub enum Workable {
Normal,
Insert(Value),
Relate(Thing, Thing),
}
#[derive(Default)]
2022-02-26 23:30:19 +00:00
pub struct Iterator {
// Iterator status
run: Canceller,
// Iterator limit value
limit: Option<usize>,
// Iterator start value
start: Option<usize>,
// Iterator runtime error
error: Option<Error>,
// Iterator output results
results: Vec<Value>,
2022-05-30 15:32:26 +00:00
// Iterator input values
entries: Vec<Iterable>,
}
impl Iterator {
// Creates a new iterator
pub fn new() -> Self {
Self::default()
}
// Prepares a value for processing
2022-05-30 15:32:26 +00:00
pub fn ingest(&mut self, val: Iterable) {
self.entries.push(val)
}
// Process the records and output
pub async fn output(
&mut self,
ctx: &Context<'_>,
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
) -> Result<Value, Error> {
// Log the statement
2022-07-19 08:28:24 +00:00
trace!(target: LOG, "Iterating: {}", stm);
// Enable context override
let mut run = Context::new(ctx);
self.run = run.add_cancel();
// Process the query LIMIT clause
self.setup_limit(&run, opt, txn, stm).await?;
// Process the query START clause
self.setup_start(&run, opt, txn, stm).await?;
// Process prepared values
self.iterate(&run, opt, txn, stm).await?;
// Return any document errors
if let Some(e) = self.error.take() {
return Err(e);
}
// Process any SPLIT clause
self.output_split(ctx, opt, txn, stm).await?;
// Process any GROUP clause
self.output_group(ctx, opt, txn, stm).await?;
// Process any ORDER clause
self.output_order(ctx, opt, txn, stm).await?;
// Process any START clause
self.output_start(ctx, opt, txn, stm).await?;
// Process any LIMIT clause
self.output_limit(ctx, opt, txn, stm).await?;
2022-03-23 14:01:28 +00:00
// Process any FETCH clause
self.output_fetch(ctx, opt, txn, stm).await?;
// Output the results
Ok(mem::take(&mut self.results).into())
}
#[inline]
async fn setup_limit(
&mut self,
ctx: &Context<'_>,
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
) -> Result<(), Error> {
if let Some(v) = stm.limit() {
self.limit = Some(v.process(ctx, opt, txn, None).await?);
}
Ok(())
}
#[inline]
async fn setup_start(
&mut self,
ctx: &Context<'_>,
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
) -> Result<(), Error> {
if let Some(v) = stm.start() {
self.start = Some(v.process(ctx, opt, txn, None).await?);
}
Ok(())
}
#[inline]
2022-03-21 21:23:47 +00:00
async fn output_split(
&mut self,
ctx: &Context<'_>,
2022-03-21 21:23:47 +00:00
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
2022-03-21 21:23:47 +00:00
) -> Result<(), Error> {
if let Some(splits) = stm.split() {
2022-03-25 18:43:22 +00:00
// Loop over each split clause
for split in splits.iter() {
2022-03-21 21:23:47 +00:00
// Get the query result
let res = mem::take(&mut self.results);
// Loop over each value
for obj in &res {
// Get the value at the path
let val = obj.pick(split);
2022-03-21 21:23:47 +00:00
// Set the value at the path
match val {
Value::Array(v) => {
for val in v {
2022-03-21 21:23:47 +00:00
// Make a copy of object
let mut obj = obj.clone();
// Set the value at the path
obj.set(ctx, opt, txn, split, val).await?;
2022-03-21 21:23:47 +00:00
// Add the object to the results
self.results.push(obj);
}
}
_ => {
// Make a copy of object
let mut obj = obj.clone();
// Set the value at the path
obj.set(ctx, opt, txn, split, val).await?;
2022-03-21 21:23:47 +00:00
// Add the object to the results
self.results.push(obj);
}
}
}
}
}
2022-03-21 21:23:47 +00:00
Ok(())
}
#[inline]
2022-03-21 21:23:47 +00:00
async fn output_group(
&mut self,
ctx: &Context<'_>,
2022-03-25 18:43:22 +00:00
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
2022-03-21 21:23:47 +00:00
) -> Result<(), Error> {
if let Some(fields) = stm.expr() {
if let Some(groups) = stm.group() {
2022-03-25 18:43:22 +00:00
// Create the new grouped collection
let mut grp: BTreeMap<Array, Array> = BTreeMap::new();
// Get the query result
let res = mem::take(&mut self.results);
// Loop over each value
for obj in res {
// Create a new column set
let mut arr = Array::with_capacity(groups.len());
// Loop over each group clause
for group in groups.iter() {
// Get the value at the path
let val = obj.pick(group);
2022-03-25 18:43:22 +00:00
// Set the value at the path
arr.push(val);
2022-03-25 18:43:22 +00:00
}
// Add to grouped collection
match grp.get_mut(&arr) {
Some(v) => v.push(obj),
2022-03-25 18:43:22 +00:00
None => {
grp.insert(arr, Array::from(obj));
}
}
}
// Loop over each grouped collection
for (_, vals) in grp {
// Create a new value
let mut obj = Value::base();
// Save the collected values
let vals = Value::from(vals);
// Loop over each group clause
for field in fields.other() {
// Process it if it is a normal field
if let Field::Alone(v) = field {
match v {
Value::Function(f) if f.is_aggregate() => {
let x = vals
.all()
2022-03-25 18:43:22 +00:00
.get(ctx, opt, txn, v.to_idiom().as_ref())
.await?;
let x = f.aggregate(x).compute(ctx, opt, txn, None).await?;
obj.set(ctx, opt, txn, v.to_idiom().as_ref(), x).await?;
}
_ => {
let x = vals.first();
2022-03-25 18:43:22 +00:00
let x = v.compute(ctx, opt, txn, Some(&x)).await?;
obj.set(ctx, opt, txn, v.to_idiom().as_ref(), x).await?;
}
}
}
// Process it if it is a aliased field
if let Field::Alias(v, i) = field {
match v {
Value::Function(f) if f.is_aggregate() => {
let x = vals
.all()
.get(ctx, opt, txn, v.to_idiom().as_ref())
.await?;
2022-03-25 18:43:22 +00:00
let x = f.aggregate(x).compute(ctx, opt, txn, None).await?;
obj.set(ctx, opt, txn, i, x).await?;
}
_ => {
let x = vals.first();
let x = i.compute(ctx, opt, txn, Some(&x)).await?;
2022-03-25 18:43:22 +00:00
obj.set(ctx, opt, txn, i, x).await?;
}
}
}
}
// Add the object to the results
self.results.push(obj);
}
}
}
2022-03-21 21:23:47 +00:00
Ok(())
}
#[inline]
2022-03-21 21:23:47 +00:00
async fn output_order(
&mut self,
_ctx: &Context<'_>,
2022-03-21 21:23:47 +00:00
_opt: &Options,
_txn: &Transaction,
stm: &Statement<'_>,
2022-03-21 21:23:47 +00:00
) -> Result<(), Error> {
if let Some(orders) = stm.order() {
2022-03-25 18:43:22 +00:00
// Sort the full result set
2022-03-23 11:56:39 +00:00
self.results.sort_by(|a, b| {
2022-03-25 18:43:22 +00:00
// Loop over each order clause
for order in orders.iter() {
// Reverse the ordering if DESC
let o = match order.random {
true => {
let a = rand::random::<f64>();
let b = rand::random::<f64>();
a.partial_cmp(&b)
}
false => match order.direction {
2022-05-05 11:27:08 +00:00
true => a.compare(b, order, order.collate, order.numeric),
false => b.compare(a, order, order.collate, order.numeric),
},
2022-03-23 11:56:39 +00:00
};
//
2022-03-23 11:56:39 +00:00
match o {
Some(Ordering::Greater) => return Ordering::Greater,
Some(Ordering::Equal) => continue,
Some(Ordering::Less) => return Ordering::Less,
None => continue,
}
}
Ordering::Equal
})
}
2022-03-21 21:23:47 +00:00
Ok(())
}
2022-03-23 14:01:28 +00:00
#[inline]
async fn output_start(
&mut self,
_ctx: &Context<'_>,
2022-03-23 14:01:28 +00:00
_opt: &Options,
_txn: &Transaction,
_stm: &Statement<'_>,
2022-03-23 14:01:28 +00:00
) -> Result<(), Error> {
if let Some(v) = self.start {
self.results = mem::take(&mut self.results).into_iter().skip(v).collect();
2022-03-23 14:01:28 +00:00
}
Ok(())
}
#[inline]
async fn output_limit(
&mut self,
_ctx: &Context<'_>,
2022-03-23 14:01:28 +00:00
_opt: &Options,
_txn: &Transaction,
_stm: &Statement<'_>,
2022-03-23 14:01:28 +00:00
) -> Result<(), Error> {
if let Some(v) = self.limit {
self.results = mem::take(&mut self.results).into_iter().take(v).collect();
2022-03-23 14:01:28 +00:00
}
Ok(())
}
#[inline]
async fn output_fetch(
&mut self,
ctx: &Context<'_>,
2022-03-23 14:01:28 +00:00
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
2022-03-23 14:01:28 +00:00
) -> Result<(), Error> {
if let Some(fetchs) = stm.fetch() {
for fetch in fetchs.iter() {
// Loop over each result value
2022-03-23 14:01:28 +00:00
for obj in &mut self.results {
// Fetch the value at the path
obj.fetch(ctx, opt, txn, fetch).await?;
2022-03-23 14:01:28 +00:00
}
}
}
Ok(())
}
#[cfg(any(target_arch = "wasm32", not(feature = "parallel")))]
#[cfg_attr(feature = "parallel", async_recursion)]
#[cfg_attr(not(feature = "parallel"), async_recursion(?Send))]
async fn iterate(
&mut self,
ctx: &Context<'_>,
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
) -> Result<(), Error> {
// Prevent deep recursion
let opt = &opt.dive(4)?;
// Process all prepared values
2022-05-30 15:32:26 +00:00
for v in mem::take(&mut self.entries) {
v.iterate(ctx, opt, txn, stm, self).await?;
}
// Everything processed ok
Ok(())
}
#[cfg(all(feature = "parallel", not(target_arch = "wasm32")))]
#[cfg_attr(feature = "parallel", async_recursion)]
#[cfg_attr(not(feature = "parallel"), async_recursion(?Send))]
async fn iterate(
&mut self,
ctx: &Context<'_>,
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
) -> Result<(), Error> {
// Prevent deep recursion
let opt = &opt.dive(4)?;
// Check if iterating in parallel
match stm.parallel() {
// Run statements sequentially
false => {
// Process all prepared values
2022-05-30 15:32:26 +00:00
for v in mem::take(&mut self.entries) {
v.iterate(ctx, opt, txn, stm, self).await?;
}
// Everything processed ok
Ok(())
}
// Run statements in parallel
true => {
// Create a new executor
let exe = executor::Executor::new();
// Take all of the iterator values
2022-05-30 15:32:26 +00:00
let vals = mem::take(&mut self.entries);
// Create a channel to shutdown
let (end, exit) = channel::bounded::<()>(1);
// Create an unbounded channel
let (chn, docs) = channel::bounded(crate::cnf::MAX_CONCURRENT_TASKS);
// Create an async closure for prepared values
let adocs = async {
2022-02-23 13:56:09 +00:00
// Process all prepared values
for v in vals {
exe.spawn(v.channel(ctx, opt, txn, stm, chn.clone()))
// Ensure we detach the spawned task
.detach();
2022-02-23 13:56:09 +00:00
}
// Drop the uncloned channel instance
drop(chn);
2022-02-26 23:30:19 +00:00
};
// Create an unbounded channel
let (chn, vals) = channel::bounded(crate::cnf::MAX_CONCURRENT_TASKS);
// Create an async closure for received values
let avals = async {
2022-02-26 23:30:19 +00:00
// Process all received values
while let Ok((k, v)) = docs.recv().await {
exe.spawn(Document::compute(ctx, opt, txn, stm, chn.clone(), k, v))
// Ensure we detach the spawned task
.detach();
}
// Drop the uncloned channel instance
drop(chn);
2022-02-23 13:56:09 +00:00
};
// Create an async closure to process results
let aproc = async {
// Process all processed values
while let Ok(r) = vals.recv().await {
self.result(r, stm);
}
// Shutdown the executor
let _ = end.send(()).await;
};
// Run all executor tasks
let fut = exe.run(exit.recv());
// Wait for all closures
let res = futures::join!(adocs, avals, aproc, fut);
// Consume executor error
let _ = res.3;
// Everything processed ok
Ok(())
}
}
}
2022-02-23 13:56:09 +00:00
// Process a new record Thing and Value
pub async fn process(
&mut self,
ctx: &Context<'_>,
opt: &Options,
txn: &Transaction,
stm: &Statement<'_>,
thg: Option<Thing>,
2022-05-30 15:32:26 +00:00
val: Operable,
) {
// Check current context
if ctx.is_done() {
return;
}
2022-05-30 15:32:26 +00:00
// Setup a new workable
let val = match val {
Operable::Value(v) => (v, Workable::Normal),
Operable::Mergeable(v, o) => (v, Workable::Insert(o)),
Operable::Relatable(f, v, w) => (v, Workable::Relate(f, w)),
};
// Setup a new document
2022-05-30 15:32:26 +00:00
let mut doc = Document::new(thg, &val.0, val.1);
// Process the document
let res = match stm {
Statement::Select(_) => doc.select(ctx, opt, txn, stm).await,
Statement::Create(_) => doc.create(ctx, opt, txn, stm).await,
Statement::Update(_) => doc.update(ctx, opt, txn, stm).await,
Statement::Relate(_) => doc.relate(ctx, opt, txn, stm).await,
Statement::Delete(_) => doc.delete(ctx, opt, txn, stm).await,
Statement::Insert(_) => doc.insert(ctx, opt, txn, stm).await,
};
2022-02-23 13:56:09 +00:00
// Process the result
self.result(res, stm);
2022-02-23 13:56:09 +00:00
}
2022-02-23 13:56:09 +00:00
// Accept a processed record result
fn result(&mut self, res: Result<Value, Error>, stm: &Statement<'_>) {
// Process the result
match res {
Err(Error::Ignore) => {
return;
}
Err(e) => {
self.error = Some(e);
self.run.cancel();
return;
}
Ok(v) => self.results.push(v),
}
// Check if we can exit
if stm.group().is_none() && stm.order().is_none() {
if let Some(l) = self.limit {
if let Some(s) = self.start {
if self.results.len() == l + s {
self.run.cancel()
}
} else if self.results.len() == l {
self.run.cancel()
}
}
}
2021-03-29 15:43:37 +00:00
}
}