2023-12-12 13:51:43 +00:00
|
|
|
use crate::ctx::Context;
|
|
|
|
use crate::dbs::{Options, Transaction};
|
|
|
|
use crate::doc::CursorDoc;
|
|
|
|
use crate::err::Error;
|
|
|
|
use crate::sql::value::Value;
|
2023-11-18 13:56:13 +00:00
|
|
|
use derive::Store;
|
|
|
|
use revision::revisioned;
|
|
|
|
use serde::{Deserialize, Serialize};
|
|
|
|
use std::fmt;
|
2022-05-30 15:05:05 +00:00
|
|
|
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
2023-12-12 13:51:43 +00:00
|
|
|
use crate::iam::Action;
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
|
|
|
use crate::ml::execution::compute::ModelComputation;
|
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
|
|
|
use crate::ml::storage::surml_file::SurMlFile;
|
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
2023-12-12 13:51:43 +00:00
|
|
|
use crate::sql::Permission;
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
2023-12-12 13:51:43 +00:00
|
|
|
use futures::future::try_join_all;
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
2023-12-12 13:51:43 +00:00
|
|
|
use std::collections::HashMap;
|
|
|
|
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
2023-12-12 13:51:43 +00:00
|
|
|
const ARGUMENTS: &str = "The model expects 1 argument. The argument can be either a number, an object, or an array of numbers.";
|
|
|
|
|
2023-09-13 06:06:28 +00:00
|
|
|
#[derive(Clone, Debug, Default, PartialEq, PartialOrd, Serialize, Deserialize, Store, Hash)]
|
2024-01-09 15:34:52 +00:00
|
|
|
#[cfg_attr(feature = "arbitrary", derive(arbitrary::Arbitrary))]
|
2023-08-17 18:03:46 +00:00
|
|
|
#[revisioned(revision = 1)]
|
2023-09-13 06:06:28 +00:00
|
|
|
pub struct Model {
|
|
|
|
pub name: String,
|
|
|
|
pub version: String,
|
2023-10-25 11:38:03 +00:00
|
|
|
pub args: Vec<Value>,
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
|
2023-09-13 06:06:28 +00:00
|
|
|
impl fmt::Display for Model {
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
2023-10-25 11:38:03 +00:00
|
|
|
write!(f, "ml::{}<{}>(", self.name, self.version)?;
|
|
|
|
for (idx, p) in self.args.iter().enumerate() {
|
|
|
|
if idx != 0 {
|
|
|
|
write!(f, ",")?;
|
|
|
|
}
|
|
|
|
write!(f, "{}", p)?;
|
|
|
|
}
|
|
|
|
write!(f, ")")
|
2022-05-30 15:05:05 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-13 06:06:28 +00:00
|
|
|
impl Model {
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(any(feature = "ml", feature = "ml2"))]
|
2023-12-12 13:51:43 +00:00
|
|
|
pub(crate) async fn compute(
|
|
|
|
&self,
|
|
|
|
ctx: &Context<'_>,
|
|
|
|
opt: &Options,
|
|
|
|
txn: &Transaction,
|
|
|
|
doc: Option<&CursorDoc<'_>>,
|
|
|
|
) -> Result<Value, Error> {
|
|
|
|
// Ensure futures are run
|
|
|
|
let opt = &opt.new_with_futures(true);
|
|
|
|
// Get the full name of this model
|
|
|
|
let name = format!("ml::{}", self.name);
|
|
|
|
// Check this function is allowed
|
|
|
|
ctx.check_allowed_function(name.as_str())?;
|
|
|
|
// Get the model definition
|
|
|
|
let val = {
|
|
|
|
// Claim transaction
|
|
|
|
let mut run = txn.lock().await;
|
|
|
|
// Get the function definition
|
|
|
|
run.get_and_cache_db_model(opt.ns(), opt.db(), &self.name, &self.version).await?
|
|
|
|
};
|
|
|
|
// Calculate the model path
|
|
|
|
let path = format!(
|
|
|
|
"ml/{}/{}/{}-{}-{}.surml",
|
|
|
|
opt.ns(),
|
|
|
|
opt.db(),
|
|
|
|
self.name,
|
|
|
|
self.version,
|
|
|
|
val.hash
|
|
|
|
);
|
|
|
|
// Check permissions
|
|
|
|
if opt.check_perms(Action::View) {
|
|
|
|
match &val.permissions {
|
|
|
|
Permission::Full => (),
|
|
|
|
Permission::None => {
|
|
|
|
return Err(Error::FunctionPermissions {
|
|
|
|
name: self.name.to_owned(),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
Permission::Specific(e) => {
|
|
|
|
// Disable permissions
|
|
|
|
let opt = &opt.new_with_perms(false);
|
|
|
|
// Process the PERMISSION clause
|
|
|
|
if !e.compute(ctx, opt, txn, doc).await?.is_truthy() {
|
|
|
|
return Err(Error::FunctionPermissions {
|
|
|
|
name: self.name.to_owned(),
|
|
|
|
});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Compute the function arguments
|
|
|
|
let mut args =
|
|
|
|
try_join_all(self.args.iter().map(|v| v.compute(ctx, opt, txn, doc))).await?;
|
|
|
|
// Check the minimum argument length
|
|
|
|
if args.len() != 1 {
|
|
|
|
return Err(Error::InvalidArguments {
|
|
|
|
name: format!("ml::{}<{}>", self.name, self.version),
|
|
|
|
message: ARGUMENTS.into(),
|
|
|
|
});
|
|
|
|
}
|
|
|
|
// Take the first and only specified argument
|
|
|
|
match args.swap_remove(0) {
|
|
|
|
// Perform bufferered compute
|
|
|
|
Value::Object(v) => {
|
|
|
|
// Compute the model function arguments
|
|
|
|
let mut args = v
|
|
|
|
.into_iter()
|
|
|
|
.map(|(k, v)| Ok((k, Value::try_into(v)?)))
|
|
|
|
.collect::<Result<HashMap<String, f32>, Error>>()
|
|
|
|
.map_err(|_| Error::InvalidArguments {
|
|
|
|
name: format!("ml::{}<{}>", self.name, self.version),
|
|
|
|
message: ARGUMENTS.into(),
|
|
|
|
})?;
|
|
|
|
// Get the model file as bytes
|
|
|
|
let bytes = crate::obs::get(&path).await?;
|
|
|
|
// Run the compute in a blocking task
|
|
|
|
let outcome = tokio::task::spawn_blocking(move || {
|
|
|
|
let mut file = SurMlFile::from_bytes(bytes).unwrap();
|
|
|
|
let compute_unit = ModelComputation {
|
|
|
|
surml_file: &mut file,
|
|
|
|
};
|
|
|
|
compute_unit.buffered_compute(&mut args).map_err(Error::ModelComputation)
|
|
|
|
})
|
|
|
|
.await
|
|
|
|
.unwrap()?;
|
|
|
|
// Convert the output to a value
|
|
|
|
Ok(outcome[0].into())
|
|
|
|
}
|
|
|
|
// Perform raw compute
|
|
|
|
Value::Number(v) => {
|
|
|
|
// Compute the model function arguments
|
|
|
|
let args: f32 = v.try_into().map_err(|_| Error::InvalidArguments {
|
|
|
|
name: format!("ml::{}<{}>", self.name, self.version),
|
|
|
|
message: ARGUMENTS.into(),
|
|
|
|
})?;
|
|
|
|
// Get the model file as bytes
|
|
|
|
let bytes = crate::obs::get(&path).await?;
|
|
|
|
// Convert the argument to a tensor
|
|
|
|
let tensor = ndarray::arr1::<f32>(&[args]).into_dyn();
|
|
|
|
// Run the compute in a blocking task
|
|
|
|
let outcome = tokio::task::spawn_blocking(move || {
|
|
|
|
let mut file = SurMlFile::from_bytes(bytes).unwrap();
|
|
|
|
let compute_unit = ModelComputation {
|
|
|
|
surml_file: &mut file,
|
|
|
|
};
|
|
|
|
compute_unit.raw_compute(tensor, None).map_err(Error::ModelComputation)
|
|
|
|
})
|
|
|
|
.await
|
|
|
|
.unwrap()?;
|
|
|
|
// Convert the output to a value
|
|
|
|
Ok(outcome[0].into())
|
|
|
|
}
|
|
|
|
// Perform raw compute
|
|
|
|
Value::Array(v) => {
|
|
|
|
// Compute the model function arguments
|
|
|
|
let args = v
|
|
|
|
.into_iter()
|
|
|
|
.map(Value::try_into)
|
|
|
|
.collect::<Result<Vec<f32>, Error>>()
|
|
|
|
.map_err(|_| Error::InvalidArguments {
|
|
|
|
name: format!("ml::{}<{}>", self.name, self.version),
|
|
|
|
message: ARGUMENTS.into(),
|
|
|
|
})?;
|
|
|
|
// Get the model file as bytes
|
|
|
|
let bytes = crate::obs::get(&path).await?;
|
|
|
|
// Convert the argument to a tensor
|
|
|
|
let tensor = ndarray::arr1::<f32>(&args).into_dyn();
|
|
|
|
// Run the compute in a blocking task
|
|
|
|
let outcome = tokio::task::spawn_blocking(move || {
|
|
|
|
let mut file = SurMlFile::from_bytes(bytes).unwrap();
|
|
|
|
let compute_unit = ModelComputation {
|
|
|
|
surml_file: &mut file,
|
|
|
|
};
|
|
|
|
compute_unit.raw_compute(tensor, None).map_err(Error::ModelComputation)
|
|
|
|
})
|
|
|
|
.await
|
|
|
|
.unwrap()?;
|
|
|
|
// Convert the output to a value
|
|
|
|
Ok(outcome[0].into())
|
|
|
|
}
|
|
|
|
//
|
|
|
|
_ => Err(Error::InvalidArguments {
|
|
|
|
name: format!("ml::{}<{}>", self.name, self.version),
|
|
|
|
message: ARGUMENTS.into(),
|
|
|
|
}),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-02-09 19:31:16 +00:00
|
|
|
#[cfg(not(any(feature = "ml", feature = "ml2")))]
|
2023-09-13 06:06:28 +00:00
|
|
|
pub(crate) async fn compute(
|
|
|
|
&self,
|
|
|
|
_ctx: &Context<'_>,
|
|
|
|
_opt: &Options,
|
|
|
|
_txn: &Transaction,
|
2023-12-12 13:51:43 +00:00
|
|
|
_doc: Option<&CursorDoc<'_>>,
|
2023-09-13 06:06:28 +00:00
|
|
|
) -> Result<Value, Error> {
|
2023-12-12 13:51:43 +00:00
|
|
|
Err(Error::InvalidModel {
|
|
|
|
message: String::from("Machine learning computation is not enabled."),
|
|
|
|
})
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
}
|