2022-01-16 20:31:50 +00:00
|
|
|
use crate::sql::error::IResult;
|
2021-05-22 18:13:53 +00:00
|
|
|
use nom::bytes::complete::escaped;
|
2020-06-29 15:36:01 +00:00
|
|
|
use nom::bytes::complete::is_not;
|
2022-09-24 08:11:38 +00:00
|
|
|
use nom::character::complete::anychar;
|
2022-03-16 23:52:25 +00:00
|
|
|
use nom::character::complete::char;
|
2023-04-23 11:55:18 +00:00
|
|
|
use serde::{
|
|
|
|
de::{self, Visitor},
|
|
|
|
Deserialize, Deserializer, Serialize, Serializer,
|
|
|
|
};
|
|
|
|
use std::cmp::Ordering;
|
|
|
|
use std::fmt::Debug;
|
|
|
|
use std::fmt::{self, Display, Formatter};
|
|
|
|
use std::hash::{Hash, Hasher};
|
2020-06-29 15:36:01 +00:00
|
|
|
use std::str;
|
2023-04-23 11:55:18 +00:00
|
|
|
use std::str::FromStr;
|
2020-06-29 15:36:01 +00:00
|
|
|
|
2023-03-30 10:41:44 +00:00
|
|
|
pub(crate) const TOKEN: &str = "$surrealdb::private::sql::Regex";
|
|
|
|
|
2023-04-23 11:55:18 +00:00
|
|
|
#[derive(Clone)]
|
|
|
|
pub struct Regex(pub(super) regex::Regex);
|
2020-06-29 15:36:01 +00:00
|
|
|
|
2023-04-23 11:55:18 +00:00
|
|
|
impl Regex {
|
|
|
|
// Deref would expose `regex::Regex::as_str` which wouldn't have the '/' delimiters.
|
|
|
|
pub fn regex(&self) -> ®ex::Regex {
|
|
|
|
&self.0
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-23 11:55:18 +00:00
|
|
|
impl FromStr for Regex {
|
|
|
|
type Err = <regex::Regex as FromStr>::Err;
|
|
|
|
|
|
|
|
fn from_str(s: &str) -> Result<Self, Self::Err> {
|
2023-05-09 17:48:14 +00:00
|
|
|
if s.contains('\0') {
|
|
|
|
Err(regex::Error::Syntax("regex contained NUL byte".to_owned()))
|
|
|
|
} else {
|
|
|
|
regex::Regex::new(&s.replace("\\/", "/")).map(Self)
|
|
|
|
}
|
2021-03-29 15:43:37 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-23 11:55:18 +00:00
|
|
|
impl PartialEq for Regex {
|
|
|
|
fn eq(&self, other: &Self) -> bool {
|
|
|
|
self.0.as_str().eq(other.0.as_str())
|
2021-03-29 15:43:37 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-23 11:55:18 +00:00
|
|
|
impl Eq for Regex {}
|
|
|
|
|
|
|
|
impl Ord for Regex {
|
|
|
|
fn cmp(&self, other: &Self) -> Ordering {
|
|
|
|
self.0.as_str().cmp(other.0.as_str())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl PartialOrd for Regex {
|
|
|
|
fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
|
|
|
|
Some(self.cmp(other))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Hash for Regex {
|
|
|
|
fn hash<H: Hasher>(&self, state: &mut H) {
|
|
|
|
self.0.as_str().hash(state);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Debug for Regex {
|
|
|
|
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
|
|
|
|
Display::fmt(self, f)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Display for Regex {
|
|
|
|
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
|
|
|
|
write!(f, "/{}/", &self.0)
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-03-30 10:41:44 +00:00
|
|
|
impl Serialize for Regex {
|
|
|
|
fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
|
|
|
|
where
|
2023-04-23 11:55:18 +00:00
|
|
|
S: Serializer,
|
2023-03-30 10:41:44 +00:00
|
|
|
{
|
2023-04-29 15:58:22 +00:00
|
|
|
serializer.serialize_newtype_struct(TOKEN, self.0.as_str())
|
2023-03-30 10:41:44 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-04-23 11:55:18 +00:00
|
|
|
impl<'de> Deserialize<'de> for Regex {
|
|
|
|
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
|
|
|
|
where
|
|
|
|
D: Deserializer<'de>,
|
|
|
|
{
|
|
|
|
struct RegexVisitor;
|
|
|
|
|
|
|
|
impl<'de> Visitor<'de> for RegexVisitor {
|
|
|
|
type Value = Regex;
|
|
|
|
|
|
|
|
fn expecting(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
|
|
|
|
formatter.write_str("a regex str")
|
|
|
|
}
|
|
|
|
|
|
|
|
fn visit_str<E>(self, value: &str) -> Result<Self::Value, E>
|
|
|
|
where
|
|
|
|
E: de::Error,
|
|
|
|
{
|
|
|
|
Regex::from_str(value).map_err(|_| de::Error::custom("invalid regex"))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
deserializer.deserialize_str(RegexVisitor)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-29 15:36:01 +00:00
|
|
|
pub fn regex(i: &str) -> IResult<&str, Regex> {
|
2022-03-16 23:52:25 +00:00
|
|
|
let (i, _) = char('/')(i)?;
|
2022-09-24 08:11:38 +00:00
|
|
|
let (i, v) = escaped(is_not("\\/"), '\\', anychar)(i)?;
|
2022-03-16 23:52:25 +00:00
|
|
|
let (i, _) = char('/')(i)?;
|
2023-04-23 11:55:18 +00:00
|
|
|
let regex = v.parse().map_err(|_| nom::Err::Error(crate::sql::Error::Parser(v)))?;
|
|
|
|
Ok((i, regex))
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn regex_simple() {
|
|
|
|
let sql = "/test/";
|
|
|
|
let res = regex(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!("/test/", format!("{}", out));
|
2023-04-23 11:55:18 +00:00
|
|
|
assert_eq!(out, "test".parse().unwrap());
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn regex_complex() {
|
2022-09-24 08:11:38 +00:00
|
|
|
let sql = r"/(?i)test\/[a-z]+\/\s\d\w{1}.*/";
|
2020-06-29 15:36:01 +00:00
|
|
|
let res = regex(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
2022-09-24 08:11:38 +00:00
|
|
|
assert_eq!(r"/(?i)test/[a-z]+/\s\d\w{1}.*/", format!("{}", out));
|
2023-04-23 11:55:18 +00:00
|
|
|
assert_eq!(out, r"(?i)test/[a-z]+/\s\d\w{1}.*".parse().unwrap());
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
}
|