2022-01-16 20:31:50 +00:00
|
|
|
use crate::sql::error::IResult;
|
2022-05-15 08:34:29 +00:00
|
|
|
use crate::sql::escape::escape_strand;
|
2022-05-21 00:35:59 +00:00
|
|
|
use crate::sql::serde::is_internal_serialization;
|
2020-06-29 15:36:01 +00:00
|
|
|
use nom::branch::alt;
|
2022-09-26 00:23:57 +00:00
|
|
|
use nom::bytes::complete::escaped_transform;
|
2020-06-29 15:36:01 +00:00
|
|
|
use nom::bytes::complete::is_not;
|
2022-09-26 00:23:57 +00:00
|
|
|
use nom::bytes::complete::take_while_m_n;
|
|
|
|
use nom::character::complete::char;
|
|
|
|
use nom::combinator::value;
|
2020-06-29 15:36:01 +00:00
|
|
|
use serde::{Deserialize, Serialize};
|
|
|
|
use std::fmt;
|
2022-01-13 17:36:41 +00:00
|
|
|
use std::ops;
|
2022-05-05 04:30:32 +00:00
|
|
|
use std::ops::Deref;
|
2020-06-29 15:36:01 +00:00
|
|
|
use std::str;
|
|
|
|
|
2022-09-26 00:23:57 +00:00
|
|
|
const SINGLE: char = '\'';
|
2021-05-24 08:18:58 +00:00
|
|
|
const SINGLE_ESC: &str = r#"\'"#;
|
|
|
|
|
2022-09-26 00:23:57 +00:00
|
|
|
const DOUBLE: char = '"';
|
2021-05-24 08:18:58 +00:00
|
|
|
const DOUBLE_ESC: &str = r#"\""#;
|
|
|
|
|
2021-03-29 15:43:37 +00:00
|
|
|
#[derive(Clone, Debug, Default, Eq, PartialEq, PartialOrd, Deserialize)]
|
2022-05-05 04:30:32 +00:00
|
|
|
pub struct Strand(pub String);
|
2020-06-29 15:36:01 +00:00
|
|
|
|
2021-03-29 15:43:37 +00:00
|
|
|
impl From<String> for Strand {
|
|
|
|
fn from(s: String) -> Self {
|
2022-05-05 04:30:32 +00:00
|
|
|
Strand(s)
|
2021-03-29 15:43:37 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-05-25 09:42:10 +00:00
|
|
|
impl From<&str> for Strand {
|
2020-06-29 15:36:01 +00:00
|
|
|
fn from(s: &str) -> Self {
|
2022-05-05 04:30:32 +00:00
|
|
|
Strand(String::from(s))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Deref for Strand {
|
|
|
|
type Target = String;
|
|
|
|
fn deref(&self) -> &Self::Target {
|
|
|
|
&self.0
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-13 17:36:41 +00:00
|
|
|
impl Strand {
|
|
|
|
pub fn as_str(&self) -> &str {
|
2022-05-05 04:30:32 +00:00
|
|
|
self.0.as_str()
|
|
|
|
}
|
|
|
|
pub fn as_string(self) -> String {
|
|
|
|
self.0
|
2022-01-13 17:36:41 +00:00
|
|
|
}
|
2022-07-04 01:03:26 +00:00
|
|
|
pub fn to_raw(self) -> String {
|
|
|
|
self.0
|
|
|
|
}
|
2022-01-13 17:36:41 +00:00
|
|
|
}
|
|
|
|
|
2020-06-29 15:36:01 +00:00
|
|
|
impl fmt::Display for Strand {
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
2022-05-15 08:34:29 +00:00
|
|
|
write!(f, "{}", escape_strand(&self.0))
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-29 15:43:37 +00:00
|
|
|
impl Serialize for Strand {
|
|
|
|
fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
|
|
|
|
where
|
|
|
|
S: serde::Serializer,
|
|
|
|
{
|
2022-05-21 00:35:59 +00:00
|
|
|
if is_internal_serialization() {
|
2022-05-05 04:30:32 +00:00
|
|
|
serializer.serialize_newtype_struct("Strand", &self.0)
|
2022-05-21 00:35:59 +00:00
|
|
|
} else {
|
|
|
|
serializer.serialize_some(&self.0)
|
2021-03-29 15:43:37 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-01-13 17:36:41 +00:00
|
|
|
impl ops::Add for Strand {
|
|
|
|
type Output = Self;
|
|
|
|
fn add(self, other: Self) -> Self {
|
2022-05-05 04:30:32 +00:00
|
|
|
Strand::from(self.0 + &other.0)
|
2022-01-13 17:36:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-29 15:36:01 +00:00
|
|
|
pub fn strand(i: &str) -> IResult<&str, Strand> {
|
|
|
|
let (i, v) = strand_raw(i)?;
|
2022-05-05 04:30:32 +00:00
|
|
|
Ok((i, Strand(v)))
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
|
2021-05-24 08:18:58 +00:00
|
|
|
pub fn strand_raw(i: &str) -> IResult<&str, String> {
|
2022-09-26 00:23:57 +00:00
|
|
|
alt((strand_blank, strand_single, strand_double))(i)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn strand_blank(i: &str) -> IResult<&str, String> {
|
|
|
|
alt((
|
|
|
|
|i| {
|
|
|
|
let (i, _) = char(SINGLE)(i)?;
|
|
|
|
let (i, _) = char(SINGLE)(i)?;
|
|
|
|
Ok((i, String::new()))
|
|
|
|
},
|
|
|
|
|i| {
|
|
|
|
let (i, _) = char(DOUBLE)(i)?;
|
|
|
|
let (i, _) = char(DOUBLE)(i)?;
|
|
|
|
Ok((i, String::new()))
|
|
|
|
},
|
|
|
|
))(i)
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
|
2021-05-24 08:18:58 +00:00
|
|
|
fn strand_single(i: &str) -> IResult<&str, String> {
|
2022-09-26 00:23:57 +00:00
|
|
|
let (i, _) = char(SINGLE)(i)?;
|
|
|
|
let (i, v) = escaped_transform(
|
|
|
|
is_not(SINGLE_ESC),
|
|
|
|
'\\',
|
|
|
|
alt((
|
|
|
|
strand_unicode,
|
|
|
|
value('\u{1c}', char('\\')),
|
|
|
|
value('\u{27}', char('\'')),
|
|
|
|
value('\u{2f}', char('/')),
|
|
|
|
value('\u{08}', char('b')),
|
|
|
|
value('\u{0c}', char('f')),
|
|
|
|
value('\u{0a}', char('n')),
|
|
|
|
value('\u{0d}', char('r')),
|
|
|
|
value('\u{09}', char('t')),
|
|
|
|
)),
|
|
|
|
)(i)?;
|
|
|
|
let (i, _) = char(SINGLE)(i)?;
|
|
|
|
Ok((i, v))
|
2021-05-24 08:18:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fn strand_double(i: &str) -> IResult<&str, String> {
|
2022-09-26 00:23:57 +00:00
|
|
|
let (i, _) = char(DOUBLE)(i)?;
|
|
|
|
let (i, v) = escaped_transform(
|
|
|
|
is_not(DOUBLE_ESC),
|
|
|
|
'\\',
|
|
|
|
alt((
|
|
|
|
strand_unicode,
|
|
|
|
value('\u{1c}', char('\\')),
|
|
|
|
value('\u{22}', char('\"')),
|
|
|
|
value('\u{2f}', char('/')),
|
|
|
|
value('\u{08}', char('b')),
|
|
|
|
value('\u{0c}', char('f')),
|
|
|
|
value('\u{0a}', char('n')),
|
|
|
|
value('\u{0d}', char('r')),
|
|
|
|
value('\u{09}', char('t')),
|
|
|
|
)),
|
|
|
|
)(i)?;
|
|
|
|
let (i, _) = char(DOUBLE)(i)?;
|
|
|
|
Ok((i, v))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn strand_unicode(i: &str) -> IResult<&str, char> {
|
|
|
|
// Read the \u character
|
|
|
|
let (i, _) = char('u')(i)?;
|
|
|
|
// Let's read the next 4 ascii hexadecimal characters
|
|
|
|
let (i, v) = take_while_m_n(1, 4, |c: char| c.is_ascii_hexdigit())(i)?;
|
|
|
|
// We can convert this to u32 as we only have 4 chars
|
|
|
|
let v = u32::from_str_radix(v, 16).unwrap();
|
|
|
|
// We can convert this to char as we know it is valid
|
|
|
|
let v = std::char::from_u32(v).unwrap();
|
|
|
|
// Return the unicode char
|
|
|
|
Ok((i, v))
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|
|
|
|
|
2021-05-24 08:18:58 +00:00
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn strand_empty() {
|
|
|
|
let sql = r#""""#;
|
|
|
|
let res = strand(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!(r#""""#, format!("{}", out));
|
|
|
|
assert_eq!(out, Strand::from(""));
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn strand_single() {
|
|
|
|
let sql = r#"'test'"#;
|
|
|
|
let res = strand(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!(r#""test""#, format!("{}", out));
|
|
|
|
assert_eq!(out, Strand::from("test"));
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn strand_double() {
|
|
|
|
let sql = r#""test""#;
|
|
|
|
let res = strand(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!(r#""test""#, format!("{}", out));
|
|
|
|
assert_eq!(out, Strand::from("test"));
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn strand_quoted_single() {
|
|
|
|
let sql = r#"'te\'st'"#;
|
|
|
|
let res = strand(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!(r#""te'st""#, format!("{}", out));
|
|
|
|
assert_eq!(out, Strand::from(r#"te'st"#));
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn strand_quoted_double() {
|
|
|
|
let sql = r#""te\"st""#;
|
|
|
|
let res = strand(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!(r#""te"st""#, format!("{}", out));
|
|
|
|
assert_eq!(out, Strand::from(r#"te"st"#));
|
|
|
|
}
|
2022-09-26 00:23:57 +00:00
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn strand_quoted_escaped() {
|
|
|
|
let sql = r#""te\"st\n\tand\bsome\u05d9""#;
|
|
|
|
let res = strand(sql);
|
|
|
|
assert!(res.is_ok());
|
|
|
|
let out = res.unwrap().1;
|
|
|
|
assert_eq!("\"te\"st\n\tand\u{08}some\u{05d9}\"", format!("{}", out));
|
|
|
|
assert_eq!(out, Strand::from("te\"st\n\tand\u{08}some\u{05d9}"));
|
|
|
|
}
|
2020-06-29 15:36:01 +00:00
|
|
|
}
|