Bugfix - make string::slice properly handle UTF-8 and reallocate less. (#1854)
This commit is contained in:
parent
c7633414b5
commit
df07bb32f5
1 changed files with 52 additions and 12 deletions
|
@ -52,21 +52,33 @@ pub fn reverse((string,): (String,)) -> Result<Value, Error> {
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn slice((val, beg, lim): (String, Option<isize>, Option<isize>)) -> Result<Value, Error> {
|
pub fn slice((val, beg, lim): (String, Option<isize>, Option<isize>)) -> Result<Value, Error> {
|
||||||
let val = match beg {
|
// Only count the chars if we need to and only do it once.
|
||||||
Some(v) if v < 0 => {
|
let mut char_count = usize::MAX;
|
||||||
val.chars().skip(val.len().saturating_sub(v.unsigned_abs())).collect::<String>()
|
let mut count_chars = || {
|
||||||
|
if char_count == usize::MAX {
|
||||||
|
char_count = val.chars().count();
|
||||||
}
|
}
|
||||||
Some(v) => val.chars().skip(v as usize).collect::<String>(),
|
char_count
|
||||||
None => val,
|
|
||||||
};
|
};
|
||||||
let val = match lim {
|
|
||||||
Some(v) if v < 0 => {
|
let skip = match beg {
|
||||||
val.chars().take(val.len().saturating_sub(v.unsigned_abs())).collect::<String>()
|
Some(v) if v < 0 => count_chars().saturating_sub(v.unsigned_abs()),
|
||||||
}
|
Some(v) => v as usize,
|
||||||
Some(v) => val.chars().take(v as usize).collect::<String>(),
|
None => 0,
|
||||||
None => val,
|
|
||||||
};
|
};
|
||||||
Ok(val.into())
|
|
||||||
|
let take = match lim {
|
||||||
|
Some(v) if v < 0 => count_chars().saturating_sub(skip).saturating_sub(v.unsigned_abs()),
|
||||||
|
Some(v) => v as usize,
|
||||||
|
None => usize::MAX,
|
||||||
|
};
|
||||||
|
|
||||||
|
Ok(if skip > 0 || take < usize::MAX {
|
||||||
|
val.chars().skip(skip).take(take).collect::<String>()
|
||||||
|
} else {
|
||||||
|
val
|
||||||
|
}
|
||||||
|
.into())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn slug((string,): (String,)) -> Result<Value, Error> {
|
pub fn slug((string,): (String,)) -> Result<Value, Error> {
|
||||||
|
@ -92,3 +104,31 @@ pub fn uppercase((string,): (String,)) -> Result<Value, Error> {
|
||||||
pub fn words((string,): (String,)) -> Result<Value, Error> {
|
pub fn words((string,): (String,)) -> Result<Value, Error> {
|
||||||
Ok(string.split_whitespace().collect::<Vec<&str>>().into())
|
Ok(string.split_whitespace().collect::<Vec<&str>>().into())
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[cfg(test)]
|
||||||
|
mod tests {
|
||||||
|
use super::slice;
|
||||||
|
use crate::sql::Value;
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn string_slice() {
|
||||||
|
fn test(initial: &str, beg: Option<isize>, end: Option<isize>, expected: &str) {
|
||||||
|
assert_eq!(slice((initial.to_owned(), beg, end)).unwrap(), Value::from(expected));
|
||||||
|
}
|
||||||
|
|
||||||
|
let string = "abcdefg";
|
||||||
|
test(string, None, None, string);
|
||||||
|
test(string, Some(2), None, &string[2..]);
|
||||||
|
test(string, Some(2), Some(3), &string[2..5]);
|
||||||
|
test(string, Some(2), Some(-1), "cdef");
|
||||||
|
test(string, Some(-2), None, "fg");
|
||||||
|
test(string, Some(-4), Some(2), "de");
|
||||||
|
test(string, Some(-4), Some(-1), "def");
|
||||||
|
|
||||||
|
let string = "你好世界";
|
||||||
|
test(string, None, None, string);
|
||||||
|
test(string, Some(1), None, "好世界");
|
||||||
|
test(string, Some(-1), None, "界");
|
||||||
|
test(string, Some(-2), Some(1), "世");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
Loading…
Reference in a new issue