use std::char::decode_utf16;
use std::collections::BTreeMap;
use std::fmt;
use std::iter::{once, repeat};
use std::str::Chars;
use crate::error::{Error, ErrorKind};
use crate::value::{StringType, Value, ValueIter, ValueKind, ValueRepr};
use crate::Output;
pub struct SealedMarker;
pub fn memchr(haystack: &[u8], needle: u8) -> Option<usize> {
haystack.iter().position(|&x| x == needle)
}
pub fn memstr(haystack: &[u8], needle: &[u8]) -> Option<usize> {
haystack
.windows(needle.len())
.position(|window| window == needle)
}
#[inline(always)]
pub(crate) fn untrusted_size_hint(value: usize) -> usize {
value.min(1024)
}
fn write_with_html_escaping(out: &mut Output, value: &Value) -> fmt::Result {
if matches!(
value.kind(),
ValueKind::Undefined | ValueKind::None | ValueKind::Bool | ValueKind::Number
) {
write!(out, "{value}")
} else if let Some(s) = value.as_str() {
write!(out, "{}", HtmlEscape(s))
} else {
write!(out, "{}", HtmlEscape(&value.to_string()))
}
}
fn invalid_autoescape(name: &str) -> Result<(), Error> {
Err(Error::new(
ErrorKind::InvalidOperation,
format!("Default formatter does not know how to format to custom format '{name}'"),
))
}
#[inline(always)]
pub fn write_escaped(
out: &mut Output,
auto_escape: AutoEscape,
value: &Value,
) -> Result<(), Error> {
if let ValueRepr::String(ref s, ty) = value.0 {
if matches!(ty, StringType::Safe) || matches!(auto_escape, AutoEscape::None) {
return out.write_str(s).map_err(Error::from);
}
}
match auto_escape {
AutoEscape::None => write!(out, "{value}").map_err(Error::from),
AutoEscape::Html => write_with_html_escaping(out, value).map_err(Error::from),
#[cfg(feature = "json")]
AutoEscape::Json => {
let value = ok!(serde_json::to_string(&value).map_err(|err| {
Error::new(ErrorKind::BadSerialization, "unable to format to JSON").with_source(err)
}));
write!(out, "{value}").map_err(Error::from)
}
AutoEscape::Custom(name) => invalid_autoescape(name),
}
}
#[derive(Debug, Copy, Clone, PartialEq, Eq)]
#[non_exhaustive]
pub enum AutoEscape {
None,
Html,
#[cfg(feature = "json")]
#[cfg_attr(docsrs, doc(cfg(feature = "json")))]
Json,
Custom(&'static str),
}
#[derive(Debug, Copy, Clone, PartialEq, Eq, Default)]
#[non_exhaustive]
pub enum UndefinedBehavior {
#[default]
Lenient,
Chainable,
Strict,
}
impl UndefinedBehavior {
pub(crate) fn handle_undefined(self, parent_was_undefined: bool) -> Result<Value, Error> {
match (self, parent_was_undefined) {
(UndefinedBehavior::Lenient, false)
| (UndefinedBehavior::Strict, false)
| (UndefinedBehavior::Chainable, _) => Ok(Value::UNDEFINED),
(UndefinedBehavior::Lenient, true) | (UndefinedBehavior::Strict, true) => {
Err(Error::from(ErrorKind::UndefinedError))
}
}
}
#[inline]
pub(crate) fn is_true(self, value: &Value) -> Result<bool, Error> {
if matches!(self, UndefinedBehavior::Strict) && value.is_undefined() {
Err(Error::from(ErrorKind::UndefinedError))
} else {
Ok(value.is_true())
}
}
#[inline]
pub(crate) fn try_iter(self, value: Value) -> Result<ValueIter, Error> {
self.assert_iterable(&value).and_then(|_| value.try_iter())
}
#[inline]
pub(crate) fn assert_iterable(self, value: &Value) -> Result<(), Error> {
if matches!(self, UndefinedBehavior::Strict) && value.is_undefined() {
Err(Error::from(ErrorKind::UndefinedError))
} else {
Ok(())
}
}
}
pub struct HtmlEscape<'a>(pub &'a str);
impl<'a> fmt::Display for HtmlEscape<'a> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
#[cfg(feature = "v_htmlescape")]
{
fmt::Display::fmt(&v_htmlescape::escape(self.0), f)
}
#[cfg(not(feature = "v_htmlescape"))]
{
let bytes = self.0.as_bytes();
let mut start = 0;
for (i, b) in bytes.iter().enumerate() {
macro_rules! escaping_body {
($quote:expr) => {{
if start < i {
ok!(f.write_str(unsafe {
std::str::from_utf8_unchecked(&bytes[start..i])
}));
}
ok!(f.write_str($quote));
start = i + 1;
}};
}
if b.wrapping_sub(b'"') <= b'>' - b'"' {
match *b {
b'<' => escaping_body!("<"),
b'>' => escaping_body!(">"),
b'&' => escaping_body!("&"),
b'"' => escaping_body!("""),
b'\'' => escaping_body!("'"),
b'/' => escaping_body!("/"),
_ => (),
}
}
}
if start < bytes.len() {
f.write_str(unsafe { std::str::from_utf8_unchecked(&bytes[start..]) })
} else {
Ok(())
}
}
}
}
struct Unescaper {
out: String,
pending_surrogate: u16,
}
impl Unescaper {
fn unescape(mut self, s: &str) -> Result<String, Error> {
let mut char_iter = s.chars();
while let Some(c) = char_iter.next() {
if c == '\\' {
match char_iter.next() {
None => return Err(ErrorKind::BadEscape.into()),
Some(d) => match d {
'"' | '\\' | '/' | '\'' => ok!(self.push_char(d)),
'b' => ok!(self.push_char('\x08')),
'f' => ok!(self.push_char('\x0C')),
'n' => ok!(self.push_char('\n')),
'r' => ok!(self.push_char('\r')),
't' => ok!(self.push_char('\t')),
'u' => {
let val = ok!(self.parse_u16(&mut char_iter));
ok!(self.push_u16(val));
}
_ => return Err(ErrorKind::BadEscape.into()),
},
}
} else {
ok!(self.push_char(c));
}
}
if self.pending_surrogate != 0 {
Err(ErrorKind::BadEscape.into())
} else {
Ok(self.out)
}
}
fn parse_u16(&self, chars: &mut Chars) -> Result<u16, Error> {
let hexnum = chars.chain(repeat('\0')).take(4).collect::<String>();
u16::from_str_radix(&hexnum, 16).map_err(|_| ErrorKind::BadEscape.into())
}
fn push_u16(&mut self, c: u16) -> Result<(), Error> {
match (self.pending_surrogate, (0xD800..=0xDFFF).contains(&c)) {
(0, false) => match decode_utf16(once(c)).next() {
Some(Ok(c)) => self.out.push(c),
_ => return Err(ErrorKind::BadEscape.into()),
},
(_, false) => return Err(ErrorKind::BadEscape.into()),
(0, true) => self.pending_surrogate = c,
(prev, true) => match decode_utf16(once(prev).chain(once(c))).next() {
Some(Ok(c)) => {
self.out.push(c);
self.pending_surrogate = 0;
}
_ => return Err(ErrorKind::BadEscape.into()),
},
}
Ok(())
}
fn push_char(&mut self, c: char) -> Result<(), Error> {
if self.pending_surrogate != 0 {
Err(ErrorKind::BadEscape.into())
} else {
self.out.push(c);
Ok(())
}
}
}
pub fn unescape(s: &str) -> Result<String, Error> {
Unescaper {
out: String::new(),
pending_surrogate: 0,
}
.unescape(s)
}
pub struct BTreeMapKeysDebug<'a, K: fmt::Debug, V>(pub &'a BTreeMap<K, V>);
impl<'a, K: fmt::Debug, V> fmt::Debug for BTreeMapKeysDebug<'a, K, V> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
f.debug_list().entries(self.0.iter().map(|x| x.0)).finish()
}
}
pub struct OnDrop<F: FnOnce()>(Option<F>);
impl<F: FnOnce()> OnDrop<F> {
pub fn new(f: F) -> Self {
Self(Some(f))
}
}
impl<F: FnOnce()> Drop for OnDrop<F> {
fn drop(&mut self) {
self.0.take().unwrap()();
}
}
#[cfg(feature = "builtins")]
pub fn splitn_whitespace(s: &str, maxsplits: usize) -> impl Iterator<Item = &str> + '_ {
let mut splits = 1;
let mut skip_ws = true;
let mut split_start = None;
let mut last_split_end = 0;
let mut chars = s.char_indices();
std::iter::from_fn(move || {
for (idx, c) in chars.by_ref() {
if splits >= maxsplits && !skip_ws {
continue;
} else if c.is_whitespace() {
if let Some(old) = split_start {
let rv = &s[old..idx];
split_start = None;
last_split_end = idx;
splits += 1;
skip_ws = true;
return Some(rv);
}
} else {
skip_ws = false;
if split_start.is_none() {
split_start = Some(idx);
last_split_end = idx;
}
}
}
let rest = &s[last_split_end..];
if !rest.is_empty() {
last_split_end = s.len();
Some(rest)
} else {
None
}
})
}
#[cfg(test)]
mod tests {
use super::*;
use similar_asserts::assert_eq;
#[test]
fn test_html_escape() {
let input = "<>&\"'/";
let output = HtmlEscape(input).to_string();
assert_eq!(output, "<>&"'/");
}
#[test]
fn test_unescape() {
assert_eq!(unescape(r"foo\u2603bar").unwrap(), "foo\u{2603}bar");
assert_eq!(unescape(r"\t\b\f\r\n\\\/").unwrap(), "\t\x08\x0c\r\n\\/");
assert_eq!(unescape("foobarbaz").unwrap(), "foobarbaz");
assert_eq!(unescape(r"\ud83d\udca9").unwrap(), "💩");
}
#[test]
#[cfg(feature = "builtins")]
fn test_splitn_whitespace() {
fn s(s: &str, n: usize) -> Vec<&str> {
splitn_whitespace(s, n).collect::<Vec<_>>()
}
assert_eq!(s("a b c", 1), vec!["a b c"]);
assert_eq!(s("a b c", 2), vec!["a", "b c"]);
assert_eq!(s("a b c", 2), vec!["a", "b c"]);
assert_eq!(s("a b c ", 2), vec!["a", "b c "]);
assert_eq!(s("a b c", 3), vec!["a", "b", "c"]);
assert_eq!(s("a b c", 4), vec!["a", "b", "c"]);
assert_eq!(s(" a b c", 3), vec!["a", "b", "c"]);
assert_eq!(s(" a b c", 4), vec!["a", "b", "c"]);
}
}