yaml_rust2/
yaml.rs

1//! YAML objects manipulation utilities.
2
3#![allow(clippy::module_name_repetitions)]
4
5use std::borrow::Cow;
6use std::ops::ControlFlow;
7use std::{collections::BTreeMap, convert::TryFrom, mem, ops::Index, ops::IndexMut};
8
9#[cfg(feature = "encoding")]
10use encoding_rs::{Decoder, DecoderResult, Encoding};
11use hashlink::LinkedHashMap;
12
13use crate::parser::{Event, MarkedEventReceiver, Parser, Tag};
14use crate::scanner::{Marker, ScanError, TScalarStyle};
15
16/// A YAML node is stored as this `Yaml` enumeration, which provides an easy way to
17/// access your YAML document.
18///
19/// # Examples
20///
21/// ```
22/// use yaml_rust2::Yaml;
23/// let foo = Yaml::from_str("-123"); // convert the string to the appropriate YAML type
24/// assert_eq!(foo.as_i64().unwrap(), -123);
25///
26/// // iterate over an Array
27/// let vec = Yaml::Array(vec![Yaml::Integer(1), Yaml::Integer(2)]);
28/// for v in vec.as_vec().unwrap() {
29///     assert!(v.as_i64().is_some());
30/// }
31/// ```
32#[derive(Clone, PartialEq, PartialOrd, Debug, Eq, Ord, Hash)]
33pub enum Yaml {
34    /// Float types are stored as String and parsed on demand.
35    /// Note that `f64` does NOT implement Eq trait and can NOT be stored in `BTreeMap`.
36    Real(String),
37    /// YAML int is stored as i64.
38    Integer(i64),
39    /// YAML scalar.
40    String(String),
41    /// YAML bool, e.g. `true` or `false`.
42    Boolean(bool),
43    /// YAML array, can be accessed as a [`Vec`].
44    Array(Array),
45    /// YAML hash, can be accessed as a [`LinkedHashMap`].
46    ///
47    /// Insertion order will match the order of insertion into the map.
48    Hash(Hash),
49    /// Alias, not fully supported yet.
50    Alias(usize),
51    /// YAML null, e.g. `null` or `~`.
52    Null,
53    /// Accessing a nonexistent node via the Index trait returns `BadValue`. This
54    /// simplifies error handling in the calling code. Invalid type conversion also
55    /// returns `BadValue`.
56    BadValue,
57}
58
59/// The type contained in the `Yaml::Array` variant. This corresponds to YAML sequences.
60pub type Array = Vec<Yaml>;
61/// The type contained in the `Yaml::Hash` variant. This corresponds to YAML mappings.
62pub type Hash = LinkedHashMap<Yaml, Yaml>;
63
64// parse f64 as Core schema
65// See: https://github.com/chyh1990/yaml-rust/issues/51
66fn parse_f64(v: &str) -> Option<f64> {
67    match v {
68        ".inf" | ".Inf" | ".INF" | "+.inf" | "+.Inf" | "+.INF" => Some(f64::INFINITY),
69        "-.inf" | "-.Inf" | "-.INF" => Some(f64::NEG_INFINITY),
70        ".nan" | ".NaN" | ".NAN" => Some(f64::NAN),
71        _ => v.parse::<f64>().ok(),
72    }
73}
74
75/// Main structure for quickly parsing YAML.
76///
77/// See [`YamlLoader::load_from_str`].
78#[derive(Default)]
79pub struct YamlLoader {
80    /// The different YAML documents that are loaded.
81    docs: Vec<Yaml>,
82    // states
83    // (current node, anchor_id) tuple
84    doc_stack: Vec<(Yaml, usize)>,
85    key_stack: Vec<Yaml>,
86    anchor_map: BTreeMap<usize, Yaml>,
87    /// An error, if one was encountered.
88    error: Option<ScanError>,
89}
90
91impl MarkedEventReceiver for YamlLoader {
92    fn on_event(&mut self, ev: Event, mark: Marker) {
93        if self.error.is_some() {
94            return;
95        }
96        if let Err(e) = self.on_event_impl(ev, mark) {
97            self.error = Some(e);
98        }
99    }
100}
101
102/// An error that happened when loading a YAML document.
103#[derive(Debug)]
104pub enum LoadError {
105    /// An I/O error.
106    IO(std::io::Error),
107    /// An error within the scanner. This indicates a malformed YAML input.
108    Scan(ScanError),
109    /// A decoding error (e.g.: Invalid UTF-8).
110    Decode(std::borrow::Cow<'static, str>),
111}
112
113impl From<std::io::Error> for LoadError {
114    fn from(error: std::io::Error) -> Self {
115        LoadError::IO(error)
116    }
117}
118
119impl YamlLoader {
120    fn on_event_impl(&mut self, ev: Event, mark: Marker) -> Result<(), ScanError> {
121        // println!("EV {:?}", ev);
122        match ev {
123            Event::DocumentStart | Event::Nothing | Event::StreamStart | Event::StreamEnd => {
124                // do nothing
125            }
126            Event::DocumentEnd => {
127                match self.doc_stack.len() {
128                    // empty document
129                    0 => self.docs.push(Yaml::BadValue),
130                    1 => self.docs.push(self.doc_stack.pop().unwrap().0),
131                    _ => unreachable!(),
132                }
133            }
134            Event::SequenceStart(aid, _) => {
135                self.doc_stack.push((Yaml::Array(Vec::new()), aid));
136            }
137            Event::SequenceEnd => {
138                let node = self.doc_stack.pop().unwrap();
139                self.insert_new_node(node, mark)?;
140            }
141            Event::MappingStart(aid, _) => {
142                self.doc_stack.push((Yaml::Hash(Hash::new()), aid));
143                self.key_stack.push(Yaml::BadValue);
144            }
145            Event::MappingEnd => {
146                self.key_stack.pop().unwrap();
147                let node = self.doc_stack.pop().unwrap();
148                self.insert_new_node(node, mark)?;
149            }
150            Event::Scalar(v, style, aid, tag) => {
151                let node = if style != TScalarStyle::Plain {
152                    Yaml::String(v)
153                } else if let Some(Tag {
154                    ref handle,
155                    ref suffix,
156                }) = tag
157                {
158                    if handle == "tag:yaml.org,2002:" {
159                        match suffix.as_ref() {
160                            "bool" => {
161                                // "true" or "false"
162                                match v.parse::<bool>() {
163                                    Err(_) => Yaml::BadValue,
164                                    Ok(v) => Yaml::Boolean(v),
165                                }
166                            }
167                            "int" => match v.parse::<i64>() {
168                                Err(_) => Yaml::BadValue,
169                                Ok(v) => Yaml::Integer(v),
170                            },
171                            "float" => match parse_f64(&v) {
172                                Some(_) => Yaml::Real(v),
173                                None => Yaml::BadValue,
174                            },
175                            "null" => match v.as_ref() {
176                                "~" | "null" => Yaml::Null,
177                                _ => Yaml::BadValue,
178                            },
179                            _ => Yaml::String(v),
180                        }
181                    } else {
182                        Yaml::String(v)
183                    }
184                } else {
185                    // Datatype is not specified, or unrecognized
186                    Yaml::from_str(&v)
187                };
188
189                self.insert_new_node((node, aid), mark)?;
190            }
191            Event::Alias(id) => {
192                let n = match self.anchor_map.get(&id) {
193                    Some(v) => v.clone(),
194                    None => Yaml::BadValue,
195                };
196                self.insert_new_node((n, 0), mark)?;
197            }
198        }
199        // println!("DOC {:?}", self.doc_stack);
200        Ok(())
201    }
202
203    fn insert_new_node(&mut self, node: (Yaml, usize), mark: Marker) -> Result<(), ScanError> {
204        // valid anchor id starts from 1
205        if node.1 > 0 {
206            self.anchor_map.insert(node.1, node.0.clone());
207        }
208        if self.doc_stack.is_empty() {
209            self.doc_stack.push(node);
210        } else {
211            let parent = self.doc_stack.last_mut().unwrap();
212            match *parent {
213                (Yaml::Array(ref mut v), _) => v.push(node.0),
214                (Yaml::Hash(ref mut h), _) => {
215                    let cur_key = self.key_stack.last_mut().unwrap();
216                    // current node is a key
217                    if cur_key.is_badvalue() {
218                        *cur_key = node.0;
219                    // current node is a value
220                    } else {
221                        let mut newkey = Yaml::BadValue;
222                        mem::swap(&mut newkey, cur_key);
223                        if h.insert(newkey, node.0).is_some() {
224                            let inserted_key = h.back().unwrap().0;
225                            return Err(ScanError::new_string(
226                                mark,
227                                format!("{inserted_key:?}: duplicated key in mapping"),
228                            ));
229                        }
230                    }
231                }
232                _ => unreachable!(),
233            }
234        }
235        Ok(())
236    }
237
238    /// Load the given string as a set of YAML documents.
239    ///
240    /// The `source` is interpreted as YAML documents and is parsed. Parsing succeeds if and only
241    /// if all documents are parsed successfully. An error in a latter document prevents the former
242    /// from being returned.
243    /// # Errors
244    /// Returns `ScanError` when loading fails.
245    pub fn load_from_str(source: &str) -> Result<Vec<Yaml>, ScanError> {
246        Self::load_from_iter(source.chars())
247    }
248
249    /// Load the contents of the given iterator as a set of YAML documents.
250    ///
251    /// The `source` is interpreted as YAML documents and is parsed. Parsing succeeds if and only
252    /// if all documents are parsed successfully. An error in a latter document prevents the former
253    /// from being returned.
254    /// # Errors
255    /// Returns `ScanError` when loading fails.
256    pub fn load_from_iter<I: Iterator<Item = char>>(source: I) -> Result<Vec<Yaml>, ScanError> {
257        let mut parser = Parser::new(source);
258        Self::load_from_parser(&mut parser)
259    }
260
261    /// Load the contents from the specified Parser as a set of YAML documents.
262    ///
263    /// Parsing succeeds if and only if all documents are parsed successfully.
264    /// An error in a latter document prevents the former from being returned.
265    /// # Errors
266    /// Returns `ScanError` when loading fails.
267    pub fn load_from_parser<I: Iterator<Item = char>>(
268        parser: &mut Parser<I>,
269    ) -> Result<Vec<Yaml>, ScanError> {
270        let mut loader = YamlLoader::default();
271        parser.load(&mut loader, true)?;
272        if let Some(e) = loader.error {
273            Err(e)
274        } else {
275            Ok(loader.docs)
276        }
277    }
278
279    /// Return a reference to the parsed Yaml documents.
280    #[must_use]
281    pub fn documents(&self) -> &[Yaml] {
282        &self.docs
283    }
284}
285
286/// The signature of the function to call when using [`YAMLDecodingTrap::Call`].
287///
288/// The arguments are as follows:
289///  * `malformation_length`: The length of the sequence the decoder failed to decode.
290///  * `bytes_read_after_malformation`: The number of lookahead bytes the decoder consumed after
291///    the malformation.
292///  * `input_at_malformation`: What the input buffer is at the malformation.
293///    This is the buffer starting at the malformation. The first `malformation_length` bytes are
294///    the problematic sequence. The following `bytes_read_after_malformation` are already stored
295///    in the decoder and will not be re-fed.
296///  * `output`: The output string.
297///
298/// The function must modify `output` as it feels is best. For instance, one could recreate the
299/// behavior of [`YAMLDecodingTrap::Ignore`] with an empty function, [`YAMLDecodingTrap::Replace`]
300/// by pushing a `\u{FFFD}` into `output` and [`YAMLDecodingTrap::Strict`] by returning
301/// [`ControlFlow::Break`].
302///
303/// # Returns
304/// The function must return [`ControlFlow::Continue`] if decoding may continue or
305/// [`ControlFlow::Break`] if decoding must be aborted. An optional error string may be supplied.
306#[cfg(feature = "encoding")]
307pub type YAMLDecodingTrapFn = fn(
308    malformation_length: u8,
309    bytes_read_after_malformation: u8,
310    input_at_malformation: &[u8],
311    output: &mut String,
312) -> ControlFlow<Cow<'static, str>>;
313
314/// The behavior [`YamlDecoder`] must have when an decoding error occurs.
315#[cfg(feature = "encoding")]
316#[derive(Copy, Clone, PartialEq, Eq)]
317pub enum YAMLDecodingTrap {
318    /// Ignore the offending bytes, remove them from the output.
319    Ignore,
320    /// Error out.
321    Strict,
322    /// Replace them with the Unicode REPLACEMENT CHARACTER.
323    Replace,
324    /// Call the user-supplied function upon decoding malformation.
325    Call(YAMLDecodingTrapFn),
326}
327
328/// `YamlDecoder` is a `YamlLoader` builder that allows you to supply your own encoding error trap.
329/// For example, to read a YAML file while ignoring Unicode decoding errors you can set the
330/// `encoding_trap` to `encoding::DecoderTrap::Ignore`.
331/// ```rust
332/// use yaml_rust2::yaml::{YamlDecoder, YAMLDecodingTrap};
333///
334/// let string = b"---
335/// a\xa9: 1
336/// b: 2.2
337/// c: [1, 2]
338/// ";
339/// let out = YamlDecoder::read(string as &[u8])
340///     .encoding_trap(YAMLDecodingTrap::Ignore)
341///     .decode()
342///     .unwrap();
343/// ```
344#[cfg(feature = "encoding")]
345pub struct YamlDecoder<T: std::io::Read> {
346    source: T,
347    trap: YAMLDecodingTrap,
348}
349
350#[cfg(feature = "encoding")]
351impl<T: std::io::Read> YamlDecoder<T> {
352    /// Create a `YamlDecoder` decoding the given source.
353    pub fn read(source: T) -> YamlDecoder<T> {
354        YamlDecoder {
355            source,
356            trap: YAMLDecodingTrap::Strict,
357        }
358    }
359
360    /// Set the behavior of the decoder when the encoding is invalid.
361    pub fn encoding_trap(&mut self, trap: YAMLDecodingTrap) -> &mut Self {
362        self.trap = trap;
363        self
364    }
365
366    /// Run the decode operation with the source and trap the `YamlDecoder` was built with.
367    ///
368    /// # Errors
369    /// Returns `LoadError` when decoding fails.
370    pub fn decode(&mut self) -> Result<Vec<Yaml>, LoadError> {
371        let mut buffer = Vec::new();
372        self.source.read_to_end(&mut buffer)?;
373
374        // Check if the `encoding` library can detect encoding from the BOM, otherwise use
375        // `detect_utf16_endianness`.
376        let (encoding, _) =
377            Encoding::for_bom(&buffer).unwrap_or_else(|| (detect_utf16_endianness(&buffer), 2));
378        let mut decoder = encoding.new_decoder();
379        let mut output = String::new();
380
381        // Decode the input buffer.
382        decode_loop(&buffer, &mut output, &mut decoder, self.trap)?;
383
384        YamlLoader::load_from_str(&output).map_err(LoadError::Scan)
385    }
386}
387
388/// Perform a loop of [`Decoder::decode_to_string`], reallocating `output` if needed.
389#[cfg(feature = "encoding")]
390fn decode_loop(
391    input: &[u8],
392    output: &mut String,
393    decoder: &mut Decoder,
394    trap: YAMLDecodingTrap,
395) -> Result<(), LoadError> {
396    output.reserve(input.len());
397    let mut total_bytes_read = 0;
398
399    loop {
400        match decoder.decode_to_string_without_replacement(&input[total_bytes_read..], output, true)
401        {
402            // If the input is empty, we processed the whole input.
403            (DecoderResult::InputEmpty, _) => break Ok(()),
404            // If the output is full, we must reallocate.
405            (DecoderResult::OutputFull, bytes_read) => {
406                total_bytes_read += bytes_read;
407                // The output is already reserved to the size of the input. We slowly resize. Here,
408                // we're expecting that 10% of bytes will double in size when converting to UTF-8.
409                output.reserve(input.len() / 10);
410            }
411            (DecoderResult::Malformed(malformed_len, bytes_after_malformed), bytes_read) => {
412                total_bytes_read += bytes_read;
413                match trap {
414                    // Ignore (skip over) malformed character.
415                    YAMLDecodingTrap::Ignore => {}
416                    // Replace them with the Unicode REPLACEMENT CHARACTER.
417                    YAMLDecodingTrap::Replace => {
418                        output.push('\u{FFFD}');
419                    }
420                    // Otherwise error, getting as much context as possible.
421                    YAMLDecodingTrap::Strict => {
422                        let malformed_len = malformed_len as usize;
423                        let bytes_after_malformed = bytes_after_malformed as usize;
424                        let byte_idx = total_bytes_read - (malformed_len + bytes_after_malformed);
425                        let malformed_sequence = &input[byte_idx..byte_idx + malformed_len];
426
427                        break Err(LoadError::Decode(Cow::Owned(format!(
428                            "Invalid character sequence at {byte_idx}: {malformed_sequence:?}",
429                        ))));
430                    }
431                    YAMLDecodingTrap::Call(callback) => {
432                        let byte_idx =
433                            total_bytes_read - ((malformed_len + bytes_after_malformed) as usize);
434                        let malformed_sequence =
435                            &input[byte_idx..byte_idx + malformed_len as usize];
436                        if let ControlFlow::Break(error) = callback(
437                            malformed_len,
438                            bytes_after_malformed,
439                            &input[byte_idx..],
440                            output,
441                        ) {
442                            if error.is_empty() {
443                                break Err(LoadError::Decode(Cow::Owned(format!(
444                                    "Invalid character sequence at {byte_idx}: {malformed_sequence:?}",
445                                ))));
446                            }
447                            break Err(LoadError::Decode(error));
448                        }
449                    }
450                }
451            }
452        }
453    }
454}
455
456/// The encoding crate knows how to tell apart UTF-8 from UTF-16LE and utf-16BE, when the
457/// bytestream starts with BOM codepoint.
458/// However, it doesn't even attempt to guess the UTF-16 endianness of the input bytestream since
459/// in the general case the bytestream could start with a codepoint that uses both bytes.
460///
461/// The YAML-1.2 spec mandates that the first character of a YAML document is an ASCII character.
462/// This allows the encoding to be deduced by the pattern of null (#x00) characters.
463//
464/// See spec at <https://yaml.org/spec/1.2/spec.html#id2771184>
465#[cfg(feature = "encoding")]
466fn detect_utf16_endianness(b: &[u8]) -> &'static Encoding {
467    if b.len() > 1 && (b[0] != b[1]) {
468        if b[0] == 0 {
469            return encoding_rs::UTF_16BE;
470        } else if b[1] == 0 {
471            return encoding_rs::UTF_16LE;
472        }
473    }
474    encoding_rs::UTF_8
475}
476
477macro_rules! define_as (
478    ($name:ident, $t:ident, $yt:ident) => (
479/// Get a copy of the inner object in the YAML enum if it is a `$t`.
480///
481/// # Return
482/// If the variant of `self` is `Yaml::$yt`, return `Some($t)` with a copy of the `$t` contained.
483/// Otherwise, return `None`.
484#[must_use]
485pub fn $name(&self) -> Option<$t> {
486    match *self {
487        Yaml::$yt(v) => Some(v),
488        _ => None
489    }
490}
491    );
492);
493
494macro_rules! define_as_ref (
495    ($name:ident, $t:ty, $yt:ident) => (
496/// Get a reference to the inner object in the YAML enum if it is a `$t`.
497///
498/// # Return
499/// If the variant of `self` is `Yaml::$yt`, return `Some(&$t)` with the `$t` contained. Otherwise,
500/// return `None`.
501#[must_use]
502pub fn $name(&self) -> Option<$t> {
503    match *self {
504        Yaml::$yt(ref v) => Some(v),
505        _ => None
506    }
507}
508    );
509);
510
511macro_rules! define_as_mut_ref (
512    ($name:ident, $t:ty, $yt:ident) => (
513/// Get a mutable reference to the inner object in the YAML enum if it is a `$t`.
514///
515/// # Return
516/// If the variant of `self` is `Yaml::$yt`, return `Some(&mut $t)` with the `$t` contained.
517/// Otherwise, return `None`.
518#[must_use]
519pub fn $name(&mut self) -> Option<$t> {
520    match *self {
521        Yaml::$yt(ref mut v) => Some(v),
522        _ => None
523    }
524}
525    );
526);
527
528macro_rules! define_into (
529    ($name:ident, $t:ty, $yt:ident) => (
530/// Get the inner object in the YAML enum if it is a `$t`.
531///
532/// # Return
533/// If the variant of `self` is `Yaml::$yt`, return `Some($t)` with the `$t` contained. Otherwise,
534/// return `None`.
535#[must_use]
536pub fn $name(self) -> Option<$t> {
537    match self {
538        Yaml::$yt(v) => Some(v),
539        _ => None
540    }
541}
542    );
543);
544
545impl Yaml {
546    define_as!(as_bool, bool, Boolean);
547    define_as!(as_i64, i64, Integer);
548
549    define_as_ref!(as_str, &str, String);
550    define_as_ref!(as_hash, &Hash, Hash);
551    define_as_ref!(as_vec, &Array, Array);
552
553    define_as_mut_ref!(as_mut_hash, &mut Hash, Hash);
554    define_as_mut_ref!(as_mut_vec, &mut Array, Array);
555
556    define_into!(into_bool, bool, Boolean);
557    define_into!(into_i64, i64, Integer);
558    define_into!(into_string, String, String);
559    define_into!(into_hash, Hash, Hash);
560    define_into!(into_vec, Array, Array);
561
562    /// Return whether `self` is a [`Yaml::Null`] node.
563    #[must_use]
564    pub fn is_null(&self) -> bool {
565        matches!(*self, Yaml::Null)
566    }
567
568    /// Return whether `self` is a [`Yaml::BadValue`] node.
569    #[must_use]
570    pub fn is_badvalue(&self) -> bool {
571        matches!(*self, Yaml::BadValue)
572    }
573
574    /// Return whether `self` is a [`Yaml::Array`] node.
575    #[must_use]
576    pub fn is_array(&self) -> bool {
577        matches!(*self, Yaml::Array(_))
578    }
579
580    /// Return whether `self` is a [`Yaml::Hash`] node.
581    #[must_use]
582    pub fn is_hash(&self) -> bool {
583        matches!(*self, Yaml::Hash(_))
584    }
585
586    /// Return the `f64` value contained in this YAML node.
587    ///
588    /// If the node is not a [`Yaml::Real`] YAML node or its contents is not a valid `f64` string,
589    /// `None` is returned.
590    #[must_use]
591    pub fn as_f64(&self) -> Option<f64> {
592        if let Yaml::Real(ref v) = self {
593            parse_f64(v)
594        } else {
595            None
596        }
597    }
598
599    /// Return the `f64` value contained in this YAML node.
600    ///
601    /// If the node is not a [`Yaml::Real`] YAML node or its contents is not a valid `f64` string,
602    /// `None` is returned.
603    #[must_use]
604    pub fn into_f64(self) -> Option<f64> {
605        self.as_f64()
606    }
607
608    /// If a value is null or otherwise bad (see variants), consume it and
609    /// replace it with a given value `other`. Otherwise, return self unchanged.
610    ///
611    /// ```
612    /// use yaml_rust2::yaml::Yaml;
613    ///
614    /// assert_eq!(Yaml::BadValue.or(Yaml::Integer(3)),  Yaml::Integer(3));
615    /// assert_eq!(Yaml::Integer(3).or(Yaml::BadValue),  Yaml::Integer(3));
616    /// ```
617    #[must_use]
618    pub fn or(self, other: Self) -> Self {
619        match self {
620            Yaml::BadValue | Yaml::Null => other,
621            this => this,
622        }
623    }
624
625    /// See `or` for behavior. This performs the same operations, but with
626    /// borrowed values for less linear pipelines.
627    #[must_use]
628    pub fn borrowed_or<'a>(&'a self, other: &'a Self) -> &'a Self {
629        match self {
630            Yaml::BadValue | Yaml::Null => other,
631            this => this,
632        }
633    }
634}
635
636#[allow(clippy::should_implement_trait)]
637impl Yaml {
638    /// Convert a string to a [`Yaml`] node.
639    ///
640    /// [`Yaml`] does not implement [`std::str::FromStr`] since conversion may not fail. This
641    /// function falls back to [`Yaml::String`] if nothing else matches.
642    ///
643    /// # Examples
644    /// ```
645    /// # use yaml_rust2::yaml::Yaml;
646    /// assert!(matches!(Yaml::from_str("42"), Yaml::Integer(42)));
647    /// assert!(matches!(Yaml::from_str("0x2A"), Yaml::Integer(42)));
648    /// assert!(matches!(Yaml::from_str("0o52"), Yaml::Integer(42)));
649    /// assert!(matches!(Yaml::from_str("~"), Yaml::Null));
650    /// assert!(matches!(Yaml::from_str("null"), Yaml::Null));
651    /// assert!(matches!(Yaml::from_str("true"), Yaml::Boolean(true)));
652    /// assert!(matches!(Yaml::from_str("3.14"), Yaml::Real(_)));
653    /// assert!(matches!(Yaml::from_str("foo"), Yaml::String(_)));
654    /// ```
655    #[must_use]
656    pub fn from_str(v: &str) -> Yaml {
657        if let Some(number) = v.strip_prefix("0x") {
658            if let Ok(i) = i64::from_str_radix(number, 16) {
659                return Yaml::Integer(i);
660            }
661        } else if let Some(number) = v.strip_prefix("0o") {
662            if let Ok(i) = i64::from_str_radix(number, 8) {
663                return Yaml::Integer(i);
664            }
665        } else if let Some(number) = v.strip_prefix('+') {
666            if let Ok(i) = number.parse::<i64>() {
667                return Yaml::Integer(i);
668            }
669        }
670        match v {
671            "" | "~" | "null" => Yaml::Null,
672            "true" => Yaml::Boolean(true),
673            "false" => Yaml::Boolean(false),
674            _ => {
675                if let Ok(integer) = v.parse::<i64>() {
676                    Yaml::Integer(integer)
677                } else if parse_f64(v).is_some() {
678                    Yaml::Real(v.to_owned())
679                } else {
680                    Yaml::String(v.to_owned())
681                }
682            }
683        }
684    }
685}
686
687static BAD_VALUE: Yaml = Yaml::BadValue;
688impl<'a> Index<&'a str> for Yaml {
689    type Output = Yaml;
690
691    /// Perform indexing if `self` is a mapping.
692    ///
693    /// # Return
694    /// If `self` is a [`Yaml::Hash`], returns an immutable borrow to the value associated to the
695    /// given key in the hash.
696    ///
697    /// This function returns a [`Yaml::BadValue`] if the underlying [`type@Hash`] does not contain
698    /// [`Yaml::String`]`{idx}` as a key.
699    ///
700    /// This function also returns a [`Yaml::BadValue`] if `self` is not a [`Yaml::Hash`].
701    fn index(&self, idx: &'a str) -> &Yaml {
702        let key = Yaml::String(idx.to_owned());
703        match self.as_hash() {
704            Some(h) => h.get(&key).unwrap_or(&BAD_VALUE),
705            None => &BAD_VALUE,
706        }
707    }
708}
709
710impl<'a> IndexMut<&'a str> for Yaml {
711    /// Perform indexing if `self` is a mapping.
712    ///
713    /// Since we cannot return a mutable borrow to a static [`Yaml::BadValue`] as we return an
714    /// immutable one in [`Index<&'a str>`], this function panics on out of bounds.
715    ///
716    /// # Panics
717    /// This function panics if the given key is not contained in `self` (as per [`IndexMut`]).
718    ///
719    /// This function also panics if `self` is not a [`Yaml::Hash`].
720    fn index_mut(&mut self, idx: &'a str) -> &mut Yaml {
721        let key = Yaml::String(idx.to_owned());
722        match self.as_mut_hash() {
723            Some(h) => h.get_mut(&key).unwrap(),
724            None => panic!("Not a hash type"),
725        }
726    }
727}
728
729impl Index<usize> for Yaml {
730    type Output = Yaml;
731
732    /// Perform indexing if `self` is a sequence or a mapping.
733    ///
734    /// # Return
735    /// If `self` is a [`Yaml::Array`], returns an immutable borrow to the value located at the
736    /// given index in the array.
737    ///
738    /// Otherwise, if `self` is a [`Yaml::Hash`], returns a borrow to the value whose key is
739    /// [`Yaml::Integer`]`(idx)` (this would not work if the key is [`Yaml::String`]`("1")`.
740    ///
741    /// This function returns a [`Yaml::BadValue`] if the index given is out of range. If `self` is
742    /// a [`Yaml::Array`], this is when the index is bigger or equal to the length of the
743    /// underlying `Vec`. If `self` is a [`Yaml::Hash`], this is when the mapping sequence does not
744    /// contain [`Yaml::Integer`]`(idx)` as a key.
745    ///
746    /// This function also returns a [`Yaml::BadValue`] if `self` is not a [`Yaml::Array`] nor a
747    /// [`Yaml::Hash`].
748    fn index(&self, idx: usize) -> &Yaml {
749        if let Some(v) = self.as_vec() {
750            v.get(idx).unwrap_or(&BAD_VALUE)
751        } else if let Some(v) = self.as_hash() {
752            let key = Yaml::Integer(i64::try_from(idx).unwrap());
753            v.get(&key).unwrap_or(&BAD_VALUE)
754        } else {
755            &BAD_VALUE
756        }
757    }
758}
759
760impl IndexMut<usize> for Yaml {
761    /// Perform indexing if `self` is a sequence or a mapping.
762    ///
763    /// Since we cannot return a mutable borrow to a static [`Yaml::BadValue`] as we return an
764    /// immutable one in [`Index<usize>`], this function panics on out of bounds.
765    ///
766    /// # Panics
767    /// This function panics if the index given is out of range (as per [`IndexMut`]). If `self` is
768    /// a [`Yaml::Array`], this is when the index is bigger or equal to the length of the
769    /// underlying `Vec`. If `self` is a [`Yaml::Hash`], this is when the mapping sequence does not
770    /// contain [`Yaml::Integer`]`(idx)` as a key.
771    ///
772    /// This function also panics if `self` is not a [`Yaml::Array`] nor a [`Yaml::Hash`].
773    fn index_mut(&mut self, idx: usize) -> &mut Yaml {
774        match self {
775            Yaml::Array(sequence) => sequence.index_mut(idx),
776            Yaml::Hash(mapping) => {
777                let key = Yaml::Integer(i64::try_from(idx).unwrap());
778                mapping.get_mut(&key).unwrap()
779            }
780            _ => panic!("Attempting to index but `self` is not a sequence nor a mapping"),
781        }
782    }
783}
784
785impl IntoIterator for Yaml {
786    type Item = Yaml;
787    type IntoIter = YamlIter;
788
789    /// Extract the [`Array`] from `self` and iterate over it.
790    ///
791    /// If `self` is **not** of the [`Yaml::Array`] variant, this function will not panic or return
792    /// an error (as per the [`IntoIterator`] trait it cannot) but will instead return an iterator
793    /// over an empty [`Array`]. Callers have to ensure (using [`Yaml::is_array`], [`matches`] or
794    /// something similar) that the [`Yaml`] object is a [`Yaml::Array`] if they want to do error
795    /// handling.
796    ///
797    /// # Examples
798    /// ```
799    /// # use yaml_rust2::{Yaml, YamlLoader};
800    ///
801    /// // An array of 2 integers, 1 and 2.
802    /// let arr = &YamlLoader::load_from_str("- 1\n- 2").unwrap()[0];
803    ///
804    /// assert_eq!(arr.clone().into_iter().count(), 2);
805    /// assert_eq!(arr.clone().into_iter().next(), Some(Yaml::Integer(1)));
806    /// assert_eq!(arr.clone().into_iter().nth(1), Some(Yaml::Integer(2)));
807    ///
808    /// // An empty array returns an empty iterator.
809    /// let empty = Yaml::Array(vec![]);
810    /// assert_eq!(empty.into_iter().count(), 0);
811    ///
812    /// // A hash with 2 key-value pairs, `(a, b)` and `(c, d)`.
813    /// let hash = YamlLoader::load_from_str("a: b\nc: d").unwrap().remove(0);
814    /// // The hash has 2 elements.
815    /// assert_eq!(hash.as_hash().unwrap().iter().count(), 2);
816    /// // But since `into_iter` can't be used with a `Yaml::Hash`, `into_iter` returns an empty
817    /// // iterator.
818    /// assert_eq!(hash.into_iter().count(), 0);
819    /// ```
820    fn into_iter(self) -> Self::IntoIter {
821        YamlIter {
822            yaml: self.into_vec().unwrap_or_default().into_iter(),
823        }
824    }
825}
826
827/// An iterator over a [`Yaml`] node.
828pub struct YamlIter {
829    yaml: std::vec::IntoIter<Yaml>,
830}
831
832impl Iterator for YamlIter {
833    type Item = Yaml;
834
835    fn next(&mut self) -> Option<Yaml> {
836        self.yaml.next()
837    }
838}
839
840#[cfg(test)]
841mod test {
842    use super::{YAMLDecodingTrap, Yaml, YamlDecoder};
843
844    #[test]
845    fn test_read_bom() {
846        let s = b"\xef\xbb\xbf---
847a: 1
848b: 2.2
849c: [1, 2]
850";
851        let out = YamlDecoder::read(s as &[u8]).decode().unwrap();
852        let doc = &out[0];
853        assert_eq!(doc["a"].as_i64().unwrap(), 1i64);
854        assert!((doc["b"].as_f64().unwrap() - 2.2f64).abs() <= f64::EPSILON);
855        assert_eq!(doc["c"][1].as_i64().unwrap(), 2i64);
856        assert!(doc["d"][0].is_badvalue());
857    }
858
859    #[test]
860    fn test_read_utf16le() {
861        let s = b"\xff\xfe-\x00-\x00-\x00
862\x00a\x00:\x00 \x001\x00
863\x00b\x00:\x00 \x002\x00.\x002\x00
864\x00c\x00:\x00 \x00[\x001\x00,\x00 \x002\x00]\x00
865\x00";
866        let out = YamlDecoder::read(s as &[u8]).decode().unwrap();
867        let doc = &out[0];
868        println!("GOT: {doc:?}");
869        assert_eq!(doc["a"].as_i64().unwrap(), 1i64);
870        assert!((doc["b"].as_f64().unwrap() - 2.2f64) <= f64::EPSILON);
871        assert_eq!(doc["c"][1].as_i64().unwrap(), 2i64);
872        assert!(doc["d"][0].is_badvalue());
873    }
874
875    #[test]
876    fn test_read_utf16be() {
877        let s = b"\xfe\xff\x00-\x00-\x00-\x00
878\x00a\x00:\x00 \x001\x00
879\x00b\x00:\x00 \x002\x00.\x002\x00
880\x00c\x00:\x00 \x00[\x001\x00,\x00 \x002\x00]\x00
881";
882        let out = YamlDecoder::read(s as &[u8]).decode().unwrap();
883        let doc = &out[0];
884        println!("GOT: {doc:?}");
885        assert_eq!(doc["a"].as_i64().unwrap(), 1i64);
886        assert!((doc["b"].as_f64().unwrap() - 2.2f64).abs() <= f64::EPSILON);
887        assert_eq!(doc["c"][1].as_i64().unwrap(), 2i64);
888        assert!(doc["d"][0].is_badvalue());
889    }
890
891    #[test]
892    fn test_read_utf16le_nobom() {
893        let s = b"-\x00-\x00-\x00
894\x00a\x00:\x00 \x001\x00
895\x00b\x00:\x00 \x002\x00.\x002\x00
896\x00c\x00:\x00 \x00[\x001\x00,\x00 \x002\x00]\x00
897\x00";
898        let out = YamlDecoder::read(s as &[u8]).decode().unwrap();
899        let doc = &out[0];
900        println!("GOT: {doc:?}");
901        assert_eq!(doc["a"].as_i64().unwrap(), 1i64);
902        assert!((doc["b"].as_f64().unwrap() - 2.2f64).abs() <= f64::EPSILON);
903        assert_eq!(doc["c"][1].as_i64().unwrap(), 2i64);
904        assert!(doc["d"][0].is_badvalue());
905    }
906
907    #[test]
908    fn test_read_trap() {
909        let s = b"---
910a\xa9: 1
911b: 2.2
912c: [1, 2]
913";
914        let out = YamlDecoder::read(s as &[u8])
915            .encoding_trap(YAMLDecodingTrap::Ignore)
916            .decode()
917            .unwrap();
918        let doc = &out[0];
919        println!("GOT: {doc:?}");
920        assert_eq!(doc["a"].as_i64().unwrap(), 1i64);
921        assert!((doc["b"].as_f64().unwrap() - 2.2f64).abs() <= f64::EPSILON);
922        assert_eq!(doc["c"][1].as_i64().unwrap(), 2i64);
923        assert!(doc["d"][0].is_badvalue());
924    }
925
926    #[test]
927    fn test_or() {
928        assert_eq!(Yaml::Null.or(Yaml::Integer(3)), Yaml::Integer(3));
929        assert_eq!(Yaml::Integer(3).or(Yaml::Integer(7)), Yaml::Integer(3));
930    }
931}