vparser/
lib.rs

// Copyright 2023-2024 Hugo Osvaldo Barrera
//
// SPDX-License-Identifier: ISC

//! See [`Parser`] as the main entry point to this library.
#![no_std]
#![deny(clippy::pedantic)]

extern crate alloc;

use core::{
    iter::{Enumerate, FusedIterator, Peekable},
    str::Bytes,
};

use alloc::{
    borrow::{Cow, ToOwned},
    string::ToString,
};

/// A valid content line.
///
/// Continuation lines may be folded; wrapped with continuation lines separated by a CRLF
/// immediately followed by a single linear white-space character (i.e., SPACE or HTAB).
#[derive(Debug, PartialEq, Clone)]
pub struct ContentLine<'input> {
    // TODO: use indeces instead; they're half the size and slightly simpler.
    /// The entire raw line, unaltered.
    raw: &'input str,
    /// Everything before the first colon or semicolon.
    name: &'input str,
    /// Everything before the first colon and after the first semicolon.
    params: &'input str,
    /// Everything after the first unquoted colon.
    value: &'input str,
}

impl<'input> ContentLine<'input> {
    /// Return the raw line without any unfolding.
    #[must_use]
    pub fn raw(&self) -> &'input str {
        self.raw
    }

    /// Return this line's name, with continuation lines unfolded.
    #[must_use]
    pub fn name(&self) -> Cow<'input, str> {
        unfold_lines(self.name)
    }

    /// Return this line's parameter(s), with continuation lines unfolded.
    #[must_use]
    pub fn params(&self) -> Cow<'input, str> {
        unfold_lines(self.params)
    }

    /// Return this line's value, with continuation lines unfolded.
    #[must_use]
    pub fn value(&self) -> Cow<'input, str> {
        unfold_lines(self.value)
    }

    /// Return the entire line unfolded.
    ///
    /// Note that the line may exceed the maximum length, making it technically invalid. This is
    /// however, suitable for comparing equality between to lines.
    #[must_use]
    pub fn unfolded(&self) -> Cow<'input, str> {
        unfold_lines(self.raw)
    }

    /// Return this content line with normalised folds
    ///
    /// The returned line shall be semantically equivalent to the input line. It will be folded
    /// making each logical line as long as possible (e.g.: no more than 75 octets, excluding the
    /// line jump).
    #[must_use]
    // INVARIANT: content lines only have valid continuation lines.
    #[allow(clippy::missing_panics_doc)]
    pub fn normalise_folds(&self) -> Cow<'input, str> {
        let mut result = Cow::Borrowed(self.raw);
        // Index where current portion begins.
        let mut cur = 0;
        // Not strictly where the line started; this is also shifted to compensate for unfolds.
        let mut line_start = 0;

        let mut chars = self.raw.char_indices().peekable();
        while let Some((i, c)) = chars.next() {
            if c == '\r' && matches!(chars.peek(), Some((_, '\n'))) {
                chars.next(); // Advance the peeked LF.

                assert!(
                    matches!(chars.next(), Some((_, ' ' | '\t'))),
                    "continuation line must start with a space or tab",
                );

                let next = chars.peek().map_or(1, |(_, c)| c.len_utf8());
                if i - line_start + next >= 75 {
                    // In this case we don't need to mutate anything; the whole line and CRLF
                    // stay they same.

                    // Note that the space already counts towards the following line.
                    line_start = i + 2;
                } else {
                    let portion = &self.raw[cur..i];
                    match result {
                        Cow::Borrowed(_) => {
                            result = Cow::Owned(portion.to_owned());
                        }
                        Cow::Owned(ref mut s) => {
                            s.push_str(portion);
                        }
                    }
                    // Shift by three to avoid counting CRLF<SPACE>.
                    line_start += 3;
                    cur = i + 3;
                }
            } else if (i - line_start) + c.len_utf8() >= 75 {
                let portion = &self.raw[cur..i];
                match result {
                    Cow::Borrowed(_) => {
                        result = Cow::Owned(portion.to_string() + "\r\n " + &c.to_string());
                    }
                    Cow::Owned(ref mut s) => {
                        s.push_str(portion);
                        s.push_str("\r\n ");
                        s.push(c);
                    }
                }
                cur = i + c.len_utf8();
                line_start = i - 1; // -1 to account for the inserted space.
            }
        }

        if let Cow::Owned(ref mut s) = result {
            let portion = &self.raw[cur..];
            s.push_str(portion);
        }

        result
    }
}

/// A flexible parser for icalendar/vcard.
///
/// This parser is designed to gracefully handle bogus data. The semantics of names, parameters,
/// and values are not validated. For example, a "date" may be an arbitrary string. Users of this
/// library should validate any data with the usual considerations for handling input data.
///
/// This parser itself is zero-copy. Accessors methods return unfolded names, values and
/// parameters. These accessors return a [`Cow`], and will allocate in case of folded lines.
///
/// It should be used via its [`Iterator`] implementation which iterates over [`ContentLine`]
/// instances.
///
/// # Known issues
///
/// - A trailing empty line is lost.
///
/// # See also
///
/// - [`Parser::next`]
pub struct Parser<'data> {
    data: &'data str,
    characters: Peekable<Enumerate<Bytes<'data>>>,
}

impl<'data> Parser<'data> {
    /// Create a new parser with the given input data.
    ///
    /// The input data MAY have unfolded continuation lines.
    #[must_use]
    pub fn new(data: &'data str) -> Parser<'data> {
        Parser {
            data,
            characters: data.bytes().enumerate().peekable(),
        }
    }

    /// Returns the unparsed portion of the input data.
    ///
    /// Does not affect advance the position of this iterator.
    #[must_use]
    pub fn remainder(&mut self) -> &str {
        &self.data[self
            .characters
            .peek()
            .map_or_else(|| self.data.len(), |(i, _)| *i)..]
    }
}

impl<'data> Iterator for Parser<'data> {
    type Item = ContentLine<'data>;

    /// Returns the next content line from the input data.
    ///
    /// This method is no-copy; a [`ContentLine`] contains only pointers to the original input
    /// data.
    ///
    /// Returns `None` after the last line has been returned. Returns `None` if called after the
    /// iterator has been exhausted.
    #[allow(clippy::too_many_lines)]
    fn next(&mut self) -> Option<ContentLine<'data>> {
        let (start, _) = *self.characters.peek()?;
        loop {
            match self.characters.next() {
                Some((semicolon, b';')) => loop {
                    match self.characters.next() {
                        Some((colon, b':')) => loop {
                            match self.characters.next() {
                                Some((cr, b'\r')) => {
                                    if !self.characters.peek().is_some_and(|(_, c)| *c == b'\n') {
                                        continue; // Not CRLF.
                                    };
                                    self.characters.next(); // Advance the peeked LF.
                                    if matches!(self.characters.peek(), Some((_, b' ' | b'\t'))) {
                                        continue; // Continuation line
                                    }
                                    return Some(ContentLine {
                                        raw: &self.data[start..cr],
                                        name: &self.data[start..semicolon],
                                        params: &self.data[semicolon + 1..colon],
                                        value: &self.data[colon + 1..cr],
                                    });
                                }
                                Some((_, _)) => {}
                                None => {
                                    return Some(ContentLine {
                                        raw: &self.data[start..],
                                        name: &self.data[start..semicolon],
                                        params: &self.data[semicolon + 1..colon],
                                        value: &self.data[colon + 1..],
                                    })
                                }
                            }
                        },
                        Some((_, b'"')) => loop {
                            match self.characters.next() {
                                Some((_, b'"')) => break,
                                Some((_, _)) => {}
                                None => {
                                    // WARN: reached EOF, expected closing quote
                                    return Some(ContentLine {
                                        raw: &self.data[start..],
                                        name: &self.data[start..semicolon],
                                        params: &self.data[semicolon + 1..],
                                        value: &self.data[semicolon..semicolon],
                                    });
                                }
                            }
                        },
                        Some((cr, b'\r')) => {
                            if !self.characters.peek().is_some_and(|(_, c)| *c == b'\n') {
                                continue; // Not CRLF.
                            };
                            self.characters.next(); // Advance the peeked LF.
                            if matches!(self.characters.peek(), Some((_, b' ' | b'\t'))) {
                                continue; // Continuation line
                            }
                            return Some(ContentLine {
                                raw: &self.data[start..cr],
                                name: &self.data[start..semicolon],
                                params: &self.data[semicolon + 1..cr],
                                value: &self.data[semicolon..semicolon],
                            });
                        }
                        Some((_, _)) => {}
                        None => {
                            return Some(ContentLine {
                                raw: &self.data[start..],
                                name: &self.data[start..semicolon],
                                params: &self.data[semicolon + 1..],
                                value: &self.data[semicolon..semicolon],
                            });
                        }
                    };
                },
                // Begin value
                Some((colon, b':')) => loop {
                    match self.characters.next() {
                        Some((cr, b'\r')) => {
                            if !self.characters.peek().is_some_and(|(_, c)| *c == b'\n') {
                                continue; // Not CRLF.
                            };
                            self.characters.next(); // Advance the peeked LF.
                            if matches!(self.characters.peek(), Some((_, b' ' | b'\t'))) {
                                continue; // Continuation line
                            }
                            return Some(ContentLine {
                                raw: &self.data[start..cr],
                                name: &self.data[start..colon],
                                params: &self.data[colon..colon],
                                value: &self.data[colon + 1..cr],
                            });
                        }
                        Some((_, _)) => {}
                        None => {
                            return Some(ContentLine {
                                raw: &self.data[start..],
                                name: &self.data[start..colon],
                                params: &self.data[colon..colon],
                                value: &self.data[colon + 1..],
                            });
                        }
                    }
                },
                Some((cr, b'\r')) => {
                    if !self.characters.peek().is_some_and(|(_, c)| *c == b'\n') {
                        continue; // Not CRLF.
                    };
                    self.characters.next(); // Advance the peeked LF.
                    if matches!(self.characters.peek(), Some((_, b' ' | b'\t'))) {
                        continue; // Continuation line
                    }
                    return Some(ContentLine {
                        raw: &self.data[start..cr],
                        name: &self.data[start..cr],
                        params: &self.data[start..start],
                        value: &self.data[start..start],
                    });
                }
                Some((_, _)) => {}
                None => {
                    return Some(ContentLine {
                        raw: &self.data[start..],
                        name: &self.data[start..],
                        params: &self.data[start..start],
                        value: &self.data[start..start],
                    });
                }
            }
        }
    }
}

impl<'data> FusedIterator for Parser<'data> {}

/// Unfold multiple continuation lines into a single line.
///
/// # Panics
///
/// If the input string has multiple non-continuation lines.
fn unfold_lines(lines: &str) -> Cow<str> {
    let mut result = Cow::Borrowed(lines);
    let mut cur = 0;

    let mut chars = lines.char_indices().peekable();
    while let Some((i, c)) = chars.next() {
        if c != '\r' {
            continue;
        }
        if !chars.peek().is_some_and(|(_, c)| *c == '\n') {
            continue; // Not CRLF.
        };
        chars.next(); // Advance the peeked LF.

        assert!(
            matches!(chars.next(), Some((_, ' ' | '\t'))),
            "continuation line is not a continuation line",
        );

        let portion = &lines[cur..i];
        match result {
            Cow::Borrowed(_) => {
                result = Cow::Owned(portion.to_owned());
            }
            Cow::Owned(ref mut s) => {
                s.push_str(portion);
            }
        }
        cur = i + 3;
    }

    if let Cow::Owned(ref mut s) = result {
        let portion = &lines[cur..];
        s.push_str(portion);
    }

    result
}

#[cfg(test)]
#[allow(clippy::too_many_lines)]
mod test {
    use crate::{unfold_lines, ContentLine, Parser};
    use alloc::borrow::Cow;

    #[test]
    fn test_complete_example() {
        let data = [
            "BEGIN:VCALENDAR",
            "VERSION:2.0",
            "PRODID:nl.whynothugo.todoman",
            "BEGIN:VTODO",
            "DTSTAMP:20231126T095923Z",
            "DUE;TZID=Asia/Shanghai:20231128T090000",
            "SUMMARY:dummy todo for parser tests",
            "UID:565f48cb5b424815a2ba5e56555e2832@destiny.whynothugo.nl",
            "END:VTODO",
            "END:VCALENDAR",
            // Note: this calendar is not entirely semantically valid;
            // it is missing the timezone which is referred to in DUE.
        ]
        .join("\r\n");

        let mut parser = Parser::new(&data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "BEGIN:VCALENDAR",
                name: "BEGIN",
                params: "",
                value: "VCALENDAR"
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "VERSION:2.0",
                name: "VERSION",
                params: "",
                value: "2.0",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "PRODID:nl.whynothugo.todoman",
                name: "PRODID",
                params: "",
                value: "nl.whynothugo.todoman",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "BEGIN:VTODO",
                name: "BEGIN",
                params: "",
                value: "VTODO",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTAMP:20231126T095923Z",
                name: "DTSTAMP",
                params: "",
                value: "20231126T095923Z",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DUE;TZID=Asia/Shanghai:20231128T090000",
                name: "DUE",
                params: "TZID=Asia/Shanghai",
                value: "20231128T090000",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "SUMMARY:dummy todo for parser tests",
                name: "SUMMARY",
                params: "",
                value: "dummy todo for parser tests",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "UID:565f48cb5b424815a2ba5e56555e2832@destiny.whynothugo.nl",
                name: "UID",
                params: "",
                value: "565f48cb5b424815a2ba5e56555e2832@destiny.whynothugo.nl",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "END:VTODO",
                name: "END",
                params: "",
                value: "VTODO",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "END:VCALENDAR",
                name: "END",
                params: "",
                value: "VCALENDAR",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_empty_data() {
        let data = "";
        let mut parser = Parser::new(data);
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_empty_lines() {
        // A line followed by CRLF is a different code-path than a line followed by EOF.
        let data = "\r\n";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(
            line,
            ContentLine {
                raw: "",
                name: "",
                params: "",
                value: "",
            }
        );
        assert_eq!(line.raw(), "");
        assert_eq!(line.name(), "");
        assert_eq!(line.params(), "");
        assert_eq!(line.value(), "");
        // FIXME: trailing empty lines are swallowed.
        // assert_eq!(
        //     parser.next(),
        //     Some(ContentLine {
        //         raw: "",
        //         name: "",
        //         params: "",
        //         value: "",
        //     })
        // );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_line_with_params() {
        // A line with ending in CRLF is a different code-path than a line in EOF.
        let data = [
            "DTSTART;TZID=America/New_York:19970902T090000",
            "DTSTART;TZID=America/New_York:19970902T090000",
        ]
        .join("\r\n");
        let mut parser = Parser::new(&data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTART;TZID=America/New_York:19970902T090000",
                name: "DTSTART",
                params: "TZID=America/New_York",
                value: "19970902T090000",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTART;TZID=America/New_York:19970902T090000",
                name: "DTSTART",
                params: "TZID=America/New_York",
                value: "19970902T090000",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_line_with_dquote() {
        // A line with ending in CRLF is a different code-path than a line in EOF.
        let data = [
            "SUMMARY:This has \"some quotes\"",
            "DTSTART;TZID=\"local;VALUE=DATE-TIME\":20150304T184500",
        ]
        .join("\r\n");
        let mut parser = Parser::new(&data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "SUMMARY:This has \"some quotes\"",
                name: "SUMMARY",
                params: "",
                value: "This has \"some quotes\"",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTART;TZID=\"local;VALUE=DATE-TIME\":20150304T184500",
                name: "DTSTART",
                params: "TZID=\"local;VALUE=DATE-TIME\"",
                value: "20150304T184500",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_continuation_line() {
        // A line with ending in CRLF is a different code-path than a line in EOF.
        let data = [
            "X-JMAP-LOCATION;VALUE=TEXT;X-JMAP-GEO=\"geo:52.123456,4.123456\";",
            " X-JMAP-ID=03453afa-71fc-4893-ba70-a7436bb6d56c:Name of place",
            "X-JMAP-LOCATION;VALUE=TEXT;X-JMAP-GEO=\"geo:52.123456,4.123456\";",
            " X-JMAP-ID=03453afa-71fc-4893-ba70-a7436bb6d56c:Name of place",
        ]
        .join("\r\n");
        let mut parser = Parser::new(&data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: &[
                    "X-JMAP-LOCATION;VALUE=TEXT;X-JMAP-GEO=\"geo:52.123456,4.123456\";",
                    " X-JMAP-ID=03453afa-71fc-4893-ba70-a7436bb6d56c:Name of place",
                ]
                .join("\r\n"),
                name: "X-JMAP-LOCATION",
                params: "VALUE=TEXT;X-JMAP-GEO=\"geo:52.123456,4.123456\";\r\n X-JMAP-ID=03453afa-71fc-4893-ba70-a7436bb6d56c",
                value: "Name of place",
            })
        );
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: &[
                    "X-JMAP-LOCATION;VALUE=TEXT;X-JMAP-GEO=\"geo:52.123456,4.123456\";",
                    " X-JMAP-ID=03453afa-71fc-4893-ba70-a7436bb6d56c:Name of place",
                ]
                .join("\r\n"),
                name: "X-JMAP-LOCATION",
                params: "VALUE=TEXT;X-JMAP-GEO=\"geo:52.123456,4.123456\";\r\n X-JMAP-ID=03453afa-71fc-4893-ba70-a7436bb6d56c",
                value: "Name of place",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_invalid_lone_name() {
        let data = "BEGIN";
        let mut parser = Parser::new(data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "BEGIN",
                name: "BEGIN",
                params: "",
                value: "",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_invalid_name_with_params() {
        let data = "DTSTART;TZID=America/New_York";
        let mut parser = Parser::new(data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTART;TZID=America/New_York",
                name: "DTSTART",
                params: "TZID=America/New_York",
                value: "",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_invalid_name_with_trailing_semicolon() {
        let data = "DTSTART;";
        let mut parser = Parser::new(data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTART;",
                name: "DTSTART",
                params: "",
                value: "",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_invalid_name_with_trailing_colon() {
        let data = "DTSTART:";
        let mut parser = Parser::new(data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "DTSTART:",
                name: "DTSTART",
                params: "",
                value: "",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_remainder() {
        let data = ["BEGIN:VTODO", "SUMMARY:Do the thing"].join("\r\n");
        let mut parser = Parser::new(&data);
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "BEGIN:VTODO",
                name: "BEGIN",
                params: "",
                value: "VTODO",
            })
        );
        assert_eq!(parser.remainder(), "SUMMARY:Do the thing");
        assert_eq!(
            parser.next(),
            Some(ContentLine {
                raw: "SUMMARY:Do the thing",
                name: "SUMMARY",
                params: "",
                value: "Do the thing",
            })
        );
        assert_eq!(parser.next(), None);
    }

    #[test]
    fn test_fold_multiline() {
        assert_eq!(
            unfold_lines("UID:horrible-\r\n example"),
            "UID:horrible-example"
        );
        assert_eq!(unfold_lines("UID:X\r\n Y"), "UID:XY");
        assert_eq!(unfold_lines("UID:X\r\n "), "UID:X");
        assert_eq!(
            unfold_lines("UID:quite\r\n a\r\n few\r\n lines"),
            "UID:quiteafewlines"
        );
    }

    #[test]
    #[should_panic(expected = "continuation line is not a continuation line")]
    fn test_fold_multiline_missing_whitespace() {
        unfold_lines("UID:two\r\nlines");
    }

    #[test]
    fn test_normalise_folds_short() {
        let data = "SUMMARY:Hello there";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        assert_eq!(line.normalise_folds(), data);
        assert!(matches!(line.normalise_folds(), Cow::Borrowed(_)));
    }

    #[test]
    fn test_normalise_folds_with_carrige_returns() {
        let data = "SUMMARY:Hello \rthere";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        assert_eq!(line.normalise_folds(), data);
        assert!(matches!(line.normalise_folds(), Cow::Borrowed(_)));
    }

    #[test]
    fn test_normalise_folds_with_newlines() {
        let data = "SUMMARY:Hello \nthere";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        assert_eq!(line.normalise_folds(), data);
        assert!(matches!(line.normalise_folds(), Cow::Borrowed(_)));
    }

    #[test]
    fn test_normalise_folds_too_many_folds() {
        let data = "SUMMARY:Hello \r\n \r\n there";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        let expected = "SUMMARY:Hello there";
        assert_eq!(line.normalise_folds(), expected);
    }

    #[test]
    fn test_normalise_folds_long() {
        let data = [
            "SUMMARY:Some really long text that nobody ",
            " cares about, but is wrapped in two lines.",
        ]
        .join("\r\n");
        let mut parser = Parser::new(&data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        let expected = [
            "SUMMARY:Some really long text that nobody cares about, but is wrapped in t",
            " wo lines.",
        ]
        .join("\r\n");
        assert_eq!(line.normalise_folds(), expected);
    }

    #[test]
    fn test_normalise_folds_multibyte() {
        // This is 59 characters, 161 octets
        let data = "SUMMARY:動千首看院波未假遠子到花，白六到星害，馬吃牠說衣欠去皮香收司意，青個話化汁喜視娘以男雪青土已升斤法兌。";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        let expected = [
            // Keep in mind that CR counts, but LF does not.
            "SUMMARY:動千首看院波未假遠子到花，白六到星害，馬吃牠", // 74
            " 說衣欠去皮香收司意，青個話化汁喜視娘以男雪青土已",    // 73
            " 升斤法兌。",                                          // 16
        ]
        .join("\r\n");
        assert_eq!(line.normalise_folds(), expected);
    }

    #[test]
    fn test_normalise_folds_multibyte_noop() {
        // This is 59 characters, 161 octets
        let data = [
            // Keep in mind that CR counts, but LF does not.
            "SUMMARY:動千首看院波未假遠子到花，白六到星害，馬吃牠", // 74
            " 說衣欠去皮香收司意，青個話化汁喜視娘以男雪青土已",    // 73
            " 升斤法兌。",                                          // 16
        ]
        .join("\r\n");
        let mut parser = Parser::new(&data);
        let line = parser.next().unwrap();
        assert_eq!(parser.next(), None);

        assert_eq!(line.normalise_folds(), data);
        assert!(matches!(line.normalise_folds(), Cow::Borrowed(_)));
    }

    #[test]
    fn test_unfold_params_with_trailing_crlf() {
        let data = ";\r\n";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(line.raw(), ";");
        assert_eq!(line.name(), "");
        assert_eq!(line.params(), "");
        assert_eq!(line.value(), "");
    }

    #[test]
    fn test_unfold_name_with_trailing_crlf() {
        let data = "\r\n";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(line.raw(), "");
        assert_eq!(line.name(), "");
        assert_eq!(line.params(), "");
        assert_eq!(line.value(), "");
    }

    #[test]
    fn test_unfold_value_with_trailing_crlf() {
        let data = ";:\r\n";
        let mut parser = Parser::new(data);
        let line = parser.next().unwrap();
        assert_eq!(line.raw(), ";:");
        assert_eq!(line.name(), "");
        assert_eq!(line.params(), "");
        assert_eq!(line.value(), "");
    }
}
vparser/lib.rs

vparser/
lib.rs