Change-Id: If05fa3d0f41d45e3574e0c5ddff406cb33dc52f4 Reviewed-on: https://cl.tvl.fyi/c/depot/+/11470 Tested-by: BuildkiteCI Reviewed-by: Connor Brewster <cbrewster@hey.com> Autosubmit: flokli <flokli@flokli.de>
125 lines
4.2 KiB
Rust
125 lines
4.2 KiB
Rust
//! This module implements parsing code for some basic building blocks
|
|
//! of the [ATerm][] format, which is used by C++ Nix to serialize Derivations.
|
|
//!
|
|
//! [ATerm]: http://program-transformation.org/Tools/ATermFormat.html
|
|
use bstr::BString;
|
|
use nom::branch::alt;
|
|
use nom::bytes::complete::{escaped_transform, is_not, tag};
|
|
use nom::character::complete::char as nomchar;
|
|
use nom::combinator::{map, value};
|
|
use nom::multi::separated_list0;
|
|
use nom::sequence::delimited;
|
|
use nom::IResult;
|
|
|
|
/// Parse a bstr and undo any escaping.
|
|
fn parse_escaped_bstr(i: &[u8]) -> IResult<&[u8], BString> {
|
|
escaped_transform(
|
|
is_not("\"\\"),
|
|
'\\',
|
|
alt((
|
|
value("\\".as_bytes(), nomchar('\\')),
|
|
value("\n".as_bytes(), nomchar('n')),
|
|
value("\t".as_bytes(), nomchar('t')),
|
|
value("\r".as_bytes(), nomchar('r')),
|
|
value("\"".as_bytes(), nomchar('\"')),
|
|
)),
|
|
)(i)
|
|
.map(|(i, v)| (i, BString::new(v)))
|
|
}
|
|
|
|
/// Parse a field in double quotes, undo any escaping, and return the unquoted
|
|
/// and decoded `Vec<u8>`.
|
|
pub(crate) fn parse_bstr_field(i: &[u8]) -> IResult<&[u8], BString> {
|
|
// inside double quotes…
|
|
delimited(
|
|
nomchar('\"'),
|
|
// There is
|
|
alt((
|
|
// …either is a bstr after unescaping
|
|
parse_escaped_bstr,
|
|
// …or an empty string.
|
|
map(tag(b""), |_| BString::default()),
|
|
)),
|
|
nomchar('\"'),
|
|
)(i)
|
|
}
|
|
|
|
/// Parse a field in double quotes, undo any escaping, and return the unquoted
|
|
/// and decoded string, if it's a valid string. Or fail parsing if the bytes are
|
|
/// no valid UTF-8.
|
|
pub(crate) fn parse_string_field(i: &[u8]) -> IResult<&[u8], String> {
|
|
// inside double quotes…
|
|
delimited(
|
|
nomchar('\"'),
|
|
// There is
|
|
alt((
|
|
// either is a String after unescaping
|
|
nom::combinator::map_opt(parse_escaped_bstr, |escaped_bstr| {
|
|
String::from_utf8(escaped_bstr.into()).ok()
|
|
}),
|
|
// or an empty string.
|
|
map(tag(b""), |_| String::new()),
|
|
)),
|
|
nomchar('\"'),
|
|
)(i)
|
|
}
|
|
|
|
/// Parse a list of of string fields (enclosed in brackets)
|
|
pub(crate) fn parse_str_list(i: &[u8]) -> IResult<&[u8], Vec<String>> {
|
|
// inside brackets
|
|
delimited(
|
|
nomchar('['),
|
|
separated_list0(nomchar(','), parse_string_field),
|
|
nomchar(']'),
|
|
)(i)
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use rstest::rstest;
|
|
|
|
#[rstest]
|
|
#[case::empty(br#""""#, b"", b"")]
|
|
#[case::hello_world(br#""Hello World""#, b"Hello World", b"")]
|
|
#[case::doublequote(br#""\"""#, br#"""#, b"")]
|
|
#[case::colon(br#"":""#, b":", b"")]
|
|
#[case::doublequote_rest(br#""\""Rest"#, br#"""#, b"Rest")]
|
|
fn test_parse_bstr_field(
|
|
#[case] input: &[u8],
|
|
#[case] expected: &[u8],
|
|
#[case] exp_rest: &[u8],
|
|
) {
|
|
let (rest, parsed) = super::parse_bstr_field(input).expect("must parse");
|
|
assert_eq!(exp_rest, rest, "expected remainder");
|
|
assert_eq!(expected, parsed);
|
|
}
|
|
|
|
#[rstest]
|
|
#[case::empty(br#""""#, "", b"")]
|
|
#[case::hello_world(br#""Hello World""#, "Hello World", b"")]
|
|
#[case::doublequote(br#""\"""#, r#"""#, b"")]
|
|
#[case::colon(br#"":""#, ":", b"")]
|
|
#[case::doublequote_rest(br#""\""Rest"#, r#"""#, b"Rest")]
|
|
fn parse_string_field(#[case] input: &[u8], #[case] expected: &str, #[case] exp_rest: &[u8]) {
|
|
let (rest, parsed) = super::parse_string_field(input).expect("must parse");
|
|
assert_eq!(exp_rest, rest, "expected remainder");
|
|
assert_eq!(expected, &parsed);
|
|
}
|
|
|
|
#[test]
|
|
fn parse_string_field_invalid_encoding_fail() {
|
|
let input: Vec<_> = vec![b'"', 0xc5, 0xc4, 0xd6, b'"'];
|
|
|
|
super::parse_string_field(&input).expect_err("must fail");
|
|
}
|
|
|
|
#[rstest]
|
|
#[case::single_foo(br#"["foo"]"#, vec!["foo".to_string()], b"")]
|
|
#[case::empty_list(b"[]", vec![], b"")]
|
|
#[case::empty_list_with_rest(b"[]blub", vec![], b"blub")]
|
|
fn parse_list(#[case] input: &[u8], #[case] expected: Vec<String>, #[case] exp_rest: &[u8]) {
|
|
let (rest, parsed) = super::parse_str_list(input).expect("must parse");
|
|
assert_eq!(exp_rest, rest, "expected remainder");
|
|
assert_eq!(expected, parsed);
|
|
}
|
|
}
|