From 437687034b11c901027aaf03af0b0d311ec7eb9b Mon Sep 17 00:00:00 2001 From: Samuel Colvin Date: Fri, 26 Jan 2024 07:51:12 +0000 Subject: [PATCH] more tests --- tests/main.rs | 14 ++++++++++++++ 1 file changed, 14 insertions(+) diff --git a/tests/main.rs b/tests/main.rs index 15bbf2c2..feed42f8 100644 --- a/tests/main.rs +++ b/tests/main.rs @@ -324,6 +324,8 @@ string_test_errors! { u4_unclosed: r#""\uxx"# => "EofWhileParsingString @ 5 - 1:5"; u4_unclosed2: r#""\udBdd"# => "EofWhileParsingString @ 7 - 1:7"; line_leading_surrogate: r#""\uddBd""# => "LoneLeadingSurrogateInHexEscape @ 6 - 1:7"; + // needs the long tail so SIMD is used to parse the string + line_leading_surrogate_tail: r#""\uddBd" "# => "LoneLeadingSurrogateInHexEscape @ 6 - 1:7"; unexpected_hex_escape1: r#""\udBd8x"# => "UnexpectedEndOfHexEscape @ 7 - 1:8"; unexpected_hex_escape2: r#""\udBd8xx"# => "UnexpectedEndOfHexEscape @ 7 - 1:8"; unexpected_hex_escape3: "\"un\\uDBBB\0" => "UnexpectedEndOfHexEscape @ 9 - 1:10"; @@ -562,6 +564,18 @@ fn bad_high_order_string() { assert_eq!(e.description(&bytes), "invalid unicode code point at line 1 column 5") } +#[test] +fn bad_high_order_string_tail() { + // needs the long tail so SIMD is used to parse the string + let mut bytes: Vec = vec![34, 32, 32, 210, 34]; + bytes.extend(vec![b' '; 100]); + // dbg!(json.iter().map(|b| *b as char).collect::>()); + let e = JsonValue::parse(&bytes, false).unwrap_err(); + assert_eq!(e.error_type, JsonErrorType::InvalidUnicodeCodePoint); + assert_eq!(e.index, 4); + assert_eq!(e.description(&bytes), "invalid unicode code point at line 1 column 5") +} + #[test] fn udb_string() { let bytes: Vec = vec![34, 92, 117, 100, 66, 100, 100, 92, 117, 100, 70, 100, 100, 34];