From 789f504ccafe8b1a60d781e4e13f01d64d9d3100 Mon Sep 17 00:00:00 2001 From: CAD97 Date: Tue, 21 Sep 2021 14:51:53 -0500 Subject: [PATCH 1/2] Rewrite env filter parsing to be stricter --- tracing-subscriber/Cargo.toml | 4 +- .../src/filter/env/directive.rs | 123 +--- tracing-subscriber/src/filter/env/mod.rs | 40 +- tracing-subscriber/src/filter/env/parsing.rs | 642 ++++++++++++++++++ 4 files changed, 691 insertions(+), 118 deletions(-) create mode 100644 tracing-subscriber/src/filter/env/parsing.rs diff --git a/tracing-subscriber/Cargo.toml b/tracing-subscriber/Cargo.toml index db9bf35797..0dc23793e7 100644 --- a/tracing-subscriber/Cargo.toml +++ b/tracing-subscriber/Cargo.toml @@ -24,7 +24,7 @@ keywords = ["logging", "tracing", "metrics", "subscriber"] [features] default = ["env-filter", "smallvec", "fmt", "ansi", "chrono", "tracing-log", "json"] -env-filter = ["matchers", "regex", "lazy_static", "tracing"] +env-filter = ["matchers", "tracing"] fmt = ["registry"] ansi = ["fmt", "ansi_term"] registry = ["sharded-slab", "thread_local"] @@ -36,9 +36,7 @@ tracing-core = { path = "../tracing-core", version = "0.2" } # only required by the filter feature tracing = { optional = true, path = "../tracing", version = "0.2", default-features = false, features = ["std"] } matchers = { optional = true, version = "0.1.0" } -regex = { optional = true, version = "1", default-features = false, features = ["std"] } smallvec = { optional = true, version = "1" } -lazy_static = { optional = true, version = "1" } # fmt tracing-log = { path = "../tracing-log", version = "0.2", optional = true, default-features = false, features = ["log-tracer", "std"] } diff --git a/tracing-subscriber/src/filter/env/directive.rs b/tracing-subscriber/src/filter/env/directive.rs index 1bd97cc42d..582db5f80a 100644 --- a/tracing-subscriber/src/filter/env/directive.rs +++ b/tracing-subscriber/src/filter/env/directive.rs @@ -1,7 +1,9 @@ use super::super::level::{self, LevelFilter}; -use super::{field, FieldMap, FilterVec}; -use lazy_static::lazy_static; -use regex::Regex; +use super::{ + field, + parsing::{parse_one_directive, ParseErrorKind}, + FieldMap, FilterVec, +}; use std::{cmp::Ordering, error::Error, fmt, iter::FromIterator, str::FromStr}; use tracing_core::{span, Level, Metadata}; @@ -10,8 +12,8 @@ use tracing_core::{span, Level, Metadata}; #[derive(Debug, Eq, PartialEq)] #[cfg_attr(docsrs, doc(cfg(feature = "env-filter")))] pub struct Directive { - in_span: Option, - fields: FilterVec, + pub(super) in_span: Option, + pub(super) fields: FilterVec, pub(crate) target: Option, pub(crate) level: LevelFilter, } @@ -58,13 +60,6 @@ pub struct ParseError { kind: ParseErrorKind, } -#[derive(Debug)] -enum ParseErrorKind { - Field(Box), - Level(level::ParseError), - Other, -} - impl Directive { pub(super) fn has_name(&self) -> bool { self.in_span.is_some() @@ -176,94 +171,12 @@ impl Match for Directive { impl FromStr for Directive { type Err = ParseError; fn from_str(from: &str) -> Result { - lazy_static! { - static ref DIRECTIVE_RE: Regex = Regex::new( - r"(?x) - ^(?P(?i:trace|debug|info|warn|error|off|[0-5]))$ | - # ^^^. - # `note: we match log level names case-insensitively - ^ - (?: # target name or span name - (?P[\w:-]+)|(?P\[[^\]]*\]) - ){1,2} - (?: # level or nothing - =(?P(?i:trace|debug|info|warn|error|off|[0-5]))? - # ^^^. - # `note: we match log level names case-insensitively - )? - $ - " - ) - .unwrap(); - static ref SPAN_PART_RE: Regex = - Regex::new(r#"(?P[^\]\{]+)?(?:\{(?P[^\}]*)\})?"#).unwrap(); - static ref FIELD_FILTER_RE: Regex = - // TODO(eliza): this doesn't _currently_ handle value matchers that include comma - // characters. We should fix that. - Regex::new(r#"(?x) - ( - # field name - [[:word:]][[[:word:]]\.]* - # value part (optional) - (?:=[^,]+)? - ) - # trailing comma or EOS - (?:,\s?|$) - "#).unwrap(); - } - - let caps = DIRECTIVE_RE.captures(from).ok_or_else(ParseError::new)?; - - if let Some(level) = caps - .name("global_level") - .and_then(|s| s.as_str().parse().ok()) - { - return Ok(Directive { - level, - ..Default::default() - }); + let (parsed, after) = parse_one_directive(from); + if after != from.len() { + Err(ParseError::new()) + } else { + Ok(parsed?) } - - let target = caps.name("target").and_then(|c| { - let s = c.as_str(); - if s.parse::().is_ok() { - None - } else { - Some(s.to_owned()) - } - }); - - let (in_span, fields) = caps - .name("span") - .and_then(|cap| { - let cap = cap.as_str().trim_matches(|c| c == '[' || c == ']'); - let caps = SPAN_PART_RE.captures(cap)?; - let span = caps.name("name").map(|c| c.as_str().to_owned()); - let fields = caps - .name("fields") - .map(|c| { - FIELD_FILTER_RE - .find_iter(c.as_str()) - .map(|c| c.as_str().parse()) - .collect::, _>>() - }) - .unwrap_or_else(|| Ok(FilterVec::new())); - Some((span, fields)) - }) - .unwrap_or_else(|| (None, Ok(FilterVec::new()))); - - let level = caps - .name("level") - .and_then(|l| l.as_str().parse().ok()) - // Setting the target without the level enables every level for that target - .unwrap_or(LevelFilter::TRACE); - - Ok(Directive { - level, - target, - in_span, - fields: fields?, - }) } } @@ -643,6 +556,9 @@ impl fmt::Display for ParseError { ParseErrorKind::Other => f.pad("invalid filter directive"), ParseErrorKind::Level(ref l) => l.fmt(f), ParseErrorKind::Field(ref e) => write!(f, "invalid field filter: {}", e), + ParseErrorKind::UnexpectedSyntax(ref c) => { + write!(f, "unexpected semantic character: {}", c) + } } } } @@ -657,6 +573,7 @@ impl Error for ParseError { ParseErrorKind::Other => None, ParseErrorKind::Level(ref l) => Some(l), ParseErrorKind::Field(ref n) => Some(n.as_ref()), + ParseErrorKind::UnexpectedSyntax(_) => None, } } } @@ -677,6 +594,12 @@ impl From for ParseError { } } +impl From for ParseError { + fn from(kind: ParseErrorKind) -> Self { + Self { kind } + } +} + // ===== impl DynamicMatch ===== impl CallsiteMatcher { @@ -1106,7 +1029,7 @@ mod test { #[test] fn parse_directives_with_special_characters_in_span_name() { - let span_name = "!\"#$%&'()*+-./:;<=>?@^_`|~[}"; + let span_name = r##"!#$%&'()*+-.:;<>?@^_`|~"##; // forbidden: "/[]{}= let dirs = parse_directives(format!("target[{}]=info", span_name)); assert_eq!(dirs.len(), 1, "\nparsed: {:#?}", dirs); diff --git a/tracing-subscriber/src/filter/env/mod.rs b/tracing-subscriber/src/filter/env/mod.rs index f983418059..2b45ebecb8 100644 --- a/tracing-subscriber/src/filter/env/mod.rs +++ b/tracing-subscriber/src/filter/env/mod.rs @@ -10,13 +10,14 @@ pub use self::{ }; mod directive; mod field; +mod parsing; use crate::{ filter::LevelFilter, subscribe::{Context, Subscribe}, sync::RwLock, }; -use std::{cell::RefCell, collections::HashMap, env, error::Error, fmt, str::FromStr}; +use std::{cell::RefCell, collections::HashMap, env, error::Error, fmt, iter, str::FromStr}; use tracing_core::{ callsite, collect::{Collect, Interest}, @@ -151,24 +152,32 @@ impl EnvFilter { /// Returns a new `EnvFilter` from the directives in the given string, /// ignoring any that are invalid. pub fn new>(dirs: S) -> Self { - let directives = dirs.as_ref().split(',').filter_map(|s| match s.parse() { - Ok(d) => Some(d), - Err(err) => { - eprintln!("ignoring `{}`: {}", s, err); - None + let mut dirs = dirs.as_ref(); + let directives = iter::from_fn(move || { + if dirs.is_empty() { + return None; } - }); + let (parsed, after) = parsing::parse_one_directive(dirs); + dirs = &dirs[after..]; + Some(parsed) + }) + .filter_map(Result::ok); Self::from_directives(directives) } /// Returns a new `EnvFilter` from the directives in the given string, /// or an error if any are invalid. pub fn try_new>(dirs: S) -> Result { - let directives = dirs - .as_ref() - .split(',') - .map(|s| s.parse()) - .collect::, _>>()?; + let mut dirs = dirs.as_ref(); + let directives = iter::from_fn(move || { + if dirs.is_empty() { + return None; + } + let (parsed, after) = parsing::parse_one_directive(dirs); + dirs = &dirs[after..]; + Some(parsed) + }) + .collect::, _>>()?; Ok(Self::from_directives(directives)) } @@ -679,7 +688,8 @@ mod tests { #[test] fn callsite_enabled_includes_span_directive_multiple_fields() { - let filter = EnvFilter::new("app[mySpan{field=\"value\",field2=2}]=debug") + let filter = EnvFilter::try_new(r#"app[mySpan{field="value",field2=2}]=debug"#) + .unwrap() .with_collector(NoCollector); static META: &Metadata<'static> = &Metadata::new( "mySpan", @@ -693,13 +703,13 @@ mod tests { ); let interest = filter.register_callsite(META); - assert!(interest.is_never()); + assert!(interest.is_sometimes()); } #[test] fn roundtrip() { let f1: EnvFilter = - "[span1{foo=1}]=error,[span2{bar=2 baz=false}],crate2[{quux=\"quuux\"}]=debug" + "[span1{foo=1}]=error,[span2{bar=2, baz=false}],crate2[{quux=\"quuux\"}]=debug" .parse() .unwrap(); let f2: EnvFilter = format!("{}", f1).parse().unwrap(); diff --git a/tracing-subscriber/src/filter/env/parsing.rs b/tracing-subscriber/src/filter/env/parsing.rs new file mode 100644 index 0000000000..10f6d81c98 --- /dev/null +++ b/tracing-subscriber/src/filter/env/parsing.rs @@ -0,0 +1,642 @@ +use super::{ + super::level::{self, LevelFilter}, + field::{Match, ValueMatch}, + Directive, FilterVec, +}; +use std::{borrow::Cow, error::Error, str::FromStr}; + +fn parse_level_filter(s: &str) -> Result::Err> { + if s.is_empty() { + Ok(LevelFilter::TRACE) + } else { + s.parse() + } +} + +/// Macro to select execution path with the index of the first occurance of +/// some given reserved syntax character, or EOI if no characters present. +/// +/// # Example +/// +/// ```rust,ignore +/// let source: &str; +/// # source = ""; +/// switch_syntax!(source => |i| { +/// '(' | ')' => println!("paren at index {}", i), +/// '[' | ']' => println!("brack at index {}", i), +/// '{' | '}' => println!("brace at index {}", i), +/// _ => println!("EOI at index {}", i), +/// }); +/// ``` +macro_rules! switch_syntax { + ($haystack:expr => |$ix:ident| { + $($($needle:tt)|+ => $expr:expr),* $(,)? + }) => {{ + let haystack: &str = &$haystack; + match find_syntax(haystack) { + $((ix, $(switch_syntax!(@syntax $needle))|+) => { + #[allow(unused_variables)] + let $ix = ix; + $expr + })* + } + }}; + + (@syntax '[') => (Some(Syntax::LBrack)); + (@syntax ']') => (Some(Syntax::RBrack)); + (@syntax '{') => (Some(Syntax::LBrace)); + (@syntax '}') => (Some(Syntax::RBrace)); + (@syntax '=') => (Some(Syntax::Equal)); + (@syntax ',') => (Some(Syntax::Comma)); + (@syntax '"') => (Some(Syntax::Quote)); + (@syntax '/') => (Some(Syntax::Slash)); + (@syntax _) => (None); + (@syntax $other:literal) => (compile_error!(concat!("unknown syntax character `", $other, "`"))); +} + +#[repr(u8)] +#[derive(Clone, Copy, PartialEq, Eq)] +enum Syntax { + LBrack = b'[', + RBrack = b']', + LBrace = b'{', + RBrace = b'}', + Equal = b'=', + Comma = b',', + Quote = b'"', + Slash = b'/', +} + +fn find_syntax(haystack: &str) -> (usize, Option) { + use Syntax::*; + haystack + .bytes() + .enumerate() + .find_map(|(i, b)| match b { + b'[' => Some((i, LBrack)), + b']' => Some((i, RBrack)), + b'{' => Some((i, LBrace)), + b'}' => Some((i, RBrace)), + b'=' => Some((i, Equal)), + b',' => Some((i, Comma)), + b'"' => Some((i, Quote)), + b'/' => Some((i, Slash)), + _ => None, + }) + .map_or_else(|| (haystack.len(), None), |(i, c)| (i, Some(c))) +} + +#[derive(Debug)] +pub(super) enum ParseErrorKind { + Field(Box), + Level(level::ParseError), + UnexpectedSyntax(char), + Other, +} + +/// Parse a single directive off the front of the source string. +/// +/// Returns the parsed directive or a parse error, along with the index of +/// the start of the next directive, making an attempt at error recovery +/// in the face of reasonably recoverable parser errors. +/// +/// # Syntax +/// +/// ```text +/// target[span{field=value}]=level +/// ``` +/// +/// All of the directive fields are optional, and multiple `field=value` pairs +/// may be provided, so the following are also valid directives: +/// +/// ```text +/// target +/// =level +/// [{}] +/// [{field=value,field=value}] +/// ``` +#[allow(unused)] +pub(super) fn parse_one_directive(source: &str) -> (Result, usize) { + fn try_recover_with(source: &str, at: usize, syntax: Syntax) -> usize { + let (i, next_syntax) = find_syntax(&source[at..]); + if next_syntax == Some(syntax) { + at + i + 1 + } else { + source.len() + } + } + + fn parse_at_span( + source: &str, + target: Option, + ) -> (Result, usize) { + assert_eq!(source.as_bytes()[0], b'['); + + if source[1..].starts_with('"') { + return match parse_one_quote_string(&source[1..]) { + (None, _) => (Err(ParseErrorKind::Other), source.len()), + (Some(quoted), after_quoted) => match source.as_bytes().get(1 + after_quoted) { + None => (Err(ParseErrorKind::Other), source.len()), + Some(&syntax @ (b'/' | b'[' | b'}' | b'"' | b',' | b'=')) => ( + Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + source.len(), + ), + Some(b']') => { + let (parsed, after_parsed) = parse_at_level( + &source[1 + after_quoted + 1..], + Some(quoted.into()), + FilterVec::new(), + target, + ); + (parsed, 1 + after_parsed + 1) + } + Some(b'{') => { + let (fields, after_fields) = parse_at_fields(&source[1 + after_quoted..]); + match fields { + Err(e) => (Err(e), source.len()), + Ok(fields) => { + let (parsed, after_parsed) = parse_at_level( + &source[1 + after_quoted + after_fields..], + Some(quoted.into()), + FilterVec::new(), + target, + ); + (parsed, 1 + after_quoted + after_fields + after_parsed) + } + } + } + _ => ( + Err(ParseErrorKind::Other), + try_recover_with(source, 1 + after_quoted, Syntax::Comma), + ), + }, + }; + } + + switch_syntax!(&source[1..] => |i| { + '/' => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + '[' => (Err(ParseErrorKind::UnexpectedSyntax('[')), source.len()), + '}' => (Err(ParseErrorKind::UnexpectedSyntax('}')), source.len()), + '"' => (Err(ParseErrorKind::UnexpectedSyntax('"')), source.len()), + ',' => (Err(ParseErrorKind::UnexpectedSyntax(',')), source.len()), + '=' => (Err(ParseErrorKind::UnexpectedSyntax('=')), source.len()), + ']' => { + let (parsed, after_parsed) = parse_at_level( + &source[1 + i + 1..], + Some(source[1..1 + i].trim()).filter(|s| !s.is_empty()).map(Into::into), + FilterVec::new(), + target, + ); + (parsed, 1 + i + 1 + after_parsed) + }, + '{' => { + let (fields, after_fields) = parse_at_fields(&source[1 + i..]); + match fields { + Err(e) => (Err(e), source.len()), + Ok(fields) => { + let (parsed, after_parsed) = parse_at_level( + &source[1 + i + after_fields..], + Some(source[1..1 + i].trim()).filter(|s| !s.is_empty()).map(Into::into), + fields, + target, + ); + (parsed, 1 + i + after_fields + after_parsed) + } + } + }, + _ => (Err(ParseErrorKind::Other), source.len()), + }) + } + + // NB: includes parsing the comma, if present + fn parse_at_field(source: &str) -> (Result, usize) { + let mut cursor = 0; + + let name = if source.starts_with('"') { + match parse_one_quote_string(source) { + (None, _) => return (Err(ParseErrorKind::Other), source.len()), + (Some(quoted), after_quoted) => { + cursor = after_quoted; + quoted.into() + } + } + } else { + let (syntax_at, _) = find_syntax(source); + cursor = syntax_at; + source[..cursor].trim().into() + }; + + match source.as_bytes().get(cursor) { + None => (Err(ParseErrorKind::Other), source.len()), + Some(b',') => (Ok(Match { name, value: None }), cursor + 1), + Some(b'}') => (Ok(Match { name, value: None }), cursor), + Some(b'=') => { + cursor += 1; + if source[cursor..].starts_with('"') { + match parse_one_quote_string(&source[cursor..]) { + (None, _) => (Err(ParseErrorKind::Other), source.len()), + (Some(quoted), after_quoted) => { + // Prefer env filter syntax error + cursor += after_quoted; + match source.as_bytes().get(cursor) { + None => (Err(ParseErrorKind::Other), source.len()), + Some(b',') => ( + Ok(Match { name, value: None }).and_then(|mut m| { + m.value = Some( + quoted + .parse::() + .map_err(|e| ParseErrorKind::Field(e.into()))?, + ); + Ok(m) + }), + cursor + 1, + ), + Some(b'}') => ( + Ok(Match { name, value: None }).and_then(|mut m| { + m.value = Some( + quoted + .parse::() + .map_err(|e| ParseErrorKind::Field(e.into()))?, + ); + Ok(m) + }), + cursor, + ), + _ => (Err(ParseErrorKind::Other), source.len()), + } + } + } + } else { + switch_syntax!(&source[cursor..] => |i| { + '/' => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + '[' => (Err(ParseErrorKind::UnexpectedSyntax('[')), source.len()), + '"' => (Err(ParseErrorKind::UnexpectedSyntax('"')), source.len()), + '{' => (Err(ParseErrorKind::UnexpectedSyntax('{')), source.len()), + '=' => (Err(ParseErrorKind::UnexpectedSyntax('=')), source.len()), + ']' => (Err(ParseErrorKind::UnexpectedSyntax(']')), source.len()), + '}' => match source[cursor..][..i].trim().parse() { + Ok(value) => (Ok(Match { name, value: Some(value) }), cursor + i), + Err(e) => (Err(ParseErrorKind::Field(e.into())), source.len()), + }, + ',' => match source[cursor..][..i].trim().parse() { + Ok(value) => (Ok(Match { name, value: Some(value) }), cursor + i + 1), + Err(e) => (Err(ParseErrorKind::Field(e.into())), source.len()), + }, + _ => (Err(ParseErrorKind::Other), source.len()), + }) + } + } + _ => (Err(ParseErrorKind::Other), source.len()), + } + } + + // NB: includes parsing the rbrack, if present + fn parse_at_fields(source: &str) -> (Result, ParseErrorKind>, usize) { + assert_eq!(source.as_bytes()[0], b'{'); + + let mut fields = FilterVec::new(); + let mut cursor = 1; + while source.as_bytes().get(cursor) != Some(&b'}') { + let (parsed, after_parsed) = parse_at_field(&source[cursor..]); + match parsed { + Err(e) => { + return ( + Err(e), + try_recover_with(source, cursor + after_parsed, Syntax::RBrace), + ) + } + Ok(field) => { + fields.push(field); + cursor += after_parsed; + } + } + } + if source.as_bytes().get(cursor + 1) == Some(&b']') { + (Ok(fields), cursor + 1 + 1) + } else { + (Err(ParseErrorKind::Other), source.len()) + } + } + + fn parse_at_level( + source: &str, + in_span: Option, + fields: FilterVec, + target: Option, + ) -> (Result, usize) { + if !source.starts_with('=') { + // NB: parse_at_comma handles syntax/comma after the level + return ( + Ok(Directive { + in_span, + fields, + target, + level: LevelFilter::TRACE, + }), + 0, + ); + } + + if source[1..].starts_with('"') { + return match parse_one_quote_string(&source[1..]) { + (None, _) => (Err(ParseErrorKind::Other), source.len()), + (Some(quoted), after_quoted) => match parse_level_filter("ed) { + // NB: parse_at_comma handles syntax/comma after the level + Ok(level) => ( + Ok(Directive { + in_span, + fields, + target, + level, + }), + 1 + after_quoted, + ), + Err(err) => (Err(ParseErrorKind::Level(err)), 1 + after_quoted), + }, + }; + } + + switch_syntax!(&source[1..] => |i| { + // Prefer syntax error over potential level parse error + '/' => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + '[' => (Err(ParseErrorKind::UnexpectedSyntax('[')), source.len()), + '"' => (Err(ParseErrorKind::UnexpectedSyntax('"')), source.len()), + '{' => (Err(ParseErrorKind::UnexpectedSyntax('{')), source.len()), + '}' => (Err(ParseErrorKind::UnexpectedSyntax('}')), 1 + i), + '=' => (Err(ParseErrorKind::UnexpectedSyntax('=')), 1 + i), + ']' => (Err(ParseErrorKind::UnexpectedSyntax(']')), 1 + i), + ',' | _ => match parse_level_filter(&source[1..1 + i]) { + Ok(level) => ( + Ok(Directive { + in_span, + fields, + target, + level, + }), + 1 + i, + ), + Err(err) => (Err(ParseErrorKind::Level(err)), 1 + i), + }, + }) + } + + fn parse_at_comma( + source: &str, + i: usize, + directive: Result, + ) -> (Result, usize) { + match source[i..].as_bytes().get(0) { + None => (directive, i), + Some(b',') => (directive, i + 1), + Some(&syntax @ (b'[' | b'{' | b'"' | b'/')) => ( + Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + source.len(), + ), + Some(&syntax @ (b']' | b'}' | b'=')) => ( + Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + try_recover_with(source, i + 1, Syntax::Comma), + ), + _ => ( + Err(ParseErrorKind::Other), + try_recover_with(source, i, Syntax::Comma), + ), + } + } + + if source.starts_with('"') { + return match parse_one_quote_string(source) { + (None, after) => (Err(ParseErrorKind::Other), after), + (Some(quoted), after_quoted) => match source.as_bytes().get(after_quoted) { + None => ( + Ok(Directive { + in_span: None, + fields: FilterVec::new(), + target: Some(quoted.to_string()), + level: LevelFilter::TRACE, + }), + after_quoted, + ), + Some(b',') => ( + Ok(Directive { + in_span: None, + fields: FilterVec::new(), + target: Some(quoted.to_string()), + level: LevelFilter::TRACE, + }), + after_quoted + 1, + ), + Some(&syntax @ (b'/' | b'{')) => ( + Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + source.len(), + ), + Some(&syntax @ (b']' | b'}')) => ( + Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + try_recover_with(source, after_quoted + 1, Syntax::Comma), + ), + Some(b'[') => { + let (parsed, after_parsed) = + parse_at_span(&source[after_quoted..], Some(quoted.into())); + parse_at_comma(source, after_parsed, parsed) + } + Some(b'=') => { + let (parsed, after_parsed) = parse_at_level( + &source[after_quoted..], + None, + FilterVec::new(), + Some(quoted.into()), + ); + parse_at_comma(source, after_parsed, parsed) + } + Some(b'"') => (Err(ParseErrorKind::UnexpectedSyntax('"')), source.len()), + _ => ( + Err(ParseErrorKind::Other), + try_recover_with(source, after_quoted, Syntax::Comma), + ), + }, + }; + } + + switch_syntax!(source => |i| { + '/' => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + '"' => (Err(ParseErrorKind::UnexpectedSyntax('}')), source.len()), + '{' => (Err(ParseErrorKind::UnexpectedSyntax('{')), source.len()), + '}' => (Err(ParseErrorKind::UnexpectedSyntax('}')), try_recover_with(source, i + 1, Syntax::Comma)), + ']' => (Err(ParseErrorKind::UnexpectedSyntax(']')), try_recover_with(source, i + 1, Syntax::Comma)), + ',' => (parse_one_directive(&source[..i]).0, i + 1), + '[' => { + let (parsed, after_parsed) = parse_at_span( + &source[i..], + Some(source[..i].trim()).filter(|s| !s.is_empty()).map(Into::into), + ); + parse_at_comma(source, i + after_parsed, parsed) + }, + '=' => { + let (parsed, after_parsed) = parse_at_level( + &source[i..], + None, + FilterVec::new(), + Some(source[..i].trim()).filter(|s| !s.is_empty()).map(Into::into), + ); + parse_at_comma(source, i + after_parsed, parsed) + }, + _ => match parse_level_filter(source.trim()) { + Ok(level) => (Ok(Directive { + in_span: None, + fields: FilterVec::new(), + target: None, + level, + }), source.len()), + Err(_) => (Ok(Directive { + in_span: None, + fields: FilterVec::new(), + target: Some(source.trim().to_string()), + level: LevelFilter::TRACE, + }), source.len()), + } + }) +} + +/// Parse a single quote string off the front of the source string. +/// +/// Returns the unquoted string, if terminated, as well as the index after the +/// parsed string. +/// +/// Currently has no escape syntax. +fn parse_one_quote_string(source: &str) -> (Option>, usize) { + assert!(source.starts_with('"')); + match source[1..].find('"') { + None => (None, source.len()), + Some(i) => (Some(source[1..1 + i].into()), 1 + i + 1), + } +} + +#[cfg(test)] +mod tests { + use super::*; + + #[test] + fn test_quote_parsing() { + macro_rules! check { + ($source:expr => $expected:expr, $expected_after:expr) => {{ + let source: &str = $source; + let expected: Option<&str> = $expected; + let expected_after: &str = $expected_after; + let (parsed, parsed_len) = parse_one_quote_string(source); + assert_eq!( + (parsed, &source[parsed_len..]), + (expected.map(Into::into), expected_after), + "\nexpected {:?} to parse", + source, + ); + }}; + } + + check!(r#""hello""# => Some("hello"), ""); + check!(r#""hello"world"# => Some("hello"), "world"); + check!(r#""hello"# => None, ""); + } + + #[test] + fn test_directive_parsing() { + macro_rules! check_pass { + ($source:expr => $expected:expr, $expected_after:expr) => {{ + let source: &str = $source; + let expected: Directive = $expected; + let expected_after: &str = $expected_after; + let (parsed, parsed_len) = parse_one_directive(source); + let parsed = parsed.unwrap_or_else(|e| { + panic!("Failed to parse directive {:?} with err {:?}", source, e) + }); + assert_eq!( + (parsed, &source[parsed_len..]), + (expected, expected_after), + "\nexpected {:?} to parse", + source, + ); + }}; + } + + macro_rules! collect { + [$($expr:expr),* $(,)?] => { + IntoIterator::into_iter([$($expr),*]).collect() + } + } + + check_pass!("hello" => Directive { + in_span: None, + fields: collect![], + target: Some("hello".into()), + level: LevelFilter::TRACE + }, ""); + + check_pass!("info" => Directive { + in_span: None, + fields: collect![], + target: None, + level: LevelFilter::INFO + }, ""); + + check_pass!("INFO" => Directive { + in_span: None, + fields: collect![], + target: None, + level: LevelFilter::INFO + }, ""); + + check_pass!("hello=debug" => Directive { + in_span: None, + fields: collect![], + target: Some("hello".into()), + level: LevelFilter::DEBUG + }, ""); + + check_pass!("hello,std::option" => Directive { + in_span: None, + fields: collect![], + target: Some("hello".into()), + level: LevelFilter::TRACE + }, "std::option"); + + check_pass!("error,hello=warn" => Directive { + in_span: None, + fields: collect![], + target: None, + level: LevelFilter::ERROR + }, "hello=warn"); + + check_pass!("tokio::net=info" => Directive { + in_span: None, + fields: collect![], + target: Some("tokio::net".into()), + level: LevelFilter::INFO + }, ""); + + check_pass!("my_crate[span_a]=trace" => Directive { + in_span: Some("span_a".into()), + fields: collect![], + target: Some("my_crate".into()), + level: LevelFilter::TRACE + }, ""); + + check_pass!("[span_b{name}]" => Directive { + in_span: Some("span_b".into()), + fields: collect![Match { name: "name".into(), value: None }], + target: None, + level: LevelFilter::TRACE + }, ""); + + check_pass!(r#"[span_b{name=bob}]"# => Directive { + in_span: Some("span_b".into()), + fields: collect![Match { name: "name".into(), value: Some("bob".parse().unwrap()) }], + target: None, + level: LevelFilter::TRACE + }, ""); + + check_pass!(r#"[span_b{name="bob"}]"# => Directive { + in_span: Some("span_b".into()), + fields: collect![Match { name: "name".into(), value: Some("bob".parse().unwrap()) }], + target: None, + level: LevelFilter::TRACE + }, ""); + } +} From 7f97a853e08c04c03cb736821dae5ecd0e9b4e8b Mon Sep 17 00:00:00 2001 From: CAD97 Date: Sat, 25 Sep 2021 18:33:51 -0500 Subject: [PATCH 2/2] Remove use of nested-or-patterns --- tracing-subscriber/src/filter/env/parsing.rs | 42 +++++++++++++------- 1 file changed, 27 insertions(+), 15 deletions(-) diff --git a/tracing-subscriber/src/filter/env/parsing.rs b/tracing-subscriber/src/filter/env/parsing.rs index 10f6d81c98..0c394349d5 100644 --- a/tracing-subscriber/src/filter/env/parsing.rs +++ b/tracing-subscriber/src/filter/env/parsing.rs @@ -34,7 +34,7 @@ macro_rules! switch_syntax { }) => {{ let haystack: &str = &$haystack; match find_syntax(haystack) { - $((ix, $(switch_syntax!(@syntax $needle))|+) => { + $($((ix, switch_syntax!(@syntax $needle)))|+ => { #[allow(unused_variables)] let $ix = ix; $expr @@ -137,10 +137,12 @@ pub(super) fn parse_one_directive(source: &str) -> (Result (Err(ParseErrorKind::Other), source.len()), (Some(quoted), after_quoted) => match source.as_bytes().get(1 + after_quoted) { None => (Err(ParseErrorKind::Other), source.len()), - Some(&syntax @ (b'/' | b'[' | b'}' | b'"' | b',' | b'=')) => ( - Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), - source.len(), - ), + Some(b'/') => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + Some(b'[') => (Err(ParseErrorKind::UnexpectedSyntax('[')), source.len()), + Some(b'}') => (Err(ParseErrorKind::UnexpectedSyntax('}')), source.len()), + Some(b'"') => (Err(ParseErrorKind::UnexpectedSyntax('"')), source.len()), + Some(b',') => (Err(ParseErrorKind::UnexpectedSyntax(',')), source.len()), + Some(b'=') => (Err(ParseErrorKind::UnexpectedSyntax('=')), source.len()), Some(b']') => { let (parsed, after_parsed) = parse_at_level( &source[1 + after_quoted + 1..], @@ -388,12 +390,20 @@ pub(super) fn parse_one_directive(source: &str) -> (Result (directive, i), Some(b',') => (directive, i + 1), - Some(&syntax @ (b'[' | b'{' | b'"' | b'/')) => ( - Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), - source.len(), + Some(b'[') => (Err(ParseErrorKind::UnexpectedSyntax('[')), source.len()), + Some(b'{') => (Err(ParseErrorKind::UnexpectedSyntax('{')), source.len()), + Some(b'"') => (Err(ParseErrorKind::UnexpectedSyntax('"')), source.len()), + Some(b'/') => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + Some(b']') => ( + Err(ParseErrorKind::UnexpectedSyntax(']')), + try_recover_with(source, i + 1, Syntax::Comma), ), - Some(&syntax @ (b']' | b'}' | b'=')) => ( - Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + Some(b'}') => ( + Err(ParseErrorKind::UnexpectedSyntax('}')), + try_recover_with(source, i + 1, Syntax::Comma), + ), + Some(b'=') => ( + Err(ParseErrorKind::UnexpectedSyntax('=')), try_recover_with(source, i + 1, Syntax::Comma), ), _ => ( @@ -425,12 +435,14 @@ pub(super) fn parse_one_directive(source: &str) -> (Result ( - Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), - source.len(), + Some(b'/') => (Err(ParseErrorKind::UnexpectedSyntax('/')), source.len()), + Some(b'{') => (Err(ParseErrorKind::UnexpectedSyntax('{')), source.len()), + Some(b']') => ( + Err(ParseErrorKind::UnexpectedSyntax(']')), + try_recover_with(source, after_quoted + 1, Syntax::Comma), ), - Some(&syntax @ (b']' | b'}')) => ( - Err(ParseErrorKind::UnexpectedSyntax(syntax as char)), + Some(b'}') => ( + Err(ParseErrorKind::UnexpectedSyntax('}')), try_recover_with(source, after_quoted + 1, Syntax::Comma), ), Some(b'[') => {