use std::{collections::btree_map, fmt::Write as _, iter, slice, sync::LazyLock};
use regex::Regex;
use serde::{Serialize, Serializer};
use vrl::path::PathPrefix;
use crate::event::{KeyString, ObjectMap, Value};
static IS_VALID_PATH_SEGMENT: LazyLock<Regex> =
LazyLock::new(|| Regex::new(r"^[a-zA-Z0-9_]+$").unwrap());
pub fn all_fields(fields: &ObjectMap) -> FieldsIter {
FieldsIter::new(None, fields, true)
}
pub fn all_fields_unquoted(fields: &ObjectMap) -> FieldsIter {
FieldsIter::new(None, fields, false)
}
pub fn all_metadata_fields(fields: &ObjectMap) -> FieldsIter {
FieldsIter::new(Some(PathPrefix::Metadata), fields, true)
}
pub fn all_fields_non_object_root(value: &Value) -> FieldsIter {
FieldsIter::non_object(value)
}
pub fn all_fields_skip_array_elements(fields: &ObjectMap) -> FieldsIter {
FieldsIter::new_with_skip_array_elements(fields)
}
#[derive(Clone, Debug)]
enum LeafIter<'a> {
Root((&'a Value, bool)),
Map(btree_map::Iter<'a, KeyString, Value>),
Array(iter::Enumerate<slice::Iter<'a, Value>>),
}
#[derive(Clone, Copy, Debug)]
enum PathComponent<'a> {
Key(&'a KeyString),
Index(usize),
}
#[derive(Clone)]
pub struct FieldsIter<'a> {
path_prefix: Option<PathPrefix>,
stack: Vec<LeafIter<'a>>,
path: Vec<PathComponent<'a>>,
skip_array_elements: bool,
quote_invalid_fields: bool,
}
impl<'a> FieldsIter<'a> {
fn new(
path_prefix: Option<PathPrefix>,
fields: &'a ObjectMap,
quote_invalid_fields: bool,
) -> FieldsIter<'a> {
FieldsIter {
path_prefix,
stack: vec![LeafIter::Map(fields.iter())],
path: vec![],
skip_array_elements: false,
quote_invalid_fields,
}
}
fn non_object(value: &'a Value) -> FieldsIter<'a> {
FieldsIter {
path_prefix: None,
stack: vec![LeafIter::Root((value, false))],
path: vec![],
skip_array_elements: false,
quote_invalid_fields: true,
}
}
fn new_with_skip_array_elements(fields: &'a ObjectMap) -> FieldsIter<'a> {
FieldsIter {
path_prefix: None,
stack: vec![LeafIter::Map(fields.iter())],
path: vec![],
skip_array_elements: true,
quote_invalid_fields: true,
}
}
fn push(&mut self, value: &'a Value, component: PathComponent<'a>) -> Option<&'a Value> {
match value {
Value::Object(map) if !map.is_empty() => {
self.stack.push(LeafIter::Map(map.iter()));
self.path.push(component);
None
}
Value::Array(array) if !array.is_empty() => {
if self.skip_array_elements {
Some(value)
} else {
self.stack.push(LeafIter::Array(array.iter().enumerate()));
self.path.push(component);
None
}
}
_ => Some(value),
}
}
fn pop(&mut self) {
self.stack.pop();
self.path.pop();
}
fn make_path(&mut self, component: PathComponent<'a>) -> KeyString {
let mut res = match self.path_prefix {
None => String::new(),
Some(prefix) => match prefix {
PathPrefix::Event => String::from("."),
PathPrefix::Metadata => String::from("%"),
},
};
let mut path_iter = self.path.iter().chain(iter::once(&component)).peekable();
loop {
match path_iter.next() {
None => break res.into(),
Some(PathComponent::Key(key)) => {
if self.quote_invalid_fields && !IS_VALID_PATH_SEGMENT.is_match(key) {
res.push_str(&format!("\"{key}\""));
} else {
res.push_str(key);
}
}
Some(PathComponent::Index(index)) => {
write!(res, "[{index}]").expect("write to String never fails");
}
}
if let Some(PathComponent::Key(_)) = path_iter.peek() {
res.push('.');
}
}
}
}
impl<'a> Iterator for FieldsIter<'a> {
type Item = (KeyString, &'a Value);
fn next(&mut self) -> Option<Self::Item> {
loop {
match self.stack.last_mut() {
None => return None,
Some(LeafIter::Map(map_iter)) => match map_iter.next() {
None => self.pop(),
Some((key, value)) => {
if let Some(scalar_value) = self.push(value, PathComponent::Key(key)) {
return Some((self.make_path(PathComponent::Key(key)), scalar_value));
}
}
},
Some(LeafIter::Array(array_iter)) => match array_iter.next() {
None => self.pop(),
Some((index, value)) => {
if let Some(scalar_value) = self.push(value, PathComponent::Index(index)) {
return Some((
self.make_path(PathComponent::Index(index)),
scalar_value,
));
}
}
},
Some(LeafIter::Root((value, visited))) => {
let result = (!*visited).then(|| ("message".into(), *value));
*visited = true;
break result;
}
};
}
}
}
impl Serialize for FieldsIter<'_> {
fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where
S: Serializer,
{
serializer.collect_map(self.clone())
}
}
#[cfg(test)]
mod test {
use serde_json::json;
use similar_asserts::assert_eq;
use super::{super::test::fields_from_json, *};
#[test]
fn keys_simple() {
let fields = fields_from_json(json!({
"field2": 3,
"field1": 4,
"field3": 5
}));
let expected: Vec<_> = vec![
("field1", &Value::Integer(4)),
("field2", &Value::Integer(3)),
("field3", &Value::Integer(5)),
]
.into_iter()
.map(|(k, v)| (k.into(), v))
.collect();
let collected: Vec<_> = all_fields(&fields).collect();
assert_eq!(collected, expected);
}
fn special_fields() -> ObjectMap {
fields_from_json(json!({
"a-b": 1,
"a*b": 2,
"a b": 3,
".a .b*": 4,
"\"a\"": 5,
}))
}
#[test]
fn keys_special_quoted() {
let fields = special_fields();
let mut collected: Vec<_> = all_fields(&fields).collect();
collected.sort_by(|(a, _), (b, _)| a.cmp(b));
let mut expected: Vec<(KeyString, &Value)> = vec![
("\"a-b\"", &Value::Integer(1)),
("\"a*b\"", &Value::Integer(2)),
("\"a b\"", &Value::Integer(3)),
("\".a .b*\"", &Value::Integer(4)),
("\"\"a\"\"", &Value::Integer(5)),
]
.into_iter()
.map(|(k, v)| (k.into(), v))
.collect();
expected.sort_by(|(a, _), (b, _)| a[1..].cmp(&b[1..]));
assert_eq!(collected, expected);
}
#[test]
fn keys_special_unquoted() {
let fields = special_fields();
let mut collected: Vec<_> = all_fields_unquoted(&fields).collect();
collected.sort_by(|(a, _), (b, _)| a.cmp(b));
let mut expected: Vec<(KeyString, &Value)> = vec![
("a-b", &Value::Integer(1)),
("a*b", &Value::Integer(2)),
("a b", &Value::Integer(3)),
(".a .b*", &Value::Integer(4)),
("\"a\"", &Value::Integer(5)),
]
.into_iter()
.map(|(k, v)| (k.into(), v))
.collect();
expected.sort_by(|(a, _), (b, _)| a.cmp(b));
assert_eq!(collected, expected);
}
#[test]
fn metadata_keys_simple() {
let fields = fields_from_json(json!({
"field_1": 1,
"field_0": 0,
"field_2": 2
}));
let expected: Vec<_> = vec![
("%field_0", &Value::Integer(0)),
("%field_1", &Value::Integer(1)),
("%field_2", &Value::Integer(2)),
]
.into_iter()
.map(|(k, v)| (k.into(), v))
.collect();
let collected: Vec<_> = all_metadata_fields(&fields).collect();
assert_eq!(collected, expected);
}
fn nested_fields() -> ObjectMap {
fields_from_json(json!({
"a": {
"b": {
"c": 5
},
"a": 4,
"array": [null, 3, {
"x": 1
}, [2]]
},
"a.b.c": 6,
"d": {},
"e": [],
}))
}
#[test]
fn keys_nested_quoted() {
let fields = nested_fields();
let expected: Vec<_> = vec![
("a.a", Value::Integer(4)),
("a.array[0]", Value::Null),
("a.array[1]", Value::Integer(3)),
("a.array[2].x", Value::Integer(1)),
("a.array[3][0]", Value::Integer(2)),
("a.b.c", Value::Integer(5)),
("\"a.b.c\"", Value::Integer(6)),
("d", Value::Object(ObjectMap::new())),
("e", Value::Array(Vec::new())),
]
.into_iter()
.map(|(k, v)| (k.into(), v))
.collect();
let collected: Vec<_> = all_fields(&fields).map(|(k, v)| (k, v.clone())).collect();
assert_eq!(collected, expected);
}
#[test]
fn keys_nested_unquoted() {
let fields = nested_fields();
let expected: Vec<_> = vec![
("a.a", Value::Integer(4)),
("a.array[0]", Value::Null),
("a.array[1]", Value::Integer(3)),
("a.array[2].x", Value::Integer(1)),
("a.array[3][0]", Value::Integer(2)),
("a.b.c", Value::Integer(5)),
("a.b.c", Value::Integer(6)),
("d", Value::Object(ObjectMap::new())),
("e", Value::Array(Vec::new())),
]
.into_iter()
.map(|(k, v)| (k.into(), v))
.collect();
let collected: Vec<_> = all_fields_unquoted(&fields)
.map(|(k, v)| (k, v.clone()))
.collect();
assert_eq!(collected, expected);
}
#[test]
fn test_non_object_root() {
let value = Value::Integer(3);
let collected: Vec<_> = all_fields_non_object_root(&value)
.map(|(k, v)| (k.into(), v.clone()))
.collect();
assert_eq!(collected, vec![("message".to_owned(), value)]);
}
}