use faststr::FastStr;
use crate::{
error::Result,
input::{JsonInput, JsonSlice},
lazyvalue::LazyValue,
parser::{Parser, DEFAULT_KEY_BUF_CAPACITY},
reader::{Read, Reader},
};
pub struct ObjectJsonIter<'de> {
json: JsonSlice<'de>,
parser: Option<Parser<Read<'de>>>,
strbuf: Vec<u8>,
first: bool,
ending: bool,
check: bool,
}
pub struct ArrayJsonIter<'de> {
json: JsonSlice<'de>,
parser: Option<Parser<Read<'de>>>,
first: bool,
ending: bool,
check: bool,
}
impl<'de> ObjectJsonIter<'de> {
fn new(json: JsonSlice<'de>, check: bool) -> Self {
Self {
json,
parser: None,
strbuf: Vec::with_capacity(DEFAULT_KEY_BUF_CAPACITY),
first: true,
ending: false,
check,
}
}
fn next_entry_impl(&mut self, check: bool) -> Option<Result<(FastStr, LazyValue<'de>)>> {
if self.ending {
return None;
}
if self.parser.is_none() {
let slice = self.json.as_ref();
let slice = unsafe { std::slice::from_raw_parts(slice.as_ptr(), slice.len()) };
let parser = Parser::new(Read::new(slice, check));
if let Err(err) = parser.read.check_utf8_final() {
self.ending = true;
return Some(Err(err));
}
self.parser = Some(parser);
}
let parser = unsafe { self.parser.as_mut().unwrap_unchecked() };
unsafe { parser.read.update_slice(self.json.as_ref().as_ptr()) };
match parser.parse_entry_lazy(&mut self.strbuf, &mut self.first, check) {
Ok(ret) => {
if let Some((key, val, has_escaped)) = ret {
let val = self.json.slice_ref(val);
Some(LazyValue::new(val, has_escaped).map(|v| (key, v)))
} else {
self.ending = true;
None
}
}
Err(err) => {
self.ending = true;
Some(Err(err))
}
}
}
}
impl<'de> ArrayJsonIter<'de> {
fn new(json: JsonSlice<'de>, check: bool) -> Self {
Self {
json,
parser: None,
first: true,
ending: false,
check,
}
}
fn next_elem_impl(&mut self, check: bool) -> Option<Result<LazyValue<'de>>> {
if self.ending {
return None;
}
if self.parser.is_none() {
let slice = self.json.as_ref();
let slice = unsafe { std::slice::from_raw_parts(slice.as_ptr(), slice.len()) };
let parser = Parser::new(Read::new(slice, check));
if let Err(err) = parser.read.check_utf8_final() {
self.ending = true;
return Some(Err(err));
}
self.parser = Some(parser);
}
let parser = self.parser.as_mut().unwrap();
unsafe { parser.read.update_slice(self.json.as_ref().as_ptr()) };
match parser.parse_array_elem_lazy(&mut self.first, check) {
Ok(ret) => {
if let Some((ret, has_escaped)) = ret {
let val = self.json.slice_ref(ret);
Some(LazyValue::new(val, has_escaped))
} else {
self.ending = true;
None
}
}
Err(err) => {
self.ending = true;
Some(Err(err))
}
}
}
}
pub fn to_object_iter<'de, I: JsonInput<'de>>(json: I) -> ObjectJsonIter<'de> {
ObjectJsonIter::new(json.to_json_slice(), true)
}
pub fn to_array_iter<'de, I: JsonInput<'de>>(json: I) -> ArrayJsonIter<'de> {
ArrayJsonIter::new(json.to_json_slice(), true)
}
pub unsafe fn to_object_iter_unchecked<'de, I: JsonInput<'de>>(json: I) -> ObjectJsonIter<'de> {
ObjectJsonIter::new(json.to_json_slice(), false)
}
pub unsafe fn to_array_iter_unchecked<'de, I: JsonInput<'de>>(json: I) -> ArrayJsonIter<'de> {
ArrayJsonIter::new(json.to_json_slice(), false)
}
impl<'de> Iterator for ObjectJsonIter<'de> {
type Item = Result<(FastStr, LazyValue<'de>)>;
fn next(&mut self) -> Option<Self::Item> {
self.next_entry_impl(self.check)
}
}
impl<'de> Iterator for ArrayJsonIter<'de> {
type Item = Result<LazyValue<'de>>;
fn next(&mut self) -> Option<Self::Item> {
self.next_elem_impl(self.check)
}
}
#[cfg(test)]
mod test {
use bytes::Bytes;
use super::*;
use crate::{value::JsonValueTrait, JsonType};
#[test]
fn test_object_iter() {
let json = Bytes::from(
r#"{
"string": "Hello, world!",
"number": 42,
"boolean": true,
"null": null,
"array": ["foo","bar","baz"],
"object": {"name": "Alice"},
"empty": {},
"": [],
"escaped\"": "\"\"",
"\t": "\n",
"\u0000": "\u0001"
}"#,
);
let _v: serde_json::Value = serde_json::from_slice(json.as_ref()).unwrap();
let mut iter = to_object_iter(&json);
let mut iter_unchecked = unsafe { to_object_iter_unchecked(&json) };
let mut test_ok = |key: &str, val: &str, typ: JsonType| {
let ret = iter.next().unwrap().unwrap();
assert_eq!(ret.0.as_str(), key);
assert_eq!(
ret.1.as_raw_str().as_bytes(),
val.as_bytes(),
"key is {} ",
key
);
assert_eq!(ret.1.get_type(), typ);
let ret = iter_unchecked.next().unwrap().unwrap();
assert_eq!(ret.0.as_str(), key);
assert_eq!(
ret.1.as_raw_str().as_bytes(),
val.as_bytes(),
"key is {} ",
key
);
assert_eq!(ret.1.get_type(), typ);
};
test_ok("string", r#""Hello, world!""#, JsonType::String);
test_ok("number", "42", JsonType::Number);
test_ok("boolean", "true", JsonType::Boolean);
test_ok("null", "null", JsonType::Null);
test_ok("array", r#"["foo","bar","baz"]"#, JsonType::Array);
test_ok("object", r#"{"name": "Alice"}"#, JsonType::Object);
test_ok("empty", r#"{}"#, JsonType::Object);
test_ok("", r#"[]"#, JsonType::Array);
test_ok("escaped\"", r#""\"\"""#, JsonType::String);
test_ok("\t", r#""\n""#, JsonType::String);
test_ok("\x00", r#""\u0001""#, JsonType::String);
assert!(iter.next().is_none());
assert!(iter.next().is_none());
let json = Bytes::from("{}");
let mut iter = to_object_iter(&json);
assert!(iter.next().is_none());
assert!(iter.next().is_none());
assert!(iter.next().is_none());
let json = Bytes::from("{xxxxxx");
let mut iter = to_object_iter(&json);
assert!(iter.next().unwrap().is_err());
assert!(iter.next().is_none());
}
#[test]
fn test_array_iter() {
let json = Bytes::from(
r#"[
"",
"\\\"\"",
"{\"a\":null}",
"Hello, world!",
0,
1,
11,
1000,
42,
42.0,
42e-1,
4.2e+1,
2333.2e+1,
0.0000000999e8,
true,
null,
["foo","bar","baz"],
{"name": "Alice"},
[],
{}
]"#,
);
let mut iter = to_array_iter(&json);
let mut iter_unchecked = unsafe { to_array_iter_unchecked(&json) };
let mut test_ok = |val: &str, typ: JsonType| {
let ret: LazyValue<'_> = iter.next().unwrap().unwrap();
assert_eq!(ret.as_raw_str(), val);
assert_eq!(ret.get_type(), typ);
let ret = iter_unchecked.next().unwrap().unwrap();
assert_eq!(ret.as_raw_str().as_bytes(), val.as_bytes());
assert_eq!(ret.get_type(), typ);
};
test_ok(r#""""#, JsonType::String);
test_ok(r#""\\\"\"""#, JsonType::String);
test_ok(r#""{\"a\":null}""#, JsonType::String);
test_ok(r#""Hello, world!""#, JsonType::String);
test_ok("0", JsonType::Number);
test_ok("1", JsonType::Number);
test_ok("11", JsonType::Number);
test_ok("1000", JsonType::Number);
test_ok("42", JsonType::Number);
test_ok("42.0", JsonType::Number);
test_ok("42e-1", JsonType::Number);
test_ok("4.2e+1", JsonType::Number);
test_ok("2333.2e+1", JsonType::Number);
test_ok("0.0000000999e8", JsonType::Number);
test_ok("true", JsonType::Boolean);
test_ok("null", JsonType::Null);
test_ok(r#"["foo","bar","baz"]"#, JsonType::Array);
test_ok(r#"{"name": "Alice"}"#, JsonType::Object);
test_ok(r#"[]"#, JsonType::Array);
test_ok(r#"{}"#, JsonType::Object);
assert!(iter.next().is_none());
assert!(iter.next().is_none());
let json = Bytes::from("[]");
let mut iter = to_array_iter(&json);
assert!(iter.next().is_none());
assert!(iter.next().is_none());
assert!(iter.next().is_none());
let json = Bytes::from("[xxxxxx");
let mut iter = to_array_iter(&json);
assert!(iter.next().unwrap().is_err());
assert!(iter.next().is_none());
}
#[test]
fn test_iter_deserialize() {
let json = Bytes::from(r#"[1, 2, 3, 4, 5, 6]"#);
let iter = to_array_iter(&json);
let out: Vec<u8> = iter
.flatten()
.map(|e| crate::from_str::<u8>(e.as_raw_str()).unwrap_or_default())
.collect();
assert_eq!(out.as_slice(), &[1, 2, 3, 4, 5, 6]);
let json = Bytes::from(r#"[1, true, "hello", null, 5, 6]"#);
let iter = to_array_iter(&json);
let out: Vec<JsonType> = iter.map(|e| e.get_type()).collect();
println!("array elem type is {:?}", out);
}
#[test]
fn test_num_iter() {
for i in to_array_iter("[6,-9E6]") {
println!("{:?}", i.unwrap().as_raw_str());
}
}
#[test]
fn test_json_iter_for_utf8() {
let data = [b'[', b'"', 0, 0, 0, 0x80, 0x90, b'"', b']'];
let iter = to_array_iter(&data[..]);
for item in iter {
assert_eq!(
item.err().unwrap().to_string(),
"Invalid UTF-8 characters in json at line 1 column \
5\n\n\t[\"\0\0\0��\"]\n\t.....^...\n"
);
}
let data = [
b'{', b'"', 0, 0, 0, 0x80, 0x90, b'"', b':', b'"', b'"', b'}',
];
let iter = to_object_iter(&data[..]);
for item in iter {
assert_eq!(
item.err().unwrap().to_string(),
"Invalid UTF-8 characters in json at line 1 column \
5\n\n\t{\"\0\0\0��\":\"\"}\n\t.....^......\n"
);
}
}
}