High performance xml pull reader/writer.
Syntax is inspired by xml-rs.
[dependencies]
quick-xml = "0.1.9"
extern crate quick_xml;
use quick_xml::{XmlReader, Event};
let xml = r#"<tag1 att1 = "test">
<tag2><!--Test comment-->Test</tag2>
<tag2>
Test 2
</tag2>
</tag1>"#;
let reader = XmlReader::from(xml).trim_text(true);
// if you want to use namespaces, you just need to convert the `XmlReader`
// to an `XmlnsReader`:
// let reader_ns = reader.namespaced();
let mut count = 0;
let mut txt = Vec::new();
for r in reader {
// namespaced: the `for` loop moves the reader
// => use `while let` so you can have access to `reader_ns.resolve` for attributes
// while let Some(r) = reader.next() {
match r {
Ok(Event::Start(ref e)) => {
// for namespaced:
// Ok((ref namespace_value, Event::Start(ref e)))
match e.name() {
b"tag1" => println!("attributes values: {:?}",
e.attributes().map(|a| a.unwrap().1)
// namespaced: use `reader_ns.resolve`
// e.attributes().map(|a| a.map(|(k, _)| reader_ns.resolve(k))) ...
.collect::<Vec<_>>()),
b"tag2" => count += 1,
_ => (),
}
},
Ok(Event::Text(e)) => txt.push(e.into_string()),
Err((e, pos)) => panic!("{:?} at position {}", e, pos),
_ => (),
}
}
use quick_xml::{AsStr, Element, Event, XmlReader, XmlWriter};
use quick_xml::Event::*;
use std::io::Cursor;
use std::iter;
let xml = r#"<this_tag k1="v1" k2="v2"><child>text</child></this_tag>"#;
let reader = XmlReader::from(xml).trim_text(true);
let mut writer = XmlWriter::new(Cursor::new(Vec::new()));
for r in reader {
match r {
Ok(Event::Start(ref e)) if e.name() == b"this_tag" => {
// collect existing attributes
let mut attrs = e.attributes().map(|attr| attr.unwrap()).collect::<Vec<_>>();
// copy existing attributes, adds a new my-key="some value" attribute
let mut elem = Element::new("my_elem").with_attributes(attrs);
elem.push_attribute(b"my-key", "some value");
// writes the event to the writer
assert!(writer.write(Start(elem)).is_ok());
},
Ok(Event::End(ref e)) if e.name() == b"this_tag" => {
assert!(writer.write(End(Element::new("my_elem"))).is_ok());
},
Ok(e) => assert!(writer.write(e).is_ok()),
Err((e, pos)) => panic!("{:?} at position {}", e, pos),
}
}
let result = writer.into_inner().into_inner();
let expected = r#"<my_elem k1="v1" k2="v2" my-key="some value"><child>text</child></my_elem>"#;
assert_eq!(result, expected.as_bytes());
You can benchmark with other libraries using features:
cargo bench --features bench-xml-rs
cargo bench --features bench-rusty-xml
Results:
test bench_quick_xml ... bench: 610,970 ns/iter (+/- 40,766)
test bench_quick_xml_escaped ... bench: 721,361 ns/iter (+/- 21,095)
test bench_quick_xml_namespaced ... bench: 820,220 ns/iter (+/- 11,309)
test bench_xml_rs ... bench: 14,012,890 ns/iter (+/- 12,378,389)
test bench_rusty_xml ... bench: 5,543,993 ns/iter (+/- 326,792)
- namespaces
- non-utf8
- most methods return
&u[u8]
- escaped characters are properly managed
- what else?
- most methods return
- parse xml declaration
- benchmarks
- escape characters
- more checks
- ... ?
- attribute values with
>
character will likely result in parsing error
Any PR is welcomed!
MIT