Skip to content

Commit

Permalink
Merge pull request tafia#662 from Mingun/followup-580
Browse files Browse the repository at this point in the history
Fix incorrect test for 580 and get rid of allocations in hot path
  • Loading branch information
Mingun authored Oct 9, 2023
2 parents c79ad58 + 9e8158c commit ca1c09a
Show file tree
Hide file tree
Showing 6 changed files with 109 additions and 95 deletions.
2 changes: 2 additions & 0 deletions Changelog.md
Original file line number Diff line number Diff line change
Expand Up @@ -37,6 +37,7 @@ MSRV bumped to 1.56! Crate now uses Rust 2021 edition.
- [#649]: Make features linkable and reference them in the docs.
- [#619]: Allow to raise application errors in `ElementWriter::write_inner_content`
(and newly added `ElementWriter::write_inner_content_async` of course).
- [#662]: Get rid of some allocations during serde deserialization.

[#545]: https://github.com/tafia/quick-xml/pull/545
[#580]: https://github.com/tafia/quick-xml/issues/580
Expand All @@ -47,6 +48,7 @@ MSRV bumped to 1.56! Crate now uses Rust 2021 edition.
[#651]: https://github.com/tafia/quick-xml/pull/651
[#660]: https://github.com/tafia/quick-xml/pull/660
[#661]: https://github.com/tafia/quick-xml/pull/661
[#662]: https://github.com/tafia/quick-xml/pull/662


## 0.30.0 -- 2023-07-23
Expand Down
102 changes: 51 additions & 51 deletions src/de/map.rs
Original file line number Diff line number Diff line change
Expand Up @@ -12,13 +12,13 @@ use crate::{
name::QName,
};
use serde::de::value::BorrowedStrDeserializer;
use serde::de::{self, DeserializeSeed, SeqAccess, Visitor};
use serde::de::{self, DeserializeSeed, MapAccess, SeqAccess, Visitor};
use serde::serde_if_integer128;
use std::borrow::Cow;
use std::ops::Range;

/// Defines a source that should be used to deserialize a value in the next call
/// to [`next_value_seed()`](de::MapAccess::next_value_seed)
/// to [`next_value_seed()`](MapAccess::next_value_seed)
#[derive(Debug, PartialEq)]
enum ValueSource {
/// Source are not specified, because [`next_key_seed()`] not yet called.
Expand All @@ -28,8 +28,8 @@ enum ValueSource {
/// Attempt to call [`next_value_seed()`] while accessor in this state would
/// return a [`DeError::KeyNotRead`] error.
///
/// [`next_key_seed()`]: de::MapAccess::next_key_seed
/// [`next_value_seed()`]: de::MapAccess::next_value_seed
/// [`next_key_seed()`]: MapAccess::next_key_seed
/// [`next_value_seed()`]: MapAccess::next_value_seed
Unknown,
/// Next value should be deserialized from an attribute value; value is located
/// at specified span.
Expand Down Expand Up @@ -62,7 +62,7 @@ enum ValueSource {
/// When in this state, next event, returned by [`next()`], will be a [`Start`],
/// which represents both a key, and a value. Value would be deserialized from
/// the whole element and how is will be done determined by the value deserializer.
/// The [`MapAccess`] do not consume any events in that state.
/// The [`ElementMapAccess`] do not consume any events in that state.
///
/// Because in that state any encountered `<tag>` is mapped to the [`VALUE_KEY`]
/// field, it is possible to use tag name as an enum discriminator, so `enum`s
Expand Down Expand Up @@ -105,7 +105,7 @@ enum ValueSource {
/// [`next()`]: Deserializer::next()
/// [`name()`]: BytesStart::name()
/// [`Text`]: Self::Text
/// [list of known fields]: MapAccess::fields
/// [list of known fields]: ElementMapAccess::fields
Content,
/// Next value should be deserialized from an element with a dedicated name.
/// If deserialized type is a sequence, then that sequence will collect all
Expand All @@ -118,7 +118,7 @@ enum ValueSource {
/// When in this state, next event, returned by [`next()`], will be a [`Start`],
/// which represents both a key, and a value. Value would be deserialized from
/// the whole element and how is will be done determined by the value deserializer.
/// The [`MapAccess`] do not consume any events in that state.
/// The [`ElementMapAccess`] do not consume any events in that state.
///
/// An illustration below shows, what data is used to deserialize key and value:
/// ```xml
Expand Down Expand Up @@ -164,16 +164,16 @@ enum ValueSource {
/// internal buffer of deserializer (i.e. deserializer itself) or an input
/// (in that case it is possible to approach zero-copy deserialization).
///
/// - `'a` lifetime represents a parent deserializer, which could own the data
/// - `'d` lifetime represents a parent deserializer, which could own the data
/// buffer.
pub(crate) struct MapAccess<'de, 'a, R, E>
pub(crate) struct ElementMapAccess<'de, 'd, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
{
/// Tag -- owner of attributes
start: BytesStart<'de>,
de: &'a mut Deserializer<'de, R, E>,
de: &'d mut Deserializer<'de, R, E>,
/// State of the iterator over attributes. Contains the next position in the
/// inner `start` slice, from which next attribute should be parsed.
iter: IterState,
Expand All @@ -192,18 +192,18 @@ where
has_value_field: bool,
}

impl<'de, 'a, R, E> MapAccess<'de, 'a, R, E>
impl<'de, 'd, R, E> ElementMapAccess<'de, 'd, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
{
/// Create a new MapAccess
/// Create a new ElementMapAccess
pub fn new(
de: &'a mut Deserializer<'de, R, E>,
de: &'d mut Deserializer<'de, R, E>,
start: BytesStart<'de>,
fields: &'static [&'static str],
) -> Result<Self, DeError> {
Ok(MapAccess {
Ok(Self {
de,
iter: IterState::new(start.name().as_ref().len(), false),
start,
Expand All @@ -214,7 +214,7 @@ where
}
}

impl<'de, 'a, R, E> de::MapAccess<'de> for MapAccess<'de, 'a, R, E>
impl<'de, 'd, R, E> MapAccess<'de> for ElementMapAccess<'de, 'd, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand Down Expand Up @@ -289,9 +289,14 @@ where
seed.deserialize(de).map(Some)
}
// Stop iteration after reaching a closing tag
DeEvent::End(e) if e.name() == self.start.name() => Ok(None),
// This is a unmatched closing tag, so the XML is invalid
DeEvent::End(e) => Err(DeError::UnexpectedEnd(e.name().as_ref().to_owned())),
// The matching tag name is guaranteed by the reader if our
// deserializer implementation is correct
DeEvent::End(e) => {
debug_assert_eq!(self.start.name(), e.name());
// Consume End
self.de.next()?;
Ok(None)
}
// We cannot get `Eof` legally, because we always inside of the
// opened tag `self.start`
DeEvent::Eof => Err(DeError::UnexpectedEof),
Expand Down Expand Up @@ -403,7 +408,7 @@ macro_rules! forward {
/// with the same deserializer;
/// - sequences, tuples and tuple structs are deserialized by iterating within the
/// parent tag and deserializing each tag or text content using [`SeqItemDeserializer`];
/// - structs and maps are deserialized using new instance of [`MapAccess`];
/// - structs and maps are deserialized using new instance of [`ElementMapAccess`];
/// - enums:
/// - in case of [`DeEvent::Text`] event the text content is deserialized as
/// a `$text` variant. Enum content is deserialized from the text using
Expand All @@ -419,14 +424,14 @@ macro_rules! forward {
///
/// [`deserialize_tuple`]: #method.deserialize_tuple
/// [`deserialize_struct`]: #method.deserialize_struct
struct MapValueDeserializer<'de, 'a, 'm, R, E>
struct MapValueDeserializer<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
{
/// Access to the map that created this deserializer. Gives access to the
/// context, such as list of fields, that current map known about.
map: &'m mut MapAccess<'de, 'a, R, E>,
map: &'m mut ElementMapAccess<'de, 'd, R, E>,
/// Determines, should [`Deserializer::read_string_impl()`] expand the second
/// level of tags or not.
///
Expand Down Expand Up @@ -504,7 +509,7 @@ where
allow_start: bool,
}

impl<'de, 'a, 'm, R, E> MapValueDeserializer<'de, 'a, 'm, R, E>
impl<'de, 'd, 'm, R, E> MapValueDeserializer<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand All @@ -520,7 +525,7 @@ where
}
}

impl<'de, 'a, 'm, R, E> de::Deserializer<'de> for MapValueDeserializer<'de, 'a, 'm, R, E>
impl<'de, 'd, 'm, R, E> de::Deserializer<'de> for MapValueDeserializer<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand All @@ -543,11 +548,14 @@ where

forward!(deserialize_any);

fn deserialize_option<V>(self, visitor: V) -> Result<V::Value, DeError>
fn deserialize_option<V>(self, visitor: V) -> Result<V::Value, Self::Error>
where
V: Visitor<'de>,
{
deserialize_option!(self.map.de, self, visitor)
match self.map.de.peek()? {
DeEvent::Text(t) if t.is_empty() => visitor.visit_none(),
_ => visitor.visit_some(self),
}
}

/// Forwards deserialization of the inner type. Always calls [`Visitor::visit_newtype_struct`]
Expand Down Expand Up @@ -582,7 +590,7 @@ where
// Clone is cheap if event borrows from the input
DeEvent::Start(e) => TagFilter::Include(e.clone()),
// SAFETY: we use that deserializer with `allow_start == true`
// only from the `MapAccess::next_value_seed` and only when we
// only from the `ElementMapAccess::next_value_seed` and only when we
// peeked `Start` event
_ => unreachable!(),
}
Expand All @@ -597,11 +605,6 @@ where
filter,
})
}

#[inline]
fn is_human_readable(&self) -> bool {
self.map.de.is_human_readable()
}
}

////////////////////////////////////////////////////////////////////////////////////////////////////
Expand Down Expand Up @@ -693,14 +696,14 @@ impl<'de> TagFilter<'de> {
///
/// [`Text`]: crate::events::Event::Text
/// [`CData`]: crate::events::Event::CData
struct MapValueSeqAccess<'de, 'a, 'm, R, E>
struct MapValueSeqAccess<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
{
/// Accessor to a map that creates this accessor and to a deserializer for
/// a sequence items.
map: &'m mut MapAccess<'de, 'a, R, E>,
map: &'m mut ElementMapAccess<'de, 'd, R, E>,
/// Filter that determines whether a tag is a part of this sequence.
///
/// When feature [`overlapped-lists`] is not activated, iteration will stop
Expand All @@ -720,7 +723,7 @@ where
}

#[cfg(feature = "overlapped-lists")]
impl<'de, 'a, 'm, R, E> Drop for MapValueSeqAccess<'de, 'a, 'm, R, E>
impl<'de, 'd, 'm, R, E> Drop for MapValueSeqAccess<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand All @@ -730,7 +733,7 @@ where
}
}

impl<'de, 'a, 'm, R, E> SeqAccess<'de> for MapValueSeqAccess<'de, 'a, 'm, R, E>
impl<'de, 'd, 'm, R, E> SeqAccess<'de> for MapValueSeqAccess<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand Down Expand Up @@ -810,7 +813,7 @@ where
/// contains something else other than text, an error is returned, but if it
/// contains a text and something else (for example, `<item>text<tag/></item>`),
/// then the trail is just ignored;
/// - structs and maps are deserialized using new [`MapAccess`];
/// - structs and maps are deserialized using new [`ElementMapAccess`];
/// - enums:
/// - in case of [`DeEvent::Text`] event the text content is deserialized as
/// a `$text` variant. Enum content is deserialized from the text using
Expand All @@ -826,17 +829,17 @@ where
///
/// [`deserialize_tuple`]: #method.deserialize_tuple
/// [`deserialize_struct`]: #method.deserialize_struct
struct SeqItemDeserializer<'de, 'a, 'm, R, E>
struct SeqItemDeserializer<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
{
/// Access to the map that created this deserializer. Gives access to the
/// context, such as list of fields, that current map known about.
map: &'m mut MapAccess<'de, 'a, R, E>,
map: &'m mut ElementMapAccess<'de, 'd, R, E>,
}

impl<'de, 'a, 'm, R, E> SeqItemDeserializer<'de, 'a, 'm, R, E>
impl<'de, 'd, 'm, R, E> SeqItemDeserializer<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand All @@ -852,7 +855,7 @@ where
}
}

impl<'de, 'a, 'm, R, E> de::Deserializer<'de> for SeqItemDeserializer<'de, 'a, 'm, R, E>
impl<'de, 'd, 'm, R, E> de::Deserializer<'de> for SeqItemDeserializer<'de, 'd, 'm, R, E>
where
R: XmlRead<'de>,
E: EntityResolver,
Expand All @@ -875,25 +878,27 @@ where

forward!(deserialize_any);

fn deserialize_option<V>(self, visitor: V) -> Result<V::Value, DeError>
fn deserialize_option<V>(self, visitor: V) -> Result<V::Value, Self::Error>
where
V: Visitor<'de>,
{
deserialize_option!(self.map.de, self, visitor)
match self.map.de.peek()? {
DeEvent::Text(t) if t.is_empty() => visitor.visit_none(),
_ => visitor.visit_some(self),
}
}

/// Forwards deserialization of the inner type. Always calls [`Visitor::visit_newtype_struct`]
/// with the [`SimpleTypeDeserializer`].
/// with this deserializer.
fn deserialize_newtype_struct<V>(
mut self,
self,
_name: &'static str,
visitor: V,
) -> Result<V::Value, Self::Error>
where
V: Visitor<'de>,
{
let text = self.read_string()?;
visitor.visit_newtype_struct(SimpleTypeDeserializer::from_text(text))
visitor.visit_newtype_struct(self)
}

/// This method deserializes a sequence inside of element that itself is a
Expand All @@ -915,11 +920,6 @@ where
let text = self.read_string()?;
SimpleTypeDeserializer::from_text(text).deserialize_seq(visitor)
}

#[inline]
fn is_human_readable(&self) -> bool {
self.map.de.is_human_readable()
}
}

////////////////////////////////////////////////////////////////////////////////////////////////////
Expand Down
Loading

0 comments on commit ca1c09a

Please sign in to comment.