Source code for icalendar.parser.ical.lazy

"""Special parsing for calendar components."""

from __future__ import annotations

from typing import TYPE_CHECKING, ClassVar

from icalendar.parser.content_line import Contentline

from .component import ComponentIcalParser

if TYPE_CHECKING:
    from icalendar.cal.component import Component


[docs] class LazyCalendarIcalParser(ComponentIcalParser): """A parser for calendar components. Instead of parsing the components, LazyComponents are created. Parsing can happen on demand. A calendar may grow over time, with its subcomponents greatly increasing in number, and requiring more memory and time to fully parse. This optimization lazily parses calendar files without consuming more memory than necessary, reducing the initial time it takes to access meta data. """ parse_instantly: ClassVar[tuple[str, ...]] = ("VCALENDAR",) """Parse these components immediately, instead of lazily. All other components are parsed lazily. """
[docs] def handle_begin_component(self, vals): """Begin a new component. This may be the first component. """ c_name = vals.upper() if ( c_name in self.parse_instantly or not self.component or not self.component.is_lazy() ): # these components are parsed immediately super().handle_begin_component(vals) else: self.handle_lazy_begin_component(c_name)
[docs] def handle_lazy_begin_component(self, component_name: str) -> None: """Begin a new component, but do not parse it yet. Parameters: component_name: The upper case name of the component, for example, ``"VEVENT"``. """ content_lines = [Contentline(f"BEGIN:{component_name}")] for line in self._content_lines_iterator: content_lines.append(line) if ( line[:4].upper() == "END:" and line[4:].strip().upper() == component_name ): break if self.component is None: raise ValueError( f"BEGIN:{component_name} encountered outside of a parent component." ) self.component.add_component( LazySubcomponent( component_name, self.get_subcomponent_parser(content_lines), ) )
[docs] def get_subcomponent_parser( self, content_lines: list[Contentline] ) -> ComponentIcalParser: """Get the parser for a subcomponent. Parameters: content_lines: The content lines of the subcomponent. """ return ComponentIcalParser( content_lines, self._component_factory, self._types_factory )
[docs] def prepare_components(self): """Prepare the lazily parsed components."""
[docs] class LazySubcomponent: """A subcomponent that is evaluated lazily. This class holds the raw data of the subcomponent ready for parsing. """ def __init__(self, name: str, parser: ComponentIcalParser): """Initialize the lazy subcomponent with the raw data.""" self._name = name self._parser = parser self._component: Component | None = None @property def name(self) -> str: """The name of the subcomponent. The name is uppercased, per :rfc:`5545#section-2.1`. """ return self._name
[docs] def is_parsed(self) -> bool: """Return whether the subcomponent is already parsed.""" return self._component is not None
[docs] def parse(self) -> Component: """Parse the raw data and return the component.""" if self._component is None: components = self._parser.parse() if len(components) != 1: raise ValueError( f"Expected exactly one component in the subcomponent, " f"but got {len(components)}." ) self._component = components[0] self._parser = None # free memory return self._component
[docs] def is_lazy(self) -> bool: """Return whether the subcomponents were accessed and parsed lazily. Call :meth:`parse` to get the fully parsed component. """ return True
def __repr__(self) -> str: return f"LazySubcomponent(name={self._name}, parsed={self.is_parsed()})"
[docs] def walk(self, name: str) -> list[Component]: """Walk through this component. This only parses the component if necessary. Parameters: name: The name to match for all components in the calendar, then walk through and parse the resulting matches. """ if not isinstance(name, str): raise TypeError("name must be a string.") if name == self.name or ( self._parser and self._parser.contains_component(name) ): return self.parse().walk(name) return []
[docs] def with_uid(self, uid: str) -> list[Component]: """Return the components containing the given ``uid``. This only parses the component if necessary. Parameters: uid: The UID of the components. """ if self._parser and not self._parser.contains_uid(uid): return [] return self.parse().with_uid(uid)
__all__ = ["LazyCalendarIcalParser", "LazySubcomponent"]