Source code for icalendar.cal.lazy

"""Components for lazy parsing of components."""

from __future__ import annotations

from typing import TYPE_CHECKING, Literal

from icalendar.cal.component_factory import ComponentFactory
from icalendar.parser.ical.lazy import LazyCalendarIcalParser

from .calendar import Calendar

if TYPE_CHECKING:
    from collections.abc import Callable

    from icalendar.parser.ical.component import ComponentIcalParser
    from icalendar.parser.ical.lazy import LazySubcomponent

    from .component import Component


[docs] class ParsedSubcomponentsStrategy: """All the subcomponents are parsed and available as a list.""" def __init__(self): self._components: list[Component] = []
[docs] def get_all_components(self) -> tuple[ParsedSubcomponentsStrategy, list[Component]]: """Get the subcomponents of the calendar.""" return self, self._components
[docs] def set_components( self, components: list[Component] ) -> ParsedSubcomponentsStrategy: """Set the subcomponents of the calendar.""" self._components = components return self
[docs] def add_component(self, component: Component) -> ParsedSubcomponentsStrategy: """Add a component to the calendar.""" self._components.append(component.parse()) return self
[docs] def is_lazy(self) -> Literal[False]: """Returns ``False`` because subcomponents are not lazily parsed.""" return False
[docs] def walk(self, name: str) -> tuple[ParsedSubcomponentsStrategy, list[Component]]: """Get the subcomponents of the calendar with the given name.""" result = [] for component in self._components: result += component.walk(name) return self, result
[docs] def with_uid( self, name: str ) -> tuple[ParsedSubcomponentsStrategy, list[Component]]: """Get the subcomponents of the calendar with the given uid.""" result = [] for component in self._components: result += component.with_uid(name) return self, result
[docs] class LazySubcomponentsStrategy: """Parse subcomponents only when accessed.""" initial_components_to_parse: tuple[str, ...] = ("VTIMEZONE",) """Parse these subcomponents before any others.""" def __init__(self): self._components: list[LazySubcomponent | Component] = [] self._initial_parsed: bool = False @property def as_parsed(self) -> ParsedSubcomponentsStrategy: """Return the parsed components.""" return ParsedSubcomponentsStrategy().set_components( [component.parse() for component in self._components] )
[docs] def get_all_components(self) -> tuple[ParsedSubcomponentsStrategy, list[Component]]: """Get the subcomponents of the calendar. Parse all subcomponents. """ self.parse_initial_components() return self.as_parsed.get_all_components()
[docs] def set_components( self, components: list[Component] ) -> ParsedSubcomponentsStrategy: """Set the subcomponents of the calendar.""" return ParsedSubcomponentsStrategy().set_components(components)
[docs] def add_component( self, component: Component | LazySubcomponent ) -> LazySubcomponentsStrategy: """Add a component to the calendar.""" self._components.append(component) return self
[docs] def is_lazy(self) -> bool: """Return whether the subcomponents may be lazily parsed.""" return True
[docs] def parse_initial_components(self) -> None: """Parse the components that are required by other components. This mainly concerns the timezone components. They are required by other components that have a TZID parameter. """ if self._initial_parsed: return self._initial_parsed = True for component in self._components: if component.name in self.initial_components_to_parse: component.parse()
[docs] def walk( self, name: str | None ) -> tuple[LazySubcomponentsStrategy, list[Component]]: """Get the subcomponents of the calendar with the given name. Parse only the minimal number of subcomponents. """ if name is None: return self.as_parsed.walk(name) self.parse_initial_components() result = [] for component in self._components: result += component.walk(name) return self, result
[docs] def with_uid(self, uid: str) -> tuple[LazySubcomponentsStrategy, list[Component]]: """Get the subcomponents of the calendar with the given ``uid``. Parse only the minimal number of subcomponents. """ self.parse_initial_components() result = [] for component in self._components: result += component.with_uid(uid) return self, result
[docs] class InitialSubcomponentsStrategy: """Initial strategy for the calendar. No subcomponents. """
[docs] def set_components(self, components: list[Component]) -> LazySubcomponentsStrategy: if components: raise ValueError( "Cannot set subcomponents on an uninitialised LazyCalendar. " "Parse it first or add components via add_component()." ) return LazySubcomponentsStrategy()
[docs] class LazyCalendar(Calendar): """A calendar that can handle big files. Subcomponents of this calendar are evaluated lazily, meaning that they are not parsed until they are accessed. This allows the calendar to handle large files without consuming too much memory or time. All properties of the calendar component are parsed immediately. Subcomponents and their properties are parsed lazily. Examples: By accessing the :attr:`~icalendar.cal.calendar.Calendar.events` of the calendar, only :class:`~icalendar.cal.event.Event` and :class:`~icalendar.cal.timezone.Timezone` are immediately parsed. .. code-block:: pycon >>> from icalendar import LazyCalendar >>> calendar = LazyCalendar.example("issue_1050_all_components") >>> len(calendar.events) == 1 True The calendar's subcomponents were not parsed because they were not accessed. The calendar is still lazy. >>> calendar.is_lazy() True When you access all :attr:`subcomponents` of the calendar, for example by getting their count, the entire calendar is parsed and becomes not lazy. >>> len(calendar.subcomponents) 5 >>> calendar.is_lazy() False """ _subcomponents: ( LazySubcomponentsStrategy | ParsedSubcomponentsStrategy | InitialSubcomponentsStrategy ) """The strategy pattern for subcomponents of the calendar.""" def __init__(self, *args, **kwargs): """Initialize the calendar.""" self._subcomponents = InitialSubcomponentsStrategy() super().__init__(*args, **kwargs) @property def subcomponents(self) -> list[Component]: """The subcomponents of the calendar. Parse all subcomponents of the calendar and return them as a list. You can manipulate this list or set it. It has the same behavior as in :class:`~icalendar.cal.calendar.Calendar`. """ self._subcomponents, result = self._subcomponents.get_all_components() return result @subcomponents.setter def subcomponents(self, value: list[Component]) -> None: """Set the subcomponents of the calendar.""" self._subcomponents = self._subcomponents.set_components(value) @classmethod def _get_ical_parser(cls, st: str | bytes) -> ComponentIcalParser: """Get the iCal parser for the given input string.""" return LazyCalendarIcalParser( st, cls._get_component_factory(), cls.types_factory ) @classmethod def _get_component_factory(cls) -> ComponentFactory: """Get the component factory for this calendar.""" factory = ComponentFactory() factory.add_component_class(cls) return factory
[docs] def add_component(self, component: Component) -> None: """Add a component to the calendar. Use this instead of appending to :attr:`~icalendar.cal.lazy.LazyCalendar.subcomponents`, as the latter does not parse the whole calendar. """ self._subcomponents = self._subcomponents.add_component(component)
[docs] def is_lazy(self) -> bool: """Whether the subcomponents will be parsed lazily. .. note:: If you believe that the calendar parses more than it should, please `open an issue <https://github.com/collective/icalendar/issues/new?template=bug_report.md>`_. Returns: ``True`` if subcomponents are deferred and not yet parsed. ``False`` if all subcomponents have been parsed. """ return self._subcomponents.is_lazy()
def _walk( self, name: str | None, select: Callable[[Component], bool] ) -> list[Component]: self._subcomponents, result = self._subcomponents.walk(name) result = [component for component in result if select(component)] if (name is None or self.name == name) and select(self): result.insert(0, self) return result
[docs] def with_uid(self, uid: str) -> list[Component]: self._subcomponents, result = self._subcomponents.with_uid(uid) if self.uid == uid: result.insert(0, self) return result
with_uid.__doc__ = Calendar.with_uid.__doc__
__all__ = ["LazyCalendar"] if __name__ == "__main__": import timeit calendar = Calendar.example("issue_1050_all_components") COUNT = 10000 calendar.subcomponents *= COUNT ics = calendar.to_ical() def _benchmark(cal: type[Calendar]): """Check out how fast this is.""" cal = cal.from_ical(ics) assert len(cal.events) == COUNT for cal in [Calendar, LazyCalendar]: print("Benchmarking:", cal.__name__) # noqa: T201 print(timeit.timeit("_benchmark(cal)", globals=locals(), number=1)) # noqa: T201 # Benchmarking: Calendar # 12.277852076000272 # Benchmarking: LazyCalendar # 5.738950790999297