Source code for pywikibot.time

"""Time handling module.

.. versionadded:: 7.5
"""
#
# (C) Pywikibot team, 2007-2024
#
# Distributed under the terms of the MIT license.
#
from __future__ import annotations

import datetime
import math
import re
import time as _time
import types
from contextlib import suppress
from typing import overload

import pywikibot
from pywikibot.tools import (
    PYTHON_VERSION,
    SPHINX_RUNNING,
    classproperty,
    deprecated,
)


__all__ = (
    'parse_duration',
    'str2timedelta',
    'MW_KEYS',
    'Timestamp',
    'TZoneFixedOffset'
)

#: .. versionadded:: 7.5
MW_KEYS = types.MappingProxyType({
    's': 'seconds',
    'h': 'hours',
    'd': 'days',
    'w': 'weeks',
    'y': 'years',
    # 'months' and 'minutes' were removed because confusion outweighs merit
})


[docs] class Timestamp(datetime.datetime): """Class for handling MediaWiki timestamps. This inherits from :python:`datetime.datetime <library/datetime.html#datetime.datetime>`, so it can use all of the methods and operations of a ``datetime`` object. To ensure that the results of any operation are also a Timestamp object, be sure to use only Timestamp objects (and :python:`datetime.timedelta <library/datetime.html#datetime.timedelta>`) in any operation. Use :meth:`Timestamp.fromISOformat` and :meth:`Timestamp.fromtimestampformat` to create Timestamp objects from MediaWiki string formats. As these constructors are typically used to create objects using data passed provided by site and page methods, some of which return a Timestamp when previously they returned a MediaWiki string representation, these methods also accept a Timestamp object, in which case they return a clone. Alternatively, :meth:`Timestamp.set_timestamp` can create Timestamp objects from :class:`Timestamp`, ``datetime.datetime`` object, or strings compliant with ISO8601, MediaWiki, or POSIX formats. Use :meth:`Site.server_time() <pywikibot.site._apisite.APISite.server_time>` for the current time; this is more reliable than using :meth:`Timestamp.utcnow` or :meth:`Timestamp.nowutc`. .. versionchanged:: 7.5 moved to :mod:`time` module """ mediawikiTSFormat = '%Y%m%d%H%M%S' # noqa: N815 _ISO8601Format_new = '{0:+05d}-{1:02d}-{2:02d}T{3:02d}:{4:02d}:{5:02d}Z'
[docs] @classmethod def set_timestamp( cls, ts: str | datetime.datetime | Timestamp, ) -> Timestamp: """Set Timestamp from input object. ts is converted to a datetime naive object representing UTC time. String shall be compliant with: - Mediwiki timestamp format: ``YYYYMMDDHHMMSS`` - ISO8601 format: ``YYYY-MM-DD[T ]HH:MM:SS[Z|±HH[MM[SS[.ffffff]]]]`` - POSIX format: seconds from Unix epoch ``S{1,13}[.ffffff]]`` .. versionadded:: 7.5 .. versionchanged:: 8.0 raises *TypeError* instead of *ValueError*. :param ts: Timestamp, datetime.datetime or str :return: Timestamp object :raises TypeError: conversion failed """ if isinstance(ts, cls): return ts if isinstance(ts, datetime.datetime): return cls._from_datetime(ts) if isinstance(ts, str): return cls._from_string(ts) raise TypeError( f'Unsupported "ts" type, got "{ts}" ({type(ts).__name__})')
@staticmethod def _from_datetime(dt: datetime.datetime) -> Timestamp: """Convert a datetime.datetime timestamp to a Timestamp object. .. versionadded:: 7.5 """ return Timestamp(dt.year, dt.month, dt.day, dt.hour, dt.minute, dt.second, dt.microsecond, dt.tzinfo) @classmethod def _from_mw(cls, timestr: str) -> Timestamp: """Convert a string in MW format to a Timestamp object. Mediwiki timestamp format: YYYYMMDDHHMMSS .. versionadded:: 7.5 """ RE_MW = r'\d{14}' # noqa: N806 m = re.fullmatch(RE_MW, timestr) if not m: raise ValueError( f'time data {timestr!r} does not match MW format.') return cls.strptime(timestr, cls.mediawikiTSFormat) @classmethod def _from_iso8601(cls, timestr: str) -> Timestamp: """Convert a string in ISO8601 format to a Timestamp object. ISO8601 format: ``YYYY-MM-DD[T ]HH:MM:SS[[.,]ffffff][Z|±HH[MM[SS[.ffffff]]]]`` .. versionadded:: 7.5 """ RE_ISO8601 = (r'(?:\d{4}-\d{2}-\d{2})(?P<sep>[T ])' # noqa: N806 r'(?:\d{2}:\d{2}:\d{2})(?P<u>[.,]\d{1,6})?' r'(?P<tz>Z|[+\-]\d{2}:?\d{,2})?' ) m = re.fullmatch(RE_ISO8601, timestr) if not m: raise ValueError( f'time data {timestr!r} does not match ISO8601 format.') strpfmt = f'%Y-%m-%d{m["sep"]}%H:%M:%S' strpstr = timestr[:19] if m['u']: strpfmt += '.%f' strpstr += m['u'].replace(',', '.') # .ljust(7, '0') if m['tz']: if m['tz'] == 'Z': strpfmt += 'Z' strpstr += 'Z' else: strpfmt += '%z' # strptime wants HHMM, without ':' strpstr += (m['tz'].replace(':', '')).ljust(5, '0') ts = cls.strptime(strpstr, strpfmt) if ts.tzinfo is not None: ts = ts.astimezone(datetime.timezone.utc).replace(tzinfo=None) # why pytest in py35/py37 fails without this? ts = cls._from_datetime(ts) return ts @classmethod def _from_posix(cls, timestr: str) -> Timestamp: """Convert a string in POSIX format to a Timestamp object. POSIX format: ``SECONDS[.ffffff]]`` .. versionadded:: 7.5 """ RE_POSIX = r'(?P<S>-?\d{1,13})(?:\.(?P<u>\d{1,6}))?' # noqa: N806 m = re.fullmatch(RE_POSIX, timestr) if not m: msg = "time data '{timestr}' does not match POSIX format." raise ValueError(msg.format(timestr=timestr)) sec = int(m['S']) usec = m['u'] usec = int(usec.ljust(6, '0')) if usec else 0 if sec < 0 < usec: sec -= 1 usec = 1_000_000 - usec ts = cls(1970, 1, 1) + datetime.timedelta(seconds=sec, microseconds=usec) return ts @classmethod def _from_string(cls, timestr: str) -> Timestamp: """Convert a string to a Timestamp object. .. versionadded:: 7.5 """ handlers = [ cls._from_mw, cls._from_iso8601, cls._from_posix, ] for handler in handlers: with suppress(ValueError): return handler(timestr) raise ValueError(f'time data {timestr!r} does not match any format.')
[docs] @deprecated('replace method', since='8.0.0') # type: ignore[misc] def clone(self) -> Timestamp: """Clone this instance. .. deprecated:: 8.0 Use :meth:`replace` method instead. """ return self.replace()
@classproperty def ISO8601Format(cls) -> str: # noqa: N802 """ISO8601 format string class property for compatibility purpose.""" return cls._ISO8601Format() @classmethod def _ISO8601Format(cls, sep: str = 'T') -> str: # noqa: N802 """ISO8601 format string. :param sep: one-character separator, placed between the date and time :return: ISO8601 format string """ assert len(sep) == 1 return f'%Y-%m-%d{sep}%H:%M:%SZ'
[docs] @classmethod def fromISOformat(cls, # noqa: N802 ts: str | Timestamp, sep: str = 'T') -> Timestamp: """Convert an ISO 8601 timestamp to a Timestamp object. :param ts: ISO 8601 timestamp or a Timestamp object already :param sep: one-character separator, placed between the date and time :return: Timestamp object """ # If inadvertently passed a Timestamp object, use replace() # to create a clone. if isinstance(ts, cls): return ts.replace() if not isinstance(ts, str): raise TypeError( f'ts argument must be a string or a Timestamp object,' f' not {type(ts).__name__}') return cls._from_iso8601(f'{ts[:10]}{sep}{ts[11:]}')
[docs] @classmethod def fromtimestampformat(cls, ts: str | Timestamp, strict: bool = False) -> Timestamp: """Convert a MediaWiki internal timestamp to a Timestamp object. .. versionchanged:: 3.0 create a Timestamp if only year, month and day are given. .. versionchanged:: 8.0 the *strict* parameter was added which discards missing element tolerance. Example ------- >>> Timestamp.fromtimestampformat('20220705082234') Timestamp(2022, 7, 5, 8, 22, 34) >>> Timestamp.fromtimestampformat('20220927') Timestamp(2022, 9, 27, 0, 0) >>> Timestamp.fromtimestampformat('20221109', strict=True) Traceback (most recent call last): ... ValueError: time data '20221109' does not match MW format. :param ts: the timestamp to be converted :param strict: If true, do not ignore missing timestamp elements for hours, minutes or seconds :return: return the *Timestamp* object from given *ts*. :raises ValueError: The timestamp is invalid, e.g. missing or invalid timestamp component. """ # If inadvertently passed a Timestamp object, use replace() # to create a clone. if isinstance(ts, cls): return ts.replace() if not isinstance(ts, str): raise TypeError( f'ts argument must be a string or a Timestamp object,' f' not {type(ts).__name__}') if len(ts) == 8 and not strict: # year, month and day are given only ts += '000000' return cls._from_mw(ts)
[docs] def isoformat(self, sep: str = 'T') -> str: # type: ignore[override] """ Convert object to an ISO 8601 timestamp accepted by MediaWiki. datetime.datetime.isoformat does not postfix the ISO formatted date with a 'Z' unless a timezone is included, which causes MediaWiki ~1.19 and earlier to fail. """ return self.strftime(self._ISO8601Format(sep))
[docs] def totimestampformat(self) -> str: """Convert object to a MediaWiki internal timestamp.""" return self.strftime(self.mediawikiTSFormat)
[docs] def posix_timestamp(self) -> float: """ Convert object to a POSIX timestamp. See Note in datetime.timestamp(). .. versionadded:: 7.5 """ return self.replace(tzinfo=datetime.timezone.utc).timestamp()
[docs] def posix_timestamp_format(self) -> str: """Convert object to a POSIX timestamp format. .. versionadded:: 7.5 """ return f'{self.posix_timestamp():.6f}'
def __repr__(self) -> str: """Unify repr string between CPython and Pypy (T325905). .. versionadded:: 8.0 """ s = super().__repr__() return f'{type(self).__name__}{s[s.find("("):]}' def __str__(self) -> str: """Return a string format recognized by the API.""" return self.isoformat()
[docs] @classmethod def nowutc(cls, *, with_tz: bool = True) -> Timestamp: """Return the current UTC date and time. If *with_tz* is True it returns an aware :class:`Timestamp` object with UTC timezone by calling ``now(datetime.UTC)``. As such this is just a short way to get it. Otherwise the UTC timestamp is returned as a naive Timestamp object with timezone of None. This is equal to the :meth:`Timestamp.utcnow`. .. warning:: Because naive datetime objects are treated by many datetime methods as local times, it is preferred to use aware Timestamps or datetimes to represent times in UTC. As such, it is not recommended to set *with_tz* to False. .. caution:: You cannot compare, add or subtract offset-naive and offset- aware Timestamps/datetimes (i.e. missing or having timezone). A TypeError will be raised in such cases. .. versionadded:: 9.0 .. seealso:: - :python:`datetime.now() <library/datetime.html#datetime.datetime.now>` - :python:`datetime.utcnow() <library/datetime.html#datetime.datetime.utcnow>` - :python:`datetime.UTC<library/datetime.html#datetime.UTC>` :param with_tz: Whether to include UTC timezone or not """ if with_tz: # datetime.UTC can only be used with Python 3.11+ return cls.now(datetime.timezone.utc) ts = _time.time() gmt = _time.gmtime(ts) us = round(ts % 1 * 1e6) return cls(*gmt[:6], us)
[docs] @classmethod def utcnow(cls) -> Timestamp: """Return the current UTC date and time, with `tzinfo` ``None``. This is like :meth:`Timestamp.now`, but returns the current UTC date and time, as a naive :class:`Timestamp` object. An aware current UTC datetime can be obtained by calling :meth:`Timestamp.nowutc`. .. note:: This method is deprecated since Python 3.12 but held here for backward compatibility because ``utcnow`` is widely used inside the framework to compare MediaWiki timestamps which are UTC-based. Neither :python:`datetime.fromisoformat() <library/datetime.html#datetime.datetime.fromisoformat>` implementations of Python < 3.11 nor :class:`Timestamp` specific :meth:`fromISOformat` supports timezone. .. warning:: Because naive datetime objects are treated by many datetime methods as local times, it is preferred to use aware Timestamps or datetimes to represent times in UTC. As such, the recommended way to create an object representing the current time in UTC is by calling :meth:`Timestamp.nowutc`. .. hint:: This method might be deprecated later. .. versionadded:: 9.0 .. seealso:: :python:`datetime.utcnow() <library/datetime.html#datetime.datetime.utcnow>` """ if PYTHON_VERSION < (3, 12): return super().utcnow() return cls.nowutc(with_tz=False)
if PYTHON_VERSION < (3, 8) or SPHINX_RUNNING: # methods which does not upcast the right class but return a # datetime.datetime object in Python 3.7 def __add__(self, other: datetime.timedelta) -> Timestamp: """Perform addition, returning a Timestamp instead of datetime.""" newdt = super().__add__(other) if isinstance(newdt, datetime.datetime): return self._from_datetime(newdt) return newdt @overload # type: ignore[override] def __sub__(self, other: datetime.timedelta) -> Timestamp: ... @overload def __sub__(self, other: datetime.datetime) -> datetime.timedelta: ... def __sub__( self, other: datetime.datetime | datetime.timedelta, ) -> datetime.timedelta | Timestamp: """Perform subtraction, returning Timestamp instead of datetime.""" newdt = super().__sub__(other) # type: ignore[operator] if isinstance(newdt, datetime.datetime): return self._from_datetime(newdt) return newdt
[docs] @classmethod def fromtimestamp(cls, timestamp: int | float, tz=None) -> Timestamp: """Return the local date and time corresponding to the POSIX ts. This class method is for Python 3.7 to upcast the class if a tz is given. .. versionadded:: 9.0 .. seealso:: - :python:`datetime.fromtimestamp() <library/datetime.html#datetime.datetime.fromtimestamp>` """ ts = super().fromtimestamp(timestamp, tz) if tz: ts = cls.set_timestamp(ts) return ts
[docs] @classmethod def now(cls, tz=None) -> Timestamp: """Return the current local date and time. This class method is for Python 3.7 to upcast the class if a *tz* is given. .. versionadded:: 9.0 .. seealso:: - :python:`datetime.now() <library/datetime.html#datetime.datetime.now>` """ ts = super().now(tz) if tz: ts = cls.set_timestamp(ts) return ts
[docs] class TZoneFixedOffset(datetime.tzinfo): """ Class building tzinfo objects for fixed-offset time zones. :param offset: a number indicating fixed offset in minutes east from UTC :param name: a string with name of the timezone """ def __init__(self, offset: int, name: str) -> None: """Initializer.""" self._offset = datetime.timedelta(minutes=offset) self._name = name
[docs] def utcoffset(self, dt: datetime.datetime | None) -> datetime.timedelta: """Return the offset to UTC.""" return self._offset
[docs] def tzname(self, dt: datetime.datetime | None) -> str: """Return the name of the timezone.""" return self._name
[docs] def dst(self, dt: datetime.datetime | None) -> datetime.timedelta: """Return no daylight savings time.""" return datetime.timedelta(0)
def __repr__(self) -> str: """Return the internal representation of the timezone.""" return '{}({}, {})'.format( self.__class__.__name__, self._offset.days * 86400 + self._offset.seconds, self._name )
[docs] def str2timedelta( string: str, timestamp: datetime.datetime | None = None, ) -> datetime.timedelta: """ Return a timedelta for a shorthand duration. :param string: a string defining a time period: Examples:: 300s - 300 seconds 36h - 36 hours 7d - 7 days 2w - 2 weeks (14 days) 1y - 1 year :param timestamp: a timestamp to calculate a more accurate duration offset used by years :type timestamp: datetime.datetime :return: the corresponding timedelta object """ key, duration = parse_duration(string) if key == 'y': # years days = math.ceil(duration * 365.25) duration *= 12 if timestamp: return pywikibot.date.apply_month_delta( timestamp.date(), month_delta=duration) - timestamp.date() return datetime.timedelta(days=days) # days, seconds, hours, weeks return datetime.timedelta(**{MW_KEYS[key]: duration})
[docs] def parse_duration(string: str) -> tuple[str, int]: """ Return the key and duration extracted from the string. :param string: a string defining a time period Examples:: 300s - 300 seconds 36h - 36 hours 7d - 7 days 2w - 2 weeks (14 days) 1y - 1 year :return: key and duration extracted form the string """ if len(string) < 2: raise ValueError('Time period should be a numeric value followed by ' 'its qualifier') key, duration = string[-1], string[:-1] if key not in MW_KEYS: raise ValueError(f'Time period qualifier is unrecognized: {string}') if not duration.isdigit(): raise ValueError(f"Time period's duration should be numeric: {string}") return key, int(duration)