mercurial-scm/hg: mercurial/utils/cborutil.py comparison

comparison mercurial/utils/cborutil.py @ 52693:5e09c6b5b795

typing: add type annotations to most of `mercurial/utils/cborutil.py` These are the easy/obvious/documented ones. We'll leave the harder ones for later.

author	Matt Harbison <matt_harbison@yahoo.com>
date	Sun, 12 Jan 2025 22:05:19 -0500
parents	279e217d6041
children	8a2091a2f974

comparison

equal deleted inserted replaced

-:45dc0f874b8c
+:5e09c6b5b795
 import struct
 import typing
 if typing.TYPE_CHECKING:
 from typing import (
+Iterable,
 Iterator,
 )
 # Very short very of RFC 7049...
 #
 # The break ends an indefinite length item.
 BREAK = b'\xff'
 BREAK_INT = 255
-def encodelength(majortype, length):
+def encodelength(majortype: int, length: int) -> bytes:
 """Obtain a value encoding the major type and its length."""
 if length < 24:
 return ENCODED_LENGTH_1.pack(majortype << 5 | length)
 elif length < 256:
 return ENCODED_LENGTH_2.pack(majortype << 5 | 24, length)
 return ENCODED_LENGTH_4.pack(majortype << 5 | 26, length)
 else:
 return ENCODED_LENGTH_5.pack(majortype << 5 | 27, length)
-def streamencodebytestring(v):
+def streamencodebytestring(v: bytes) -> Iterator[bytes]:
 yield encodelength(MAJOR_TYPE_BYTESTRING, len(v))
 yield v
-def streamencodebytestringfromiter(it):
+def streamencodebytestringfromiter(it: Iterable[bytes]) -> Iterator[bytes]:
 """Convert an iterator of chunks to an indefinite bytestring.
 Given an input that is iterable and each element in the iterator is
 representable as bytes, emit an indefinite length bytestring.
 """
 yield chunk
 yield BREAK
-def streamencodeindefinitebytestring(source, chunksize=65536):
+def streamencodeindefinitebytestring(
+source, chunksize: int = 65536
+) -> Iterator[bytes]:
 """Given a large source buffer, emit as an indefinite length bytestring.
 This is a generator of chunks constituting the encoded CBOR data.
 """
 yield BEGIN_INDEFINITE_BYTESTRING
 break
 yield BREAK
-def streamencodeint(v):
+def streamencodeint(v: int) -> Iterator[bytes]:
 if v >= 18446744073709551616 or v < -18446744073709551616:
 raise ValueError(b'big integers not supported')
 if v >= 0:
 yield encodelength(MAJOR_TYPE_UINT, v)
 def _mixedtypesortkey(v):
 return type(v).__name__, v
-def streamencodeset(s):
+def streamencodeset(s) -> Iterator[bytes]:
 # https://www.iana.org/assignments/cbor-tags/cbor-tags.xhtml defines
 # semantic tag 258 for finite sets.
 yield encodelength(MAJOR_TYPE_SEMANTIC, SEMANTIC_TAG_FINITE_SET)
 yield from streamencodearray(sorted(s, key=_mixedtypesortkey))
-def streamencodemap(d) -> Iterator[bytes]:
+def streamencodemap(d: dict) -> Iterator[bytes]:
 """Encode dictionary to a generator.
 Does not supporting indefinite length dictionaries.
 """
 yield encodelength(MAJOR_TYPE_MAP, len(d))
 for key, value in sorted(d.items(), key=lambda x: _mixedtypesortkey(x[0])):
 yield from streamencode(key)
 yield from streamencode(value)
-def streamencodemapfromiter(it) -> Iterator[bytes]:
+def streamencodemapfromiter(it: Iterable) -> Iterator[bytes]:
 """Given an iterable of (key, value), encode to an indefinite length map."""
 yield BEGIN_INDEFINITE_MAP
 for key, value in it:
 yield from streamencode(key)
 yield from streamencode(value)
 yield BREAK
-def streamencodebool(b):
+def streamencodebool(b: bool) -> Iterator[bytes]:
 # major type 7, simple value 20 and 21.
 yield b'\xf5' if b else b'\xf4'
-def streamencodenone(v):
+def streamencodenone(v: None) -> Iterator[bytes]:
 # major type 7, simple value 22.
 yield b'\xf6'
 STREAM_ENCODERS = {
 bool: streamencodebool,
 type(None): streamencodenone,
 }
-def streamencode(v):
+def streamencode(v) -> Iterator[bytes]:
 """Encode a value in a streaming manner.
 Given an input object, encode it to CBOR recursively.
 Returns a generator of CBOR encoded bytes. There is no guarantee
 class CBORDecodeError(Exception):
 """Represents an error decoding CBOR."""
-def _elementtointeger(b, i):
+def _elementtointeger(b, i: int) -> int:
 return b[i]
 STRUCT_BIG_UBYTE = struct.Struct('>B')
 STRUCT_BIG_USHORT = struct.Struct(b'>H')
 SPECIAL_START_MAP = 3
 SPECIAL_START_SET = 4
 SPECIAL_INDEFINITE_BREAK = 5
-def decodeitem(b, offset=0):
+def decodeitem(b, offset: int = 0):
 """Decode a new CBOR value from a buffer at offset.
 This function attempts to decode up to one complete CBOR value
 from ``b`` starting at offset ``offset``.
 elif majortype == MAJOR_TYPE_NEGINT:
 # Negative integers are the same as UINT except inverted minus 1.
 complete, value, readcount = decodeuint(subtype, b, offset)
 if complete:
+assert value is not None  # help pytype
 return True, -value - 1, readcount + 1, SPECIAL_NONE
 else:
 return False, None, readcount, SPECIAL_NONE
 elif majortype == MAJOR_TYPE_BYTESTRING:
 raise CBORDecodeError(b'special type %d not allowed' % subtype)
 else:
 assert False
-def decodeuint(subtype, b, offset=0, allowindefinite=False):
+def decodeuint(
+subtype: int, b: bytes, offset: int = 0, allowindefinite: bool = False
+):
 """Decode an unsigned integer.
 ``subtype`` is the lower 5 bits from the initial byte CBOR item
 "header." ``b`` is a buffer containing bytes. ``offset`` points to
 the index of the first byte after the byte that ``subtype`` was
 This behaves like a ``bytes`` but in addition has the ``isfirst``
 and ``islast`` attributes indicating whether this chunk is the first
 or last in an indefinite length bytestring.
 """
-def __new__(cls, v, first=False, last=False):
+isfirst: bool
+islast: bool
+def __new__(cls, v, first: bool = False, last: bool = False):
 self = bytes.__new__(cls, v)
 self.isfirst = first
 self.islast = last
 return self
 _STATE_WANT_ARRAY_VALUE = 3
 _STATE_WANT_SET_VALUE = 4
 _STATE_WANT_BYTESTRING_CHUNK_FIRST = 5
 _STATE_WANT_BYTESTRING_CHUNK_SUBSEQUENT = 6
-def __init__(self):
+def __init__(self) -> None:
 # TODO add support for limiting size of bytestrings
 # TODO add support for limiting number of keys / values in collections
 # TODO add support for limiting size of buffered partial values
 self.decodedbytecount = 0
 # Fully decoded values available for retrieval.
 self._decodedvalues = []
 @property
-def inprogress(self):
+def inprogress(self) -> bool:
 """Whether the decoder has partially decoded a value."""
 return self._state != self._STATE_NONE
-def decode(self, b, offset=0):
+def decode(self, b, offset: int = 0) -> tuple[bool, int, int]:
 """Attempt to decode bytes from an input buffer.
 ``b`` is a collection of bytes and ``offset`` is the byte
 offset within that buffer from which to begin reading data.
 TODO consider adding limits as to the maximum amount of data that can
 be buffered.
 """
-def __init__(self):
+_decoder: sansiodecoder
+_chunks: list
+_wanted: int
+def __init__(self) -> None:
 self._decoder = sansiodecoder()
 self._chunks = []
 self._wanted = 0
-def decode(self, b):
+def decode(self, b) -> tuple[bool, int, int]:
 """Attempt to decode bytes to CBOR values.
 Returns a tuple with the following fields:
 * Bool indicating whether new values are available for retrieval.

Mercurial > public > mercurial-scm > hg

comparison mercurial/utils/cborutil.py @ 52693:5e09c6b5b795