mercurial-scm/hg-stable: mercurial/encoding.py comparison

comparison mercurial/encoding.py @ 43544:2ade00f3b03b

encoding: add comment-based type hints for pytype Differential Revision: https://phab.mercurial-scm.org/D7275

author	Augie Fackler <augie@google.com>
date	Wed, 06 Nov 2019 14:48:34 -0500
parents	5f2a8dabb0d8
children	313e3a279828

comparison

equal deleted inserted replaced

-:daade078f1f0
+:2ade00f3b03b
 policy,
 pycompat,
 )
 from .pure import charencode as charencodepure
+if not globals():  # hide this from non-pytype users
+from typing import (
+Any,
+Callable,
+List,
+Text,
+Type,
+TypeVar,
+Union,
+)
+# keep pyflakes happy
+for t in (Any, Callable, List, Text, Type, Union):
+assert t
+_Tlocalstr = TypeVar('_Tlocalstr', bound=localstr)
 charencode = policy.importmod(r'charencode')
 isasciistr = charencode.isasciistr
 asciilower = charencode.asciilower
 # verify the next function will work
 assert all(i.startswith((b"\xe2", b"\xef")) for i in _ignore)
 def hfsignoreclean(s):
+# type: (bytes) -> bytes
 """Remove codepoints ignored by HFS+ from s.
 >>> hfsignoreclean(u'.h\u200cg'.encode('utf-8'))
 '.hg'
 >>> hfsignoreclean(u'.h\ufeffg'.encode('utf-8'))
 class localstr(bytes):
 '''This class allows strings that are unmodified to be
 round-tripped to the local encoding and back'''
 def __new__(cls, u, l):
+# type: (Type[_Tlocalstr], Text, bytes) -> _Tlocalstr
 s = bytes.__new__(cls, l)
 s._utf8 = u
 return s
 def __hash__(self):
 >>> assert safelocalstr(b'\\xc3') in {b'\\xc3': 0}
 """
 def tolocal(s):
+# type: (Text) -> bytes
 """
 Convert a string from internal UTF-8 to local encoding
 All internal strings should be UTF-8 but some repos before the
 implementation of locale support may contain latin1 or possibly
 except LookupError as k:
 raise error.Abort(k, hint=b"please check your locale settings")
 def fromlocal(s):
+# type: (bytes) -> Text
 """
 Convert a string from the local character encoding to UTF-8
 We attempt to decode strings using the encoding mode set by
 HGENCODINGMODE, which defaults to 'strict'. In this mode, unknown
 except LookupError as k:
 raise error.Abort(k, hint=b"please check your locale settings")
 def unitolocal(u):
+# type: (Text) -> bytes
 """Convert a unicode string to a byte string of local encoding"""
 return tolocal(u.encode('utf-8'))
 def unifromlocal(s):
+# type: (bytes) -> Text
 """Convert a byte string of local encoding to a unicode string"""
 return fromlocal(s).decode('utf-8')
 def unimethod(bytesfunc):
+# type: (Callable[[Any], bytes]) -> Callable[[Any], Text]
 """Create a proxy method that forwards __unicode__() and __str__() of
 Python 3 to __bytes__()"""
 def unifunc(obj):
 return unifromlocal(bytesfunc(obj))
 or b"WF"
 )
 def colwidth(s):
+# type: (bytes) -> int
 b"Find the column width of a string for display in the local encoding"
 return ucolwidth(s.decode(_sysstr(encoding), r'replace'))
 def ucolwidth(d):
+# type: (Text) -> int
 b"Find the column width of a Unicode string for display"
 eaw = getattr(unicodedata, 'east_asian_width', None)
 if eaw is not None:
 return sum([eaw(c) in _wide and 2 or 1 for c in d])
 return len(d)
 def getcols(s, start, c):
+# type: (bytes, int, int) -> bytes
 '''Use colwidth to find a c-column substring of s starting at byte
 index start'''
 for x in pycompat.xrange(start + c, len(s)):
 t = s[start:x]
 if colwidth(t) == c:
 return t
 def trim(s, width, ellipsis=b'', leftside=False):
+# type: (bytes, int, bytes, bool) -> bytes
 """Trim string 's' to at most 'width' columns (including 'ellipsis').
 If 'leftside' is True, left side of string 's' is trimmed.
 'ellipsis' is always placed at trimmed side.
 return concat(usub.encode(_sysstr(encoding)))
 return ellipsis  # no enough room for multi-column characters
 def lower(s):
+# type: (bytes) -> bytes
 b"best-effort encoding-aware case-folding of local string s"
 try:
 return asciilower(s)
 except UnicodeDecodeError:
 pass
 except LookupError as k:
 raise error.Abort(k, hint=b"please check your locale settings")
 def upper(s):
+# type: (bytes) -> bytes
 b"best-effort encoding-aware case-folding of local string s"
 try:
 return asciiupper(s)
 except UnicodeDecodeError:
 return upperfallback(s)
 def upperfallback(s):
+# type: (Any) -> Any
 try:
 if isinstance(s, localstr):
 u = s._utf8.decode("utf-8")
 else:
 u = s.decode(_sysstr(encoding), _sysstr(encodingmode))
 upper = 1
 other = 0
 def jsonescape(s, paranoid=False):
+# type: (Any, Any) -> Any
 '''returns a string suitable for JSON
 JSON is problematic for us because it doesn't support non-Unicode
 bytes. To deal with this, we take the following approach:
 _utf8len = [0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 2, 2, 3, 4]
 def getutf8char(s, pos):
+# type: (Any, Any) -> Any
 '''get the next full utf-8 character in the given string, starting at pos
 Raises a UnicodeError if the given location does not start a valid
 utf-8 character.
 '''
 c.decode("utf-8", _utf8strict)
 return c
 def toutf8b(s):
+# type: (Any) -> Any
 '''convert a local, possibly-binary string into UTF-8b
 This is intended as a generic method to preserve data when working
 with schemes like JSON and XML that have no provision for
 arbitrary byte strings. As Mercurial often doesn't know
 r += c
 return r
 def fromutf8b(s):
+# type: (Text) -> bytes
 '''Given a UTF-8b string, return a local, possibly-binary string.
 return the original binary string. This
 is a round-trip process for strings like filenames, but metadata
 that's was passed through tolocal will remain in UTF-8.

Mercurial > public > mercurial-scm > hg-stable

comparison mercurial/encoding.py @ 43544:2ade00f3b03b