mercurial-scm/hg-stable: mercurial/encoding.py comparison

comparison mercurial/encoding.py @ 30033:02dbfaa6df0b

py3: convert encoding name and mode to str Otherwise tolocal() and fromlocal() wouldn't work on Python 3. Still tolocal() can't make a valid localstr object because localstr inherits str, but it can return some object without raising exceptions. Since Py3 bytes() behaves much like bytearray() than str() of Py2, we can't simply do s/str/bytes/g. I have no good idea to handle str/bytes divergence.

author	Yuya Nishihara <yuya@tcha.org>
date	Wed, 28 Sep 2016 20:39:06 +0900
parents	0f6d6fdd3c2a
children	e4a6b439acc5

comparison

equal deleted inserted replaced

-:2219f4f82ede
+:02dbfaa6df0b
 from . import (
 error,
 pycompat,
 )
+_sysstr = pycompat.sysstr
 if pycompat.ispy3:
 unichr = chr
 # These unicode characters are ignored by HFS+ (Apple Technote 1150,
 # make sure string is actually stored in UTF-8
 u = s.decode('UTF-8')
 if encoding == 'UTF-8':
 # fast path
 return s
-r = u.encode(encoding, "replace")
+r = u.encode(_sysstr(encoding), u"replace")
-if u == r.decode(encoding):
+if u == r.decode(_sysstr(encoding)):
 # r is a safe, non-lossy encoding of s
 return r
 return localstr(s, r)
 except UnicodeDecodeError:
 # we should only get here if we're looking at an ancient changeset
 try:
-u = s.decode(fallbackencoding)
+u = s.decode(_sysstr(fallbackencoding))
-r = u.encode(encoding, "replace")
+r = u.encode(_sysstr(encoding), u"replace")
-if u == r.decode(encoding):
+if u == r.decode(_sysstr(encoding)):
 # r is a safe, non-lossy encoding of s
 return r
 return localstr(u.encode('UTF-8'), r)
 except UnicodeDecodeError:
 u = s.decode("utf-8", "replace") # last ditch
-return u.encode(encoding, "replace") # can't round-trip
+# can't round-trip
+return u.encode(_sysstr(encoding), u"replace")
 except LookupError as k:
 raise error.Abort(k, hint="please check your locale settings")
 def fromlocal(s):
 """
 # can we do a lossless round-trip?
 if isinstance(s, localstr):
 return s._utf8
 try:
-return s.decode(encoding, encodingmode).encode("utf-8")
+u = s.decode(_sysstr(encoding), _sysstr(encodingmode))
+return u.encode("utf-8")
 except UnicodeDecodeError as inst:
 sub = s[max(0, inst.start - 10):inst.start + 10]
 raise error.Abort("decoding near '%s': %s!" % (sub, inst))
 except LookupError as k:
 raise error.Abort(k, hint="please check your locale settings")
 wide = (os.environ.get("HGENCODINGAMBIGUOUS", "narrow") == "wide"
 and "WFA" or "WF")
 def colwidth(s):
 "Find the column width of a string for display in the local encoding"
-return ucolwidth(s.decode(encoding, 'replace'))
+return ucolwidth(s.decode(_sysstr(encoding), u'replace'))
 def ucolwidth(d):
 "Find the column width of a Unicode string for display"
 eaw = getattr(unicodedata, 'east_asian_width', None)
 if eaw is not None:
 +++
 >>> print trim(t, 1, ellipsis=ellipsis)
 +
 """
 try:
-u = s.decode(encoding)
+u = s.decode(_sysstr(encoding))
 except UnicodeDecodeError:
 if len(s) <= width: # trimming is not needed
 return s
 width -= len(ellipsis)
 if width <= 0: # no enough room even for ellipsis
 uslice = lambda i: u[:-i]
 concat = lambda s: s + ellipsis
 for i in xrange(1, len(u)):
 usub = uslice(i)
 if ucolwidth(usub) <= width:
-return concat(usub.encode(encoding))
+return concat(usub.encode(_sysstr(encoding)))
 return ellipsis # no enough room for multi-column characters
 def _asciilower(s):
 '''convert a string to lowercase if ASCII
 pass
 try:
 if isinstance(s, localstr):
 u = s._utf8.decode("utf-8")
 else:
-u = s.decode(encoding, encodingmode)
+u = s.decode(_sysstr(encoding), _sysstr(encodingmode))
 lu = u.lower()
 if u == lu:
 return s # preserve localstring
-return lu.encode(encoding)
+return lu.encode(_sysstr(encoding))
 except UnicodeError:
 return s.lower() # we don't know how to fold this except in ASCII
 except LookupError as k:
 raise error.Abort(k, hint="please check your locale settings")
 def upperfallback(s):
 try:
 if isinstance(s, localstr):
 u = s._utf8.decode("utf-8")
 else:
-u = s.decode(encoding, encodingmode)
+u = s.decode(_sysstr(encoding), _sysstr(encodingmode))
 uu = u.upper()
 if u == uu:
 return s # preserve localstring
-return uu.encode(encoding)
+return uu.encode(_sysstr(encoding))
 except UnicodeError:
 return s.upper() # we don't know how to fold this except in ASCII
 except LookupError as k:
 raise error.Abort(k, hint="please check your locale settings")

Mercurial > public > mercurial-scm > hg-stable

comparison mercurial/encoding.py @ 30033:02dbfaa6df0b