eric: comparison eric6/ThirdParty/Pygments/pygments/lexers/special.py

-:48d210e41c65
+:54c5cfbb1e29
 pygments.lexers.special
 ~~~~~~~~~~~~~~~~~~~~~~~
 Special lexers.
-:copyright: Copyright 2006-2020 by the Pygments team, see AUTHORS.
+:copyright: Copyright 2006-2021 by the Pygments team, see AUTHORS.
 :license: BSD, see LICENSE for details.
 """
 import re
 from io import BytesIO
 return TextLexer.priority
 _ttype_cache = {}
-line_re = re.compile(b'.*?\n')
+line_re = re.compile('.*?\n')
 class RawTokenLexer(Lexer):
 """
 Recreate a token stream formatted with the `RawTokenFormatter`.  This
 self.compress = get_choice_opt(options, 'compress',
 ['', 'none', 'gz', 'bz2'], '')
 Lexer.__init__(self, **options)
 def get_tokens(self, text):
-if isinstance(text, str):
+if self.compress:
-# raw token stream never has any non-ASCII characters
+if isinstance(text, str):
-text = text.encode('ascii')
+text = text.encode('latin1')
 if self.compress == 'gz':
 import gzip
 gzipfile = gzip.GzipFile('', 'rb', 9, BytesIO(text))
 text = gzipfile.read()
 elif self.compress == 'bz2':
 import bz2
 text = bz2.decompress(text)
+text = text.decode('latin1')
-# do not call Lexer.get_tokens() because we do not want Unicode
+# do not call Lexer.get_tokens() because stripping is not optional.
-# decoding to occur, and stripping is not optional.
+text = text.strip('\n') + '\n'
-text = text.strip(b'\n') + b'\n'
 for i, t, v in self.get_tokens_unprocessed(text):
 yield t, v
 def get_tokens_unprocessed(self, text):
 length = 0
 for match in line_re.finditer(text):
 try:
-ttypestr, val = match.group().split(b'\t', 1)
+ttypestr, val = match.group().rstrip().split('\t', 1)
 except ValueError:
-val = match.group().decode('ascii', 'replace')
+val = match.group()
 ttype = Error
 else:
 ttype = _ttype_cache.get(ttypestr)
 if not ttype:
 ttype = Token
 for ttype_ in ttypes:
 if not ttype_ or not ttype_[0].isupper():
 raise ValueError('malformed token name')
 ttype = getattr(ttype, ttype_)
 _ttype_cache[ttypestr] = ttype
-val = val[2:-2].decode('unicode-escape')
+val = val[1:-1].encode().decode('unicode-escape')
 yield length, ttype, val
 length += len(val)

Mercurial Repositories > eric / file comparison

comparison: eric6/ThirdParty/Pygments/pygments/lexers/special.py

eric6/ThirdParty/Pygments/pygments/lexers/special.py