aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorTerry Jan Reedy <tjreedy@udel.edu>2014-02-17 23:12:16 -0500
committerTerry Jan Reedy <tjreedy@udel.edu>2014-02-17 23:12:16 -0500
commit5b8d2c3af76e704926cf5915ad0e6af59a232e61 (patch)
treefe41f651e48dad3c4b79e363ebe8b3f51a5d48fc /Lib/tokenize.py
parentwhitespace (diff)
downloadcpython-5b8d2c3af76e704926cf5915ad0e6af59a232e61.tar.gz
cpython-5b8d2c3af76e704926cf5915ad0e6af59a232e61.tar.bz2
cpython-5b8d2c3af76e704926cf5915ad0e6af59a232e61.zip
Issue #8478: Untokenizer.compat now processes first token from iterator input.
Patch based on lines from Georg Brandl, Eric Snow, and Gareth Rees.
Diffstat (limited to 'Lib/tokenize.py')
-rw-r--r--Lib/tokenize.py24
1 files changed, 11 insertions, 13 deletions
diff --git a/Lib/tokenize.py b/Lib/tokenize.py
index c156450d047..7356a88b217 100644
--- a/Lib/tokenize.py
+++ b/Lib/tokenize.py
@@ -25,12 +25,14 @@ __credits__ = ('GvR, ESR, Tim Peters, Thomas Wouters, Fred Drake, '
'Skip Montanaro, Raymond Hettinger, Trent Nelson, '
'Michael Foord')
import builtins
-import re
-import sys
-from token import *
from codecs import lookup, BOM_UTF8
import collections
from io import TextIOWrapper
+from itertools import chain
+import re
+import sys
+from token import *
+
cookie_re = re.compile(r'^[ \t\f]*#.*coding[:=][ \t]*([-\w.]+)', re.ASCII)
blank_re = re.compile(br'^[ \t\f]*(?:[#\r\n]|$)', re.ASCII)
@@ -237,9 +239,10 @@ class Untokenizer:
self.tokens.append(" " * col_offset)
def untokenize(self, iterable):
- for t in iterable:
+ it = iter(iterable)
+ for t in it:
if len(t) == 2:
- self.compat(t, iterable)
+ self.compat(t, it)
break
tok_type, token, start, end, line = t
if tok_type == ENCODING:
@@ -254,17 +257,12 @@ class Untokenizer:
return "".join(self.tokens)
def compat(self, token, iterable):
- startline = False
indents = []
toks_append = self.tokens.append
- toknum, tokval = token
-
- if toknum in (NAME, NUMBER):
- tokval += ' '
- if toknum in (NEWLINE, NL):
- startline = True
+ startline = token[0] in (NEWLINE, NL)
prevstring = False
- for tok in iterable:
+
+ for tok in chain([token], iterable):
toknum, tokval = tok[:2]
if toknum == ENCODING:
self.encoding = tokval