[pypy-svn] r66519 - in pypy/branch/parser-compiler/pypy/interpreter: pyparser test

Thu Jul 23 00:03:18 CEST 2009

Author: benjamin
Date: Thu Jul 23 00:03:17 2009
New Revision: 66519

Modified:
   pypy/branch/parser-compiler/pypy/interpreter/pyparser/pytokenizer.py
   pypy/branch/parser-compiler/pypy/interpreter/test/test_syntax.py
Log:
make the column be the start of the token

Modified: pypy/branch/parser-compiler/pypy/interpreter/pyparser/pytokenizer.py
==============================================================================

--- pypy/branch/parser-compiler/pypy/interpreter/pyparser/pytokenizer.py	(original)
+++ pypy/branch/parser-compiler/pypy/interpreter/pyparser/pytokenizer.py	Thu Jul 23 00:03:17 2009
@@ -96,14 +96,16 @@
             endmatch = endDFA.recognize(line)
             if endmatch >= 0:
                 pos = end = endmatch
-                tok = (tokens.STRING, contstr + line[:end], lnum, pos, line)
+                tok = (tokens.STRING, contstr + line[:end], strstart[0],
+                       strstart[1], line)
                 token_list.append(tok)
                 last_comment = ''
                 contstr, needcont = '', 0
                 contline = None
             elif (needcont and not line.endswith('\\\n') and
                                not line.endswith('\\\r\n')):
-                tok = (tokens.ERRORTOKEN, contstr + line, lnum, pos, line)
+                tok = (tokens.ERRORTOKEN, contstr + line, strstart[0],
+                       strstart[1], line)
                 token_list.append(tok)
                 last_comment = ''
                 contstr = ''
@@ -131,7 +133,7 @@
 
             if column > indents[-1]:           # count indents or dedents
                 indents.append(column)
-                token_list.append((tokens.INDENT, line[:pos], lnum, pos, line))
+                token_list.append((tokens.INDENT, line[:pos], lnum, 0, line))
                 last_comment = ''
             while column < indents[-1]:
                 indents = indents[:-1]
@@ -164,11 +166,11 @@
                 token, initial = line[start:end], line[start]
                 if initial in numchars or \
                    (initial == '.' and token != '.'):      # ordinary number
-                    token_list.append((tokens.NUMBER, token, lnum, pos, line))
+                    token_list.append((tokens.NUMBER, token, lnum, start, line))
                     last_comment = ''
                 elif initial in '\r\n':
                     if parenlev <= 0:
-                        tok = (tokens.NEWLINE, last_comment, lnum, pos, line)
+                        tok = (tokens.NEWLINE, last_comment, lnum, start, line)
                         token_list.append(tok)
                     last_comment = ''
                 elif initial == '#':
@@ -180,10 +182,11 @@
                     if endmatch >= 0:                     # all on one line
                         pos = endmatch
                         token = line[start:pos]
-                        tok = (tokens.STRING, token, lnum, pos, line)
+                        tok = (tokens.STRING, token, lnum, start, line)
                         token_list.append(tok)
                         last_comment = ''
                     else:
+                        strstart = (lnum, start)
                         contstr = line[start:]
                         contline = line
                         break
@@ -191,17 +194,19 @@
                     token[:2] in single_quoted or \
                     token[:3] in single_quoted:
                     if token[-1] == '\n':                  # continued string
+                        strstart = (lnum, start)
                         endDFA = (endDFAs[initial] or endDFAs[token[1]] or
                                    endDFAs[token[2]])
                         contstr, needcont = line[start:], 1
                         contline = line
                         break
                     else:                                  # ordinary string
-                        tok = (tokens.STRING, token, lnum, pos, line)
+                        tok = (tokens.STRING, token, lnum, start, line)
                         token_list.append(tok)
                         last_comment = ''
                 elif initial in namechars:                 # ordinary name
-                    token_list.append((tokens.NAME, token, lnum, pos, line))
+                    print token, start
+                    token_list.append((tokens.NAME, token, lnum, start, line))
                     last_comment = ''
                 elif initial == '\\':                      # continued stmt
                     continued = 1
@@ -217,7 +222,7 @@
                         punct = python_opmap[token]
                     else:
                         punct = tokens.OP
-                    token_list.append((punct, token, lnum, pos, line))
+                    token_list.append((punct, token, lnum, start, line))
                     last_comment = ''
             else:
                 start = whiteSpaceDFA.recognize(line, pos)

Modified: pypy/branch/parser-compiler/pypy/interpreter/test/test_syntax.py
==============================================================================
--- pypy/branch/parser-compiler/pypy/interpreter/test/test_syntax.py	(original)
+++ pypy/branch/parser-compiler/pypy/interpreter/test/test_syntax.py	Thu Jul 23 00:03:17 2009
@@ -640,7 +640,7 @@
         except SyntaxError, e:
             assert e.lineno == 4
             assert e.text.endswith('a b c d e\n')
-            assert e.offset == e.text.index('b') + 1
+            assert e.offset == e.text.index('b')
         else:
             raise Exception("no SyntaxError??")