Untokenize: An logically incorrect assert tested user input validity.

Replace it with correct logic that raises ValueError for bad input. Issues #8478 and #12691 reported the incorrect logic. Add an Untokenize test case and an initial test method.
author: Terry Jan Reedy <tjreedy@udel.edu> 2014-02-17 21:45:48 (GMT)
committer: Terry Jan Reedy <tjreedy@udel.edu> 2014-02-17 21:45:48 (GMT)
commit: 5e6db313686c200da425a54d2e0c95fa40107b1d (patch)
tree: 5586a30aaf9f83a3a1e2f7996773487366baa6e1 /Lib
parent: cf626032763077bf959937705ed35f9e2b40a862 (diff)
download: cpython-5e6db313686c200da425a54d2e0c95fa40107b1d.zip
cpython-5e6db313686c200da425a54d2e0c95fa40107b1d.tar.gz
cpython-5e6db313686c200da425a54d2e0c95fa40107b1d.tar.bz2
2 files changed, 18 insertions, 2 deletions
diff --git a/Lib/test/test_tokenize.py b/Lib/test/test_tokenize.py
index 6ed8597..df4e165 100644
--- a/Lib/test/test_tokenize.py
+++ b/Lib/test/test_tokenize.py
@@ -638,7 +638,7 @@ Legacy unicode literals:
 from test import support
 from tokenize import (tokenize, _tokenize, untokenize, NUMBER, NAME, OP,
                      STRING, ENDMARKER, ENCODING, tok_name, detect_encoding,
-                     open as tokenize_open)
+                     open as tokenize_open, Untokenizer)
 from io import BytesIO
 from unittest import TestCase
 import os, sys, glob
@@ -1153,6 +1153,19 @@ class TestTokenize(TestCase):
         # See http://bugs.python.org/issue16152
         self.assertExactTypeEqual('@          ', token.AT)
 
+class UntokenizeTest(TestCase):
+    
+    def test_bad_input_order(self):
+        u = Untokenizer()
+        u.prev_row = 2
+        u.prev_col = 2
+        with self.assertRaises(ValueError) as cm:
+            u.add_whitespace((1,3))
+        self.assertEqual(cm.exception.args[0], 
+                'start (1,3) precedes previous end (2,2)')
+        self.assertRaises(ValueError, u.add_whitespace, (2,1))
+
+
 __test__ = {"doctests" : doctests, 'decistmt': decistmt}
 
 def test_main():
@@ -1162,6 +1175,7 @@ def test_main():
     support.run_unittest(Test_Tokenize)
     support.run_unittest(TestDetectEncoding)
     support.run_unittest(TestTokenize)
+    support.run_unittest(UntokenizeTest)
 
 if __name__ == "__main__":
     test_main()
diff --git a/Lib/tokenize.py b/Lib/tokenize.py
index 294bf9a..c156450 100644
--- a/Lib/tokenize.py
+++ b/Lib/tokenize.py
@@ -229,7 +229,9 @@ class Untokenizer:
 
     def add_whitespace(self, start):
         row, col = start
-        assert row <= self.prev_row
+        if row < self.prev_row or row == self.prev_row and col < self.prev_col:
+            raise ValueError("start ({},{}) precedes previous end ({},{})"
+                             .format(row, col, self.prev_row, self.prev_col))
         col_offset = col - self.prev_col
         if col_offset:
             self.tokens.append(" " * col_offset)
author	Terry Jan Reedy <tjreedy@udel.edu>	2014-02-17 21:45:48 (GMT)
committer	Terry Jan Reedy <tjreedy@udel.edu>	2014-02-17 21:45:48 (GMT)
commit	5e6db313686c200da425a54d2e0c95fa40107b1d (patch)
tree	5586a30aaf9f83a3a1e2f7996773487366baa6e1 /Lib
parent	cf626032763077bf959937705ed35f9e2b40a862 (diff)
download	cpython-5e6db313686c200da425a54d2e0c95fa40107b1d.zip cpython-5e6db313686c200da425a54d2e0c95fa40107b1d.tar.gz cpython-5e6db313686c200da425a54d2e0c95fa40107b1d.tar.bz2