summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorTim Peters <tim.peters@gmail.com>2006-06-13 03:30:07 (GMT)
committerTim Peters <tim.peters@gmail.com>2006-06-13 03:30:07 (GMT)
commit7ca6677218e7e31fa6a6629c4fe6d052de22793c (patch)
treebb183c9f32535d1cf62bcebef84c70f007d3e5b3
parent2adc626bb515be2b6c6c0657d5db48933895593a (diff)
downloadcpython-7ca6677218e7e31fa6a6629c4fe6d052de22793c.zip
cpython-7ca6677218e7e31fa6a6629c4fe6d052de22793c.tar.gz
cpython-7ca6677218e7e31fa6a6629c4fe6d052de22793c.tar.bz2
get_matching_blocks(): rewrote code & comments so they match; added
more comments about why it's this way at all; and removed what looked like needless expense (sorting (i, j, k) triples directly should give exactly the same order as sorting (i, (i, j, k)) pairs).
-rw-r--r--Lib/difflib.py28
1 files changed, 14 insertions, 14 deletions
diff --git a/Lib/difflib.py b/Lib/difflib.py
index 39bb2d9..9a90710 100644
--- a/Lib/difflib.py
+++ b/Lib/difflib.py
@@ -474,30 +474,30 @@ class SequenceMatcher:
if self.matching_blocks is not None:
return self.matching_blocks
la, lb = len(self.a), len(self.b)
-
- indexed_blocks = []
+ self.matching_blocks = matching_blocks = []
+
+ # This is most naturally expressed as a recursive algorithm, but
+ # at least one user bumped into extreme use cases that exceeded
+ # the recursion limit on their box. So, now we maintain a list
+ # ('queue`) of blocks we still need to look at, and append partial
+ # results to `matching_blocks` in a loop; the matches are sorted
+ # at the end.
queue = [(0, la, 0, lb)]
while queue:
- # builds list of matching blocks covering a[alo:ahi] and
- # b[blo:bhi], appending them in increasing order to answer
alo, ahi, blo, bhi = queue.pop()
-
+ i, j, k = x = self.find_longest_match(alo, ahi, blo, bhi)
# a[alo:i] vs b[blo:j] unknown
# a[i:i+k] same as b[j:j+k]
# a[i+k:ahi] vs b[j+k:bhi] unknown
- i, j, k = x = self.find_longest_match(alo, ahi, blo, bhi)
-
- if k:
+ if k: # if k is 0, there was no matching block
+ matching_blocks.append(x)
if alo < i and blo < j:
queue.append((alo, i, blo, j))
- indexed_blocks.append((i, x))
if i+k < ahi and j+k < bhi:
queue.append((i+k, ahi, j+k, bhi))
- indexed_blocks.sort()
-
- self.matching_blocks = [elem[1] for elem in indexed_blocks]
- self.matching_blocks.append( (la, lb, 0) )
- return self.matching_blocks
+ matching_blocks.sort()
+ matching_blocks.append( (la, lb, 0) )
+ return matching_blocks
def get_opcodes(self):
"""Return list of 5-tuples describing how to turn a into b.