Hmm! I thought I checked this in before! Oh well.

Added new heapify() function, which transforms an arbitrary list into a heap in linear time; that's a fundamental tool for using heaps in real life <wink>. Added heapyify() test. Added a "less naive" N-best algorithm to the test suite, and noted that this could actually go much faster (building on heapify()) if we had max-heaps instead of min-heaps (the iterative method is appropriate when all the data isn't known in advance, but when it is known in advance the tradeoffs get murkier).
2025-08-31 14:07:50 +00:00 · 2002-08-02 21:48:06 +00:00 · 2002-08-02 21:48:06 +00:00 · 28c25527c2
commit 28c25527c2
parent 940dc922c0
2 changed files with 48 additions and 10 deletions
--- a/Lib/test/test_heapq.py
+++ b/Lib/test/test_heapq.py
@ -2,7 +2,7 @@

 from test.test_support import verify, vereq, verbose, TestFailed

-from heapq import heappush, heappop
+from heapq import heappush, heappop, heapify
 import random

 def check_invariant(heap):
@ -40,6 +40,24 @@ def test_main():
            heappop(heap)
    heap.sort()
    vereq(heap, data_sorted[-10:])
+    # 4) Test heapify.
+    for size in range(30):
+        heap = [random.random() for dummy in range(size)]
+        heapify(heap)
+        check_invariant(heap)
+    # 5) Less-naive "N-best" algorithm, much faster (if len(data) is big
+    #    enough <wink>) than sorting all of data.  However, if we had a max
+    #    heap instead of a min heap, it would go much faster still via
+    #    heapify'ing all of data (linear time), then doing 10 heappops
+    #    (10 log-time steps).
+    heap = data[:10]
+    heapify(heap)
+    for item in data[10:]:
+        if item > heap[0]:  # this gets rarer and rarer the longer we run
+            heappush(heap, item)
+            heappop(heap)
+    heap.sort()
+    vereq(heap, data_sorted[-10:])
    # Make user happy
    if verbose:
        print "All OK"