added heap implementations, experimental scripts, results and plots

5b11ae58 · Maria Hartmann · 08a1489f · 5b11ae58 · 5b11ae58 · 5b11ae58
Commit 5b11ae58 authored 4 years ago by Maria Hartmann
--- a/paper-sorting-subseq-new.py
+++ b/paper-sorting-subseq-new.py
+#!/usr/bin/python3
+from random import shuffle
+import random
+import numpy as np
+import matplotlib.pyplot as plt
+import sys
+import signal
+import copy
+import math
+import csv
+from node import Node
+from pairing_heap import PairingHeap
+from pairing_heap_interface import PairingHeapInterface
+from pairing_heap_standard import PairingHeapStandard
+from variants.pairing_heap_multipass import PairingHeapMultipass
+from variants.pairing_heap_ftb import PairingHeapFTB
+from variants.pairing_heap_btf import PairingHeapBTF
+from variants.pairing_heap_lazy import PairingHeapLazy
+from variants.pairing_heap_standard_stable import PairingHeapStandardStable
+from variants.pairing_heap_ftb_stable import PairingHeapFTBStable
+from variants.pairing_heap_btf_stable import PairingHeapBTFStable
+from variants.pairing_heap_multipass_stable import PairingHeapMultipassStable
+from variants.pairing_heap_lazy_stable import PairingHeapLazyStable
+from pairing_heap_smooth import PairingHeapSmooth
+from variants.pairing_heap_smooth_unstable import PairingHeapSmoothUnstable
+from smooth_heap_corey import SmoothHeapCorey
+COUNT_TYPE_BOTH = 0
+COUNT_TYPE_LINKS = -1
+COUNT_TYPE_COMPS = -2
+MAXSIZE = 17
+NUMBER_TESTS = 20  # number of tests to run
+TEST_SIZES = [j for j in range(MAXSIZE)]  
+LIST_LEN = 10000  # number of elements in test list
+TEST_SIZE = 10000  # number of elements in test list
+STEP_SIZE = 100
+INCREMENT_SUBSEQS = 100
+TYPES = {0: "Pairing", 12: "Smooth"} 
+MAX_TYPE_KEY = max(TYPES.keys())
+COLOURS = {0:'xkcd:fire engine red', 12:'xkcd:green'}
+SHADE_COLOURS = {0:'#fe4d4e', 12:'#58ab8e'}
+def isSorted(list0):
+    return all(list0[i] < list0[i + 1] for i in range(len(list0) - 1))
+def generateContSortedSubseq(llist, sublen):
+    listcopy = copy.copy(llist)
+    shuffle(listcopy)
+    res = []
+    l = 0
+    while l < len(llist):
+        clen = random.randint(1, sublen)
+        sublist = copy.copy(listcopy[l:min(l + clen, len(listcopy))])
+        sublist.sort()
+        res += sublist
+        l += clen
+    return res
+def plot_avg_counts(avgCounts):
+    # colours from https://xkcd.com/color/rgb/
+    MARKERS_COMP = {0:"o", 12:"^"}#https://matplotlib.org/3.1.1/api/markers_api.html
+    MARKERS_LINK = {0:"o", 12:"D"}
+    plt.figure('avg number of operations by heap type')
+    deviations = [fac*INCREMENT_SUBSEQS/200 for fac in range(1, math.ceil((TEST_SIZE/5)/INCREMENT_SUBSEQS), 1)]
+    deviations.reverse()
+    for k in TYPES.keys():
+        print(k)
+        avgComps = [acounts[k] for acounts in avgCounts[0]]
+        maxComps = [acounts[k] for acounts in avgCounts[2]]
+        minComps = [acounts[k] for acounts in avgCounts[4]]
+        plt.plot(deviations, avgComps, color=COLOURS[k], linestyle="-", marker=MARKERS_COMP[k], markerfacecolor=COLOURS[k], markersize=9, markeredgewidth=1, markeredgecolor='black', label=TYPES[k] + " comparisons")
+        plt.fill_between(deviations, minComps, maxComps, color=SHADE_COLOURS[k], alpha=.3)
+        avgLinks = [acounts[k] for acounts in avgCounts[1]]
+        maxLinks = [acounts[k] for acounts in avgCounts[3]]
+        minLinks = [acounts[k] for acounts in avgCounts[5]]
+        plt.plot(deviations, avgLinks, color=COLOURS[k], linestyle="--", marker=MARKERS_LINK[k], markerfacecolor=COLOURS[k], markersize=9, markeredgewidth=1, markeredgecolor='black', label=TYPES[k] + " links")
+        plt.fill_between(deviations, minLinks, maxLinks, color=SHADE_COLOURS[k], alpha=.3)
+    plt.xlabel('Avg. length of sorted blocks, % of size', fontsize=26)
+    plt.ylabel('Avg. number of operations / size', fontsize=26)
+    plt.xticks(fontsize=20)
+    plt.yticks(fontsize=20)
+    plt.rc('legend',fontsize=26) # using a size in points
+    plt.legend()
+    plt.grid(True)
+    plt.gca().invert_xaxis()
+    figure = plt.gcf()  # get current figure
+    figure.set_size_inches(16, 18)  # set figure's size manually to full screen
+    plt.savefig('plots/paper-sorting-subseq-new.svg', bbox_inches='tight')  # bbox_inches removes extra white spaces
+    plt.legend(loc='best')
+    plt.show()
+def export_results(params, results, countType, heapTypes, filename="dijkstra"):
+    #  exports results of simulation as separate .csv files, one for links and one for comparisons, into /data directory
+    #  each row contains randomness parameter value; plus one column containing the number of operations for each heap type
+    if countType == COUNT_TYPE_BOTH:
+        with open("data/" + filename + '-comps.csv', 'w', newline='') as csvfile:
+            csvwriter = csv.writer(csvfile, delimiter=';', quotechar='|', quoting=csv.QUOTE_MINIMAL)
+            csvwriter.writerow(["randomness parameter value"] + [name for name in TYPES.values()])
+            csvwriter.writerow(["randomness parameter value"] + [name for name in TYPES.keys()])
+            for i in range(len(results[0])):
+                row = [params[i]] + [results[0][i][k] for k in TYPES.keys()]
+                csvwriter.writerow(row)
+        with open("data/" + filename + '-links.csv', 'w', newline='') as csvfile:
+            csvwriter = csv.writer(csvfile, delimiter=';', quotechar='|', quoting=csv.QUOTE_MINIMAL)
+            csvwriter.writerow(["randomness parameter value"] + [name for name in TYPES.values()])
+            csvwriter.writerow(["randomness parameter value"] + [name for name in TYPES.keys()])
+            for i in range(len(results[1])):
+                row = [params[i]] + [results[1][i][k] for k in TYPES.keys()]
+                csvwriter.writerow(row)
+    else:
+        fn = "data/" + filename + '-links.csv' if countType == COUNT_TYPE_LINKS else "data/" + filename + '-comps.csv'
+        with open(fn, 'w', newline='') as csvfile:
+            csvwriter = csv.writer(csvfile, delimiter=';', quotechar='|', quoting=csv.QUOTE_MINIMAL)
+            csvwriter.writerow(["randomness parameter value"] + [name for name in TYPES.values()])
+            csvwriter.writerow(["randomness parameter value"] + [name for name in TYPES.keys()])
+            for i in range(len(results)):
+                row = [params[i]] + [results[i][k] for k in TYPES.keys()]
+                csvwriter.writerow(row)
+if __name__ == "__main__":
+    testOutputCount = []
+    avgLinksPerSize = []
+    avgCompsPerSize = []
+    maxLinksPerSize = []
+    maxCompsPerSize = []
+    minLinksPerSize = []
+    minCompsPerSize = []
+    sortedInput = []
+    # testInput = []
+    # ----------continuous sorted subsequences inputs-----
+    # randomness parameter: subsequence lengths
+    params = [fac*INCREMENT_SUBSEQS for fac in range(1, math.ceil((TEST_SIZE/5)/INCREMENT_SUBSEQS), 1)]
+    params.reverse()
+    for x in params:
+        sortedInput = [k for k in range(LIST_LEN)]
+        avgCountsLinks = [0 for _ in range(MAX_TYPE_KEY + 1)]
+        avgCountsComps = [0 for _ in range(MAX_TYPE_KEY + 1)]
+        maxCountsLinks = [0 for _ in range(MAX_TYPE_KEY + 1)]
+        maxCountsComps = [0 for _ in range(MAX_TYPE_KEY + 1)]
+        minCountsLinks = [1000000000000 for _ in range(MAX_TYPE_KEY + 1)]
+        minCountsComps = [1000000000000 for _ in range(MAX_TYPE_KEY + 1)]
+        for zz in range(NUMBER_TESTS):
+            testInput = generateContSortedSubseq(sortedInput, x)
+            #print(len(testInput))
+            for heapType in TYPES.keys():
+                linkCount = 0
+                compCount = 0
+                testOutput = []
+                heap = PairingHeap(heapType, COUNT_TYPE_BOTH)
+                heap.make_heap()
+                for element in testInput:
+                    node = Node(element)
+                    (cc, lc) = heap.insert(node)
+                for i in range(len(testInput)):
+                    (minNode, cc, lc) = heap.delete_min()
+                    testOutput += [minNode.key]
+                    compCount += cc
+                    linkCount += lc
+                if isSorted(testOutput):  # sanity check
+			        #divide by size for visualization
+                    avgCountsLinks[heapType] += (linkCount/LIST_LEN) / NUMBER_TESTS
+                    avgCountsComps[heapType] += (compCount/LIST_LEN) / NUMBER_TESTS
+                    maxCountsLinks[heapType] = max(maxCountsLinks[heapType],linkCount/LIST_LEN)
+                    maxCountsComps[heapType] = max(maxCountsComps[heapType],compCount/LIST_LEN)
+                    minCountsLinks[heapType] = min(minCountsLinks[heapType],linkCount/LIST_LEN)
+                    minCountsComps[heapType] = min(minCountsComps[heapType],compCount/LIST_LEN)
+                else:
+                    raise Exception("Invalid result for {}".format(TYPES[heapType]))
+                print("[{}: {}, {}/{}] \t Links: {} \t Comps: {}".format(
+                    TYPES[heapType], x, zz+1, NUMBER_TESTS, linkCount, compCount))
+        for heapType in TYPES.keys():
+            print("[{}: {}, avg] \t Links: {} \t Comps: {}".format(TYPES[heapType], x, avgCountsLinks[heapType], avgCountsComps[heapType]))
+        avgLinksPerSize += [avgCountsLinks]
+        avgCompsPerSize += [avgCountsComps]
+        maxLinksPerSize += [maxCountsLinks]
+        maxCompsPerSize += [maxCountsComps]
+        minLinksPerSize += [minCountsLinks]
+        minCompsPerSize += [minCountsComps]
+    plot_avg_counts([avgCompsPerSize, avgLinksPerSize, maxCompsPerSize, maxLinksPerSize, minCompsPerSize, minLinksPerSize])
+    export_results(params, [avgCompsPerSize, avgLinksPerSize], COUNT_TYPE_BOTH, TYPES, "sorting-subseq-new")
--- a/plots/paper-dijkstra-new.svg
+++ b/plots/paper-dijkstra-new.svg
--- a/plots/paper-dijkstra2-new.svg
+++ b/plots/paper-dijkstra2-new.svg
--- a/plots/paper-permutation-localized.pdf
+++ b/plots/paper-permutation-localized.pdf
--- a/plots/paper-permutation-localized.svg
+++ b/plots/paper-permutation-localized.svg
--- a/plots/paper-permutation-separable.pdf
+++ b/plots/paper-permutation-separable.pdf
--- a/plots/paper-permutation-separable.svg
+++ b/plots/paper-permutation-separable.svg
--- a/plots/paper-permutation-subseq.pdf
+++ b/plots/paper-permutation-subseq.pdf
--- a/plots/paper-permutation-subseq.svg
+++ b/plots/paper-permutation-subseq.svg
--- a/plots/paper-permutation-uniform.pdf
+++ b/plots/paper-permutation-uniform.pdf
--- a/plots/paper-permutation-uniform.svg
+++ b/plots/paper-permutation-uniform.svg
--- a/plots/paper-sorting-loc-new.pdf
+++ b/plots/paper-sorting-loc-new.pdf
--- a/plots/paper-sorting-loc-new.svg
+++ b/plots/paper-sorting-loc-new.svg
--- a/plots/paper-sorting-sep-new.pdf
+++ b/plots/paper-sorting-sep-new.pdf
--- a/plots/paper-sorting-sep-new.svg
+++ b/plots/paper-sorting-sep-new.svg
--- a/plots/paper-sorting-subseq-new.pdf
+++ b/plots/paper-sorting-subseq-new.pdf
--- a/plots/paper-sorting-subseq-new.svg
+++ b/plots/paper-sorting-subseq-new.svg
--- a/plots/paper-sorting-uniform-new.pdf
+++ b/plots/paper-sorting-uniform-new.pdf
--- a/plots/paper-sorting-uniform-new.svg
+++ b/plots/paper-sorting-uniform-new.svg
--- a/smooth_heap.py
+++ b/smooth_heap.py