dis/gen_input.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117

#!/usr/bin/python3
#####
# Copyright 2020 Joshua Bakita
#
# This program generates input data for the DIS benchmark suite on stdout
# given a requested working set size.
#####


from ctypes import sizeof, c_double, c_int, c_short
from math import sqrt, floor
import sys # For argv and stderr

USAGE = """Usage: {} <benchmark> <template> <WSS in bytes>"""

# Check input
if (len(sys.argv) < 4):
    print(USAGE.format(sys.argv[0]), file=sys.stderr)
    exit(1);

# Don't try to understand the logic in these functions, see WSS_DOCS.md
def setup_field(params, wss):
    params[0] = wss
    return params

def setup_matrix(params, wss):
    nnZR = 0.80 # 8% seems average, but it's too fast to compute. Use 80%.
    si = sizeof(c_int)
    sd = sizeof(c_double)
    # s is size double, i is size int, z in nnZR
    # This formula is out of a solver
    d = (sqrt(sd*sd*(81-4*nnZR) + 4*sd*(wss - si*nnZR + 9*si) - 4) - 9*sd - 2*si) / (2*sd)
    params[1] = floor(d);
    # Make sure that we don't add more elements than the matrix size
    params[2] = floor(d*d*nnZR)
    # Set error as low as possible to slow things down
    params[4] = 1.0e-7
    if params[1] <= 0 or params[2] <= 0:
        raise Exception("WSS too small for matrix benchmark!")
    return params

def setup_neighborhood(params, wss):
    bitDepth = 15
    bitDepthAlloc = sizeof(c_int) * (2**(bitDepth + 1) - 1)
    dim = sqrt((wss - bitDepthAlloc) / sizeof(c_short))
    params[1] = bitDepth
    params[2] = floor(dim)
    if params[1] <= 0 or params[2] <= 0:
        raise Exception("WSS too small for neighborhood benchmark!")
    # Cap maximum line thinkness to the image size
    params[5] = min(params[2]-1, int(params[5]))
    # Cap line lengths to the image size
    params[6] = min(params[2]-1, int(params[6]))
    params[7] = min(params[2]-1, int(params[7]))
    return params

def setup_pointer(params, wss):
    n = 1; # Only use one "thread"
    f = (wss - sizeof(c_int) * 4 * n) / sizeof(c_int)
    params[0] = floor(f)
    params[4] = floor(n)
    if params[0] <= 0 or params[4] <= 0:
        raise Exception("WSS too small for pointer benchmark!")
    return params

def setup_transitive(params, wss):
    n = sqrt(wss / (sizeof(c_int) * 2))
    params[0] = floor(n)
    # Fix edges at 50%
    params[1] = floor(params[0] * 0.5)
    if params[0] <= 0:
        raise Exception("WSS too small for transitive benchmark!")
    return params

def setup_update(params, wss):
    f = wss / sizeof(c_int)
    params[0] = floor(f)
    if params[0] <= 0:
        raise Exception("WSS too small for update benchmark!")
    # Don't do more than 10M hops (keeps time array feasible)
    params[2] = min(10000000, int(params[2]))
    # Enforce size requirements
    params[4] = min(params[0]-1, int(params[4]))
    params[5] = min(params[0]-1, int(params[5]))
    params[6] = min(params[0]-1, int(params[6]))
    return params

def setup_random_walk(params, wss):
    params[0] = wss
    return params

BENCH_TO_PARAMS = {"field":setup_field, "matrix":setup_matrix, "neighborhood":setup_neighborhood, "pointer":setup_pointer, "transitive":setup_transitive, "update":setup_update, "random_walk":setup_random_walk}

# Main logic
benchmark_name = sys.argv[1]
if benchmark_name not in BENCH_TO_PARAMS.keys():
    print("Invalid benchmark name.", file=sys.stderr)
    exit(2)

wss = int(sys.argv[3])
if wss <= 0:
    print("Invalid working set size", file=sys.stderr)
    exit(3)

with open(sys.argv[2], "r") as template:
    # We expect the initialization params to all be on the first line
    params = template.readline().split()
    mutated_params = BENCH_TO_PARAMS[benchmark_name](params, wss);
    print("Using", " ".join(map(lambda x: str(x), mutated_params)), "for", benchmark_name, "stressmark", file=sys.stderr)
    print(" ".join(map(lambda x: str(x), mutated_params)))
    if benchmark_name == "pointer":
        # Clone the data format used in the template
        for i in range(0,10):
            print("10 " + str(mutated_params[0]-10) + " " + str(mutated_params[0]-10))
    else:
        print(template.read())