remove some of the unneeded parts

author: Bjoern Brandenburg <bbb@Serenity.local> 2009-01-11 20:20:33 -0500
committer: Bjoern Brandenburg <bbb@Serenity.local> 2009-01-11 20:20:33 -0500
commit: 6ccfe134d4bff05f457fc97d03f9f3692ab99adb (patch)
tree: 1a9bf1e8ef02a4c88bb5ff40c15a29f551cc6a23
parent: 1fa1d31e516adc4c7e2c6f800b44d169a5d2d3ee (diff)
4 files changed, 0 insertions, 270 deletions
diff --git a/TODO b/TODO
deleted file mode 100644
index 4160836..0000000
--- a/TODO
+++ /dev/null
@@ -1,3 +0,0 @@
-FEATURES:
-        - extract a reusable line plotter, like plot_scatter
diff --git a/csv2graph b/csv2graph
deleted file mode 100755
index 8f7d795..0000000
--- a/csv2graph
+++ /dev/null
@@ -1,23 +0,0 @@
-#!/bin/bash
-FILE=$1
-shift
-if [ ! -f "$FILE" ] ; then
-    echo "Usage: csv2graph <csv file>"
-fi
-CUM=`mktemp`
-DIST=`mktemp`
-OUT=`echo $FILE | sed s/csv/png/`
-analyze -adist    -b1000 "$FILE" --csv -n -i $* > $DIST
-analyze -adist -c -b1000 "$FILE" --csv -n -i $* > $CUM
-if [ -s $CUM ] && [ -s $DIST ]; then
-    plot_dist $DIST $CUM $OUT "$FILE: $*"
-    rm $DIST $CUM
-else
-    echo "$FILE: Empty."
-fi
diff --git a/csv_tool b/csv_tool
deleted file mode 100755
index 17ad949..0000000
--- a/csv_tool
+++ /dev/null
@@ -1,214 +0,0 @@
-#!/usr/bin/env python
-"""
-Do stuff with csv files.
-"""
-import optparse
-import defapp
-import csv
-import operator
-import os.path
-from collections import defaultdict as defdict
-from itertools   import izip
-o = optparse.make_option
-opts = [
-    o('-c', '--column', action='append', dest='col', type='int',
-      help='The column(s) on which to operate.'),
-    o(None, '--write-to-file', action='store_true', dest='write_to_file',
-      help='Write the output of operation xyz on file abc.csv to xyz_abc.csv.'),
-    o('-u', '--upper-bound', action='store_true', dest='upper_bound',
-      help="The linear regression is modified to represent an upper bound."),
-#     o(None, '--degree', action='store', type='float', dest='thruthiness',
-#       help='Not quite absolut truth.'),
-    ]
-defaults = {
-    'col'           : [],
-    'write_to_file' : False,
-    'upper_bound'   : False,
-    }
-def pair_iter(it):
-    it = iter(it)
-    while True:
-        yield (it.next(), it.next())
-def make_vector_op(op):
-    def vector_op(a, b, defvalue=0):
-        if len(a) > len(b):
-            shorter = b
-            longer  = a
-        else:
-            shorter = a
-            longer  = b
-        c = list(longer)
-        for i in xrange(len(shorter)):
-            c[i] = op(longer[i], shorter[i])
-        for i in xrange(len(shorter), len(longer)):
-            c[i] = op(longer[i], defvalue)
-        return c
-    return vector_op
-def make_scalar_op(op):
-    def scalar_op(scalar, a):
-        return [op(x, scalar) for x in a]
-    return scalar_op
-row_add = make_vector_op(operator.add)
-row_min = make_vector_op(min)
-row_max = make_vector_op(max)
-def row_reduce(row_op, fixup=lambda key, rows, res: res):
-    def _reduce(order, by_key):
-        for key in order:
-            if key in by_key:
-                rows  = by_key[key]
-                res   = reduce(row_op, rows)
-                del by_key[key]
-                yield fixup(key, rows, res)
-    return _reduce
-row_mul = make_scalar_op(operator.mul)
-row_div = make_scalar_op(operator.div)
-def transpose(rows):
-    rows = list(rows)
-    if rows:
-        r = len(rows)
-        c = max([len(x) for x in rows])
-        def at(x, y):
-            try:
-                return rows[x][y]
-            except IndexError:
-                return 0
-        for i in xrange(c):
-            yield [at(j, i) for j in xrange(r) ]
-def reorder_columns(rows, xchg_pairs):
-    for r in rows:
-        for (x,y) in xchg_pairs:
-            r[x], r[y] = r[y], r[x]
-        yield r
-def select_columns(rows, cols):
-    for r in rows:
-        yield [r[x] for x in cols]
-def numpy_lstsq(x, y):
-    from numpy import ones, array
-    from numpy.linalg import lstsq
-    A = ones((len(y), 2), dtype=float)
-    A[:,0] = array(x)
-    b      = array(y)
-    return lstsq(A, b)[0]
-def max_delta(c0, c1, x, y):
-    return max([float(y) - (c0 + c1 * float(x)) for (x,y) in izip(x, y)])
-def least_squares(rows, xy_pairs, upper_bound):
-    cols = []
-    for (x, y) in xy_pairs:
-        cols += [x, y]
-    rows = select_columns(rows, cols)
-    cols = transpose(rows)
-    for ((x, y), (xval, yval)) in izip(xy_pairs, pair_iter(cols)):
-        c1, c0 = numpy_lstsq(xval, yval)
-        if upper_bound:
-            c0 += max_delta(c0, c1, xval, yval)
-        yield [x + 1, y + 1, c0, c1]
-def select_by_key(rows, col, cast=None):
-    by_key = defdict(list)
-    order  = []
-    for r in rows:
-        key = r[col]
-        if cast:
-            by_key[key] += [[cast(x) for x in r]]
-        else:
-            by_key[key] += [r]
-        order += [key]
-    return (order, by_key)
-class CsvApp(defapp.App):
-    def __init__(self):
-        defapp.App.__init__(self, opts, defaults)
-        # fixup human-friendly offsets
-        if not self.options.col:
-            self.options.col = [1]
-        self.options.col = [x - 1 for x in self.options.col]
-        self.options.col_pairs = list(pair_iter(self.options.col))
-    def transform(self, make_iterator, ordered=True):
-        """
-        Read a file, pass the rows in the file to an iterator factory, and
-        write out the output of the iterator. The iterator performs the
-        desired transformation.
-        """
-        files = list(self.args)
-        del files[0]
-        for fn in files:
-            try:
-                # read in content
-                rows = csv.reader(open(fn, 'r'))
-                # set up transformation
-                if ordered:
-                    (order, by_key) = select_by_key(rows, self.options.col[0],
-                                                    float)
-                    rows = make_iterator(order, by_key)
-                else:
-                    rows = make_iterator(rows)
-                # write out
-                outfile = self.outfile()
-                if self.options.write_to_file:
-                    (dir, file) = os.path.split(fn)
-                    fn = os.path.join(dir, self.args[0] + '_' + file)
-                    outfile = open(fn, 'w')
-                csv.writer(outfile).writerows(rows)
-                if self.options.write_to_file:
-                    outfile.close()
-            except IOError, ex:
-                self.err("%s:%s"  % (fn, str(ex)))
-            except IndexError, ex:
-                self.err("%s: Sorry, index out of range." % fn)
-    def do_avg(self, _):
-        def fixup_avg(key, rows, res):
-            res = row_div(len(rows), res)
-            res[self.options.col[0]] = key
-            return res
-        self.transform(row_reduce(row_add, fixup_avg))
-    def do_max(self, _):
-        self.transform(row_reduce(row_max))
-    def do_min(self, _):
-        self.transform(row_reduce(row_min))
-    def do_transpose(self, _):
-        self.transform(transpose, ordered=False)
-    def do_reorder(self, _):
-        self.transform(lambda rows: reorder_columns(
-                rows, self.options.col_pairs), ordered=False)
-    def do_select(self, _):
-        self.transform(lambda rows: select_columns(
-                rows, self.options.col), ordered=False)
-    def do_lstsqrs(self, _):
-        self.transform(
-            lambda rows: least_squares(rows, self.options.col_pairs,
-                                       self.options.upper_bound),
-            ordered=False)
-if __name__ == '__main__':
-    CsvApp().launch()
diff --git a/plot_dist b/plot_dist
deleted file mode 100755
index 18cb48c..0000000
--- a/plot_dist
+++ /dev/null
@@ -1,30 +0,0 @@
-#!/bin/bash
-CSV1=$1
-CSV2=$2
-OUT=$3
-TITLE=$4
-if [ ! -f "$CSV1" ] || [ ! -f "$CSV2"  ] ||
-   [ "" == "$OUT" ] ; then
-    echo "Usage: plot_dist <normal.csv> <cumulative.csv> <out.png> <title>"
-    exit 1
-fi
-gnuplot <<EOM
-set terminal png picsize 1024 768
-set out '/dev/null'
-plot     '$CSV1' title 'distribution' with lines
-replot   '$CSV2' title 'distribution (cumulative)' axes x1y2 with lines
-set ylabel  'probability'
-set y2label 'probability (cumulative)'
-set xlabel  'overhead (in us)'
-set y2tics
-set y2range [0.0:1.0]
-set title '$TITLE'
-set key top left
-set out '$OUT'
-replot
-set out
-EOM
author	Bjoern Brandenburg <bbb@Serenity.local>	2009-01-11 20:20:33 -0500
committer	Bjoern Brandenburg <bbb@Serenity.local>	2009-01-11 20:20:33 -0500
commit	6ccfe134d4bff05f457fc97d03f9f3692ab99adb (patch)
tree	1a9bf1e8ef02a4c88bb5ff40c15a29f551cc6a23
parent	1fa1d31e516adc4c7e2c6f800b44d169a5d2d3ee (diff)

diff --git a/TODO b/TODO deleted file mode 100644 index 4160836..0000000 --- a/TODO +++ /dev/null
@@ -1,3 +0,0 @@
1
2	FEATURES:
3	- extract a reusable line plotter, like plot_scatter


diff --git a/csv2graph b/csv2graph deleted file mode 100755 index 8f7d795..0000000 --- a/csv2graph +++ /dev/null
@@ -1,23 +0,0 @@
1	#!/bin/bash
2
3	FILE=$1
4
5	shift
6
7	if [ ! -f "$FILE" ] ; then
8	echo "Usage: csv2graph <csv file>"
9	fi
10
11	CUM=`mktemp`
12	DIST=`mktemp`
13	OUT=`echo $FILE \| sed s/csv/png/`
14
15	analyze -adist -b1000 "$FILE" --csv -n -i $* > $DIST
16	analyze -adist -c -b1000 "$FILE" --csv -n -i $* > $CUM
17
18	if [ -s $CUM ] && [ -s $DIST ]; then
19	plot_dist $DIST $CUM $OUT "$FILE: $*"
20	rm $DIST $CUM
21	else
22	echo "$FILE: Empty."
23	fi


diff --git a/csv_tool b/csv_tool deleted file mode 100755 index 17ad949..0000000 --- a/csv_tool +++ /dev/null
@@ -1,214 +0,0 @@
1	#!/usr/bin/env python
2
3	"""
4	Do stuff with csv files.
5	"""
6
7	import optparse
8	import defapp
9
10	import csv
11	import operator
12	import os.path
13	from collections import defaultdict as defdict
14	from itertools import izip
15
16	o = optparse.make_option
17
18	opts = [
19
20	o('-c', '--column', action='append', dest='col', type='int',
21	help='The column(s) on which to operate.'),
22
23	o(None, '--write-to-file', action='store_true', dest='write_to_file',
24	help='Write the output of operation xyz on file abc.csv to xyz_abc.csv.'),
25
26	o('-u', '--upper-bound', action='store_true', dest='upper_bound',
27	help="The linear regression is modified to represent an upper bound."),
28
29	# o(None, '--degree', action='store', type='float', dest='thruthiness',
30	# help='Not quite absolut truth.'),
31	]
32
33	defaults = {
34	'col' : [],
35	'write_to_file' : False,
36	'upper_bound' : False,
37	}
38
39	def pair_iter(it):
40	it = iter(it)
41	while True:
42	yield (it.next(), it.next())
43
44	def make_vector_op(op):
45	def vector_op(a, b, defvalue=0):
46	if len(a) > len(b):
47	shorter = b
48	longer = a
49	else:
50	shorter = a
51	longer = b
52	c = list(longer)
53	for i in xrange(len(shorter)):
54	c[i] = op(longer[i], shorter[i])
55	for i in xrange(len(shorter), len(longer)):
56	c[i] = op(longer[i], defvalue)
57	return c
58	return vector_op
59
60	def make_scalar_op(op):
61	def scalar_op(scalar, a):
62	return [op(x, scalar) for x in a]
63	return scalar_op
64
65	row_add = make_vector_op(operator.add)
66	row_min = make_vector_op(min)
67	row_max = make_vector_op(max)
68
69	def row_reduce(row_op, fixup=lambda key, rows, res: res):
70	def _reduce(order, by_key):
71	for key in order:
72	if key in by_key:
73	rows = by_key[key]
74	res = reduce(row_op, rows)
75	del by_key[key]
76	yield fixup(key, rows, res)
77	return _reduce
78
79
80	row_mul = make_scalar_op(operator.mul)
81	row_div = make_scalar_op(operator.div)
82
83	def transpose(rows):
84	rows = list(rows)
85	if rows:
86	r = len(rows)
87	c = max([len(x) for x in rows])
88	def at(x, y):
89	try:
90	return rows[x][y]
91	except IndexError:
92	return 0
93	for i in xrange(c):
94	yield [at(j, i) for j in xrange(r) ]
95
96	def reorder_columns(rows, xchg_pairs):
97	for r in rows:
98	for (x,y) in xchg_pairs:
99	r[x], r[y] = r[y], r[x]
100	yield r
101
102	def select_columns(rows, cols):
103	for r in rows:
104	yield [r[x] for x in cols]
105
106	def numpy_lstsq(x, y):
107	from numpy import ones, array
108	from numpy.linalg import lstsq
109	A = ones((len(y), 2), dtype=float)
110	A[:,0] = array(x)
111	b = array(y)
112	return lstsq(A, b)[0]
113
114	def max_delta(c0, c1, x, y):
115	return max([float(y) - (c0 + c1 * float(x)) for (x,y) in izip(x, y)])
116
117	def least_squares(rows, xy_pairs, upper_bound):
118	cols = []
119	for (x, y) in xy_pairs:
120	cols += [x, y]
121	rows = select_columns(rows, cols)
122	cols = transpose(rows)
123	for ((x, y), (xval, yval)) in izip(xy_pairs, pair_iter(cols)):
124	c1, c0 = numpy_lstsq(xval, yval)
125	if upper_bound:
126	c0 += max_delta(c0, c1, xval, yval)
127	yield [x + 1, y + 1, c0, c1]
128
129	def select_by_key(rows, col, cast=None):
130	by_key = defdict(list)
131	order = []
132	for r in rows:
133	key = r[col]
134	if cast:
135	by_key[key] += [[cast(x) for x in r]]
136	else:
137	by_key[key] += [r]
138	order += [key]
139	return (order, by_key)
140
141	class CsvApp(defapp.App):
142	def __init__(self):
143	defapp.App.__init__(self, opts, defaults)
144	# fixup human-friendly offsets
145	if not self.options.col:
146	self.options.col = [1]
147	self.options.col = [x - 1 for x in self.options.col]
148	self.options.col_pairs = list(pair_iter(self.options.col))
149
150	def transform(self, make_iterator, ordered=True):
151	"""
152	Read a file, pass the rows in the file to an iterator factory, and
153	write out the output of the iterator. The iterator performs the
154	desired transformation.
155	"""
156	files = list(self.args)
157	del files[0]
158	for fn in files:
159	try:
160	# read in content
161	rows = csv.reader(open(fn, 'r'))
162	# set up transformation
163	if ordered:
164	(order, by_key) = select_by_key(rows, self.options.col[0],
165	float)
166	rows = make_iterator(order, by_key)
167	else:
168	rows = make_iterator(rows)
169	# write out
170	outfile = self.outfile()
171	if self.options.write_to_file:
172	(dir, file) = os.path.split(fn)
173	fn = os.path.join(dir, self.args[0] + '_' + file)
174	outfile = open(fn, 'w')
175	csv.writer(outfile).writerows(rows)
176	if self.options.write_to_file:
177	outfile.close()
178	except IOError, ex:
179	self.err("%s:%s" % (fn, str(ex)))
180	except IndexError, ex:
181	self.err("%s: Sorry, index out of range." % fn)
182
183	def do_avg(self, _):
184	def fixup_avg(key, rows, res):
185	res = row_div(len(rows), res)
186	res[self.options.col[0]] = key
187	return res
188	self.transform(row_reduce(row_add, fixup_avg))
189
190	def do_max(self, _):
191	self.transform(row_reduce(row_max))
192
193	def do_min(self, _):
194	self.transform(row_reduce(row_min))
195
196	def do_transpose(self, _):
197	self.transform(transpose, ordered=False)
198
199	def do_reorder(self, _):
200	self.transform(lambda rows: reorder_columns(
201	rows, self.options.col_pairs), ordered=False)
202
203	def do_select(self, _):
204	self.transform(lambda rows: select_columns(
205	rows, self.options.col), ordered=False)
206
207	def do_lstsqrs(self, _):
208	self.transform(
209	lambda rows: least_squares(rows, self.options.col_pairs,
210	self.options.upper_bound),
211	ordered=False)
212
213	if __name__ == '__main__':
214	CsvApp().launch()


diff --git a/plot_dist b/plot_dist deleted file mode 100755 index 18cb48c..0000000 --- a/plot_dist +++ /dev/null
@@ -1,30 +0,0 @@
1	#!/bin/bash
2
3	CSV1=$1
4	CSV2=$2
5	OUT=$3
6	TITLE=$4
7
8	if [ ! -f "$CSV1" ] \|\| [ ! -f "$CSV2" ] \|\|
9	[ "" == "$OUT" ] ; then
10	echo "Usage: plot_dist <normal.csv> <cumulative.csv> <out.png> <title>"
11	exit 1
12	fi
13
14	gnuplot <<EOM
15	set terminal png picsize 1024 768
16	set out '/dev/null'
17	plot '$CSV1' title 'distribution' with lines
18	replot '$CSV2' title 'distribution (cumulative)' axes x1y2 with lines
19	set ylabel 'probability'
20	set y2label 'probability (cumulative)'
21	set xlabel 'overhead (in us)'
22	set y2tics
23	set y2range [0.0:1.0]
24	set title '$TITLE'
25	set key top left
26	set out '$OUT'
27	replot
28	set out
29	EOM
30