#!/usr/bin/env python

import sys
import time
import optparse

from os.path import basename
from os import listdir

from tempfile import NamedTemporaryFile as Tmp

from plot import decode, Plot
from gnuplot import curve

SCHEDULERS = ['MC', 'MC-MERGE', 'MC-MERGE-REDIR']
COLS = {'plugin':       0,
        'overhead':     1,
        'n_tasks':      2,
        'samples':      3,
        'filtered':     4,
        'max':          5,
        'avg':          6,
        'min':          7,
        'med':          8,
        'std':          9,
        'var':          10,
        'iqr_max':      11,
        'iqr_min':      12}


def parse_args():
    p = optparse.OptionParser(description='make graphs')
    p.add_option('--paper', dest='paper', action='store_true', default=False)
    return p.parse_args()

def usage(msg):
    print >>sys.stderr, msg
    sys.exit(1)

def get_csv_files(directory):
    a = []
    for f in listdir(directory):
        bn = basename(f)
        if f.startswith('scheduler') and f.endswith('.csv'):
            a.append(f)
    return a

def gnuplot_col(col_name):
    # gnuplot is 1-indexed
    return 1 + COLS[col_name]

def get_sched_title(sched):
    SCHEDULERS = {'MC': 'Basic:',
            'MC-MERGE': 'IM + TM:',
            'MC-MERGE-REDIR': 'All:'}
    return SCHEDULERS[sched]

def get_overhead_title(ov):
    OV = {'LVLA-SCHED': 'A',
          'LVLB-SCHED': 'B',
          'LVLC-SCHED': 'C',
          'LVLA-RELEASE': 'A',
          'LVLB-RELEASE': 'B',
          'LVLC-RELEASE': 'C',
}
    return OV[ov]

def get_line_style(sched, o_type):
    S = {   'MC' :              {'LVLA': 1, 'LVLB': 4, 'LVLC': 7},
            'MC-MERGE':         {'LVLA': 2, 'LVLB': 5, 'LVLC': 8},
            'MC-MERGE-REDIR':   {'LVLA': 3, 'LVLB': 6, 'LVLC': 9}}
    o = o_type.split('-')[0]
    return 'linespoints linestyle {0}'.format(S[sched][o])

def get_graph_fname(directory, o_type, levels, ycol_type):
    return '{0}/overhead={1}-levels={2}-type={3}'.format(directory, o_type,
            levels, ycol_type)

def set_plot_opts(opts, p):
    p.rounded_caps = True
    p.font = 'Helvetica'
    p.key = 'off'
    p.monochrome = False
    p.dashed_lines = True
    p.xrange = (18, 122)
    p.yrange = (0, '')

    if opts.paper:
        ext = 'pdf'
        p.size = ('8.5cm', '5.25cm')
        line_width = 1.5
        point_size = 0.3
        p.font_size = '5pt'
    else:
        ext = 'png'
        p.size = (1024, 768)
        line_width = 3.0
        point_size = 1.5
        p.font_size = 'font "/usr/share/fonts/truetype/ttf-dejavu/DejaVuSans.ttf" 18'
    p.output = '{0}.{1}'.format(p.output, ext)
    p.format = ext

    p.line_styles = [
        (1, 'lt 1 pt 1 lw {0} ps {1} lc rgbcolor "#000000"'.format(line_width, point_size)),
        (2, 'lt 1 pt 4 lw {0} ps {1} lc rgbcolor "#ff0000"'.format(line_width, point_size)),
        (3, 'lt 1 pt 7 lw {0} ps {1} lc rgbcolor "#0000ff"'.format(line_width, point_size)),
        (4, 'lt 2 pt 1 lw {0} ps {1} lc rgbcolor "#000000"'.format(line_width, point_size)),
        (5, 'lt 2 pt 4 lw {0} ps {1} lc rgbcolor "#ff0000"'.format(line_width, point_size)),
        (6, 'lt 2 pt 7 lw {0} ps {1} lc rgbcolor "#0000ff"'.format(line_width, point_size)),
        (7, 'lt 3 pt 1 lw {0} ps {1} lc rgbcolor "#000000"'.format(line_width, point_size)),
        (8, 'lt 3 pt 4 lw {0} ps {1} lc rgbcolor "#ff0000"'.format(line_width, point_size)),
        (9, 'lt 3 pt 7 lw {0} ps {1} lc rgbcolor "#0000ff"'.format(line_width, point_size)),
        ]

def get_data_matrix(fname):
    ret = []
    with open(fname, 'r') as f:
        for row in f:
            new_row = []
            for field in row.split(','):
                s_field = field.strip()
                try:
                    conv = float(s_field)
                except ValueError:
                    conv = s_field
                new_row.append(conv)
            ret.append(new_row)
    return ret


def include_level_a_releases(data_dir, o_type, scheduler, ycol):
    fmt_f = '{0}/scheduler={1}_overhead={2}.csv'
    a_fname = fmt_f.format(data_dir, scheduler, 'LVLA-RELEASE')
    b_c_fname = fmt_f.format(data_dir, scheduler, 'RELEASE')
    a_data = get_data_matrix(a_fname)
    b_c_data = get_data_matrix(b_c_fname)
    new_data = []

    for i, a_row in enumerate(a_data):
        b_c_row = b_c_data[i]
        # make a copy of a_row
        new_row = list(a_row)
        if gnuplot_col('max') == ycol:
            idx = COLS['max']
            new_row[idx] = max(a_row[idx], b_c_row[idx])
        elif gnuplot_col('avg') == ycol:
            avg_col = COLS['avg']
            a_samples = a_row[COLS['samples']]
            b_c_samples = b_c_row[COLS['samples']]
            a_filtered = a_row[COLS['filtered']]
            b_c_filtered = b_c_row[COLS['filtered']]
            a_avg = a_row[avg_col]
            b_c_avg = b_c_row[avg_col]
            n_a = a_samples - a_filtered
            n_b_c = b_c_samples - b_c_filtered
            new_avg = (a_avg * n_a + b_c_avg * n_b_c) / (n_a + n_b_c)
            new_row[avg_col] = new_avg
        else:
            raise RuntimeError("Don't know how to merge this column.")
        new_data.append(new_row)
    f = Tmp()
    for row in new_data:
        f.write(', '.join(map(str, row)))
        f.write('\n')
    f.file.flush()
    return (f.name, f)

def add_key_to_plot(p):
    p.key = 'on tmargin center horizontal maxcolumns 3'
    p.size = ('8.5cm', '6.25cm')

def plot_release(opts, data_dir, ycol_name, title, levels):
    levels = levels.upper()
    refs = [] # need to save reference to file handle so it is not deleted
    p = Plot()
    p.output = get_graph_fname(data_dir, 'RELEASE', levels, ycol_name)

    for o_type in ['LVL{0}-RELEASE'.format(l) for l in levels]:
        for sched in SCHEDULERS:
            # if o_type == 'RELEASE':
            #     # we have to make the regular release include the level-A
            #     # releases
            #     fname, ref = include_level_a_releases(data_dir, o_type,
            #             sched, ycol)
            #     refs.append(ref)
            # else:
            fname = '{0}/scheduler={1}_overhead={2}.csv'.format(data_dir, sched, o_type)
            ti = '{0} {1}'.format(get_sched_title(sched), get_overhead_title(o_type))
            c = curve(fname=fname, xcol=gnuplot_col('n_tasks'),
                    ycol=gnuplot_col(ycol_name), title=ti,
                    style=get_line_style(sched, o_type))
            p.curves += [c]
    p.xlabel = 'number of tasks'
    p.ylabel = 'overhead (microseconds)'
    set_plot_opts(opts, p)
    if 'avg' == ycol_name and 'ABC' == levels:
        add_key_to_plot(p)
    p.gnuplot_exec()

def plot_release_jim(opts, data_dir, ycol, title, fname):
    """Jim just wanted level-A without any techniques and with all our techniques."""
    p = Plot()
    p.output = '{0}/{1}'.format(data_dir, fname)
    refs = [] # need to save reference to file handle so it is not deleted

    for sched in ['MC', 'MC-MERGE-REDIR']:
        o_type = 'LVLA-RELEASE'
        fname = '{0}/scheduler={1}_overhead={2}.csv'.format(data_dir, sched, o_type)
        ti = '{0} {1}'.format(get_sched_title(sched), get_overhead_title(o_type))
        p.curves += [curve(fname=fname, xcol=gnuplot_col('n_tasks'), ycol=ycol, title=ti)]
    p.xlabel = 'number of tasks'
    p.ylabel = 'overhead (microseconds)'
    set_plot_opts(opts, p)
    p.key = 'top left'
    p.title = 'level-A worst-case release overhead'
    p.gnuplot_exec()

def plot_sched(opts, data_dir, ycol_name, title, levels):
    levels = levels.upper()
    p = Plot()
    p.output = get_graph_fname(data_dir, 'SCHED', levels, ycol_name)

    for o_type in ['LVL{0}-SCHED'.format(l) for l in levels]:
        for sched in SCHEDULERS:
            fname = '{0}/scheduler={1}_overhead={2}.csv'.format(data_dir, sched, o_type)
            ti = '{0} {1}'.format(get_sched_title(sched), get_overhead_title(o_type))
            c = curve(fname=fname, xcol=gnuplot_col('n_tasks'),
                    ycol=gnuplot_col(ycol_name), title=ti,
                    style=get_line_style(sched, o_type))
            p.curves += [c]
    p.xlabel = 'number of tasks'
    p.ylabel = 'overhead (microseconds)'
    set_plot_opts(opts, p)
    if 'avg' == ycol_name and 'ABC' == levels:
        add_key_to_plot(p)
    p.gnuplot_exec()


def main():

    opts, extra = parse_args()

    if len(extra) < 1:
        usage('missing args')

    data_dir = extra[0]
    for levels in ('ABC', 'AC', 'BC'):
        plot_sched(opts, data_dir, 'max', 'worst-case scheduling overhead', levels)
        plot_release(opts, data_dir, 'max', 'worst-case release overhead', levels)
        plot_sched(opts, data_dir, 'avg', 'average-case scheduling overhead', levels)
        plot_release(opts, data_dir, 'avg', 'average-case release overhead', levels)
    #plot_release_jim(opts, data_dir, 'max', 'worst-case release overhead', 'overhead=RELEASE_type=MAX_for-jim=1')
    
if __name__ == '__main__':
    main()