data/analyse.py
author Eugen Sawin <sawine@me73.com>
Fri, 04 Jun 2010 13:48:28 +0200
changeset 0 feede61efa96
permissions -rwxr-xr-x
Final version.
sawine@0
     1
#!/usr/bin/python
sawine@0
     2
sawine@0
     3
import dflowlog
sawine@0
     4
from dflowlog import dflow_fields as fields
sawine@0
     5
from filter import filter
sawine@0
     6
import sys
sawine@0
     7
from datetime import datetime
sawine@0
     8
from datetime import timedelta
sawine@0
     9
from optparse import OptionParser
sawine@0
    10
sawine@0
    11
sawine@0
    12
def get_datetime(row, value):
sawine@0
    13
	date, time = row[fields[value]].split()
sawine@0
    14
	year, month, day = date.split("-")
sawine@0
    15
	hour, minute, second = time.split(":")
sawine@0
    16
	return datetime(int(year), int(month), int(day), int(hour), int(minute), int(second))
sawine@0
    17
sawine@0
    18
def time_diff(dt1, dt2):	
sawine@0
    19
	diff = (max(dt1,dt2) - min(dt1, dt2))
sawine@0
    20
	diff = diff.seconds / 60 + diff.days * 24 * 60
sawine@0
    21
	if dt1 < dt2:
sawine@0
    22
		diff *= -1
sawine@0
    23
	return diff
sawine@0
    24
sawine@0
    25
def diff(values, plans):
sawine@0
    26
	new_plans = []
sawine@0
    27
	for plan in plans:
sawine@0
    28
		new_plans.append(plan)
sawine@0
    29
		v1 = get_datetime(plan, values[0])
sawine@0
    30
		v2 = get_datetime(plan, values[1])
sawine@0
    31
		new_plans[-1].append(str(time_diff(v1, v2)))
sawine@0
    32
	return new_plans
sawine@0
    33
sawine@0
    34
def column_diff(values, plans):
sawine@0
    35
	new_plans = []
sawine@0
    36
	flow_points = []
sawine@0
    37
	for plan in plans:
sawine@0
    38
		flow_point = plan[fields["flow_point"]]
sawine@0
    39
		if flow_point not in flow_points:
sawine@0
    40
			flow_points.append(flow_point)
sawine@0
    41
	for fp in flow_points:
sawine@0
    42
		flow_plans = filter("flow_point", fp, plans)		
sawine@0
    43
		for plan in flow_plans:
sawine@0
    44
			min_sep = 999
sawine@0
    45
			current_plan = plan
sawine@0
    46
			current_flow_time = get_datetime(current_plan, values[0])			
sawine@0
    47
			for plan2 in flow_plans:
sawine@0
    48
				if plan2 is not current_plan:
sawine@0
    49
					min_sep = min(min_sep, 
sawine@0
    50
									abs(time_diff(get_datetime(plan2, values[0]),
sawine@0
    51
									current_flow_time)))				
sawine@0
    52
			if min_sep < 999:
sawine@0
    53
				plan.append(str(min_sep))
sawine@0
    54
			new_plans.append(plan)
sawine@0
    55
	return new_plans
sawine@0
    56
sawine@0
    57
if __name__ == "__main__":
sawine@0
    58
	modes = {"diff": (diff, 3),
sawine@0
    59
				"cdiff": (column_diff, 2)}
sawine@0
    60
	arg_parser = OptionParser(usage="usage: %prog [options] diff column1 column2 csv_logs\
sawine@0
    61
									 %prog [options] cdiff column csv_logs")
sawine@0
    62
	arg_parser.add_option("-f", "--files",
sawine@0
    63
				action="store_true", dest="files_mode",
sawine@0
    64
				help="csv_logs are files")
sawine@0
    65
	arg_parser.set_defaults(files_mode=False)
sawine@0
    66
	(options, args) = arg_parser.parse_args()
sawine@0
    67
	plans = []
sawine@0
    68
	
sawine@0
    69
	if options.files_mode:
sawine@0
    70
		plans =	dflowlog.parse_files(args[modes[args[0]][1]:])
sawine@0
    71
		options.files_mode = False
sawine@0
    72
	else:
sawine@0
    73
		plans = dflowlog.parse_pipe(args[modes[args[0]][1]:])
sawine@0
    74
	
sawine@0
    75
	plans = modes[args[0]][0](args[1:], plans)	
sawine@0
    76
		
sawine@0
    77
	dflowlog.print_logs(plans)
sawine@0
    78
	
sawine@0
    79