annotate scripts/timeline_view.py @ 1946:1d08f8aee098

Merge WAC paper
author Dave Moffat <me@davemoffat.com>
date Thu, 24 Sep 2015 09:52:08 +0100
parents 4988c805ff9e
children 1b6fa37d46a4 235594325b84
rev   line source
me@1942 1 #!/usr/bin/python
me@1942 2
me@1942 3 import xml.etree.ElementTree as ET
me@1942 4 import os # list files in directory
me@1942 5 import sys # command line arguments
me@1942 6 import matplotlib.pyplot as plt # plots
me@1942 7 import matplotlib.patches as patches # rectangles
me@1942 8
me@1942 9 # COMMAND LINE ARGUMENTS
me@1942 10
me@1942 11 assert len(sys.argv)<3, "timeline_view takes at most 1 command line argument\n"+\
me@1942 12 "Use: python timeline_view.py [XML_files_location]"
me@1942 13
me@1942 14 # XML results files location
me@1942 15 if len(sys.argv) == 1:
me@1942 16 folder_name = "../saves" # Looks in 'saves/' folder from 'scripts/' folder
me@1942 17 print "Use: python timeline_view.py [XML_files_location]"
me@1942 18 print "Using default path: " + folder_name
me@1942 19 elif len(sys.argv) == 2:
me@1942 20 folder_name = sys.argv[1] # First command line argument is folder
me@1942 21
me@1942 22 # check if folder_name exists
me@1942 23 if not os.path.exists(folder_name):
me@1942 24 #the file is not there
me@1942 25 print "Folder '"+folder_name+"' does not exist."
me@1942 26 sys.exit() # terminate script execution
me@1942 27 elif not os.access(os.path.dirname(folder_name), os.W_OK):
me@1942 28 #the file does exist but write privileges are not given
me@1942 29 print "No write privileges in folder '"+folder_name+"'."
me@1942 30
me@1942 31
me@1942 32 # CONFIGURATION
me@1942 33
me@1942 34 # Folder where to store timelines
me@1942 35 timeline_folder = folder_name + '/timelines/' # Stores in 'saves/timelines/'
me@1942 36
me@1942 37 # Font settings
me@1942 38 font = {'weight' : 'bold',
me@1942 39 'size' : 16}
me@1942 40 plt.rc('font', **font)
me@1942 41
me@1942 42 # Colormap for to cycle through
me@1942 43 colormap = ['b', 'r', 'g', 'c', 'm', 'y', 'k']
me@1942 44
me@1942 45 # if enabled, x-axis shows time per audioholder, not total test time
me@1942 46 show_audioholder_time = True
me@1942 47
me@1942 48 # bar height (<1 to avoid overlapping)
me@1942 49 bar_height = 0.6
me@1942 50
me@1942 51 # figure size
me@1942 52 fig_width = 25
me@1942 53 fig_height = 5
me@1942 54
me@1942 55
me@1942 56 # CODE
me@1942 57
me@1942 58 # create timeline_folder if not yet created
me@1942 59 if not os.path.exists(timeline_folder):
me@1942 60 os.makedirs(timeline_folder)
me@1942 61
me@1942 62 # get every XML file in folder
me@1942 63 for file in os.listdir(folder_name):
me@1942 64 if file.endswith(".xml"):
me@1942 65 tree = ET.parse(folder_name + '/' + file)
me@1942 66 root = tree.getroot()
me@1942 67 subject_id = file[:-4] # drop '.xml'
me@1942 68
me@1942 69 time_offset = 0 # test starts at zero
me@1942 70
me@1942 71 # ONE TIMELINE PER PAGE - make new plot per page
me@1942 72
me@1942 73 # get list of all page names
me@1942 74 for audioholder in root.findall("./audioholder"): # iterate over pages
me@1942 75 page_name = audioholder.get('id') # get page name
me@1942 76 plot_empty = True # check if any data is plotted
me@1942 77
me@1942 78 if page_name is None: # ignore 'empty' audio_holders
me@1942 79 break
me@1942 80
me@1942 81 # SORT AUDIO ELEMENTS ALPHABETICALLY
me@1942 82 audioelements = audioholder.findall("./audioelement")
me@1942 83
me@1942 84 data = []
me@1942 85 for elem in audioelements: # from http://effbot.org/zone/element-sort.htm
me@1942 86 key = elem.get("id")
me@1942 87 data.append((key, elem))
me@1942 88 data.sort()
me@1942 89
me@1942 90 N_audioelements = len(audioelements) # number of audio elements for this page
me@1942 91 increment = 0 # increased for every new audioelement
me@1942 92 audioelements_names = [] # store names of audioelements
me@1942 93
me@1942 94 # get axes handle
me@1942 95 fig = plt.figure(figsize=(fig_width, fig_height))
me@1942 96 ax = fig.add_subplot(111) #, aspect='equal'
me@1942 97
me@1942 98 # for page [page_name], print comments related to fragment [id]
me@1942 99 for tuple in data:
me@1942 100 audioelement = tuple[1]
me@1942 101 if audioelement is not None: # Check it exists
me@1942 102 audio_id = str(audioelement.get('id'))
me@1942 103 audioelements_names.append(audio_id)
me@1942 104
me@1942 105 # for this audioelement, loop over all listen events
me@1942 106 listen_events = audioelement.findall("./metric/metricresult/[@name='elementListenTracker']/event")
me@1942 107 for event in listen_events:
me@1942 108 # mark this plot as not empty
me@1942 109 plot_empty = False
me@1942 110
me@1942 111 # get testtime: start and stop
me@1942 112 start_time = float(event.find('testtime').get('start'))-time_offset
me@1942 113 stop_time = float(event.find('testtime').get('stop'))-time_offset
me@1942 114 # event lines:
me@1942 115 ax.plot([start_time, start_time], # x-values
me@1942 116 [0, N_audioelements+1], # y-values
me@1942 117 color='k'
me@1942 118 )
me@1942 119 ax.plot([stop_time, stop_time], # x-values
me@1942 120 [0, N_audioelements+1], # y-values
me@1942 121 color='k'
me@1942 122 )
me@1942 123 # plot time:
me@1942 124 ax.add_patch(
me@1942 125 patches.Rectangle(
me@1942 126 (start_time, N_audioelements-increment-bar_height/2), # (x, y)
me@1942 127 stop_time - start_time, # width
me@1942 128 bar_height, # height
me@1942 129 color=colormap[increment%len(colormap)] # colour
me@1942 130 )
me@1942 131 )
me@1942 132
me@1942 133 increment+=1 # to next audioelement
me@1942 134
me@1942 135 # subtract total audioholder length from subsequent audioholder event times
me@1942 136 audioholder_time = audioholder.find("./metric/metricresult/[@id='testTime']")
me@1942 137 if audioholder_time is not None and show_audioholder_time:
me@1942 138 time_offset = float(audioholder_time.text)
me@1942 139
me@1942 140 if not plot_empty:
me@1942 141 # set plot parameters
me@1942 142 plt.title('Timeline ' + file + ": "+page_name)
me@1942 143 plt.xlabel('Time [seconds]')
me@1942 144 plt.ylabel('Fragment')
me@1942 145 plt.ylim(0, N_audioelements+1)
me@1942 146
me@1942 147 #y-ticks: fragment IDs, top to bottom
me@1942 148 plt.yticks(range(N_audioelements, 0, -1), audioelements_names) # show fragment names
me@1942 149
me@1942 150
me@1942 151 #plt.show() # uncomment to show plot; comment when just saving
me@1942 152 #exit()
me@1942 153
me@1942 154 plt.savefig(timeline_folder+subject_id+"-"+page_name+".pdf", bbox_inches='tight')
me@1942 155 plt.close()
me@1942 156
me@1942 157 #TODO: if 'nonsensical' or unknown: dashed line until next event
me@1942 158 #TODO: Vertical lines for fragment looping point
me@1942 159