annotate scripts/timeline_view.py @ 1103:2051868b21f0

Hotfix: Updated schema. <audioelement>, <surveyelement> and <commentquestion> have optional name attribute.
author Nicholas Jillings <n.g.r.jillings@se14.qmul.ac.uk>
date Wed, 09 Mar 2016 11:29:16 +0000
parents 0a15fa67bda1
children 1b6fa37d46a4 235594325b84
rev   line source
djmoffat@1099 1 #!/usr/bin/python
djmoffat@1099 2
djmoffat@1099 3 import xml.etree.ElementTree as ET
djmoffat@1099 4 import os # list files in directory
djmoffat@1099 5 import sys # command line arguments
djmoffat@1099 6 import matplotlib.pyplot as plt # plots
djmoffat@1099 7 import matplotlib.patches as patches # rectangles
djmoffat@1099 8
djmoffat@1099 9 # COMMAND LINE ARGUMENTS
djmoffat@1099 10
djmoffat@1099 11 assert len(sys.argv)<3, "timeline_view takes at most 1 command line argument\n"+\
djmoffat@1099 12 "Use: python timeline_view.py [XML_files_location]"
djmoffat@1099 13
djmoffat@1099 14 # XML results files location
djmoffat@1099 15 if len(sys.argv) == 1:
djmoffat@1099 16 folder_name = "../saves" # Looks in 'saves/' folder from 'scripts/' folder
djmoffat@1099 17 print "Use: python timeline_view.py [XML_files_location]"
djmoffat@1099 18 print "Using default path: " + folder_name
djmoffat@1099 19 elif len(sys.argv) == 2:
djmoffat@1099 20 folder_name = sys.argv[1] # First command line argument is folder
djmoffat@1099 21
djmoffat@1099 22 # check if folder_name exists
djmoffat@1099 23 if not os.path.exists(folder_name):
djmoffat@1099 24 #the file is not there
djmoffat@1099 25 print "Folder '"+folder_name+"' does not exist."
djmoffat@1099 26 sys.exit() # terminate script execution
djmoffat@1099 27 elif not os.access(os.path.dirname(folder_name), os.W_OK):
djmoffat@1099 28 #the file does exist but write privileges are not given
djmoffat@1099 29 print "No write privileges in folder '"+folder_name+"'."
djmoffat@1099 30
djmoffat@1099 31
djmoffat@1099 32 # CONFIGURATION
djmoffat@1099 33
djmoffat@1099 34 # Folder where to store timelines
djmoffat@1099 35 timeline_folder = folder_name + '/timelines/' # Stores in 'saves/timelines/'
djmoffat@1099 36
djmoffat@1099 37 # Font settings
djmoffat@1099 38 font = {'weight' : 'bold',
djmoffat@1099 39 'size' : 16}
djmoffat@1099 40 plt.rc('font', **font)
djmoffat@1099 41
djmoffat@1099 42 # Colormap for to cycle through
djmoffat@1099 43 colormap = ['b', 'r', 'g', 'c', 'm', 'y', 'k']
djmoffat@1099 44
djmoffat@1099 45 # if enabled, x-axis shows time per audioholder, not total test time
djmoffat@1099 46 show_audioholder_time = True
djmoffat@1099 47
djmoffat@1099 48 # bar height (<1 to avoid overlapping)
djmoffat@1099 49 bar_height = 0.6
djmoffat@1099 50
djmoffat@1099 51 # figure size
djmoffat@1099 52 fig_width = 25
djmoffat@1099 53 fig_height = 5
djmoffat@1099 54
djmoffat@1099 55
djmoffat@1099 56 # CODE
djmoffat@1099 57
djmoffat@1099 58 # create timeline_folder if not yet created
djmoffat@1099 59 if not os.path.exists(timeline_folder):
djmoffat@1099 60 os.makedirs(timeline_folder)
djmoffat@1099 61
djmoffat@1099 62 # get every XML file in folder
djmoffat@1099 63 for file in os.listdir(folder_name):
djmoffat@1099 64 if file.endswith(".xml"):
djmoffat@1099 65 tree = ET.parse(folder_name + '/' + file)
djmoffat@1099 66 root = tree.getroot()
djmoffat@1099 67 subject_id = file[:-4] # drop '.xml'
djmoffat@1099 68
djmoffat@1099 69 time_offset = 0 # test starts at zero
djmoffat@1099 70
djmoffat@1099 71 # ONE TIMELINE PER PAGE - make new plot per page
djmoffat@1099 72
djmoffat@1099 73 # get list of all page names
djmoffat@1099 74 for audioholder in root.findall("./audioholder"): # iterate over pages
djmoffat@1099 75 page_name = audioholder.get('id') # get page name
djmoffat@1099 76 plot_empty = True # check if any data is plotted
djmoffat@1099 77
djmoffat@1099 78 if page_name is None: # ignore 'empty' audio_holders
djmoffat@1099 79 break
djmoffat@1099 80
djmoffat@1099 81 # SORT AUDIO ELEMENTS ALPHABETICALLY
djmoffat@1099 82 audioelements = audioholder.findall("./audioelement")
djmoffat@1099 83
djmoffat@1099 84 data = []
djmoffat@1099 85 for elem in audioelements: # from http://effbot.org/zone/element-sort.htm
djmoffat@1099 86 key = elem.get("id")
djmoffat@1099 87 data.append((key, elem))
djmoffat@1099 88 data.sort()
djmoffat@1099 89
djmoffat@1099 90 N_audioelements = len(audioelements) # number of audio elements for this page
djmoffat@1099 91 increment = 0 # increased for every new audioelement
djmoffat@1099 92 audioelements_names = [] # store names of audioelements
djmoffat@1099 93
djmoffat@1099 94 # get axes handle
djmoffat@1099 95 fig = plt.figure(figsize=(fig_width, fig_height))
djmoffat@1099 96 ax = fig.add_subplot(111) #, aspect='equal'
djmoffat@1099 97
djmoffat@1099 98 # for page [page_name], print comments related to fragment [id]
djmoffat@1099 99 for tuple in data:
djmoffat@1099 100 audioelement = tuple[1]
djmoffat@1099 101 if audioelement is not None: # Check it exists
djmoffat@1099 102 audio_id = str(audioelement.get('id'))
djmoffat@1099 103 audioelements_names.append(audio_id)
djmoffat@1099 104
djmoffat@1099 105 # for this audioelement, loop over all listen events
djmoffat@1099 106 listen_events = audioelement.findall("./metric/metricresult/[@name='elementListenTracker']/event")
djmoffat@1099 107 for event in listen_events:
djmoffat@1099 108 # mark this plot as not empty
djmoffat@1099 109 plot_empty = False
djmoffat@1099 110
djmoffat@1099 111 # get testtime: start and stop
djmoffat@1099 112 start_time = float(event.find('testtime').get('start'))-time_offset
djmoffat@1099 113 stop_time = float(event.find('testtime').get('stop'))-time_offset
djmoffat@1099 114 # event lines:
djmoffat@1099 115 ax.plot([start_time, start_time], # x-values
djmoffat@1099 116 [0, N_audioelements+1], # y-values
djmoffat@1099 117 color='k'
djmoffat@1099 118 )
djmoffat@1099 119 ax.plot([stop_time, stop_time], # x-values
djmoffat@1099 120 [0, N_audioelements+1], # y-values
djmoffat@1099 121 color='k'
djmoffat@1099 122 )
djmoffat@1099 123 # plot time:
djmoffat@1099 124 ax.add_patch(
djmoffat@1099 125 patches.Rectangle(
djmoffat@1099 126 (start_time, N_audioelements-increment-bar_height/2), # (x, y)
djmoffat@1099 127 stop_time - start_time, # width
djmoffat@1099 128 bar_height, # height
djmoffat@1099 129 color=colormap[increment%len(colormap)] # colour
djmoffat@1099 130 )
djmoffat@1099 131 )
djmoffat@1099 132
djmoffat@1099 133 increment+=1 # to next audioelement
djmoffat@1099 134
djmoffat@1099 135 # subtract total audioholder length from subsequent audioholder event times
djmoffat@1099 136 audioholder_time = audioholder.find("./metric/metricresult/[@id='testTime']")
djmoffat@1099 137 if audioholder_time is not None and show_audioholder_time:
djmoffat@1099 138 time_offset = float(audioholder_time.text)
djmoffat@1099 139
djmoffat@1099 140 if not plot_empty:
djmoffat@1099 141 # set plot parameters
djmoffat@1099 142 plt.title('Timeline ' + file + ": "+page_name)
djmoffat@1099 143 plt.xlabel('Time [seconds]')
djmoffat@1099 144 plt.ylabel('Fragment')
djmoffat@1099 145 plt.ylim(0, N_audioelements+1)
djmoffat@1099 146
djmoffat@1099 147 #y-ticks: fragment IDs, top to bottom
djmoffat@1099 148 plt.yticks(range(N_audioelements, 0, -1), audioelements_names) # show fragment names
djmoffat@1099 149
djmoffat@1099 150
djmoffat@1099 151 #plt.show() # uncomment to show plot; comment when just saving
djmoffat@1099 152 #exit()
djmoffat@1099 153
djmoffat@1099 154 plt.savefig(timeline_folder+subject_id+"-"+page_name+".pdf", bbox_inches='tight')
djmoffat@1099 155 plt.close()
djmoffat@1099 156
djmoffat@1099 157 #TODO: if 'nonsensical' or unknown: dashed line until next event
djmoffat@1099 158 #TODO: Vertical lines for fragment looping point
djmoffat@1099 159