annotate docs/SMC15/smc2015template.tex @ 1645:08dcb9b22a88

Updated example project.xml to reflect new project specifications.
author Nicholas Jillings <nickjillings@users.noreply.github.com>
date Fri, 10 Apr 2015 12:23:57 +0100
parents 06e4d36ca9d7
children e0abe55f5514
rev   line source
nickjillings@1642 1 % -----------------------------------------------
nickjillings@1642 2 % Template for SMC 2012
nickjillings@1642 3 % adapted from the template for SMC 2011, which was adapted from that of SMC 2010
nickjillings@1642 4 % -----------------------------------------------
nickjillings@1642 5
nickjillings@1642 6 \documentclass{article}
nickjillings@1642 7 \usepackage{smc2015}
nickjillings@1642 8 \usepackage{times}
nickjillings@1642 9 \usepackage{ifpdf}
nickjillings@1642 10 \usepackage[english]{babel}
nickjillings@1642 11 \usepackage{cite}
nickjillings@1642 12
nickjillings@1642 13 %%%%%%%%%%%%%%%%%%%%%%%% Some useful packages %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
nickjillings@1642 14 %%%%%%%%%%%%%%%%%%%%%%%% See related documentation %%%%%%%%%%%%%%%%%%%%%%%%%%
nickjillings@1642 15 %\usepackage{amsmath} % popular packages from Am. Math. Soc. Please use the
nickjillings@1642 16 %\usepackage{amssymb} % related math environments (split, subequation, cases,
nickjillings@1642 17 %\usepackage{amsfonts}% multline, etc.)
nickjillings@1642 18 %\usepackage{bm} % Bold Math package, defines the command \bf{}
nickjillings@1642 19 %\usepackage{paralist}% extended list environments
nickjillings@1642 20 %%subfig.sty is the modern replacement for subfigure.sty. However, subfig.sty
nickjillings@1642 21 %%requires and automatically loads caption.sty which overrides class handling
nickjillings@1642 22 %%of captions. To prevent this problem, preload caption.sty with caption=false
nickjillings@1642 23 %\usepackage[caption=false]{caption}
nickjillings@1642 24 %\usepackage[font=footnotesize]{subfig}
nickjillings@1642 25
nickjillings@1642 26
nickjillings@1642 27 %user defined variables
nickjillings@1642 28 \def\papertitle{APE FOR WEB: A BROWSER-BASED EVALUATION TOOL FOR AUDIO} %?
nickjillings@1642 29 \def\firstauthor{Nicholas Jillings}
nickjillings@1642 30 \def\secondauthor{Brecht De Man}
nickjillings@1642 31 \def\thirdauthor{David Moffat}
nickjillings@1642 32 \def\fourthauthor{Joshua D. Reiss}
nickjillings@1642 33
nickjillings@1642 34 % adds the automatic
nickjillings@1642 35 % Saves a lot of ouptut space in PDF... after conversion with the distiller
nickjillings@1642 36 % Delete if you cannot get PS fonts working on your system.
nickjillings@1642 37
nickjillings@1642 38 % pdf-tex settings: detect automatically if run by latex or pdflatex
nickjillings@1642 39 \newif\ifpdf
nickjillings@1642 40 \ifx\pdfoutput\relax
nickjillings@1642 41 \else
nickjillings@1642 42 \ifcase\pdfoutput
nickjillings@1642 43 \pdffalse
nickjillings@1642 44 \else
nickjillings@1642 45 \pdftrue
nickjillings@1642 46 \fi
nickjillings@1642 47
nickjillings@1642 48 \ifpdf % compiling with pdflatex
nickjillings@1642 49 \usepackage[pdftex,
nickjillings@1642 50 pdftitle={\papertitle},
nickjillings@1642 51 pdfauthor={\firstauthor, \secondauthor, \thirdauthor},
nickjillings@1642 52 bookmarksnumbered, % use section numbers with bookmarks
nickjillings@1642 53 pdfstartview=XYZ % start with zoom=100% instead of full screen;
nickjillings@1642 54 % especially useful if working with a big screen :-)
nickjillings@1642 55 ]{hyperref}
nickjillings@1642 56 %\pdfcompresslevel=9
nickjillings@1642 57
nickjillings@1642 58 \usepackage[pdftex]{graphicx}
nickjillings@1642 59 % declare the path(s) where your graphic files are and their extensions so
nickjillings@1642 60 %you won't have to specify these with every instance of \includegraphics
nickjillings@1642 61 \graphicspath{{./figures/}}
nickjillings@1642 62 \DeclareGraphicsExtensions{.pdf,.jpeg,.png}
nickjillings@1642 63
nickjillings@1642 64 \usepackage[figure,table]{hypcap}
nickjillings@1642 65
nickjillings@1642 66 \else % compiling with latex
nickjillings@1642 67 \usepackage[dvips,
nickjillings@1642 68 bookmarksnumbered, % use section numbers with bookmarks
nickjillings@1642 69 pdfstartview=XYZ % start with zoom=100% instead of full screen
nickjillings@1642 70 ]{hyperref} % hyperrefs are active in the pdf file after conversion
nickjillings@1642 71
nickjillings@1642 72 \usepackage[dvips]{epsfig,graphicx}
nickjillings@1642 73 % declare the path(s) where your graphic files are and their extensions so
nickjillings@1642 74 %you won't have to specify these with every instance of \includegraphics
nickjillings@1642 75 \graphicspath{{./figures/}}
nickjillings@1642 76 \DeclareGraphicsExtensions{.eps}
nickjillings@1642 77
nickjillings@1642 78 \usepackage[figure,table]{hypcap}
nickjillings@1642 79 \fi
nickjillings@1642 80
nickjillings@1642 81 %setup the hyperref package - make the links black without a surrounding frame
nickjillings@1642 82 \hypersetup{
nickjillings@1642 83 colorlinks,%
nickjillings@1642 84 citecolor=black,%
nickjillings@1642 85 filecolor=black,%
nickjillings@1642 86 linkcolor=black,%
nickjillings@1642 87 urlcolor=black
nickjillings@1642 88 }
nickjillings@1642 89
nickjillings@1642 90
nickjillings@1642 91 % Title.
nickjillings@1642 92 % ------
nickjillings@1642 93 \title{\papertitle}
nickjillings@1642 94
nickjillings@1642 95 % Authors
nickjillings@1642 96 % Please note that submissions are NOT anonymous, therefore
nickjillings@1642 97 % authors' names have to be VISIBLE in your manuscript.
nickjillings@1642 98 %
nickjillings@1642 99 % Single address
nickjillings@1642 100 % To use with only one author or several with the same address
nickjillings@1642 101 % ---------------
nickjillings@1642 102 %\oneauthor
nickjillings@1642 103 % {\firstauthor} {Affiliation1 \\ %
nickjillings@1642 104 % {\tt \href{mailto:author1@smcnetwork.org}{author1@smcnetwork.org}}}
nickjillings@1642 105
nickjillings@1642 106 %Two addresses
nickjillings@1642 107 %--------------
nickjillings@1642 108 % \twoauthors
nickjillings@1642 109 % {\firstauthor} {Affiliation1 \\ %
nickjillings@1642 110 % {\tt \href{mailto:author1@smcnetwork.org}{author1@smcnetwork.org}}}
nickjillings@1642 111 % {\secondauthor} {Affiliation2 \\ %
nickjillings@1642 112 % {\tt \href{mailto:author2@smcnetwork.org}{author2@smcnetwork.org}}}
nickjillings@1642 113
nickjillings@1642 114
nickjillings@1642 115
nickjillings@1642 116 % FIX!!!
nickjillings@1642 117 \fourauthors
nickjillings@1642 118 {\firstauthor} {%Affiliation1 \\
nickjillings@1642 119 {\tt \href{mailto:b.deman@qmul.ac.uk}{n.g.r.jillings@se14.qmul.ac.uk, }}}
nickjillings@1642 120 {\secondauthor} {%Affiliation2\\ %
nickjillings@1642 121 {\tt \href{mailto:n.g.r.jillings@se14.qmul.ac.uk}{\{b.deman,}}}
nickjillings@1642 122 {\thirdauthor} {%Affiliation3\\ %
nickjillings@1642 123 {\tt \href{mailto:d.j.moffat@qmul.ac.uk}{d.j.moffat, }}}
nickjillings@1642 124 {\fourthauthor} {%Affiliation4\\ %
nickjillings@1642 125 {\tt \href{mailto:joshua.reiss@qmul.ac.uk}{joshua.reiss\}@qmul.ac.uk}}}
nickjillings@1642 126
nickjillings@1642 127 % ***************************************** the document starts here ***************
nickjillings@1642 128 \begin{document}
nickjillings@1642 129 %
nickjillings@1642 130 \capstartfalse
nickjillings@1642 131 \maketitle
nickjillings@1642 132 \capstarttrue
nickjillings@1642 133 %
nickjillings@1642 134 \begin{abstract}
nickjillings@1642 135 Place your abstract at the top left column on the first page.
nickjillings@1642 136 Please write about 150-200 words that specifically highlight the purpose of your work,
nickjillings@1642 137 its context, and provide a brief synopsis of your results.
nickjillings@1642 138 Avoid equations in this part.\\
nickjillings@1642 139 TOTAL PAPER: Minimum 4 pages, 6 preferred, max. 8 (6 for demos/posters)\\
nickjillings@1642 140 \end{abstract}
nickjillings@1642 141 %
nickjillings@1642 142
nickjillings@1642 143 \section{Introduction}\label{sec:introduction}
nickjillings@1642 144
nickjillings@1642 145 background (types of research where this type of perceptual evaluation of audio is relevant)\\
nickjillings@1642 146
nickjillings@1642 147 multiple stimulus perceptual evaluation (reference to Bech etc.)\\
nickjillings@1642 148
nickjillings@1642 149 prior work: \cite{deman2014b} in MATLAB, much less easy to deploy, and often stops working due to version updates \\
nickjillings@1642 150
nickjillings@1642 151 goal, what are we trying to do? \\
nickjillings@1642 152
nickjillings@1642 153 [Previously, due to limited functionality of HTML, ..., it was not possible to design this type of interfaces with such high quality audio... ]
nickjillings@1642 154
nickjillings@1642 155
nickjillings@1642 156 \section{Design considerations}\label{sec:designconsiderations}
nickjillings@1642 157
nickjillings@1642 158 We present a browser-based perceptual evaluation tool for audio that ... \\
nickjillings@1642 159
nickjillings@1642 160 see \cite{deman2014b}: requirements informed by research on music production (see my work and that of others' in the group), such as randomisation, playback of high quality audio, some degree of flexibility in terms of configuration, ... \\
nickjillings@1642 161
nickjillings@1642 162
nickjillings@1642 163 \section{Implementation}\label{sec:implementation}
nickjillings@1642 164 %[Nick???]
nickjillings@1642 165
nickjillings@1642 166 %section on overall architecture\\
nickjillings@1642 167
nickjillings@1642 168 %section with overview of the structure of the input and output files, perhaps with graph or table
nickjillings@1642 169
nickjillings@1642 170 The tool runs entirely inside the browser through the new HTML5 Web Audio API. The API is supported by most major web browsers (except Internet Explorer) and allows for constructing a chain of audio processing elements to produce a high quality, real time signal process to manipulate audio streams. The API supports multi-channel processing and has an accurate playback timer for precise scheduled playback control. The web audio API is controlled through the browser JavaScript and is therefore highly controllable. The Web Audio API processing is all controlled in a separate thread to the main JavaScript thread, meaning there is no blocking due to real time processing.
nickjillings@1642 171
nickjillings@1642 172 \subsection{Architecture}\label{sec:architecture}
nickjillings@1642 173
nickjillings@1642 174 The web tool itself is split into several files to operate:
nickjillings@1642 175 \begin{itemize}
nickjillings@1642 176 \item apeTool.html: The main index file to load the scripts, this is the file the browser must request to load
nickjillings@1642 177 \item core.js: Contains functions and objects to manage the audio control, audio objects for testing and loading of files
nickjillings@1642 178 \item ape.js: Parses setup files to create the interface as instructed, following the same style chain as the MATLAB APE Tool.
nickjillings@1642 179 \end{itemize}
nickjillings@1642 180
nickjillings@1642 181 The HTML file loads the core.js file with it along with a few other ancillary files (such as the jQuery javascript extensions), the browser JavaScript begins to execute the on page instructions, which gives the URL of the test setup XML document (outlined in the next section). The core.js parses this document and executes the function in ape.js to build the web page with the given audio files. The reason for separating these two files is to allow for further interface designs (such as Mushra or A-B tests) to be used, which would still require the same underlying core functions outlined in core.js
nickjillings@1642 182
nickjillings@1642 183 The ape.js file has only two main functions: loadInterface(xmlDoc) and interfaceXMLSave(). The first function is called to build the interface once the setup document has been loaded. This includes creating the slider interface to rate the tracks and creating the comment boxes bellow. The bars in the slider ranking at the top of the page are randomly spaced. It also instructs the audio engine in the core.js to create the audio objects. The audio objects are custom built audio nodes built on the web audio API. They consist of a bufferSourceNode (a node which holds a buffer of audio samples for playback) and a gainNode. These are then connected to the audioEngine (itself a custom web audio node) containing a gainNode (where the various audio Objects connect to) for summation before passing the output to the destination Node, a fixed node created where the browser then passes the audio information to the system sound device.
nickjillings@1642 184
nickjillings@1642 185 When an audioObject is created, the URL of the audio sample to load is given to it. This is downloaded into the browser asynchronously using the XMLHttpRequest object. This allows for downloading of any file into the JavaScript environment for further processing. It is particularly useful for the web audio API because it supports downloading of files in their binary form, allowing a perfect copy. Once the asynchronous download is complete, the file is then decoded using the web audio API offline decoder. This uses the browser available decoding schemes to decode the audio files into raw float32 arrays, which are in-turn passed to the relevant audioObject bufferSourceNode for playback.
nickjillings@1642 186
nickjillings@1642 187 Browsers support various audio file formats and are not consistent in any format. One sure format that all browsers support is the WAV format. Although not a compact, web friendly format, most transport systems are of a high enough bandwidth this should not be a problem. However one problem is that of sample rate. On loading, the browser uses the sample rate assigned by the system sound device. The browser does not have the ability to request a different sound rate. Therefore the default operation when an audio file is loaded with a different sample rate to that of the system is to convert the sample rate. To provide a check for this, the desired sample rate can be supplied with the setup XML and checked against. If the sample rates do not match, a browser alert window is shown asking for the sample rate to be correctly adjusted. This happens before any loading or decoding of audio files. Only once the sample rates match will the system actually fetch any files, keeping down requests for the larger files until they are actually needed.
nickjillings@1642 188
nickjillings@1642 189 During playback, the playback nodes loop indefinitely until playback is stopped. The gain nodes in the audioObjects enable dynamic muting of nodes. When a bar in the sliding ranking is clicked, the audio engine mutes all audioObjects and un-mutes the clicked one. Therefore, if the audio samples are perfectly aligned up and of the same sample length, they will remain perfectly aligned with each other.
nickjillings@1642 190
nickjillings@1642 191 \subsection{Setup and Results Formats}\label{sec:setupresultsformats}
nickjillings@1642 192
nickjillings@1642 193 Setup and the results both use the common XML document format to outline the various parameters. The setup file contains all the information needed to initialise a test session. Several Nodes can be defined to outline the audio samples to use, questions to be asked and any pre- or post-test questions or instructions. Having one document to modify allows for quick manipulation in a 'human readable' form to create new tests, or adjust current ones, without needing to edit which web files.
nickjillings@1642 194
nickjillings@1642 195 The results file is dynamically generated by the interface upon clicking the submit button. There will be checks, depending on the setup file, to ensure that all tracks have been evaluated and their positions in the slider moved. The XML returned contains a node per audioObject and contains its rating in the slider and any comments written in its associated comment box. The rating returned is normalised to be within a integer range of 0 to 100. This normalises the pixel representation of different browser windows. If a window for instance is only 1280 wide, reporting its pixel position is not representative to a display with a width of 1920.
nickjillings@1642 196
nickjillings@1642 197 The pre- and post-test options allow for comments or questions to be presented before or after the test. These are automatically generated based upon the given setup XML and allow nearly any form of question and comment to be included in a window on its own. Questions are stored and presented in the response section labelled 'pretest' and 'posttest' along with the question ID and its response. Questions can be made optionally mandatory. Example questions may involve entering mixing experience or listening environment.
nickjillings@1642 198
nickjillings@1642 199 The results will also contain information collected by any defined pre/post questions. These are referenced against the setup XML by using the same ID as well as printing in the same question, so readable responses can be obtained. Future development will also evolve to include any session data, such as the browser the tool was used in, how long the test took and any other metrics. Currently the results files are downloaded on the user side of the browser as a .xml file to be manually returned. However the end goal is to allow the XML files to be submitted over the web to a receiving server to store them, allowing for automated collection.
nickjillings@1642 200
nickjillings@1642 201 Here is an example of the setup XML and the results XML:
nickjillings@1642 202 % Should we include an Example of the input and output XML structure??
nickjillings@1642 203
nickjillings@1642 204 \section{Applications}\label{sec:applications} %?
nickjillings@1642 205 discussion of use of this toolbox (possibly based on a quick mock test using my research data, to be repeated with a large number of participants and more data later)\\
nickjillings@1642 206
nickjillings@1642 207 \subsection{Listening Environment Standardisation}
nickjillings@1642 208
nickjillings@1642 209 In order to reduce the impact of having a non-standardised listening environment and unobservable participants, a series of pre-test standard questions have been put together to ask every participant. The first part of this is that every participant is asked to carry out the test, wherever possible, with a pair of quality headphones.
nickjillings@1642 210
nickjillings@1642 211 \begin{itemize}
nickjillings@1642 212 \item Name (text box)
nickjillings@1642 213 \item I am happy for name to be used in an academic publication (check box)
nickjillings@1642 214 \item First Language (text box)
nickjillings@1642 215 \item Location eg. country, city (text box)
nickjillings@1642 216 \item Playback System (ratio box (Headphones or Speaker))
nickjillings@1642 217 \item Make and Model of Playback System (text box)
nickjillings@1642 218 \item Please assess how good you believe your hearing to be, where 1 is deaf, 10 is professional critical listener (Dropdown box 1-10)
nickjillings@1642 219 \end{itemize}
nickjillings@1642 220
nickjillings@1642 221
nickjillings@1642 222 There are also a series of considerations that have been made towards ensuring there is a standardised listening environment, so it is possible to
nickjillings@1642 223 \begin{itemize}
nickjillings@1642 224 \item Begin with standardised listening test - to confirm listening experience
nickjillings@1642 225 \item Perform loudness equalisation on all tracks
nickjillings@1642 226 \\** OR THIS SHOULD BE DONE BEFORE THE EXPERIMENT
nickjillings@1642 227 \item Randomise order of tests
nickjillings@1642 228 \item Randomise order of tracks in each test
nickjillings@1642 229 \item Repeat each experiment a number of times
nickjillings@1642 230 \\** TO REMOVE THE FAMILIARISATION WITH EXPERIMENT VARIABLE
nickjillings@1642 231 \\** TO ENSURE CONSISTENCY OF USER
nickjillings@1642 232 \item Track all user interactions with system
nickjillings@1642 233 \end{itemize}
nickjillings@1642 234
nickjillings@1642 235
nickjillings@1642 236
nickjillings@1642 237
nickjillings@1642 238
nickjillings@1642 239 \section{Conclusions and future work}\label{sec:conclusions}
nickjillings@1642 240
nickjillings@1642 241 In this paper we have presented an approach to creating a browser-based listening test environment that can be used for a variety of types of perceptual evaluation of audio.
nickjillings@1642 242 Specifically, we discussed the use of the toolbox in the context of assessment of preference for different production practices, with identical source material.
nickjillings@1642 243 The purpose of this paper is to outline the design of this tool, to describe our implementation using basic HTML5 functionality, and to discuss design challenges and limitations of our approach. % or something
nickjillings@1642 244
nickjillings@1642 245 % future work
nickjillings@1642 246 Further work may include the development of other common test designs, such as [...], and [...]. In addition, [...].
nickjillings@1642 247
nickjillings@1642 248 \begin{itemize}
nickjillings@1642 249 \item Options for MUSHRA style experiment with vertical slide per track, APE style experiment where all tracks are on a single horizontal axis, or AB test
nickjillings@1642 250 \end{itemize}
nickjillings@1642 251
nickjillings@1642 252
nickjillings@1642 253 ...
nickjillings@1642 254
nickjillings@1642 255 The source code of this tool can be found on \url{code.soundsoftware.ac.uk/projects/browserevaluationtool}.
nickjillings@1642 256
nickjillings@1642 257
nickjillings@1642 258 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
nickjillings@1642 259 %bibliography here
nickjillings@1642 260 \bibliography{smc2015template}
nickjillings@1642 261
nickjillings@1642 262
nickjillings@1642 263
nickjillings@1642 264 \end{document}
nickjillings@1642 265
nickjillings@1642 266
nickjillings@1642 267
nickjillings@1642 268 % RUBBISH
nickjillings@1642 269
nickjillings@1642 270 %\subsection{Equations}
nickjillings@1642 271 %Equations of importance,
nickjillings@1642 272 %or to which you refer later,
nickjillings@1642 273 %should be placed on separated lines and numbered.
nickjillings@1642 274 %The number should be on the right side, in parentheses.
nickjillings@1642 275 %\begin{equation}
nickjillings@1642 276 %E=mc^{2+\delta}.
nickjillings@1642 277 %\label{eq:Emc2}
nickjillings@1642 278 %\end{equation}
nickjillings@1642 279 %Refer to equations like so:
nickjillings@1642 280 %As (\ref{eq:Emc2}) shows,
nickjillings@1642 281 %I do not completely trust Special Relativity.
nickjillings@1642 282 %
nickjillings@1642 283 %\subsection{Figures, Tables and Captions}
nickjillings@1642 284 %\begin{table}[t]
nickjillings@1642 285 % \begin{center}
nickjillings@1642 286 % \begin{tabular}{|l|l|}
nickjillings@1642 287 % \hline
nickjillings@1642 288 % String value & Numeric value \\
nickjillings@1642 289 % \hline
nickjillings@1642 290 % Hej SMC & 2015 \\
nickjillings@1642 291 % \hline
nickjillings@1642 292 % \end{tabular}
nickjillings@1642 293 %\end{center}
nickjillings@1642 294 % \caption{Table captions should be placed below the table, exactly like this,
nickjillings@1642 295 % but using words different from these.}
nickjillings@1642 296 % \label{tab:example}
nickjillings@1642 297 %\end{table}
nickjillings@1642 298
nickjillings@1642 299 %\begin{figure}[t]
nickjillings@1642 300 %\figbox{
nickjillings@1642 301 %\subfloat[][]{\includegraphics[width=60mm]{figure}\label{fig:subfigex_a}}\\
nickjillings@1642 302 %\subfloat[][]{\includegraphics[width=80mm]{figure}\label{fig:subfigex_b}}
nickjillings@1642 303 %}
nickjillings@1642 304 %\caption{Here's an example using the subfig package.\label{fig:subfigex} }
nickjillings@1642 305 %\end{figure}
nickjillings@1642 306
nickjillings@1642 307
nickjillings@1642 308
nickjillings@1642 309
nickjillings@1642 310
nickjillings@1642 311 %\begin{acknowledgments}
nickjillings@1642 312 %You may acknowledge people, projects,
nickjillings@1642 313 %funding agencies, etc.
nickjillings@1642 314 %which can be included after the second-level heading
nickjillings@1642 315 %``Acknowledgments'' (with no numbering).
nickjillings@1642 316 %\end{acknowledgments}
nickjillings@1642 317