webaudioevaluationtool: docs/SMC15/smc2015template.tex annotate

annotate docs/SMC15/smc2015template.tex @ 694:869ed636f7c0

Edit to project Spec Doc

author	Dave Moffat <djmoffat@users.noreply.github.com>
date	Thu, 09 Apr 2015 16:30:08 +0100
parents	a74cb47e779c
children	b95d1ede4c91

rev	line source
djmoffat@693	1 % -----------------------------------------------
djmoffat@693	2 % Template for SMC 2012
djmoffat@693	3 % adapted from the template for SMC 2011, which was adapted from that of SMC 2010
djmoffat@693	4 % -----------------------------------------------
djmoffat@693	5
djmoffat@693	6 \documentclass{article}
djmoffat@693	7 \usepackage{smc2015}
djmoffat@693	8 \usepackage{times}
djmoffat@693	9 \usepackage{ifpdf}
djmoffat@693	10 \usepackage[english]{babel}
djmoffat@693	11 \usepackage{cite}
djmoffat@693	12
djmoffat@693	13 %%%%%%%%%%%%%%%%%%%%%%%% Some useful packages %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
djmoffat@693	14 %%%%%%%%%%%%%%%%%%%%%%%% See related documentation %%%%%%%%%%%%%%%%%%%%%%%%%%
djmoffat@693	15 %\usepackage{amsmath} % popular packages from Am. Math. Soc. Please use the
djmoffat@693	16 %\usepackage{amssymb} % related math environments (split, subequation, cases,
djmoffat@693	17 %\usepackage{amsfonts}% multline, etc.)
djmoffat@693	18 %\usepackage{bm} % Bold Math package, defines the command \bf{}
djmoffat@693	19 %\usepackage{paralist}% extended list environments
djmoffat@693	20 %%subfig.sty is the modern replacement for subfigure.sty. However, subfig.sty
djmoffat@693	21 %%requires and automatically loads caption.sty which overrides class handling
djmoffat@693	22 %%of captions. To prevent this problem, preload caption.sty with caption=false
djmoffat@693	23 %\usepackage[caption=false]{caption}
djmoffat@693	24 %\usepackage[font=footnotesize]{subfig}
djmoffat@693	25
djmoffat@693	26
djmoffat@693	27 %user defined variables
djmoffat@694	28 \def\papertitle{APE FOR WEB: A BROWSER-BASED EVALUATION TOOL FOR AUDIO} %?
djmoffat@694	29 \def\firstauthor{Nicholas Jillings}
djmoffat@694	30 \def\secondauthor{Brecht De Man}
djmoffat@693	31 \def\thirdauthor{David Moffat}
djmoffat@693	32 \def\fourthauthor{Joshua D. Reiss}
djmoffat@693	33
djmoffat@693	34 % adds the automatic
djmoffat@693	35 % Saves a lot of ouptut space in PDF... after conversion with the distiller
djmoffat@693	36 % Delete if you cannot get PS fonts working on your system.
djmoffat@693	37
djmoffat@693	38 % pdf-tex settings: detect automatically if run by latex or pdflatex
djmoffat@693	39 \newif\ifpdf
djmoffat@693	40 \ifx\pdfoutput\relax
djmoffat@693	41 \else
djmoffat@693	42 \ifcase\pdfoutput
djmoffat@693	43 \pdffalse
djmoffat@693	44 \else
djmoffat@693	45 \pdftrue
djmoffat@693	46 \fi
djmoffat@693	47
djmoffat@693	48 \ifpdf % compiling with pdflatex
djmoffat@693	49 \usepackage[pdftex,
djmoffat@693	50 pdftitle={\papertitle},
djmoffat@693	51 pdfauthor={\firstauthor, \secondauthor, \thirdauthor},
djmoffat@693	52 bookmarksnumbered, % use section numbers with bookmarks
djmoffat@693	53 pdfstartview=XYZ % start with zoom=100% instead of full screen;
djmoffat@693	54 % especially useful if working with a big screen :-)
djmoffat@693	55 ]{hyperref}
djmoffat@693	56 %\pdfcompresslevel=9
djmoffat@693	57
djmoffat@693	58 \usepackage[pdftex]{graphicx}
djmoffat@693	59 % declare the path(s) where your graphic files are and their extensions so
djmoffat@693	60 %you won't have to specify these with every instance of \includegraphics
djmoffat@693	61 \graphicspath{{./figures/}}
djmoffat@693	62 \DeclareGraphicsExtensions{.pdf,.jpeg,.png}
djmoffat@693	63
djmoffat@693	64 \usepackage[figure,table]{hypcap}
djmoffat@693	65
djmoffat@693	66 \else % compiling with latex
djmoffat@693	67 \usepackage[dvips,
djmoffat@693	68 bookmarksnumbered, % use section numbers with bookmarks
djmoffat@693	69 pdfstartview=XYZ % start with zoom=100% instead of full screen
djmoffat@693	70 ]{hyperref} % hyperrefs are active in the pdf file after conversion
djmoffat@693	71
djmoffat@693	72 \usepackage[dvips]{epsfig,graphicx}
djmoffat@693	73 % declare the path(s) where your graphic files are and their extensions so
djmoffat@693	74 %you won't have to specify these with every instance of \includegraphics
djmoffat@693	75 \graphicspath{{./figures/}}
djmoffat@693	76 \DeclareGraphicsExtensions{.eps}
djmoffat@693	77
djmoffat@693	78 \usepackage[figure,table]{hypcap}
djmoffat@693	79 \fi
djmoffat@693	80
djmoffat@693	81 %setup the hyperref package - make the links black without a surrounding frame
djmoffat@693	82 \hypersetup{
djmoffat@693	83 colorlinks,%
djmoffat@693	84 citecolor=black,%
djmoffat@693	85 filecolor=black,%
djmoffat@693	86 linkcolor=black,%
djmoffat@693	87 urlcolor=black
djmoffat@693	88 }
djmoffat@693	89
djmoffat@693	90
djmoffat@693	91 % Title.
djmoffat@693	92 % ------
djmoffat@693	93 \title{\papertitle}
djmoffat@693	94
djmoffat@693	95 % Authors
djmoffat@693	96 % Please note that submissions are NOT anonymous, therefore
djmoffat@693	97 % authors' names have to be VISIBLE in your manuscript.
djmoffat@693	98 %
djmoffat@693	99 % Single address
djmoffat@693	100 % To use with only one author or several with the same address
djmoffat@693	101 % ---------------
djmoffat@693	102 %\oneauthor
djmoffat@693	103 % {\firstauthor} {Affiliation1 \\ %
djmoffat@693	104 % {\tt \href{mailto:author1@smcnetwork.org}{author1@smcnetwork.org}}}
djmoffat@693	105
djmoffat@693	106 %Two addresses
djmoffat@693	107 %--------------
djmoffat@693	108 % \twoauthors
djmoffat@693	109 % {\firstauthor} {Affiliation1 \\ %
djmoffat@693	110 % {\tt \href{mailto:author1@smcnetwork.org}{author1@smcnetwork.org}}}
djmoffat@693	111 % {\secondauthor} {Affiliation2 \\ %
djmoffat@693	112 % {\tt \href{mailto:author2@smcnetwork.org}{author2@smcnetwork.org}}}
djmoffat@693	113
djmoffat@694	114
djmoffat@694	115
djmoffat@694	116 % FIX!!!
djmoffat@693	117 \fourauthors
djmoffat@693	118 {\firstauthor} {%Affiliation1 \\
djmoffat@694	119 {\tt \href{mailto:b.deman@qmul.ac.uk}{n.g.r.jillings@se14.qmul.ac.uk, }}}
djmoffat@693	120 {\secondauthor} {%Affiliation2\\ %
djmoffat@694	121 {\tt \href{mailto:n.g.r.jillings@se14.qmul.ac.uk}{\{b.deman,}}}
djmoffat@693	122 {\thirdauthor} {%Affiliation3\\ %
djmoffat@694	123 {\tt \href{mailto:d.j.moffat@qmul.ac.uk}{d.j.moffat, }}}
djmoffat@693	124 {\fourthauthor} {%Affiliation4\\ %
djmoffat@694	125 {\tt \href{mailto:joshua.reiss@qmul.ac.uk}{joshua.reiss\}@qmul.ac.uk}}}
djmoffat@693	126
djmoffat@693	127 % *************************************** the document starts here *************
djmoffat@693	128 \begin{document}
djmoffat@693	129 %
djmoffat@693	130 \capstartfalse
djmoffat@693	131 \maketitle
djmoffat@693	132 \capstarttrue
djmoffat@693	133 %
djmoffat@693	134 \begin{abstract}
djmoffat@693	135 Place your abstract at the top left column on the first page.
djmoffat@693	136 Please write about 150-200 words that specifically highlight the purpose of your work,
djmoffat@693	137 its context, and provide a brief synopsis of your results.
djmoffat@694	138 Avoid equations in this part.\\
djmoffat@694	139 TOTAL PAPER: Minimum 4 pages, 6 preferred, max. 8 (6 for demos/posters)\\
djmoffat@693	140 \end{abstract}
djmoffat@693	141 %
djmoffat@693	142
djmoffat@693	143 \section{Introduction}\label{sec:introduction}
djmoffat@693	144
djmoffat@694	145 background (types of research where this type of perceptual evaluation of audio is relevant)\\
djmoffat@694	146
djmoffat@694	147 multiple stimulus perceptual evaluation (reference to Bech etc.)\\
djmoffat@694	148
djmoffat@694	149 prior work: \cite{deman2014b} in MATLAB, much less easy to deploy, and often stops working due to version updates \\
djmoffat@694	150
djmoffat@693	151 goal, what are we trying to do? \\
djmoffat@693	152
djmoffat@694	153 [Previously, due to limited functionality of HTML, ..., it was not possible to design this type of interfaces with such high quality audio... ]
djmoffat@693	154
djmoffat@693	155
djmoffat@694	156 \section{Design considerations}\label{sec:designconsiderations}
djmoffat@693	157
djmoffat@694	158 We present a browser-based perceptual evaluation tool for audio that ... \\
djmoffat@693	159
djmoffat@694	160 see \cite{deman2014b}: requirements informed by research on music production (see my work and that of others' in the group), such as randomisation, playback of high quality audio, some degree of flexibility in terms of configuration, ... \\
djmoffat@694	161
djmoffat@694	162
djmoffat@694	163 \section{Implementation}\label{sec:implementation}
djmoffat@694	164 %[Nick???]
djmoffat@694	165
djmoffat@694	166 %section on overall architecture\\
djmoffat@694	167
djmoffat@694	168 %section with overview of the structure of the input and output files, perhaps with graph or table
djmoffat@694	169
djmoffat@694	170 The tool runs entirely inside the browser through the new HTML5 Web Audio API. The API is supported by most major web browsers (except Internet Explorer) and allows for constructing a chain of audio processing elements to produce a high quality, real time signal process to manipulate audio streams. The API supports multi-channel processing and has an accurate playback timer for precise scheduled playback control. The web audio API is controlled through the browser JavaScript and is therefore highly controllable. The Web Audio API processing is all controlled in a separate thread to the main JavaScript thread, meaning there is no blocking due to real time processing.
djmoffat@694	171
djmoffat@694	172 \subsection{Architecture}\label{sec:architecture}
djmoffat@694	173
djmoffat@694	174 The web tool itself is split into several files to operate:
djmoffat@694	175 \begin{itemize}
djmoffat@694	176 \item apeTool.html: The main index file to load the scripts, this is the file the browser must request to load
djmoffat@694	177 \item core.js: Contains functions and objects to manage the audio control, audio objects for testing and loading of files
djmoffat@694	178 \item ape.js: Parses setup files to create the interface as instructed, following the same style chain as the MATLAB APE Tool.
djmoffat@694	179 \end{itemize}
djmoffat@694	180
djmoffat@694	181 The HTML file loads the core.js file with it along with a few other ancillary files (such as the jQuery javascript extensions), the browser JavaScript begins to execute the on page instructions, which gives the URL of the test setup XML document (outlined in the next section). The core.js parses this document and executes the function in ape.js to build the web page with the given audio files. The reason for separating these two files is to allow for further interface designs (such as Mushra or A-B tests) to be used, which would still require the same underlying core functions outlined in core.js
djmoffat@694	182
djmoffat@694	183 The ape.js file has only two main functions: loadInterface(xmlDoc) and interfaceXMLSave(). The first function is called to build the interface once the setup document has been loaded. This includes creating the slider interface to rate the tracks and creating the comment boxes bellow. The bars in the slider ranking at the top of the page are randomly spaced. It also instructs the audio engine in the core.js to create the audio objects. The audio objects are custom built audio nodes built on the web audio API. They consist of a bufferSourceNode (a node which holds a buffer of audio samples for playback) and a gainNode. These are then connected to the audioEngine (itself a custom web audio node) containing a gainNode (where the various audio Objects connect to) for summation before passing the output to the destination Node, a fixed node created where the browser then passes the audio information to the system sound device.
djmoffat@694	184
djmoffat@694	185 When an audioObject is created, the URL of the audio sample to load is given to it. This is downloaded into the browser asynchronously using the XMLHttpRequest object. This allows for downloading of any file into the JavaScript environment for further processing. It is particularly useful for the web audio API because it supports downloading of files in their binary form, allowing a perfect copy. Once the asynchronous download is complete, the file is then decoded using the web audio API offline decoder. This uses the browser available decoding schemes to decode the audio files into raw float32 arrays, which are in-turn passed to the relevant audioObject bufferSourceNode for playback.
djmoffat@694	186
djmoffat@694	187 Browsers support various audio file formats and are not consistent in any format. One sure format that all browsers support is the WAV format. Although not a compact, web friendly format, most transport systems are of a high enough bandwidth this should not be a problem. However one problem is that of sample rate. On loading, the browser uses the sample rate assigned by the system sound device. The browser does not have the ability to request a different sound rate. Therefore the default operation when an audio file is loaded with a different sample rate to that of the system is to convert the sample rate. To provide a check for this, the desired sample rate can be supplied with the setup XML and checked against. If the sample rates do not match, a browser alert window is shown asking for the sample rate to be correctly adjusted. This happens before any loading or decoding of audio files. Only once the sample rates match will the system actually fetch any files, keeping down requests for the larger files until they are actually needed.
djmoffat@694	188
djmoffat@694	189 During playback, the playback nodes loop indefinitely until playback is stopped. The gain nodes in the audioObjects enable dynamic muting of nodes. When a bar in the sliding ranking is clicked, the audio engine mutes all audioObjects and un-mutes the clicked one. Therefore, if the audio samples are perfectly aligned up and of the same sample length, they will remain perfectly aligned with each other.
djmoffat@694	190
djmoffat@694	191 \subsection{Setup and Results Formats}\label{sec:setupresultsformats}
djmoffat@694	192
djmoffat@694	193 Setup and the results both use the common XML document format to outline the various parameters. The setup file contains all the information needed to initialise a test session. Several Nodes can be defined to outline the audio samples to use, questions to be asked and any pre- or post-test questions or instructions. Having one document to modify allows for quick manipulation in a 'human readable' form to create new tests, or adjust current ones, without needing to edit which web files.
djmoffat@694	194
djmoffat@694	195 The results file is dynamically generated by the interface upon clicking the submit button. There will be checks, depending on the setup file, to ensure that all tracks have been evaluated and their positions in the slider moved. The XML returned contains a node per audioObject and contains its rating in the slider and any comments written in its associated comment box. The rating returned is normalised to be within a integer range of 0 to 100. This normalises the pixel representation of different browser windows. If a window for instance is only 1280 wide, reporting its pixel position is not representative to a display with a width of 1920.
djmoffat@694	196
djmoffat@694	197 The pre- and post-test options allow for comments or questions to be presented before or after the test. These are automatically generated based upon the given setup XML and allow nearly any form of question and comment to be included in a window on its own. Questions are stored and presented in the response section labelled 'pretest' and 'posttest' along with the question ID and its response. Questions can be made optionally mandatory. Example questions may involve entering mixing experience or listening environment.
djmoffat@694	198
djmoffat@694	199 The results will also contain information collected by any defined pre/post questions. These are referenced against the setup XML by using the same ID as well as printing in the same question, so readable responses can be obtained. Future development will also evolve to include any session data, such as the browser the tool was used in, how long the test took and any other metrics. Currently the results files are downloaded on the user side of the browser as a .xml file to be manually returned. However the end goal is to allow the XML files to be submitted over the web to a receiving server to store them, allowing for automated collection.
djmoffat@694	200
djmoffat@694	201 Here is an example of the setup XML and the results XML:
djmoffat@694	202 % Should we include an Example of the input and output XML structure??
djmoffat@694	203
djmoffat@694	204 \section{Applications}\label{sec:applications} %?
djmoffat@694	205
djmoffat@694	206 \subsection{Listening Environment Standardisation}
djmoffat@694	207
djmoffat@694	208
djmoffat@694	209 discussion of use of this toolbox (possibly based on a quick mock test using my research data, to be repeated with a large number of participants and more data later)\\
djmoffat@694	210
djmoffat@694	211
djmoffat@694	212 \section{Conclusions and future work}\label{sec:conclusions}
djmoffat@694	213
djmoffat@694	214 In this paper we have presented an approach to creating a browser-based listening test environment that can be used for a variety of types of perceptual evaluation of audio.
djmoffat@694	215 Specifically, we discussed the use of the toolbox in the context of assessment of preference for different production practices, with identical source material.
djmoffat@694	216 The purpose of this paper is to outline the design of this tool, to describe our implementation using basic HTML5 functionality, and to discuss design challenges and limitations of our approach. % or something
djmoffat@694	217
djmoffat@694	218 % future work
djmoffat@694	219 Further work may include the development of other common test designs, such as [...], and [...]. In addition, [...].
djmoffat@694	220
djmoffat@694	221 ...
djmoffat@694	222
djmoffat@694	223 The source code of this tool can be found on \url{code.soundsoftware.ac.uk/projects/browserevaluationtool}.
djmoffat@694	224
djmoffat@694	225
djmoffat@694	226 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
djmoffat@694	227 %bibliography here
djmoffat@694	228 \bibliography{smc2015template}
djmoffat@694	229
djmoffat@694	230
djmoffat@694	231
djmoffat@694	232 \end{document}
djmoffat@694	233
djmoffat@694	234
djmoffat@694	235
djmoffat@694	236 % RUBBISH
djmoffat@693	237
djmoffat@693	238 %\subsection{Equations}
djmoffat@693	239 %Equations of importance,
djmoffat@693	240 %or to which you refer later,
djmoffat@693	241 %should be placed on separated lines and numbered.
djmoffat@693	242 %The number should be on the right side, in parentheses.
djmoffat@693	243 %\begin{equation}
djmoffat@693	244 %E=mc^{2+\delta}.
djmoffat@693	245 %\label{eq:Emc2}
djmoffat@693	246 %\end{equation}
djmoffat@693	247 %Refer to equations like so:
djmoffat@693	248 %As (\ref{eq:Emc2}) shows,
djmoffat@693	249 %I do not completely trust Special Relativity.
djmoffat@693	250 %
djmoffat@693	251 %\subsection{Figures, Tables and Captions}
djmoffat@693	252 %\begin{table}[t]
djmoffat@693	253 % \begin{center}
djmoffat@693	254 % \begin{tabular}{\|l\|l\|}
djmoffat@693	255 % \hline
djmoffat@693	256 % String value & Numeric value \\
djmoffat@693	257 % \hline
djmoffat@693	258 % Hej SMC & 2015 \\
djmoffat@693	259 % \hline
djmoffat@693	260 % \end{tabular}
djmoffat@693	261 %\end{center}
djmoffat@693	262 % \caption{Table captions should be placed below the table, exactly like this,
djmoffat@693	263 % but using words different from these.}
djmoffat@693	264 % \label{tab:example}
djmoffat@693	265 %\end{table}
djmoffat@693	266
djmoffat@693	267 %\begin{figure}[t]
djmoffat@693	268 %\figbox{
djmoffat@693	269 %\subfloat[][]{\includegraphics[width=60mm]{figure}\label{fig:subfigex_a}}\\
djmoffat@693	270 %\subfloat[][]{\includegraphics[width=80mm]{figure}\label{fig:subfigex_b}}
djmoffat@693	271 %}
djmoffat@693	272 %\caption{Here's an example using the subfig package.\label{fig:subfigex} }
djmoffat@693	273 %\end{figure}
djmoffat@693	274
djmoffat@693	275
djmoffat@694	276
djmoffat@693	277
djmoffat@693	278
djmoffat@693	279 %\begin{acknowledgments}
djmoffat@693	280 %You may acknowledge people, projects,
djmoffat@693	281 %funding agencies, etc.
djmoffat@693	282 %which can be included after the second-level heading
djmoffat@693	283 %``Acknowledgments'' (with no numbering).
djmoffat@693	284 %\end{acknowledgments}
djmoffat@693	285

Mercurial > hg > webaudioevaluationtool

annotate docs/SMC15/smc2015template.tex @ 694:869ed636f7c0