annotate musicweb.tex @ 8:d4d732b8b9cb

intro
author mariano
date Fri, 29 Apr 2016 09:37:29 +0100
parents 1b88c2531512
children 9866ea2d3b9a
rev   line source
alo@0 1 \documentclass{llncs}
alo@0 2 \usepackage{graphicx}
alo@0 3
alo@0 4 \usepackage{amsmath,cite}
alo@0 5 \usepackage{pifont}
alo@0 6 \usepackage{listings}
alo@0 7 \usepackage{courier}
alo@0 8 \usepackage{adjustbox}
alo@0 9 \usepackage{url}
alo@0 10 \usepackage[ngerman,english]{babel}
alo@0 11 \usepackage[utf8]{inputenc}
alo@0 12 \newcommand{\cmark}{\fontsize{14}{14}\textbullet\selectfont}
alo@0 13 \usepackage[usenames,dvipsnames]{color}
alo@0 14
alo@0 15 \lstdefinelanguage{sparql} {
alo@0 16 morekeywords={SELECT, WHERE, a, COUNT, GROUP, ORDER, BY, HAVING, as, DISTINCT, OPTIONAL},
alo@0 17 sensitive=true,
alo@0 18 morecomment=[l][\color{ForestGreen}\bfseries\selectfont]{\#\ },
alo@0 19 moredelim=[s][\color{ForestGreen}\bfseries\selectfont]{?}{\ }, %variable
alo@0 20 moredelim=[s][\color{NavyBlue}\bfseries\selectfont]{@}{\ }, %prefix
alo@0 21 moredelim=[s][\color{OrangeRed}\bfseries\selectfont]{<}{>}, %red URIs
alo@0 22 morestring=[b][\color{ForestGreen}]\", %green strings
alo@0 23 morestring=[b]",
alo@0 24 }
alo@0 25
alo@0 26 \lstdefinestyle{sparql}{
alo@0 27 language=sparql,
alo@0 28 basicstyle=\footnotesize\ttfamily\bfseries,
alo@0 29 % basicstyle=\ttfamily,
alo@0 30 keywordstyle=\color{blue}\bfseries,
alo@0 31 identifierstyle=,
alo@0 32 commentstyle=\color{ForestGreen}\bfseries,
alo@0 33 stringstyle=\color{BlueGreen}\ttfamily,
alo@0 34 showstringspaces=false,
alo@0 35 emph={context},emphstyle=\color{BrickRed}\bfseries,
alo@0 36 frame = lines,
alo@0 37 %aboveskip = 15pt,
alo@0 38 %framexbottommargin = 5pt,
alo@0 39 %framextopmargin = 5pt,
alo@0 40 aboveskip = 10pt,
alo@0 41 framexbottommargin = 2pt,
alo@0 42 framextopmargin = 2pt,
alo@0 43 captionpos=b,
alo@0 44 escapechar=~,
alo@0 45 breaklines=true,
alo@0 46 breakatwhitespace=true,
alo@0 47 breakindent=20pt,
alo@0 48 xleftmargin=5pt,
alo@0 49 xrightmargin=5pt,
alo@0 50 basewidth={0.55em,0.45em},
alo@0 51 %basewidth={0.50em,0.6em},
alo@0 52 fontadjust=true,
alo@0 53 % lineskip={-1.5pt},
alo@0 54 % columns=[c]spaceflexible, %make the long artist URI fit
alo@0 55 %float = h!,
alo@0 56 }
alo@0 57
alo@0 58 \renewcommand{\lstlistingname}{{\bf Listing}}
alo@0 59
alo@0 60
alo@0 61 \lstdefinelanguage{ttl} {
alo@0 62 morekeywords={a},
alo@0 63 sensitive=true,
alo@0 64 % morecomment=[l][\color{ForestGreen}\bfseries\fontsize{10}{2}\selectfont]{\#\ },
alo@0 65 % moredelim=[s][\color{ForestGreen}\bfseries\fontsize{10}{2}\selectfont]{\#\ }{\ },
alo@0 66 % moredelim=[s][\color{NavyBlue}\bfseries\fontsize{10}{2}\selectfont]{@}{\ }, %prefix
alo@0 67 % moredelim=[s][\color{OrangeRed}\bfseries\fontsize{10}{2}\selectfont]{<}{>}, %red URIs
alo@0 68 morecomment=[l][\color{ForestGreen}\ttfamily\bfseries\selectfont]{\#\ },
alo@0 69 moredelim=[s][\color{NavyBlue}\ttfamily\bfseries\selectfont]{@}{\ }, %prefix
alo@0 70 moredelim=[s][\color{OrangeRed}\ttfamily\bfseries\selectfont]{<}{>}, %red URIs
alo@0 71 morestring=[b][\color{ForestGreen}]\", %green strings
alo@0 72 morestring=[b]",
alo@0 73 }
alo@0 74
alo@0 75 \lstdefinestyle{ttl}{
alo@0 76 language=ttl,
alo@0 77 basicstyle=\footnotesize\ttfamily\bfseries,
alo@0 78 keywordstyle=\color{blue}\bfseries,
alo@0 79 identifierstyle=,
alo@0 80 commentstyle=\color{ForestGreen}\bfseries,
alo@0 81 stringstyle=\color{BlueGreen}\bfseries,
alo@0 82 showstringspaces=false,
alo@0 83 emph={context},emphstyle=\color{BrickRed}\bfseries,
alo@0 84 frame = lines,
alo@0 85 framexbottommargin = 5pt,
alo@0 86 framextopmargin = 5pt,
alo@0 87 captionpos=b,
alo@0 88 escapechar=~,
alo@0 89 breaklines=true,
alo@0 90 breakatwhitespace=true,
alo@0 91 breakindent=20pt,
alo@0 92 aboveskip = 15pt,
alo@0 93 xleftmargin=5pt,
alo@0 94 xrightmargin=5pt,
alo@0 95 basewidth={0.55em,0.45em},
alo@0 96 % basewidth={0.50em,0.6em},
alo@0 97 fontadjust=true,
alo@0 98 lineskip={-1.5pt},
alo@0 99 % columns=[c]spaceflexible, %make the long artist URI fit
alo@0 100 % float = h!,
alo@0 101 }
alo@0 102
alo@0 103 \lstdefinelanguage{json} {
alo@0 104 sensitive=true,
alo@0 105 %morecomment=[l]{@},
alo@0 106 moredelim=[s][\color{ForestGreen}]{?}{\ }, %green variables
alo@0 107 moredelim=[s][\color{OrangeRed}\fontsize{7}{2}\selectfont]{<}{>}, %red URIs
alo@0 108 morestring=[b][\color{Gray}]\",
alo@0 109 morestring=[b]",
alo@0 110 }
alo@0 111
alo@0 112 \lstdefinestyle{json}{
alo@0 113 language=json,
alo@0 114 keywords={type,context},
alo@0 115 basicstyle=\fontsize{7}{8}\bfseries\ttfamily,
alo@0 116 keywordstyle=\color{blue}\bfseries,
alo@0 117 identifierstyle=,
alo@0 118 commentstyle=\color{Gray}\bfseries,
alo@0 119 stringstyle=\color{OliveGreen}\ttfamily,
alo@0 120 showstringspaces=false,
alo@0 121 emph={context},emphstyle=\color{BrickRed}\bfseries,
alo@0 122 frame = lines,
alo@0 123 framexbottommargin = 5pt,
alo@0 124 framextopmargin = 5pt,
alo@0 125 tabsize=4,
alo@0 126 captionpos=b,
alo@0 127 escapechar=~,
alo@0 128 breaklines=false,
alo@0 129 xleftmargin=5pt,
alo@0 130 xrightmargin=5pt,
alo@0 131 basewidth={0.50em,0.45em},
alo@0 132 %basewidth={0.50em,0.6em},
alo@0 133 fontadjust=true,
alo@0 134 columns=[c]spaceflexible, %make the long artist URI fit
alo@0 135 float = ht,
alo@0 136 }
alo@0 137
alo@0 138 \renewcommand{\labelitemi}{$\bullet$}
alo@0 139
alo@0 140 \begin{document}
alo@0 141
alo@1 142 \mainmatter
alo@1 143
alo@3 144 \title{MusicWeb: an open linked semantic platform for music metadata}
alo@1 145
alo@1 146 \author{Mariano Mora-Mcginity \and Alo Allik \and Gy\"orgy Fazekas \and Mark Sandler }
alo@1 147 %
alo@1 148
alo@1 149 \institute{Queen Mary University of London, \\
alo@1 150 \email{\{m.mora-mcginity, a.allik, g.fazekas, mark.sandler\}@qmul.ac.uk}}
alo@1 151
alo@1 152 \maketitle
alo@0 153
alo@1 154 \begin{abstract}
alo@1 155
gyorgyf@2 156 % MusicWeb is a web site that provides users a browsing, searching and linking platform of music artist and group information by integrating open linked semantic metadata from various Semantic Web, music recommendation and social media data sources, including DBpedia.org, sameas.org, MusicBrainz, the Music Ontology, Last.FM, Youtube, and Echonest. The front portal includes suggested links to selected artists and a search functionality from where users can navigate to individual artists pages. Each artist page contains a biography, links to online audio and a video player with a side menu displaying a selection of Youtube videos. Further it provides lists of YAGO categories linking each artist to other artists by various commonalities such as style, geographical location, instrumentation, record label as well as more obscure categories, for example, artists who have received the same award, have shared the same fate, or belonged to the same organisation or religion. The artist connections are further enhanced by thematic analysis of journal articles and blog posts as well as content-based music information retrieval similarity measures.
gyorgyf@2 157
gyorgyf@2 158 This paper presents MusicWeb, a novel platform for linking music artists within a web-based application for discovering connections between them. MusicWeb provides a browsing experience using connections that are either extra-musical or tangential to music, such as the artists' political affiliation or social influence, or intra-musical, such as the artists' main instrument or most favoured musical key. The platform integrates open linked semantic metadata from various Semantic Web, music recommendation and social media data sources including DBpedia.org, sameas.org, MusicBrainz, the Music Ontology, Last.FM and Youtube as well as content-derived information. The front portal includes suggested links to selected artists and a search functionality from where users can navigate to individual artists pages. Each artist page contains a biography and links to online audio and a video resources. Connections are made using YAGO categories linking artist by various commonalities such as style, geographical location, instrumentation, record label as well as more obscure categories, for instance, artists who have received the same award, have shared the same fate, or belonged to the same organisation or religion. These connections are further enhanced by thematic analysis of journal articles and blog posts as well as content-based similarity measures focussing on high level musical categories.
alo@0 159
alo@1 160 \keywords{Semantic Web, Linked Open Data, music metadata, semantic audio analysis, music information retrieval }
alo@1 161 \end{abstract}
alo@1 162
alo@0 163 \section{Introduction}\label{sec:introduction}
mariano@8 164 In recent years we have witnessed an explosion of information, a consequence of millions of users producing and consuming web resources. Researchers and industry have recognised the potential of this data, and have endeavoured to develop methods to handle such a vast amount of information: to understand and manage it, to transform into knowledge. Multimedia content providers have devoted a lot of energy to analysing consumer preference, in an effort to offer customised user experiences. Music stream services, for instance, carry out extensive analysis trying to identify patterns in user's listening habits, and researchers are striving to refine multimedia recommendation algorithms. There are two main approaches to music recommendation\cite{Song2012}: the first is known as \emph{collaborative filtering}\cite{Su2009}, which recommends music items based on the choices of similar users. There are, however, limitations in user-preference based systems: recommendations based solely on user preference can easily lead to a ''rich-club phenomenon''\cite{Zhou2004}, in which short-tail popular music is heavily reinforced whereas most of the music available online is ignored and remains unknown\cite{Celma2010}. The second most significant model of music recommendation is based on audio content analysis, or \emph{music information retrieval}. This analysis extracts low to high-level audio features such as tempo, key, metric structure, melodic and harmonic sequences, instrument recognition and song segmentation, which are then used to measure music similarity\cite{Aucoutourier2002}, to carry out genre classification or to identify the mood of the song\cite{Kim2010}. Music discovery websites such as Last.fm\footnote{http://www.last.fm}, Allmusic\footnote{http://www.allmusic.com} or Pandora\footnote{http://www.pandora.com} have successfully developed hybrid systems which combine both approaches.
mariano@8 165
mariano@4 166 \begin{itemize}
mariano@8 167 \item NOTE: The problem with this is that it does not offer music \emph{discovery}!
mariano@8 168 \item Music metadata can improve this
mariano@8 169 \item Pachet's patper on metadata identifies three different kinds of music metadata
mariano@4 170 \begin{itemize}
mariano@8 171 \item Editorial metadata
mariano@8 172 \item Cultural metadata
mariano@8 173 \item Acoustic metadata
mariano@4 174 \end{itemize}
mariano@4 175 \end{itemize}
mariano@5 176
mariano@8 177
mariano@8 178
mariano@4 179 \section{Background}\label{sec:background}
mariano@4 180 \begin{itemize}
mariano@4 181 \item Information management
mariano@4 182 \item Some references to semantic web audio
mariano@4 183 \item Linked musicians: echonest, musicbrainz
mariano@4 184 \item Smart music
alo@0 185
mariano@4 186 \end{itemize}
mariano@6 187
alo@1 188 \section{MusicWeb: Yago linking}\label{sec:yago}
alo@0 189
alo@1 190 \section{MUSIC: linking by topic}\label{sec:music}
mariano@4 191 \begin{itemize}
mariano@4 192 \item Semantic analysis\cite{Landauer1998}
mariano@4 193 \item Topic modeling\cite{Blei2012}
mariano@4 194 \item Entity recognition
mariano@4 195 \item Hierarchical bayesian modeling
mariano@4 196 \item Authors, journals, keywords, tags
mariano@4 197
mariano@4 198 \end{itemize}
alo@1 199 \section{Content-based information retrieval}\label{sec:mir}
alo@0 200
alo@0 201 \section{Discussion}\label{sec:discussion}
alo@0 202
alo@0 203 \section{Conclusions}\label{sec:conclusions}
alo@0 204
alo@0 205 %
alo@0 206 % ---- Bibliography ----
alo@0 207 %
alo@0 208 \vspace{-1em}\begin{thebibliography}{5}
alo@0 209 %
alo@0 210
mariano@8 211 \bibitem{Song2012}
mariano@6 212 Y.~Song, S.~Dixon and M.~Pearce.
mariano@6 213 \newblock A survey of music recommendation systems and future perspectives
mariano@6 214 \newblock In {\em Proceedings of the 9th International Symposium on Computer Music Modelling and Retrieval}, 2012.
mariano@8 215
mariano@8 216 \bibitem{Su2009}
mariano@8 217 X.~Su and T. M. ~Khoshgoftaar.
mariano@8 218 \newblock A Survey of Collaborative Filtering Techniques.
mariano@8 219 \newblock In {\em Advances in Artificial Intelligence,(Section 3):1–19}, 2009.
mariano@8 220
mariano@6 221 \bibitem{Zhou2004}
mariano@6 222 S.~Zhou and R. J.~Mondrag\'on
mariano@6 223 \newblock The rich-club phenomenon in the Internet topology
mariano@6 224 \newblock In {\em Communications Letters, IEEE}, 2004
mariano@6 225
mariano@6 226 \bibitem{Celma2010}
mariano@6 227 O.~Celma
mariano@6 228 \newblock Music Recommendation and Discovery:The Long Tail, Long Fail, and Long Play in the Digital Music Space.
mariano@6 229 \newblock Springer Verlag, Heidelberg, 2010.
mariano@8 230
mariano@8 231 \bibitem{Aucoutourier2002}
mariano@8 232 J. J.~Aucouturier and F~Pachet.
mariano@8 233 \newblock Music Similarity Measures: What is the Use.
mariano@8 234 \newblock In {emProceedings of the ISMIR, pages 157–163}, 2002.
mariano@8 235
mariano@8 236 \bibitem{Kim2010}
mariano@8 237 Y.E.~Kim, E.M.~Schmidt, R.~Migneco, B.G.~Morton, P.~Richardson, J.~Scott, J.A.~Speck and D.~Turnbull.
mariano@8 238 \newblock Music Emotion Recognition: A State of the Art Review.
mariano@8 239 \newblock In {\em Proc. of the 11th Intl. Society for Music Information Retrieval (ISMIR) Conf}, 2010.
mariano@8 240
mariano@8 241 \bibitem{FazekasRJS10_OMRAS2}
mariano@6 242 G.~Fazekas, Y.~Raimond, K.~Jakobson, and M.~Sandler.
mariano@6 243 \newblock An overview of semantic web activities in the {OMRAS2} project.
mariano@6 244 \newblock {\em Journal of New Music Research (JNMR)}, 39(4), 2010.
mariano@6 245
mariano@6 246 \bibitem{Porter:ISMIR:15}
mariano@6 247 A.~Porter, D.~Bogdanov, R.~Kaye, R.~Tsukanov, and X.~Serra.
mariano@6 248 \newblock Acousticbrainz: a community platform for gathering music information
mariano@6 249 obtained from audio.
mariano@6 250 \newblock In {\em 16th International Society for Music Information Retrieval
alo@0 251 (ISMIR) Conference}, 2015.
alo@0 252
alo@0 253 \bibitem{DBLP:conf/ismir/RaimondASG07}
alo@0 254 Y~Raimond, S.~Abdallah, M.~Sandler, and F.~Giasson.
alo@0 255 \newblock The music ontology.
alo@0 256 \newblock In {\em Proceedings of the 8th International Conference on Music
alo@0 257 Information Retrieval, ISMIR 2007, Vienna, Austria, September 23-27}, 2007.
mariano@4 258
mariano@6 259
mariano@6 260 \bibitem{Landauer1998}
mariano@4 261 T.~Landauer, P.~Folt, and D.~Laham.
mariano@4 262 \newblock An introduction to latent semantic analysis
mariano@4 263 \newblock In {\em Discourse processes, 25}, 1998
mariano@4 264
mariano@4 265 \bibitem{Blei2012}
mariano@4 266 D.~Blei, A.~ Ng, and M.I.~Jordan.
mariano@4 267 \newblock Latent Dirichlet Allocation.
mariano@4 268 \newblock In {\em Journal of Machine Learning Research, 3(4-5), 993–1022}, 2012
mariano@6 269
mariano@6 270
alo@0 271 \end{thebibliography}
alo@0 272
alo@0 273 \end{document}