alo@0: \documentclass{llncs} alo@0: \usepackage{graphicx} alo@0: alo@0: \usepackage{amsmath,cite} alo@0: \usepackage{pifont} alo@0: \usepackage{listings} alo@0: \usepackage{courier} alo@0: \usepackage{adjustbox} alo@0: \usepackage{url} alo@0: \usepackage[ngerman,english]{babel} alo@0: \usepackage[utf8]{inputenc} alo@0: \newcommand{\cmark}{\fontsize{14}{14}\textbullet\selectfont} alo@0: \usepackage[usenames,dvipsnames]{color} alo@0: alo@0: \lstdefinelanguage{sparql} { alo@0: morekeywords={SELECT, WHERE, a, COUNT, GROUP, ORDER, BY, HAVING, as, DISTINCT, OPTIONAL}, alo@0: sensitive=true, alo@0: morecomment=[l][\color{ForestGreen}\bfseries\selectfont]{\#\ }, alo@0: moredelim=[s][\color{ForestGreen}\bfseries\selectfont]{?}{\ }, %variable alo@0: moredelim=[s][\color{NavyBlue}\bfseries\selectfont]{@}{\ }, %prefix alo@0: moredelim=[s][\color{OrangeRed}\bfseries\selectfont]{<}{>}, %red URIs alo@0: morestring=[b][\color{ForestGreen}]\", %green strings alo@0: morestring=[b]", alo@0: } alo@0: alo@0: \lstdefinestyle{sparql}{ alo@0: language=sparql, alo@0: basicstyle=\footnotesize\ttfamily\bfseries, alo@0: % basicstyle=\ttfamily, alo@0: keywordstyle=\color{blue}\bfseries, alo@0: identifierstyle=, alo@0: commentstyle=\color{ForestGreen}\bfseries, alo@0: stringstyle=\color{BlueGreen}\ttfamily, alo@0: showstringspaces=false, alo@0: emph={context},emphstyle=\color{BrickRed}\bfseries, alo@0: frame = lines, alo@0: %aboveskip = 15pt, alo@0: %framexbottommargin = 5pt, alo@0: %framextopmargin = 5pt, alo@0: aboveskip = 10pt, alo@0: framexbottommargin = 2pt, alo@0: framextopmargin = 2pt, alo@0: captionpos=b, alo@0: escapechar=~, alo@0: breaklines=true, alo@0: breakatwhitespace=true, alo@0: breakindent=20pt, alo@0: xleftmargin=5pt, alo@0: xrightmargin=5pt, alo@0: basewidth={0.55em,0.45em}, alo@0: %basewidth={0.50em,0.6em}, alo@0: fontadjust=true, alo@0: % lineskip={-1.5pt}, alo@0: % columns=[c]spaceflexible, %make the long artist URI fit alo@0: %float = h!, alo@0: } alo@0: alo@0: \renewcommand{\lstlistingname}{{\bf Listing}} alo@0: alo@0: alo@0: \lstdefinelanguage{ttl} { alo@0: morekeywords={a}, alo@0: sensitive=true, alo@0: % morecomment=[l][\color{ForestGreen}\bfseries\fontsize{10}{2}\selectfont]{\#\ }, alo@0: % moredelim=[s][\color{ForestGreen}\bfseries\fontsize{10}{2}\selectfont]{\#\ }{\ }, alo@0: % moredelim=[s][\color{NavyBlue}\bfseries\fontsize{10}{2}\selectfont]{@}{\ }, %prefix alo@0: % moredelim=[s][\color{OrangeRed}\bfseries\fontsize{10}{2}\selectfont]{<}{>}, %red URIs alo@0: morecomment=[l][\color{ForestGreen}\ttfamily\bfseries\selectfont]{\#\ }, alo@0: moredelim=[s][\color{NavyBlue}\ttfamily\bfseries\selectfont]{@}{\ }, %prefix alo@0: moredelim=[s][\color{OrangeRed}\ttfamily\bfseries\selectfont]{<}{>}, %red URIs alo@0: morestring=[b][\color{ForestGreen}]\", %green strings alo@0: morestring=[b]", alo@0: } alo@0: alo@0: \lstdefinestyle{ttl}{ alo@0: language=ttl, alo@0: basicstyle=\footnotesize\ttfamily\bfseries, alo@0: keywordstyle=\color{blue}\bfseries, alo@0: identifierstyle=, alo@0: commentstyle=\color{ForestGreen}\bfseries, alo@0: stringstyle=\color{BlueGreen}\bfseries, alo@0: showstringspaces=false, alo@0: emph={context},emphstyle=\color{BrickRed}\bfseries, alo@0: frame = lines, alo@0: framexbottommargin = 5pt, alo@0: framextopmargin = 5pt, alo@0: captionpos=b, alo@0: escapechar=~, alo@0: breaklines=true, alo@0: breakatwhitespace=true, alo@0: breakindent=20pt, alo@0: aboveskip = 15pt, alo@0: xleftmargin=5pt, alo@0: xrightmargin=5pt, alo@0: basewidth={0.55em,0.45em}, alo@0: % basewidth={0.50em,0.6em}, alo@0: fontadjust=true, alo@0: lineskip={-1.5pt}, alo@0: % columns=[c]spaceflexible, %make the long artist URI fit alo@0: % float = h!, alo@0: } alo@0: alo@0: \lstdefinelanguage{json} { alo@0: sensitive=true, alo@0: %morecomment=[l]{@}, alo@0: moredelim=[s][\color{ForestGreen}]{?}{\ }, %green variables alo@0: moredelim=[s][\color{OrangeRed}\fontsize{7}{2}\selectfont]{<}{>}, %red URIs alo@0: morestring=[b][\color{Gray}]\", alo@0: morestring=[b]", alo@0: } alo@0: alo@0: \lstdefinestyle{json}{ alo@0: language=json, alo@0: keywords={type,context}, alo@0: basicstyle=\fontsize{7}{8}\bfseries\ttfamily, alo@0: keywordstyle=\color{blue}\bfseries, alo@0: identifierstyle=, alo@0: commentstyle=\color{Gray}\bfseries, alo@0: stringstyle=\color{OliveGreen}\ttfamily, alo@0: showstringspaces=false, alo@0: emph={context},emphstyle=\color{BrickRed}\bfseries, alo@0: frame = lines, alo@0: framexbottommargin = 5pt, alo@0: framextopmargin = 5pt, alo@0: tabsize=4, alo@0: captionpos=b, alo@0: escapechar=~, alo@0: breaklines=false, alo@0: xleftmargin=5pt, alo@0: xrightmargin=5pt, alo@0: basewidth={0.50em,0.45em}, alo@0: %basewidth={0.50em,0.6em}, alo@0: fontadjust=true, alo@0: columns=[c]spaceflexible, %make the long artist URI fit alo@0: float = ht, alo@0: } alo@0: alo@0: \renewcommand{\labelitemi}{$\bullet$} alo@0: alo@0: \begin{document} alo@0: alo@1: \mainmatter alo@1: alo@3: \title{MusicWeb: an open linked semantic platform for music metadata} alo@1: alo@1: \author{Mariano Mora-Mcginity \and Alo Allik \and Gy\"orgy Fazekas \and Mark Sandler } alo@1: % alo@1: alo@1: \institute{Queen Mary University of London, \\ alo@1: \email{\{m.mora-mcginity, a.allik, g.fazekas, mark.sandler\}@qmul.ac.uk}} alo@1: alo@1: \maketitle alo@0: alo@1: \begin{abstract} alo@1: gyorgyf@2: % MusicWeb is a web site that provides users a browsing, searching and linking platform of music artist and group information by integrating open linked semantic metadata from various Semantic Web, music recommendation and social media data sources, including DBpedia.org, sameas.org, MusicBrainz, the Music Ontology, Last.FM, Youtube, and Echonest. The front portal includes suggested links to selected artists and a search functionality from where users can navigate to individual artists pages. Each artist page contains a biography, links to online audio and a video player with a side menu displaying a selection of Youtube videos. Further it provides lists of YAGO categories linking each artist to other artists by various commonalities such as style, geographical location, instrumentation, record label as well as more obscure categories, for example, artists who have received the same award, have shared the same fate, or belonged to the same organisation or religion. The artist connections are further enhanced by thematic analysis of journal articles and blog posts as well as content-based music information retrieval similarity measures. gyorgyf@2: gyorgyf@2: This paper presents MusicWeb, a novel platform for linking music artists within a web-based application for discovering connections between them. MusicWeb provides a browsing experience using connections that are either extra-musical or tangential to music, such as the artists' political affiliation or social influence, or intra-musical, such as the artists' main instrument or most favoured musical key. The platform integrates open linked semantic metadata from various Semantic Web, music recommendation and social media data sources including DBpedia.org, sameas.org, MusicBrainz, the Music Ontology, Last.FM and Youtube as well as content-derived information. The front portal includes suggested links to selected artists and a search functionality from where users can navigate to individual artists pages. Each artist page contains a biography and links to online audio and a video resources. Connections are made using YAGO categories linking artist by various commonalities such as style, geographical location, instrumentation, record label as well as more obscure categories, for instance, artists who have received the same award, have shared the same fate, or belonged to the same organisation or religion. These connections are further enhanced by thematic analysis of journal articles and blog posts as well as content-based similarity measures focussing on high level musical categories. alo@0: alo@1: \keywords{Semantic Web, Linked Open Data, music metadata, semantic audio analysis, music information retrieval } alo@1: \end{abstract} alo@1: alo@0: \section{Introduction}\label{sec:introduction} mariano@6: In recent years we have witnessed an explosion of information, a consequence of millions of users producing and consuming web resources. Researchers and industry have recognised the potential of this data, and have endeavoured to develop methods to handle such a vast amount of information: to understand and manage it, to transform into knowledge. Multimedia content providers have devoted a lot of energy to analysing consumer preference, in an effort to offer customised user experiences. Music stream services, for instance, carry out extensive analysis trying to identify patterns in user's listening habits, and researchers are striving to refine multimedia recommendation algorithms\cite{Song2012}. There are, however, limitations in user-preference based approaches: recommendations based solely on user preference can very easily lead to a ''rich-club phenomenon''\cite{Zhou2004}, in which the short-tail popular music is heavily reinforced whereas most of the music available online is ignored and remains unknown\cite{Celma2010}. Music recommendation systems such as mariano@4: \begin{itemize} mariano@4: \item Why are we doing this? mariano@4: \begin{itemize} mariano@4: \item What does the application do? mariano@4: \item Why is this a good thing? mariano@4: \item Who is it good for?: User experience. mariano@4: \item Who is it potentially good for? mariano@4: mariano@4: \end{itemize} mariano@4: \end{itemize} mariano@5: mariano@4: \section{Background}\label{sec:background} mariano@4: \begin{itemize} mariano@4: \item Information management mariano@5: \item Music data collection: Spotify has acquired Echonest for \$100 million. mariano@4: \item Music recommendation systems: many recommendation systems are based on identifying trends in user listening patterns: it likely that a user who likes a particular artist will also like another artist because other users have shown this tendency. mariano@4: \item Some references to semantic web audio mariano@4: \item Linked musicians: echonest, musicbrainz mariano@4: \item Smart music alo@0: mariano@4: \end{itemize} mariano@6: alo@1: \section{MusicWeb: Yago linking}\label{sec:yago} alo@0: alo@1: \section{MUSIC: linking by topic}\label{sec:music} mariano@4: \begin{itemize} mariano@4: \item Semantic analysis\cite{Landauer1998} mariano@4: \item Topic modeling\cite{Blei2012} mariano@4: \item Entity recognition mariano@4: \item Hierarchical bayesian modeling mariano@4: \item Authors, journals, keywords, tags mariano@4: mariano@4: \end{itemize} alo@1: \section{Content-based information retrieval}\label{sec:mir} alo@0: alo@0: \section{Discussion}\label{sec:discussion} alo@0: alo@0: \section{Conclusions}\label{sec:conclusions} alo@0: alo@0: % alo@0: % ---- Bibliography ---- alo@0: % alo@0: \vspace{-1em}\begin{thebibliography}{5} alo@0: % alo@0: mariano@6: \bibitem{Song2012} mariano@6: Y.~Song, S.~Dixon and M.~Pearce. mariano@6: \newblock A survey of music recommendation systems and future perspectives mariano@6: \newblock In {\em Proceedings of the 9th International Symposium on Computer Music Modelling and Retrieval}, 2012. mariano@6: mariano@6: \bibitem{Zhou2004} mariano@6: S.~Zhou and R. J.~Mondrag\'on mariano@6: \newblock The rich-club phenomenon in the Internet topology mariano@6: \newblock In {\em Communications Letters, IEEE}, 2004 mariano@6: mariano@6: \bibitem{Celma2010} mariano@6: O.~Celma mariano@6: \newblock Music Recommendation and Discovery:The Long Tail, Long Fail, and Long Play in the Digital Music Space. mariano@6: \newblock Springer Verlag, Heidelberg, 2010. mariano@6: mariano@6: \bibitem{FazekasRJS10_OMRAS2} mariano@6: G.~Fazekas, Y.~Raimond, K.~Jakobson, and M.~Sandler. mariano@6: \newblock An overview of semantic web activities in the {OMRAS2} project. mariano@6: \newblock {\em Journal of New Music Research (JNMR)}, 39(4), 2010. mariano@6: mariano@6: \bibitem{Porter:ISMIR:15} mariano@6: A.~Porter, D.~Bogdanov, R.~Kaye, R.~Tsukanov, and X.~Serra. mariano@6: \newblock Acousticbrainz: a community platform for gathering music information mariano@6: obtained from audio. mariano@6: \newblock In {\em 16th International Society for Music Information Retrieval alo@0: (ISMIR) Conference}, 2015. alo@0: alo@0: \bibitem{DBLP:conf/ismir/RaimondASG07} alo@0: Y~Raimond, S.~Abdallah, M.~Sandler, and F.~Giasson. alo@0: \newblock The music ontology. alo@0: \newblock In {\em Proceedings of the 8th International Conference on Music alo@0: Information Retrieval, ISMIR 2007, Vienna, Austria, September 23-27}, 2007. mariano@4: mariano@6: mariano@6: \bibitem{Landauer1998} mariano@4: T.~Landauer, P.~Folt, and D.~Laham. mariano@4: \newblock An introduction to latent semantic analysis mariano@4: \newblock In {\em Discourse processes, 25}, 1998 mariano@4: mariano@4: \bibitem{Blei2012} mariano@4: D.~Blei, A.~ Ng, and M.I.~Jordan. mariano@4: \newblock Latent Dirichlet Allocation. mariano@4: \newblock In {\em Journal of Machine Learning Research, 3(4-5), 993–1022}, 2012 mariano@6: mariano@6: alo@0: \end{thebibliography} alo@0: alo@0: \end{document}