diff --git a/HHU_Logo.pdf b/HHU_Logo.pdf new file mode 100644 index 0000000000000000000000000000000000000000..0e1c2e35c260b9e4b43dadd9b6eb11f4d9fc94f0 Binary files /dev/null and b/HHU_Logo.pdf differ diff --git a/frontpage.tex b/frontpage.tex new file mode 100644 index 0000000000000000000000000000000000000000..bca604a59512cdd26e02dff40757b96da6c8c900 --- /dev/null +++ b/frontpage.tex @@ -0,0 +1,34 @@ +\newgeometry{left=15mm,right=15mm, top=3cm, bottom=2cm} +\begin{titlepage} +\vspace*{-1.5cm} + \raisebox{17mm}{ + \begin{minipage}[t]{90mm} + \begin{center} + {\Large Department of Computer Science\\} + {\normalsize + Data \& Knowledge Engineering\\ + } + \vspace{3mm} + {\small Universitätsstr. 1 \hspace{5ex} D--40225 Düsseldorf\\} + \end{center} + \end{minipage} + } + \hfill + \includegraphics[width=130pt]{unilogo.eps} + \vspace{14em} + \begin{center} + {\Large Submission} + \end{center} + \begin{center} + \baselineskip=55pt + \textbf{\huge \titel} + \baselineskip=0 pt + \end{center} +\vfill + \begin{center} + \textbf{\Large + \bearbeiter + } + \end{center} +\end{titlepage} +\restoregeometry \ No newline at end of file diff --git a/introduction.tex b/introduction.tex new file mode 100644 index 0000000000000000000000000000000000000000..1ce6306bbc071df875f0e11538e7680328e2f747 --- /dev/null +++ b/introduction.tex @@ -0,0 +1,21 @@ +\section{Introduction} +Today's use of \textit{recommender systems} finds an increased and yet unconscious access to our everyday life. +More and more areas of life are therefore subject to constant optimisation. +Companies such as \textit{Netflix}, \textit{Amazon} and \textit{YouTube} adapt their product proposals to the individual wishes of their customers. +To make this possible, the various \textit{collaborative-filtering} and \textit{content-based} \textit{recommender systems} are used. + +Since \citet{JuKa90} first presented \textit{recommender systems} as a kind of intelligent bookcase, much effort has been put into the development and research of such systems. +The most diverse subject areas were not only illuminated by the industry. + A whole new branch of research also opened up for science. + + In their work ``On the Diffculty of Evaluating Baselines A Study on Recommender Systems`` \citet{Rendle19} show that current research on the \textit{MovieLens10M} dataset leads in a wrong direction. + In addition to general problems, they particulary list wrong working methods and missunderstood \textit{baselines} by breaking them by a number of simple methods such as \textit{matrix-factorization}. + + They were able to beat the existing baselines by not taking them for granted. + On the contrary, they questioned them and transferred well evaluated and understood properties of the baselines from the \textit{Netflix-Challenge} to them. + +As a result, they were not only able to beat the \textit{baselines} reported for the \textit{MovieLens10M}, but also the newer methods from the last 5 years of research. Therefore, it can be assumed that the current and former results obtained on the \textit{MovieLens10M} dataset were not sufficient to be considered as a true baseline. Thus they show the community a critical error on which can be found not only in the evaluation of \textit{recommender systems} but also in other scientific areas. + +As a first problem, the authors point out that scientific papers whose focus is on better understanding and improving existing \textit{baselines} do not receive recognition because they do not seem innovative enough. In contrast to industry, which tenders horrendous prizes for researching and improving such \textit{baselines}, there is a lack of such motivation in the scientific field. From the authors point of view, the scientific work on the \textit{MovieLens10M} dataset is misdirected, because one-off evaluations leading to one-hit-wonders, which are then used as a starting point for further work. Thus \citet{Rendle19} points out as a second point of criticism that the need for further basic research for the \textit{MovieLens10M} dataset is not yet exhausted. + +This submission takes a critical look at the topic presented by \citet{Rendle19}. In addition, basic terms and the results obtained are presented in a way that is comprehensible to the non-experienced reader. \ No newline at end of file diff --git a/references.bib b/references.bib new file mode 100644 index 0000000000000000000000000000000000000000..71e2152dacc11067a3378e702565dab6b4ab7f4f --- /dev/null +++ b/references.bib @@ -0,0 +1,29 @@ +@book{JuKa90, + author = {Karlgren, Jussi}, + institution = {KTH, Computer and Systems Sciences, DSV}, + institution = {Stockholm University}, + publisher = {Department of Computer and Systems Sciences, Stockholm University}, + title = {An algebra for recommendations : Using reader data as a basis for measuring document proximity}, + series = {SYSLAB technical reports}, + number = {179}, + pages = {1--11}, + abstract = {A measure for proximity between documents is defined, based on data from readers. This proximity measure can be further investigated as a tool document retrieval, and as to provide data for concept formation experiments. }, + year = {1990} +} + +@article{Rendle19, + author = {Steffen Rendle and + Li Zhang and + Yehuda Koren}, + title = {On the Difficulty of Evaluating Baselines: {A} Study on Recommender + Systems}, + journal = {CoRR}, + volume = {abs/1905.01395}, + year = {2019}, + url = {http://arxiv.org/abs/1905.01395}, + archivePrefix = {arXiv}, + eprint = {1905.01395}, + timestamp = {Mon, 27 May 2019 13:15:00 +0200}, + biburl = {https://dblp.org/rec/bib/journals/corr/abs-1905-01395}, + bibsource = {dblp computer science bibliography, https://dblp.org} +} diff --git a/submission.pdf b/submission.pdf new file mode 100644 index 0000000000000000000000000000000000000000..27e09aa140cd03912cc567e266226d4a05ea5da7 Binary files /dev/null and b/submission.pdf differ diff --git a/submission.tex b/submission.tex new file mode 100644 index 0000000000000000000000000000000000000000..d98a4976b53cd02cfbd01c3e416791c0ca0d28fb --- /dev/null +++ b/submission.tex @@ -0,0 +1,69 @@ +%%%%%%%%%%%%%%%%%%%%%%%%% +% Neue Referenz einfügen: $BibTeX % +% Änderung im Doukment: $LuaLaTex% +%%%%%%%%%%%%%%%%%%%%%%%%% +\documentclass[11pt]{article} +\usepackage[singlespacing]{setspace} +\usepackage{sectsty} +\sectionfont{\fontsize{14pt}{0}\selectfont} +\usepackage{fontspec} +\setmainfont{Arial} +\usepackage[utf8]{inputenc} +\usepackage{amsmath} +\usepackage{amsfonts} +\usepackage{amssymb} +\usepackage{geometry} +\usepackage{fancyhdr} +\usepackage{lastpage} +\usepackage[english]{babel} +\usepackage[round]{natbib} +\usepackage[usenames,dvipsnames]{xcolor} +\usepackage{hyperref} %anklickbare Literaturangaben +\geometry{a4paper,left=15mm,right=15mm, top=5mm, bottom=1cm,includeheadfoot} +\usepackage{graphicx} +\usepackage{subcaption} +\usepackage{amsthm} +\usepackage{algorithm} +\usepackage{algorithmic} +\usepackage{bbold} +\usepackage{tikz} +\usepackage{multirow} +\parindent 6pt +\usepackage[]{titlesec} +\titlespacing*{\section} +{0pt}{0pt}{6pt} +\usepackage{footmisc} +\setlength{\abovedisplayskip}{0pt} +\renewcommand{\footrulewidth}{0.5pt} +\pagestyle{fancy} +\rhead{\today} +\rfoot{Page \thepage\ / \pageref{LastPage}} +\cfoot{} +\lhead{\bfseries \large Submission - \bearbeiter} +\definecolor{hhuUniBlau}{RGB}{0,106,179} +\hypersetup{ + colorlinks, + citecolor=hhuUniBlau, + linkcolor=black, + urlcolor=hhuUniBlau} + +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Diese Felder ausfüllen! % +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +\newcommand{\Datum}{\today} +\newcommand{\bearbeiter}{Marc Feger B.Sc.} +\newcommand{\titel}{On the Diffculty of Evaluating Baselines\\ +A Study on Recommender Systems} +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +\begin{document} +\input{frontpage} +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% Hier beginnt der Inhalt! % +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +\input{introduction} + +\newpage +\bibliography{references} +\bibliographystyle{plainnat} +\end{document} diff --git a/unilogo-eps-converted-to.pdf b/unilogo-eps-converted-to.pdf new file mode 100644 index 0000000000000000000000000000000000000000..727003997f6e762907759aebbe7bda25803a7307 Binary files /dev/null and b/unilogo-eps-converted-to.pdf differ diff --git a/unilogo.eps b/unilogo.eps new file mode 100755 index 0000000000000000000000000000000000000000..5fe5f83e8c5bd597eae6287a651d399628d5199b Binary files /dev/null and b/unilogo.eps differ