forked from alshedivat/al-folio
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpapers.bib
224 lines (203 loc) · 26.1 KB
/
papers.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
---
---
@inproceedings{melchiorre2024modular,
title = {Modular Debiasing of Latent User Representations in Prototype-based Recommender Systems},
author = {Melchiorre, Alessandro B. and Masoudian, Shahed and Kumar, Deepak and Schedl, Markus},
booktitle = {Proceedings of 2024 Joint European Conference on Machine Learning and Knowledge Discovery in Databases (ECML PKDD)},
abstract = {Recommender Systems (RSs) may inadvertently perpetuate biases based on protected attributes like gender, religion, or ethnicity. Left unaddressed, these biases can lead to unfair system behavior and privacy concerns. Interpretable RS models provide a promising avenue for understanding and mitigating such biases. In this work, we propose a novel approach to debias interpretable RS models by introducing user-specific scaling weights to the interpretable user representations of prototype-based RSs. This reduces the influence of the protected attributes on the RS's prediction while preserving recommendation utility. By decoupling the scaling weights from the original representations, users can control the degree of invariance of recommendations to their protected characteristics. Moreover, by defining distinct sets of weights for each attribute, the user can further specify which attributes the recommendations should be agnostic to. We apply our method to ProtoMF, a state-of-the-art prototype-based RS model that models users by their similarities to prototypes. We employ two debiasing strategies to learn the scaling weights and conduct experiments on ML-1M and LFM2B-DB datasets aiming at making the user representations agnostic to age and gender. The results show that our approach effectively reduces the influence of the protected attributes on the representations on both datasets, showcasing flexibility in bias mitigation, while only marginally affecting recommendation quality. Finally, we assess the effects of the debiasing weights and provide qualitative evidence, particularly focusing on movie recommendations, of genre patterns identified by ProtoMF that correlate with specific genders.},
year = {2024},
bibtex_show = {true},
selected = {true},
pdf = {melchiorre2024modular.pdf},
preview = {melchiorre2024modular_preview.png},
bibtex_show = {true},
}
@article{melchiorre2023emomtb,
abbr = {Journal},
title = {Emotion-aware Music Tower Blocks (EmoMTB): An Intelligent Audiovisual Interface for Music Discovery and Recommendation},
author = {Melchiorre, Alessandro B. and Penz, David and Ganh\"or, Christian and Lesota, Oleg and Fragoso, Vasco and Fritzl, Florian and Parada-Cabaleiro, Emilia and Schubert, Franz and Schedl, Markus},
journal = {International Journal of Multimedia Information Retrieval (IJMIR)},
abstract = {Music listening has experienced a sharp increase during the last decade thanks to music streaming and recommendation services. While they offer text-based search functionality and provide recommendation lists of remarkable utility, their typical mode of interaction is unidimensional, i.e., they provide lists of consecutive tracks, which are commonly inspected in sequential order by the user. The user experience with such systems is heavily affected by cognition biases (e.g., position bias, human tendency to pay more attention to first positions of ordered lists) as well as algorithmic biases (e.g., popularity bias, the tendency of recommender systems to overrepresent popular items). This may cause dissatisfaction among the users by disabling them to find novel music to enjoy. In light of such systems and biases, we propose an intelligent audiovisual music exploration system named EmoMTB. It allows the user to browse the entirety of a given collection in a free non-linear fashion. The navigation is assisted by a set of personalized emotion-aware recommendations which serve as starting points for the exploration experience. EmoMTB adopts the metaphor of a city, in which each track (visualized as a colored cube) represents one floor of a building. Highly similar tracks are located in the same building, moderately similar ones form neighborhoods that mostly correspond to genres. Tracks situated between distinct neighborhoods create a gradual transition between genres. Users can navigate this music city using their smartphones as control devices. They can explore districts of well-known music or decide to leave their comfort zone. In addition, EmoMTB integrates an emotion-aware music recommendation system that re-ranks the list of suggested starting points for exploration according to the user’s self-identified emotion or the collective emotion expressed in EmoMTB’s Twitter channel. Evaluation of EmoMTB has been carried out in a three-fold way: by quantifying the homogeneity of the clustering underlying the construction of the city, by measuring the accuracy of the emotion predictor, and by carrying out a web-based survey composed of open questions to obtain qualitative feedback from users.},
doi = {10.1007/s13735-023-00275-8},
pdf = {melchiorre2023emomtb.pdf},
preview = {melchiorre2023emomtb_preview.jpg},
volume = {12},
number = {13},
year = {2023},
bibtex_show = {true},
html = {https://link.springer.com/article/10.1007/s13735-023-00275-8}
}
@inproceedings{melchiorre2022protomf,
title = {ProtoMF: Prototype-based Matrix Factorization for Effective and Explainable Recommendations},
author = {Melchiorre, Alessandro B. and Rekabsaz, Navid and Ganh\"or, Christian and Schedl, Markus},
booktitle = {Proceedings of the 16th ACM Conference on Recommender Systems (RecSys)},
year = {2022},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
abstract = {Recent studies show the benefits of reformulating common machine learning models through the concept of prototypes -- representatives of the underlying data, used to calculate the prediction score as a linear combination of similarities of a data point to prototypes. Such prototype-based formulation of a model, in addition to preserving (sometimes enhancing) the performance, enables explainability of the model's decisions, as the prediction can be linearly broken down into the contributions of distinct definable prototypes. Following this direction, we extend the idea of prototypes to the recommender system domain by introducing ProtoMF, a novel collaborative filtering algorithm. ProtoMF learns sets of user/item prototypes that represent the general consumption characteristics of users/items in the underlying dataset. Using these prototypes, ProtoMF then represents users and items as vectors of similarities to the corresponding prototypes. These user/item representations are ultimately leveraged to make recommendations that are both effective in terms of accuracy metrics, and explainable through the interpretation of prototypes' contributions to the affinity scores. We conduct experiments on three datasets to assess both the effectiveness and the explainability of ProtoMF. Addressing the former, we show that ProtoMF exhibits higher Hit~Ratio and NDCG compared to other relevant collaborative filtering approaches. As for the latter, we qualitatively show how ProtoMF can provide explainable recommendations and how its explanation capabilities can expose the existence of statistical biases in the learned representations, which we exemplify for the case of gender bias.},
bibtex_show = {true},
pdf = {melchiorre2022protomf.pdf},
selected = {true},
preview = {melchiorre2022protomf_preview.png},
youtube = {https://www.youtube.com/watch?v=qQD0oFdTlSs},
doi ={10.1145/3523227.3546756},
slides = {melchiorre2022protomf_slides.pdf},
html = {https://dl.acm.org/doi/10.1145/3523227.3546756},
isbn = {9781450392785},
pages = {246–256},
numpages = {11},
keywords = {prototypes, bias, recommender systems, explainability},
location = {Seattle, WA, USA},
series = {RecSys '22}
}
@inproceedings{lesota2022exploring,
title = {Exploring Cross-group Discrepancies in Calibrated Popularity for Accuracy/Fairness Trade-off Optimization},
author = {Lesota, Oleg and Brandl, Stefan and Wenzel, Matthias and Melchiorre, Alessandro B. and Lex, Elisabeth and Rekabsaz, Navid and Schedl, Markus},
booktitle = {Proceedings of the 2nd Workshop on Multi-Objective Recommender Systems co-located with 16th ACM Conference on Recommender Systems (RecSys 2022), Seattle, WA, USA, 18th-23rd September},
year={2022},
preview = {lesota2022exploring_preview.png},
html = {https://ceur-ws.org/Vol-3268/paper5.pdf},
abstract = {Popularity bias is an important issue in recommender systems, as it affects end-users, content creators, and content provider platforms alike. It can cause users to miss out on less popular items that would fit their preference, prevent new content creators from finding their audience, and force providers to pay higher royalties for serving expensive popular content. Over the past years, various approaches to mitigate popularity bias in recommender systems have been proposed. Among them, post-processing methods are widely accepted due to their versatility and ease of implementation. While previous studies have investigated the effects of different post-processing techniques on accuracy and fairness of recommendations, the influence of different algorithms on different user groups have not received much attention in this context. Addressing this research gap, we study the effect of a recent mitigation strategy, Calibrated Popularity, in conjunction with a selection of state-of-the-art recommender algorithms including BPR, ItemKNN, LightGCN, MultiVAE, and NeuMF. We show that these algorithms demonstrate different characteristics in terms of the trade-off between accuracy and fairness, both within and between various user groups defined by gender and inclination towards consumption of mainstream items. Finally, we demonstrate how these discrepancies can be exploited to achieve a more effective trade-off between utility and fairness of recommender systems.},
bibtex_show = {true},
location = {Seattle, WA, USA},
}
@inproceedings{melchiorre2022emomtb,
title = {EmoMTB: Emotion-aware Music Tower Blocks},
author = {Melchiorre, Alessandro B. and Penz, David and Ganh\"or, Christian and Lesota, Oleg and Fragoso, Vasco and Fritzl, Florian and Parada-Cabaleiro, Emilia and Schubert, Franz and Schedl, Markus},
booktitle = {Proceedings of the 2022 International Conference on Multimedia Retrieval (ICMR)},
year = {2022},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
abstract = {We introduce Emotion-aware Music Tower Blocks (EmoMTB), an audiovisual interface to explore large music collections. It creates a musical landscape, by adopting the metaphor of a city, where similar songs are grouped into the same building and nearby buildings form neighborhoods of particular genres. In order to personalize the user experience, an underlying classifier monitors textual user-generated content, by predicting their emotional state and adapting the audiovisual elements of the interface accordingly. EmoMTB enables users to explore different musical styles either within their comfort zone or outside of it. Besides, tailoring the results of the recommender engine to match the affective state of the user, EmoMTB offers a unique way to discover and enjoy music.
EmoMTB supports exploring a collection of circa half a million streamed songs using a regular smartphone as a control interface to navigate in the landscape.},
bibtex_show = {true},
html = {https://dl.acm.org/doi/10.1145/3512527.3531351},
pages = {206-–210},
youtube = {https://www.youtube.com/watch?v=JKgAlWObc-0},
pdf = {melchiorre2022emomtb.pdf},
preview = {melchiorre2022emomtb_preview.png},
doi = {10.1145/3512527.3531351}
}
@article{afchar2022explainability,
abbr = {Article with Deezer},
title = {Explainability in Music Recommender Systems},
author = {Afchar, Darius* and Melchiorre, Alessandro B.* and Schedl, Markus and Hennequin, Romain and Epure, Elena V. and Moussallam, Manuel},
journal = {AI Magazine},
volume = {43},
issue = {2},
abstract = {The most common way to listen to recorded music nowadays is via streaming platforms which provide access to tens of millions of tracks. To assist users in effectively browsing these large catalogs, the integration of Music Recommender Systems (MRSs) has become essential. Current real-world MRSs are often quite complex and optimized for recommendation accuracy. They combine several building blocks based on collaborative filtering and content-based recommendation. This complexity can hinder the ability to explain recommendations to end users, which is particularly important for recommendations perceived as unexpected or inappropriate. While pure recommendation performance often correlates with user satisfaction, explainability has a positive impact on other factors such as trust and forgiveness, which are ultimately essential to maintain user loyalty. In this article, we discuss how explainability can be addressed in the context of MRSs. We provide perspectives on how explainability could improve music recommendation algorithms and enhance user experience. First, we review common dimensions and goals of recommenders' explainability and in general of eXplainable Artificial Intelligence (XAI), and elaborate on the extent to which these apply -- or need to be adapted -- to the specific characteristics of music consumption and recommendation. Then, we show how explainability components can be integrated within a MRS and in what form explanations can be provided. Since the evaluation of explanation quality is decoupled from pure accuracy-based evaluation criteria, we also discuss requirements and strategies for evaluating explanations of music recommendations. Finally, we describe the current challenges for introducing explainability within a large-scale industrial music recommender system and provide research perspectives.},
year = {2022},
arxiv = {https://arxiv.org/abs/2201.10528},
html = {https://ojs.aaai.org/index.php/aimagazine/article/view/21743},
selected = {true},
pages = {190--208},
pdf = {afchar2022explainability.pdf},
preview = {afchar2022explainability_preview.png},
doi= {10.1002/aaai.12056},
bibtex_show = {true}
}
@inproceedings{lesota2021analyzing,
title = {Analyzing Item Popularity Bias of Music Recommender Systems: Are Different Genders Equally Affected?},
author = {Lesota, Oleg and Melchiorre, Alessandro B. and Rekabsaz, Navid and Brandl, Stefan and Kowald, Dominik and Lex, Elisabeth and Schedl, Markus},
booktitle = {Fifteenth ACM Conference on Recommender Systems (RecSys)},
pages = {601--606},
year = {2021},
isbn = {9781450384582},
preview = {lesota2021analyzing_preview.png},
publisher = {Association for Computing Machinery},
html = {https://doi.org/10.1145/3460231.3478843},
abstract = {Several studies have identified discrepancies between the popularity of items in user profiles and the corresponding recommendation lists. Such behavior, which concerns a variety of recommendation algorithms, is referred to as popularity bias. Existing work predominantly adopts simple statistical measures, such as the difference of mean or median popularity, to quantify popularity bias. Moreover, it does so irrespective of user characteristics other than the inclination to popular content. In this work, in contrast, we propose to investigate popularity differences (between the user profile and recommendation list) in terms of median, a variety of statistical moments, as well as similarity measures that consider the entire popularity distributions (Kullback-Leibler divergence and Kendall’s τ rank-order correlation). This results in a more detailed picture of the characteristics of popularity bias. Furthermore, we investigate whether such algorithmic popularity bias affects users of different genders in the same way. We focus on music recommendation and conduct experiments on the recently released standardized LFM-2b dataset, containing listening profiles of Last.fm users. We investigate the algorithmic popularity bias of seven common recommendation algorithms (five collaborative filtering and two baselines). Our experiments show that (1) the studied metrics provide novel insights into popularity bias in comparison with only using average differences, (2) algorithms less inclined towards popularity bias amplification do not necessarily perform worse in terms of utility (NDCG), (3) the majority of the investigated recommenders intensify the popularity bias of the female users. },
bibtex_show = {true},
numpages = {6},
keywords = {popularity bias, fairness, gender, music recommendation},
location = {Amsterdam, Netherlands},
series = {RecSys '21},
doi = {10.1145/3460231.3478843},
html = {https://dl.acm.org/doi/10.1145/3460231.3478843},
arxiv = {https://arxiv.org/abs/2108.06973}
}
@article{melchiorre2021investigating,
abbr = {Journal},
title = {Investigating Gender Fairness of Recommendation Algorithms in the Music Domain},
author = {Melchiorre, Alessandro B. and Rekabsaz, Navid and Parada-Cabaleiro, Emilia and Brandl, Stefan and Lesota, Oleg and Schedl, Markus},
journal = {Information Processing \& Management (IPM)},
volume = {58},
number = {5},
pages = {102666},
year = {2021},
abstract = {Although recommender systems (RSs) play a crucial role in our society, previous studies have revealed that the performance of RSs may considerably differ between groups of individuals with different characteristics or from different demographics. In this case, a RS is considered to be unfair when it does not perform equally well for different groups of users. Considering the importance of RSs in the distribution and consumption of musical content worldwide, a careful evaluation of fairness in the context of music RSs is crucial. To this end, we first introduce LFM-2b, a novel large-scale real-world dataset of music listening records, comprising a subset to investigate bias of RSs regarding users’ demographics. We then define a notion of fairness based on the performance gap of a RS between the users with different demographics, and evaluate a variety of collaborative filtering algorithms in terms of accuracy and beyond-accuracy metrics to explore the fairness in the RS results toward a specific gender group. We observe the existence of significant discrepancies (unfairness) between the performance of algorithms across male and female user groups. Based on these discrepancies, we explore to what extent recommender algorithms lead to intensifying the underlying population bias in the final results. We also study the effect of a resampling strategy, commonly used as debiasing method , which yields slight improvements in the fairness measures of various algorithms while maintaining their accuracy and beyond-accuracy performance.},
publisher = {Elsevier},
bibtex_show = {true},
html = {https://www.sciencedirect.com/science/article/pii/S0306457321001540},
selected = {true},
pdf = {melchiorre2021investigating.pdf},
preview = {melchiorre2021investigating_preview.png},
doi = {10.1016/j.ipm.2021.102666}
}
@inproceedings{melchiorre2021lemons,
title = {LEMONS: Listenable Explanations for Music recOmmeNder Systems},
author = {Melchiorre, Alessandro B. and Haunschmid, Verena and Schedl, Markus and Widmer, Gerhard},
booktitle = {European Conference on Information Retrieval (ECIR)},
pages = {531--536},
year = {2021},
publisher = {Springer International Publishing},
abstract = {Although current music recommender systems suggest new tracks to their users, they do not provide listenable explanations of why a user should listen to them. LEMONS (Demonstration video: https://youtu.be/giSPrPnZ7mc) is a new system that addresses this gap by (1) adopting a deep learning approach to generate audio content-based recommendations from the audio tracks and (2) providing listenable explanations based on the time-source segmentation of the recommended tracks using the recently proposed audioLIME},
bibtex_show = {true},
html = {https://link.springer.com/chapter/10.1007/978-3-030-72240-1_60},
pdf = {melchiorre2021lemons.pdf},
youtube = {https://www.youtube.com/watch?v=giSPrPnZ7mc},
preview = {melchiorre2021lemons_preview.png},
poster = {melchiorre2021lemons_poster.pdf},
doi = {10.1007/978-3-030-72240-1_60}
}
@inproceedings{liu2020pandemics,
title = {Pandemics, Music, and Collective Sentiment: Evidence from the Outbreak of COVID-19},
author = {Liu, Meijun and Zangerle, Eva and Hu, Xiao and Melchiorre, Alessandro B. and Schedl, Markus},
booktitle = {Proceedings of the 21st International Society for Music Information Retrieval Conference (ISMIR)},
pages = {157-165},
year = {2020},
abstract = {The COVID-19 pandemic causes a massive global health crisis and produces substantial economic and social distress, which in turn may cause stress and anxiety among people. Real-world events play a key role in shaping collective sentiment in a society. As people listen to music daily everywhere in the world, the sentiment of music being listened to can reflect the mood of the listeners and serve as a measure of collective sentiment. However, the exact relationship between real-world events and the sentiment of music being listened to is not clear. Driven by this research gap, we use the unexpected outbreak of COVID-19 as a natural experiment to explore how users' sentiment of music being listened to evolves before and during the outbreak of the pandemic. We employ causal inference approaches on an extended version of the LFM-1b dataset of listening events shared on Last.fm, to examine the impact of the pandemic on the sentiment of music listened to by users in different countries. We find that, after the first COVID-19 case in a country was confirmed, the sentiment of artists users listened to becomes more negative. This negative effect is pronounced for males while females' music emotion is less influenced by the outbreak of the COVID-19 pandemic. We further find a negative association between the number of new weekly COVID-19 cases and users' music sentiment. Our results provide empirical evidence that public sentiment can be monitored based on collective music listening behaviors, which can contribute to research in related disciplines.},
bibtex_show = {true},
html = {https://program.ismir2020.net/poster_1-19.html},
preview = {liu2020pandemics_preview.png}
}
@inproceedings{melchiorre2020personalitybias,
author = {Melchiorre, Alessandro B. and Zangerle, Eva and Schedl, Markus},
title = {Personality Bias of Music Recommendation Algorithms},
year = {2020},
isbn = {9781450375832},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
html = {https://doi.org/10.1145/3383313.3412223},
abstract = {Recommender systems, like other tools that make use of machine learning, are known to create or increase certain biases. Earlier work has already unveiled different performance of recommender systems for different user groups, depending on gender, age, country, and consumption behavior. In this work, we study user bias in terms of another aspect, i.e., users’ personality. We investigate to which extent state-of-the-art recommendation algorithms yield different accuracy scores depending on the users’ personality traits. We focus on the music domain and create a dataset of Twitter users’ music consumption behavior and personality traits, measuring the latter in terms of the OCEAN model. Investigating recall@K and NDCG@K of the recommendation algorithms SLIM, embarrassingly shallow autoencoders for sparse data (EASE), and variational autoencoders for collaborative filtering (Mult-VAE) on this dataset, we find several significant differences in performance between user groups scoring high vs. groups scoring low on several personality traits.},
booktitle = {Fourteenth ACM Conference on Recommender Systems (RecSys)},
pages = {533–538},
numpages = {6},
bibtex_show = {true},
pdf = {melchiorre2020personalitybias.pdf},
preview = {melchiorre2020personalitybias_preview.png},
slides = {melchiorre2020personalitybias_slides.pdf},
youtube = {https://www.youtube.com/watch?v=3-3ubWNW3q8},
poster = {melchiorre2020personalitybias_poster.pdf},
doi = {10.1145/3383313.3412223}
}
@inproceedings{melchiorre2020personalitycorrelates,
author = {Melchiorre, Alessandro B. and Schedl, Markus},
title = {Personality Correlates of Music Audio Preferences for Modelling Music Listeners},
year = {2020},
isbn = {9781450368612},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
url = {https://doi.org/10.1145/3340631.3394874},
html = {https://doi.org/10.1145/3340631.3394874},
abstract = {Past studies have shown that personality has a significant association with user behaviour and preferences, not least towards music. This makes personality information a promising aspect for user modelling in personalised recommender systems and similar domains. In contrast to existing studies, which investigate personality correlates of music preferences via genres or styles, we study such correlates by modelling music preferences at a finer-grained content level, using audio features of the music users listen to. Leveraging listening and personality information of more than 1,300 Last.fm users, we identify several significant medium and weak correlations between music audio features and personality traits, the latter defined by the five-factor model. Our results provide useful insights into the relationship between personality and music preference, which can be valuable for music recommender systems in terms of more personalised recommendations.},
booktitle = {Proceedings of the 28th ACM Conference on User Modeling, Adaptation and Personalization (UMAP)},
pages = {313–317},
numpages = {5},
bibtex_show = {true},
pdf = {melchiorre2020personalitycorrelates.pdf},
preview = {melchiorre2020personalitycorrelates_preview.png},
slides = {melchiorre2020personalitycorrelates_slides.pdf},
youtube = {https://www.youtube.com/watch?v=6z4l06b69Do&t=197s},
doi = {10.1145/3340631.3394874}
}