-
Notifications
You must be signed in to change notification settings - Fork 33
/
paper.bib
452 lines (393 loc) · 15.7 KB
/
paper.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
@inproceedings{six2012ethnic_fingerprinter,
author = {Joren Six and Olmo Cornelis},
booktitle = {{Proceedings of the Folk Music Analysis conference (FMA 2012)}},
title = {A Robust Audio Fingerprinter Based on Pitch Class Histograms - Applications for Ethnic Music Archives},
year = {2012}}
@inproceedings{velasco2011constructing,
title={Constructing an invertible constant-{Q} transform with non-stationary Gabor frames},
author={{Velasco, Gino Angelo and Holighaus, Nicki and D{\"o}rfler, Monika and Grill, Thomas}},
booktitle={{Proceedings of the 14th International Conference on Digital Audio Effects (DAFx-11)}},
volume={33},
year={2011}
}
@inproceedings{six2014tarsosdsp,
author = {Joren Six and Olmo Cornelis and Marc Leman},
title = {{TarsosDSP, a Real-Time Audio Processing Framework in Java}},
booktitle = {{Proceedings of the 53rd AES Conference (AES 53rd)}},
year = 2014
}
@inproceedings{herre2002scalable,
title={Scalable robust audio fingerprinting using {MPEG-7} content description},
author={Herre, J{\"u}rgen and Hellmuth, Oliver and Cremer, Markus},
booktitle={Multimedia Signal Processing, 2002 IEEE Workshop on},
pages={165--168},
year={2002},
organization={IEEE},
doi={10.1109/MMSP.2002.1203273}
}
@inproceedings{Wang2003a,
author = {Wang, Avery L.},
booktitle = {Proceedings of the 4th {I}nternational {S}ymposium on {M}usic {I}nformation {R}etrieval ({ISMIR} 2003)},
location = {Baltimore, MD, USA},
pages = {7--13},
title = {An Industrial-Strength Audio Search Algorithm},
year = {2003},
doi = {10.5281/zenodo.1416340}
}
@inproceedings{fenet2011pitch_shift_fingerprinting,
author = {Fenet, Sébastien and Richard, Gaël and Grenier, Yves},
booktitle = {Proceedings of the 12th {I}nternational {S}ymposium on {M}usic {I}nformation {R}etrieval ({ISMIR} 2011)},
pages = {121--126},
title = {{A Scalable Audio Fingerprint Method with Robustness to Pitch-Shifting}},
year = {2011},
doi = {10.5281/zenodo.1417593}
}
@article{holighaus2012framework,
title={A framework for invertible, real-time constant-Q transforms},
author={Holighaus, Nicki and D{\"o}rfler, Monika and Velasco, Gino Angelo and Grill, Thomas},
journal={IEEE Transactions on Audio, Speech, and Language Processing},
volume={21},
number={4},
pages={775--785},
year={2012},
publisher={IEEE},
doi={10.1109/TASL.2012.2234114}
}
@inproceedings{six2018dupapps,
author="Six, Joren and Bressan, Federica and Leman, Marc",
editor="Serra, Giuseppe and Tasso, Carlo",
title="Applications of Duplicate Detection in Music Archives:
From Metadata Comparison to Storage Optimisation",
booktitle="Digital Libraries and Multimedia Archives",
year="2018",
publisher="Springer International Publishing",
address="Cham",
pages="101--113",
isbn="978-3-319-73165-0",
doi="10.1007/978-3-319-73165-0_10"
}
@article{cano2005fingerprinting_overview,
author = {Cano, Pedro and Batlle, Eloi and Kalker, Ton and Haitsma, Jaap},
issn = {0922-5773},
issue = {3},
journal = {The Journal of VLSI Signal Processing},
keyword = {Engineering},
pages = {271--284},
publisher = {Springer Netherlands},
title = {A Review of Audio Fingerprinting},
volume = {41},
year = {2005},
doi = {10.1007/s11265-005-4151-3}
}
@inproceedings{fma2017fma,
author = {Michaël Defferrard and Kirell Benzi and Pierre Vandergheynst and Xavier Bresson},
booktitle = {Proceedings of the 18th {I}nternational {S}ymposium on {M}usic {I}nformation {R}etrieval ({ISMIR} 2017)},
title = {{FMA: a dataset for music analysis}},
year = {2017},
doi = {10.5281/zenodo.1414728}
}
@article{brown1991calculation,
title={Calculation of a constant Q spectral transform},
author={Brown, Judith C},
journal={The Journal of the Acoustical Society of America},
volume={89},
number={1},
pages={425--434},
year={1991},
publisher={Acoustical Society of America},
doi = {10.1121/1.400476}
}
@article{brown1992efficient,
title={An efficient algorithm for the calculation of a constant Q transform},
author={Brown, Judith C and Puckette, Miller S},
journal={The Journal of the Acoustical Society of America},
volume={92},
number={5},
pages={2698--2701},
year={1992},
publisher={Acoustical Society of America},
doi={10.1121/1.404385}
}
@article{comer1979ubiquitous,
title={Ubiquitous B-tree},
author={Comer, Douglas},
journal={ACM Computing Surveys (CSUR)},
volume={11},
number={2},
pages={121--137},
year={1979},
publisher={ACM New York, NY, USA}
}
@inproceedings{9044274,
author={Mehmood, Zahid and Ashfaq Qazi, Khurram and Tahir, Muhammad and Muhammad Yousaf, Rehan and Sardaraz, Muhammad},
booktitle={6th Conference on Data Science and Machine Learning Applications (CDMA 2020)},
title={Potential Barriers to Music Fingerprinting Algorithms in the Presence of Background Noise},
year={2020},
volume={},
number={},
pages={25-30},
doi={10.1109/CDMA47397.2020.00010}}
@inproceedings{dlfm2017_mirchiving,
author = {de Valk, Reinier and Volk, Anja and Holzapfel, Andre and
Pikrakis, Aggelos and Kroher, Nadine and Six, Joren},
title = {MIRchiving: Challenges and Opportunities of Connecting
MIR Research and Digital Music Archives},
booktitle = {Proceedings of the 4th International Workshop on Digital Libraries for Musicology},
series = {DLfM '17},
year = {2017},
isbn = {978-1-4503-5347-2},
location = {Shanghai, China},
pages = {25--28},
numpages = {4},
url = {http://doi.acm.org/10.1145/3144749.3144755},
doi = {10.1145/3144749.3144755},
acmid = {3144755},
publisher = {ACM},
address = {New York, NY, USA},
keywords = {Applying MIR, collaboration, digital music archives, documentation},
}
@inproceedings{sonnleitner2014quad_based_fingerprinter,
author = {Reinhard Sonnleitner and Gerhard Widmer},
booktitle = {{Proceedings of the 17th International Conference on Digital Audio Effects (DAFx-14)}},
title = {{Quad-based audio fingerprinting robust to time and frequency scaling}},
year = {2014},
}
@inproceedings{ellis2014labrosafp,
title={The 2014 {LabROSA} audio fingerprint system},
author={Ellis, Daniel},
booktitle={{MIREX abstracts of the 15th International Symposium on Music Information Retrieval (ISMIR 2014)}},
year={2014}
}
@INPROCEEDINGS{neuralfp,
author={Chang, Sungkyun and Lee, Donmoon and Park, Jeongsoo and Lim, Hyungui and Lee, Kyogu and Ko, Karam and Han, Yoonchang},
booktitle={IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP 2021)},
title={Neural Audio Fingerprint for High-Specific Audio Retrieval Based on Contrastive Learning},
year={2021},
volume={},
number={},
pages={3025-3029},
doi={10.1109/ICASSP39728.2021.9414337}}
@patent{wang2003patent,
title={Robust and invariant audio pattern matching},
author={Wang, A Li-chun and Culbert, Daniel},
journal={Patent US7627477 B},
volume={2},
year={2003},
yearfiled={2003},
nationality={US},
number={US7627477 B}
}
@inproceedings{sonnleitner2016landmark,
title={Landmark-based audio fingerprinting for DJ mix monitoring.},
author={Sonnleitner, Reinhard and Arzt, Andreas and Widmer, Gerhard},
booktitle={{Proceedings of the 17th International Symposium on Music Information Retrieval (ISMIR 2016)}},
pages={185--191},
year={2016},
doi={10.5281/zenodo.1417008}
}
@inproceedings{six2021panakovtwo,
author = {Six, Joren},
booktitle = {{Extended abstracts for the Late-Breaking Demo Session of the 22st International Society for Music Information Conference (ISMIR 2021) }},
keywords = {{Acoustic fingerprinting}},
language = {{eng}},
location = {{Online}},
title = {{Panako 2.0 : updates for an acoustic fingerprinting system}},
year = {{2021}},
}
@inproceedings{six2014panako,
author = {Six, Joren and Leman, Marc},
booktitle = {{Proceedings of the 15th ISMIR Conference (ISMIR 2014)}},
pages = {1--6},
title = {{Panako - A scalable acoustic fingerprinting system handling time-scale and pitch modification}},
year = {2014},
doi = {10.5281/zenodo.1416190}
}
@inproceedings{six2017framework,
title={A framework to provide fine-grained time-dependent context for active listening experiences},
author={Six, Joren and Leman, Marc},
booktitle={Audio Engineering Society Conference: 2017 AES International Conference on Semantic Audio},
year={2017},
organization={Audio Engineering Society}
}
@article{weck2023data,
title={Data leakage in cross-modal retrieval training: A case study},
author={Weck, Benno and Serra, Xavier},
journal={arXiv e-prints},
pages={arXiv--2302},
doi={10.48550/arXiv.2302.12258},
year={2023}
}
@inproceedings {black2018unmixdb,
title = {Unmixdb: A Dataset for DJ-Mix Information Retrieval},
author = {Schwarz, Diemo and Fourer, Dominique},
booktitle = {{Proceedings of the 19th International Symposium on Music Information Retrieval (ISMIR 2018)}},
year = {2018},
doi = {10.5281/zenodo.1422385}
}
@dataset{schwarz_diemo_2018_1422385,
author = {Schwarz, Diemo and
Fourer, Dominique},
title = {{UnmixDB: A Dataset for DJ-Mix Information
Retrieval}},
month = sep,
year = 2018,
publisher = {Zenodo},
version = 1,
doi = {10.5281/zenodo.1422385},
url = {https://doi.org/10.5281/zenodo.1422385}
}
@inproceedings{haitsma2002fingerprinter,
author = {Haitsma, Jaap and Kalker, Ton},
booktitle = {Proceedings of the 3th {I}nternational {S}ymposium on {M}usic {I}nformation {R}etrieval ({ISMIR} 2002)},
ee = {http://ismir2002.ismir.net/proceedings/02-FP04-2.pdf},
title = {A Highly Robust Audio Fingerprinting System.},
year = {2002},
doi = {10.5281/zenodo.1417973}
}
@inproceedings {kim2020djset,
title = {A Computational Analysis of Real-World DJ Mixes using Mix-To-Track Subsequence Alignment},
author = {Taejun Kim and Minsuk Choi and Evan Sacks and Yi-Hsuan Yang and Juhan Nam},
bootitle = {Proceedings of the 21st International Society for Music Information Retrieval Conference (ISMIR), 2020},
year = {2020},
doi = {10.5281/zenodo.4245544}
}
@inproceedings{six2020olaf,
title={OLAF: Overly Lightweight Acoustic Fingerprinting},
author={Joren Six},
year={2020},
booktitle ={{Extended abstracts for the Late-Breaking Demo Session of the 21st International Society for Music Information Conference (ISMIR 2020) }}
}
@article{six2022panako,
title={Panako: a scalable audio search system},
author={Six, Joren},
journal={Journal of open source software},
volume={7},
number={78},
year={2022},
doi = {10.21105/joss.04554}
}
@article{six2015synchronizing,
title={Synchronizing multimodal recordings using audio-to-audio alignment: An application of acoustic fingerprinting to facilitate music interaction research},
author={Six, Joren and Leman, Marc},
journal={Journal on Multimodal User Interfaces},
volume={9},
pages={223--229},
year={2015},
doi = {10.1007/s12193-015-0196-1},
publisher={Springer}
}
@book{ISO1999,
address = {Geneva, Switzerland},
author = {{ISO}},
keywords = {C Specification Standard},
publisher = {International Organization for Standardization},
title = {{ISO/IEC 9899:1999 Information technology --- Programming languages --- C}},
year = 2011
}
@inproceedings{cortes2022baf,
author = {Cortès, Guillem and Ciurana, Alex and Molina, Emilio and Miron, Marius and Meyers, Owen and Six, Joren and Serra, Xavier},
booktitle = {{Proceedings of the 23rd International Society for Music Information Retrieval Conference (ISMIR 2022)}},
keywords = {{Acoustic fingerprinting}},
language = {{eng}},
location = {{Bengalaru, India}},
pages = {{908--916}},
title = {{BAF: an audio fingerprinting dataset for broadcast monitoring}},
url = {{http://dx.doi.org/10.5281/zenodo.7343030}},
doi = {10.5281/zenodo.7343030},
year = {{2022}},
}
@inbook{six2023duplicates,
abstract = {This chapter focuses on identification of duplicate audio material in large digital music archives. The music information retrieval (MIR) problem to efficiently find duplicate in large collections is a solved problem. There are even off-the-shelf systems available to find duplicates. The applications of this technology, however, are still too unknown and underexploited.},
address = {Cham},
author = {Six, Joren and Bressan, Federica and Renders, Koen},
booktitle = {Advances in Speech and Music Technology: Computational Aspects and Applications},
doi = {10.1007/978-3-031-18444-4_16},
editor = {Biswas, Anupam and Wennekes, Emile and Wieczorkowska, Alicja and Laskar, Rabul Hussain},
isbn = {978-3-031-18444-4},
pages = {311--329},
publisher = {Springer International Publishing},
title = {Duplicate Detection for for Digital Audio Archive Management: Two Case Studies},
url = {https://doi.org/10.1007/978-3-031-18444-4_16},
year = {2023}}
@misc{calgorithms,
author = {Simon Howard},
title = {C Algorithms: a collection of common Computer Science algorithms},
year = {2020},
publisher = {GitHub},
journal = {GitHub repository},
url = {https://github.com/fragglet/c-algorithms}
}
@misc{audfprint,
author = {Dan Ellis},
title = {audfprint: Landmark-based audio fingerprinting},
year = {2019},
publisher = {GitHub},
journal = {GitHub repository},
url = {https://github.com/dpwe/audfprint}
}
@misc{pffft,
author = {Julien Pommier},
title = {{PFFFT}: a pretty fast {FFT}},
year = {2022},
publisher = {BitBucket},
journal = {BitBucket repository},
url = {https://bitbucket.org/jpommier/pffft/src/master/}
}
@misc{zig,
author = {Andrew Kelley and contributors},
title = {Zig: a general-purpose programming language and toolchain for maintaining robust, optimal, and reusable software.},
year = {2023},
publisher = {GitHub},
journal = {GitHub repository},
url = {https://github.com/ziglang/zig}
}
@misc{lmdb,
author = {Howard Chu},
title = {{LMDB}: a general-purpose programming language and toolchain for maintaining robust, optimal, and reusable software.},
year = {2022},
publisher = {OpenLDAP},
journal = {OpenLDAP repository},
url = {https://git.openldap.org/openldap/openldap/tree/mdb.master}
}
@misc{doxygen,
author = {Dimitri van Heesch},
title = {Doxygen: the de facto standard tool for generating documentation from annotated C++ sources.},
year = {2023},
publisher = {Doxygen},
journal = {Doxygen website},
url = {https://www.doxygen.nl/}
}
@misc{chromaprint,
author = {Lukáš Lalinský and contributors},
title = {Chromaprint: an audio fingerprint library developed for the AcoustID project.},
year = {2023},
publisher = {Github},
journal = {GitHub repository},
url = {https://github.com/acoustid/chromaprint}
}
@misc{dejavu,
author = {Will Drevo},
title = {Dejavu: Audio fingerprinting and recognition algorithm implemented in Python.},
year = {2020},
publisher = {Github},
journal = {GitHub repository},
url = {https://github.com/worldveil/dejavu}
}
@InProceedings{spectromap,
author="L{\'o}pez-Garc{\'i}a, Aar{\'o}n
and Mart{\'i}nez-Rodr{\'i}guez, Brian
and Liern, Vicente",
editor="Montiel, Mariana
and Agust{\'i}n-Aquino, Octavio A.
and G{\'o}mez, Francisco
and Kastine, Jeremy
and Lluis-Puebla, Emilio
and Milam, Brent",
title="A Proposal to Compare the Similarity Between Musical Products. One More Step for Automated Plagiarism Detection?",
booktitle="Mathematics and Computation in Music",
year="2022",
publisher="Springer International Publishing",
address="Cham",
pages="192--204",
doi = "10.1007/978-3-031-07015-0_16",
}