-
Notifications
You must be signed in to change notification settings - Fork 0
/
literatura.bib
311 lines (282 loc) · 10.4 KB
/
literatura.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
@ARTICLE{benetos2019overview,
author={Benetos, Emmanouil and Dixon, Simon and Duan, Zhiyao and Ewert, Sebastian},
journal={IEEE Signal Processing Magazine},
title={Automatic Music Transcription: An Overview},
year={2019},
volume={36},
number={1},
pages={20-30},
doi={10.1109/MSP.2018.2869928}
}
@misc{kelz2016potential,
title={On the Potential of Simple Framewise Approaches to Piano Transcription},
author={Rainer Kelz and Matthias Dorfer and Filip Korzeniowski and Sebastian Böck and Andreas Arzt and Gerhard Widmer},
year={2016},
eprint={1612.05153},
archivePrefix={arXiv},
primaryClass={cs.SD}
}
@article{smaragdis2003nmf,
author = {Smaragdis, Paris and Brown, Judith},
year = {2003},
month = {11},
pages = {177 - 180},
title = {Non-negative matrix factorization for polyphonic music transcription},
isbn = {0-7803-7850-4},
journal = {Proceedings of IEEE Workshop on Applications of Signal Processing to Audio and Acoustics},
doi = {10.1109/ASPAA.2003.1285860}
}
@article{lee1999learning,
author = {Lee, D. and Seung, H.},
year = {1999},
month = {10},
pages = {788-791},
title = {Learning the parts of objects by non-negative matrix factorization},
journal = {Nature},
volume = {401},
doi = {10.1038/44565}
}
@article{sigtia2016endtoend,
author = {Sigtia, Siddharth and Benetos, Emmanouil and Dixon, Simon},
journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
title = {An End-to-End Neural Network for Polyphonic Piano Music Transcription},
year = {2016},
volume = {24},
number = {5},
pages = {927-939},
doi = {10.1109/TASLP.2016.2533858}
}
@INPROCEEDINGS{schluter2014onsetcnn,
author={Schlüter, Jan and Böck, Sebastian},
booktitle={2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
title={Improved musical onset detection with Convolutional Neural Networks},
year={2014},
volume={},
number={},
pages={6979-6983},
doi={10.1109/ICASSP.2014.6854953}
}
@INPROCEEDINGS{humphrey2012rethinking,
author={Humphrey, Eric J. and Bello, Juan P.},
booktitle={2012 11th International Conference on Machine Learning and Applications},
title={Rethinking Automatic Chord Recognition with Convolutional Neural Networks},
year={2012},
volume={2},
number={},
pages={357-362},
doi={10.1109/ICMLA.2012.220}
}
@ARTICLE{su2015spectral,
author={Su, Li and Yang, Yi-Hsuan},
journal={IEEE/ACM Transactions on Audio, Speech, and Language Processing},
title={Combining Spectral and Temporal Representations for Multipitch Estimation of Polyphonic Music},
year={2015},
volume={23},
number={10},
pages={1600-1612},
doi={10.1109/TASLP.2015.2442411}
}
@misc{hawthorne2018onsets,
title={Onsets and Frames: Dual-Objective Piano Transcription},
author={Curtis Hawthorne and Erich Elsen and Jialin Song and Adam Roberts and Ian Simon and Colin Raffel and Jesse Engel and Sageev Oore and Douglas Eck},
year={2018},
eprint={1710.11153},
archivePrefix={arXiv},
primaryClass={cs.SD}
}
@online{mirex,
title = {MIREX Wiki},
date = {2021-06},
url = {https://www.music-ir.org/mirex/wiki/MIREX_HOME},
urldate = {2021-08-04}
}
@article{maps_orig,
author = {Emiya, Valentin and Bertin, Nancy and David, Bertrand and Badeau, Roland},
year = {2010},
month = {07},
pages = {11},
title = {MAPS - A piano database for multipitch estimation and automatic transcription of music}
}
@article{maps,
author = {Emiya, Valentin and Badeau, Roland and David, Bertrand},
year = {2010},
month = {09},
pages = {1643 - 1654},
title = {Multipitch Estimation of Piano Sounds Using a New Probabilistic Spectral Smoothness Principle},
volume = {18},
journal = {Audio, Speech, and Language Processing, IEEE Transactions on},
doi = {10.1109/TASL.2009.2038819}
}
@article{brown1991cqt,
author = {Brown, Judith C.},
title = {Calculation of a constant Q spectral transform},
journal = {The Journal of the Acoustical Society of America},
volume = {89},
number = {1},
pages = {425-434},
year = {1991},
doi = {10.1121/1.400476},
URL = {https://doi.org/10.1121/1.400476},
eprint = {https://doi.org/10.1121/1.400476}
}
@misc{choi2021comparison,
title={A Comparison of Audio Signal Preprocessing Methods for Deep Neural Networks on Music Tagging},
author={Keunwoo Choi and György Fazekas and Kyunghyun Cho and Mark Sandler},
year={2021},
eprint={1709.01922},
archivePrefix={arXiv},
primaryClass={cs.SD}
}
@book{moore2012psy,
author = {Brian C. J. Moore},
title = {An Introduction to the Psychology of Hearing},
year = {2012},
publisher = {Brill}
}
@inproceedings{mcfee2015librosa,
author = {McFee, Brian and Raffel, Colin and Liang, Dawen and Ellis, Daniel and Mcvicar, Matt and Battenberg, Eric and Nieto, Oriol},
year = {2015},
month = {01},
pages = {18-24},
title = {librosa: Audio and Music Signal Analysis in Python},
publisher = {Proceedings of the 14th python in science conference},
doi = {10.25080/Majora-7b98e3ed-003}
}
@article{raffael2014pretty_midi,
author = {Raffel, Colin and Ellis, Daniel P. W.},
title = {Intuitive Analysis, Creation and Manipulation of MIDI Data with pretty\_midi},
journal = {Proceedings of the 15th International Conference on Music Information Retrieval Late Breaking and Demo Papers},
year = {2014},
pages = {84-93}
}
@misc{tensorflow2015whitepaper,
title={TensorFlow: Large-Scale Machine Learning on Heterogeneous Systems},
url={https://www.tensorflow.org/},
note={Software available from tensorflow.org},
author={Mart\'in~Abadi and Ashish~Agarwal and Paul~Barham and Eugene~Brevdo and Zhifeng~Chen and Craig~Citro and Greg~S.~Corrado and Andy~Davis and Jeffrey~Dean and Matthieu~Devin and Sanjay~Ghemawat and Ian~Goodfellow and Andrew~Harp and Geoffrey~Irving and Michael~Isard and Yangqing Jia and Rafal~Jozefowicz and Lukasz~Kaiser and Manjunath~Kudlur and Josh~Levenberg and Dandelion~Man\'e and Rajat~Monga and Sherry~Moore and Derek~Murray and Chris~Olah and Mike~Schuster and Jonathon~Shlens and Benoit~Steiner and Ilya~Sutskever and Kunal~Talwar and Paul~Tucker and Vincent~Vanhoucke and Vijay~Vasudevan and Fernanda~Vi\'egas and Oriol~Vinyals and Pete~Warden and Martin~Wattenberg and Martin~Wicke and Yuan~Yu and Xiaoqiang~Zheng},
year={2015},
urldate = {2021-08-04}
}
@article{nitish2014dropout,
author = {Nitish Srivastava and Geoffrey Hinton and Alex Krizhevsky and Ilya Sutskever and Ruslan Salakhutdinov},
title = {Dropout: A Simple Way to Prevent Neural Networks from Overfitting},
journal = {Journal of Machine Learning Research},
year = {2014},
volume = {15},
number = {56},
pages = {1929-1958},
url = {http://jmlr.org/papers/v15/srivastava14a.html}
}
@inproceedings{monti2000monophonic,
author = {Giuliano Monti and Mark Sandler},
title = {Monophonic transcription with autocorrelation},
booktitle = {Proceedings of the COST G-6 Conference on digital audio effects (DAFX-00},
year = {2000},
pages = {2000--257}
}
@misc{kingma2017adam,
title={Adam: A Method for Stochastic Optimization},
author={Diederik P. Kingma and Jimmy Ba},
year={2017},
eprint={1412.6980},
archivePrefix={arXiv}
}
@phdthesis{moorer1975digital,
title = {On the Segmentation and Analysis of Continuous Musical Sound by Digital Computer},
volume = {Ph.D.},
number = {STAN-M-3},
year = {1975},
school = {Stanford University},
address = {Stanford, CA},
keywords = {analysis, continuous musical sound, digital computer, segmentation},
url = {https://ccrma.stanford.edu/files/papers/stanm3.pdf},
author = {Moorer, James A.},
urldate = {2021-08-08}
}
@article{katayose1989kensei,
ISSN = {01489267, 15315169},
URL = {http://www.jstor.org/stable/3679555},
author = {Haruhiro Katayose and Seiji Inokuchi},
journal = {Computer Music Journal},
number = {4},
pages = {72--77},
publisher = {The MIT Press},
title = {The Kansei Music System},
volume = {13},
year = {1989}
}
@phdthesis{hawley1993structure,
title = {Structure out of sound},
volume = {Ph.D.},
number = {},
year = {1993},
school = {Massachusetts Institute of Technology},
address = {},
keywords = {Architecture. Program in Media Arts and Sciences},
url = {http://hdl.handle.net/1721.1/29068},
author = {Hawley, Michael Jerome},
urldate = {2021-08-08}
}
@article{marolt2004sonic,
title={A connectionist approach to automatic transcription of polyphonic piano music},
author={Marolt, Matija},
journal={IEEE Transactions on Multimedia},
volume={6},
number={3},
pages={439--449},
year={2004},
publisher={IEEE}
}
@INPROCEEDINGS{bock2012rnn,
author={Böck, Sebastian and Schedl, Markus},
booktitle={2012 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
title={Polyphonic piano note transcription with recurrent neural networks},
year={2012},
volume={},
number={},
pages={121-124},
doi={10.1109/ICASSP.2012.6287832}
}
@inproceedings{sigtia2015hybrid,
author = {Sigtia, Siddharth and Benetos, Emmanouil and Boulanger-Lewandowski, Nicolas and Weyde, Tillman and Garcez, Artur and Dixon, Simon},
year = {2015},
month = {04},
pages = {2061--2065},
title = {A hybrid recurrent neural network for music transcription},
doi = {10.1109/ICASSP.2015.7178333}
}
@article{poliner2007melody,
author = {Poliner, Graham and Ellis, Daniel and Ehmann, Andreas and Gómez, Emilia and Streich, Sebastian and Ong, Beesuan},
year = {2007},
month = {06},
pages = {1247 - 1256},
title = {Melody Transcription From Music Audio: Approaches and Evaluation},
volume = {15},
journal = {Audio, Speech, and Language Processing, IEEE Transactions on},
doi = {10.1109/TASL.2006.889797}
}
@inproceedings{dressler2005extraction,
title={Extraction of the melody pitch contour from polyphonic audio},
author={Dressler, Karin},
booktitle={Proc. 6th International Conference on Music Information Retrieval},
volume={110},
year={2005},
organization={Citeseer},
doi = {10.1.1.122.7773}
}
@misc{kwon2020polyphonic,
title={Polyphonic Piano Transcription Using Autoregressive Multi-State Note Model},
author={Taegyun Kwon and Dasaem Jeong and Juhan Nam},
year={2020},
eprint={2010.01104},
archivePrefix={arXiv},
primaryClass={eess.AS}
}
@inproceedings{kelz2019deep,
title={Deep polyphonic ADSR piano note transcription},
author={Kelz, Rainer and Böck, Sebastian and Widmer, Gerhard},
booktitle={ICASSP 2019-2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
pages={246--250},
year={2019},
organization={IEEE}
}