-
Notifications
You must be signed in to change notification settings - Fork 33
/
mir-datasets.yaml
1797 lines (1559 loc) · 40.7 KB
/
mir-datasets.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
200DrumMachines:
url: http://www.hexawe.net/mess/200.Drum.Machines
metadata: audio samples
contents: 7371 one-shots
audio: 'yes'
AAM:
url: https://zenodo.org/record/5794629
metadata:
- onsets
- pitches
- instruments
- melody instrument
- keys
- chords
- tempos
- beats
- segments
contents: 3,000 music tracks (with single instrument multitracks)
audio: 'yes'
AccoMontage2:
url: https://github.com/billyblu2000/accomontage2
metadata: song harmonization and accompaniment arrangement based on a lead melody
contents:
audio: 'no'
ACM_MIRUM:
url: http://www.marsyas.info/tempo
metadata: tempo
contents: 1410 excerpts (60s)
audio: 'yes'
ADC2004:
url: http://labrosa.ee.columbia.edu/projects/melody
metadata: predominant pitch
contents: 20 excerpts
audio: 'yes'
AcousticBrainz-Genre:
url: https://mtg.github.io/acousticbrainz-genre-dataset/
metadata: 15-31 genres with 265-745 subgenres
contents: audio features for about 2000000 songs
audio: 'no'
AED:
url: https://data.vision.ee.ethz.ch/cvl/ae_dataset/
title: Acoustic Event Dataset
metadata: 28 event classes
contents: 5223 audio snippets
audio: 'yes'
AIST-Dance-DB:
url: https://aistdancedb.ongaaccel.jp
title: AIST Dance Video Database
metadata: street dance videos
contents: 13,940 videos for 60 pieces
audio: 'yes'
Amg1608:
url: https://amg1608.blogspot.ch
metadata: valence & arousal
contents: 1608 excerpts (30s)
audio: 'no'
AMT-pilot:
url: https://github.com/chordify/CASD
metadata: structure by multiple annotators
contents: 8 songs
audio: 'yes'
APL:
url: https://archive.org/details/Automatic_Practice_Logging
title: Automatic Practice Logging
metadata: piano practice
contents: 620 segments
audio: 'yes'
artist20:
url: http://labrosa.ee.columbia.edu/projects/artistid
metadata: 20 artists
contents: 1413 songs
audio: 'no'
ASAP:
url: https://github.com/fosfrancesco/asap-dataset
metadata:
- aligned MIDI/audio performances and MIDI/XML scores
- beats
- downbeats
- time signatures
- key signatures
contents: 1068 MIDI performances, 520 audio performances, 222 scores
audio: yes (see MAESTRO)
ATEPP:
url: https://zenodo.org/record/6564406#.Y5QnkezP3OQ
metadata:
- symbolic music MIDI
- musicXML
- classification tasks
- expressive piano performances
contents: 1742 performances (~1000 hours) by 49 pianists and covers 1580 movements by 25 composers
audio: ''
AudioSet:
url: https://research.google.com/audioset/index.html
metadata: 632 event classes
contents: 2084320 clips (10s)
audio: 'no'
bach10:
url: http://www2.ece.rochester.edu/projects/air/resource.html
metadata: aligned multitrack MIDI
contents: 10 chorales
audio: 'yes'
BAF:
url: https://github.com/guillemcortes/baf-dataset/
metadata:
- audio fingerprinting
- music monitoring in broadcast
contents: 2,000 tracks from Epidemic Sound and 3,425 TV audio recordings (60s)
audio: 'yes'
ballroom:
url: http://mtg.upf.edu/ismir2004/contest/tempoContest/node5.html
metadata:
- 8 genres
- tempo
- beats: https://github.com/CPJKU/BallroomAnnotations
- bars / downbeats: https://github.com/CPJKU/BallroomAnnotations
contents: 698 excerpts (30s)
audio: 'yes'
beatboxset1:
url: http://archive.org/details/beatboxset1
metadata: percussion annotation
contents: 14 clips
audio: 'yes'
BPS-FH:
title: BPS-FH Beethoven Piano Sonata with Function Harmony
url: https://github.com/Tsung-Ping/functional-harmony
metadata: functional annotation
contents: 32 sonatas
audio: 'no'
C224a:
url: http://www.cp.jku.at/people/schedl/datasets.html
metadata: 14 genres
contents: 224 artists
audio: 'no'
C3ka:
url: http://www.cp.jku.at/people/schedl/datasets.html
metadata: 18 genres
contents: 3000 artists
audio: 'no'
C49ka-C111ka:
url: http://www.cp.jku.at/people/schedl/datasets.html
metadata: genres
contents: 48800/110588 artists
audio: 'no'
CAL500:
url: http://calab1.ucsd.edu/~datasets/
metadata: tags
contents: 502 songs
audio: 'yes'
CAL10k:
url: http://calab1.ucsd.edu/~datasets/
metadata: tags
contents: 10870 songs
audio: 'no'
CarnaticRhythm:
url: http://compmusic.upf.edu/carnatic-rhythm-dataset
metadata:
- sama
- beats
contents: 176 pieces
audio: on request
CASD:
title: Chordify Annotator Subjectivity Dataset
url: https://github.com/chordify/CASD
metadata:
- chords by 4 annotators
contents: 50 songs
audio: 'no'
CBFdataset:
url: https://zenodo.org/record/3250223
metadata:
- 4 playing techniques (Chinese Bamboo Flute)
contents: 10 performers
audio: 'yes'
CCMixter:
url: http://www.loria.fr/~aliutkus/kam/
metadata:
- vocal track
- background track
contents: 50 mixes
audio: 'yes'
ChoCo:
url: https://github.com/smashub/choco
title: ChoCo, the Chord Corpus
metadata:
- chords
- keys
- knowledge graph: https://polifonia.disi.unibo.it/choco/
contents: 20K+ songs/pieces
audio: 'no'
ChoralMusicSeparation:
url: https://github.com/RetroCirce/Choral_Music_Separation
metadata:
- JSB chorales
- separation
contents: 8.2-hour-long choral music dataset from the JSB Chorales Dataset
audio: 'yes'
Chopin22:
url: http://iwk.mdw.ac.at/goebl/mp3.html
metadata:
- aligned MIDI
contents: 44 recordings
audio: 'yes'
Clotho:
url: https://zenodo.org/record/3490684
metadata:
- 5 descriptive captions
contents: 4981 snippets
audio: 'yes'
CMMSD:
url: https://sourceforge.net/projects/segmentationgt/
metadata:
- note/rest/transition
- onsets
- vibrato
contents: 36 excerpts
audio: 'no'
Coidach:
url: http://jmir.sourceforge.net/Codaich.html
metadata: 55 genres
contents: 26420 songs
audio: 'no'
corpusCOFLA:
url: http://www.cofla-project.com/?page_id=170
metadata:
- editorial
- predominant melody
contents: 1800 flamenco recordings
audio: 'no'
covers80:
url: http://labrosa.ee.columbia.edu/projects/coversongs/covers80/
metadata: cover songs
contents: 80 song pairs
audio: 'yes'
Cross-Composer:
url: https://www.audiolabs-erlangen.de/resources/MIR/cross-comp
metadata:
- 11 composers
- piece
- key
- era
- instrumentation
contents: 1100 chromagrams and chord labels
audio: 'no'
Cross-Era:
url: https://www.audiolabs-erlangen.de/resources/MIR/cross-era
metadata:
- composer
- piece
- key
- era
- instrumentation
contents: 2000 chromagrams and chord labels
audio: 'no'
CSD:
url: https://zenodo.org/record/2649950
title: Choral Singing Dataset
metadata:
- f0
- MIDI
contents: 48 recordings
audio: 'yes'
dadaGP:
url: https://github.com/dada-bots/dadaGP
title: dadaGP dataset
metadata:
- guitarPro tablatures
- encoder and decoder python tool to and from text and token format
- symbolic music generation
contents: a total of 26,181 songs in guitarPro/token format for symbolic music generation
audio: 'no'
DALI:
url: https://github.com/gabolsgabs/DALI
title: Dataset of synchronised Audio, LyrIcs and vocal notes
metadata: aligned notes and lyrics
contents: 5358 songs
audio: 'no'
DAMP:
url: https://ccrma.stanford.edu/damp/
metadata:
- karaoke performances
- aligned lyrics: https://drive.google.com/drive/folders/1hGuE0Drv3tbN-YNRDzJJMHfzKH6e4O2A
- pronunciation assessment: https://drive.google.com/drive/folders/19JPEWSBAM0ssatjBIJzAzjClxi2abt8w
contents: 34000 monophonic recordings
audio: 'yes'
Da-TACOS:
url: https://mtg.github.io/da-tacos/
metadata: cover songs
contents: 25000 songs
audio: 'no'
DCS:
url: https://www.audiolabs-erlangen.de/resources/MIR/2020-DagstuhlChoirSet
title: Dagstuhl ChoirSet
metadata:
- beats
- time-aligned scores
- F0
contents: 81 takes
audio: 'yes'
DEAM:
url: http://cvml.unige.ch/databases/DEAM
title: DEAM - The MediaEval Database for Emotional Analysis of Music
metadata: valence & arousal
contents: 1802 excerpts
audio: 'yes'
DEAPDataset:
url: http://www.eecs.qmul.ac.uk/mmv/datasets/deap/readme.html
metadata:
- valence & arousal
- dominance
- physiological data
contents: 120 music video excerpts
audio: 'no'
DESED:
url: https://github.com/turpaultn/DESED
metadata: 10 audio event classes
contents: pprox 20k 10s clips (unlabeled, weakly/strongly labeled)
audio: 'yes'
DREANSS:
url: http://mtg.upf.edu/download/datasets/dreanss
metadata:
- onset times
- percussion instruments
contents: 18 excerpts
audio: 'yes'
DrumPt:
url: https://github.com/cwu307/DrumPtDataset
metadata: 4 playing techniques
contents: app. 2000 annotations
audio: yes (see ENST)
DSD100:
url: https://sigsep.github.io/datasets/dsd100.html
metadata:
- multitrack recordings
- stems for vocals, drums, bass and accompaniment
contents: 100 songs
audio: 'yes'
emoMusic:
url: http://cvml.unige.ch/databases/emoMusic
metadata: arousal & valence
contents: 744 excerpts (45s)
audio: 'yes'
EMusic:
url: http://cvml.unige.ch/databases/emoMusic
metadata: arousal & valence
contents: 100 excerpts (experimental music)
audio: 'yes'
EMO-Soundscapes:
url: http://cvml.unige.ch/databases/emoMusic
metadata: arousal & valence
contents: 1213 soundscape recordings
audio: 'yes'
Emotify:
url: http://www.projects.science.uu.nl/memotion/emotifydata
metadata: induced emotion
contents: 400 excerpts
audio: 'yes'
EnsembleSet:
url: https://zenodo.org/record/6519024#.Y52xKex_pTZ
metadata:
- source separation
- synthesized with Spitfire BBC Symphony Orchestra Professional Library
- 20 different mix/microphone configurations
contents: dataset presents 80 tracks (6+ hours) with a range of string, wind, and brass instruments arranged as chamber ensembles
audio: 'yes'
ENST-Drums:
url: http://www.tsi.telecom-paristech.fr/aao/en/2010/02/19/enst-drums-an-extensive-audio-visual-database-for-drum-signals-processing/
metadata:
- onset times
- perc. instruments
- playing technique: https://github.com/cwu307/DrumPtDataset
contents: 318 segments
audio: 'yes'
Erkomaishvili:
url: https://www.audiolabs-erlangen.de/resources/MIR/2019-GeorgianMusic-Erkomaishvili
title: Erkomaishvili Dataset
metadata:
- sheet music
- structure
- F0
- note onsets
contents: 118 tracks
audio: 'yes'
Extendedballroom:
url: http://anasynth.ircam.fr/home/media/ExtendedBallroom/
metadata:
- 9 genres
- tempo
contents: 4000 excerpts (30s)
audio: downloadable
ExtraSensory:
url: http://extrasensory.ucsd.edu/
metadata: 51 context labels
contents: 300000 sensor recordings from 60 users
audio: 'yes'
ffuhrmann:
url: http://www.dtic.upf.edu/~ffuhrmann/PhD/data
metadata: 11 predom. instr.
contents: 6951 excerpts from 220 songs
audio: yes/no
FlaBase:
url: http://mtg.upf.edu/download/datasets/flabase
title: Flamenco database
metadata:
- editorial
- biographical
- musicological information on flamenco
- 1102 artists
- 74 palos
- 2860 albums
contents: 13311 tracks
audio: 'no'
FifteenSongs:
url: https://github.com/grateful-dead-live/fifteen-songs-dataset
metadata: Grateful Dead
contents: 15 grateful dead songs with leadsheets
audio: 'yes'
FMA-small:
url: https://github.com/mdeff/fma
metadata: 8 genres
contents: 8000 excerpts (30s)
audio: 'yes'
FMA-medium:
url: https://github.com/mdeff/fma
metadata: 16 genres
contents: 25000 excerpts (30s)
audio: 'yes'
FMA-large:
url: https://github.com/mdeff/fma
metadata: 161 genres
contents: 106574 excerpts (30s)
audio: 'yes'
FMA-full:
url: https://github.com/mdeff/fma
metadata: 161 genres
contents: 106574 songs
audio: 'yes'
Freesound-Loop-Dataset:
url: https://zenodo.org/record/3967852
metadata: tempo, key, instrumentation, genre
contents: 3000 annotated loops, 9455 loops total
audio: 'yes'
FSD-Kaggle2019:
url: https://zenodo.org/record/3612637
metadata: 80 tags
contents: 29000 clips
audio: 'yes'
Fugue:
url: http://algomus.fr/data
title: Fugue Analyses
metadata:
- fugue structure
- patterns
- cadences
contents: 36 fugues (Bach & Shostakovich)
audio: 'no'
GiantStepsTempo:
url: https://github.com/GiantSteps/giantsteps-tempo-dataset
metadata: tempo
contents: 664 files
audio: 'no'
GiantStepsTempo:alternate:
url: http://www.tagtraum.com/download/schreiber_new_giantsteps_tempo.zip
metadata: tempo
contents: 664 files
audio: 'no'
GiantStepsKey:
url: https://github.com/GiantSteps/giantsteps-key-dataset
metadata:
- key
contents: 604 files
audio: 'no'
GNMID14:
url: https://developer.gracenote.com/mid2014
title: Gracenote Music Identification 2014
metadata:
- timestamp
- country
contents: 110M music ID matches
audio: 'no'
GoodSounds:
url: http://mtg.upf.edu/download/datasets/good-sounds
metadata:
- 12 instruments
- pitch
- sound quality
contents: 8750 notes
audio: 'yes'
GPT:
url: http://mac.citi.sinica.edu.tw/GuitarTranscription
metadata: 7 guitar playing techniques
contents: 6580 clips
audio: 'yes'
GMD:
url: http://di.ionio.gr/hilab/gmd
title: Greek Music Dataset
metadata:
- genre
- valence
- arousal
contents: 1400 songs
audio: 'downloadable'
GrooveMD:
url: https://magenta.tensorflow.org/datasets/groove
title: Groove MIDI Dataset
metadata:
- drummer/session id
- drum timing
contents: 1150 MIDI recordings
audio: 'rendered'
ExpandedGrooveMD:
url: https://g.co/magenta/e-gmd
title: Expanded Groove MIDI Dataset
metadata:
- drummer/session id
- drum timing
- kit name
contents: 45537 midi/audio pairs
audio: 'rendered'
GSD:
url: https://github.com/ashispati/GuitarSoloDetection/tree/master/Dataset
title: Guitar Solo Dataset
metadata: start/stop of guitar solos
contents: 60 songs
audio: 'no'
GTZAN:
url: http://marsyas.info/downloads/datasets.html
metadata:
- 10 genres
- tempo labels: http://www.marsyas.info/tempo/
- key labels (lerch): https://github.com/alexanderlerch/data_set
- key labels (li): http://visal.cs.cityu.edu.hk/downloads/#gtzankeys
- beat/downbeat: http://anasynth.ircam.fr/home/media/GTZAN-rhythm
- metrical levels: http://www.isophonics.net/content/metrical-structure-annotations-gtzan-dataset
contents: 1000 excerpts (30s)
audio: 'yes'
GuitarSet:
url: https://guitarset.weebly.com/
metadata:
- midi
- pitch
- beat
- chords
contents: 360 guitar excerpts (30s) with hexaphonic audio
audio: 'yes'
GZ_IsoTech:
url: https://ccmusic-database.github.io/en/database/ccm.html#GZTech
metadata: Guzheng
contents: 2824
audio: 'yes'
Hainsworth:
url: http://www.marsyas.info/tempo/ # This seems wrong?
metadata: tempo
contents: 245 excerpts (60s)
audio: 'yes'
HarmonixSet:
url: https://github.com/urinieto/harmonixset
metadata:
- beats
- downbeats
- structure
contents: 912 pop songs
audio: 'no'
HED:
url: http://coconuts-palm-lab.com/EH/HED.zip
metadata:
- emotion annotations
- harmonisation and tempo arrangements
contents: 4000 tracks with emotion annotations
audio: 'yes'
HHDS:
url: http://goo.gl/5Hu51y
metadata:
- multitrack
- style
- tempo
contents: 18 songs
audio: 'yes'
holzapfel:onset:
url: https://kth.box.com/s/o151l3rqtglhmeszah06wmvpcmpat6w9
metadata: onset times
contents: 78 excerpts
audio: 'yes'
homburg:
url: http://www-ai.cs.uni-dortmund.de/audio.html
metadata: 9 genres
contents: 1889 excerpts (10s)
audio: 'yes'
HookTheory:
url: https://github.com/chrisdonahue/sheetsage
metadata:
- aligned melody and harmony annotations
contents: 50 hours of aligned melody and harmony annotations
audio: 'yes'
IADS:
url: http://csea.phhp.ufl.edu/media/iadsmessage.html
metadata:
- valence & arousal
- dominance
contents: 111 sound snippets
audio: 'yes'
IDMT-PIANO-MM:
url: https://www.idmt.fraunhofer.de/en/publications/datasets/piano-mm.html
metadata:
- classical and jazz piano recordings
contents: 432 piano recordings (around four hours)
audio: 'yes'
IDMT-SMT-Bass:
url: http://www.idmt.fraunhofer.de/en/business_units/smt/bass.html
metadata: bass performance styles
contents: 4300 excerpts
audio: 'yes'
IDMT-SMT-Audio-Effects:
url: http://www.idmt.fraunhofer.de/en/business_units/smt/audio_effects.html
metadata: effects on bass and guitar notes
contents: 55044 recordings
audio: 'yes'
IDMT-SMT-Bass-SINGLE-TRACK:
url: http://www.idmt.fraunhofer.de/en/business_units/smt/bass_lines.html
metadata: style annotated bass lines
contents: 17 bass lines (?)
audio: 'yes'
IDMT-SMT-Drum:
url: http://www.idmt.fraunhofer.de/en/business_units/smt/drums.html
metadata:
- onset times
- perc. instruments
contents: 518 files
audio: 'yes'
IDMT-SMT-Guitar:
url: http://www.idmt.fraunhofer.de/en/business_units/smt/guitar.html
metadata: 9 guitar playing techniques
contents: 4700+400 note events
audio: 'yes'
IDMT-MT:
url: https://www.jyu.fi/hytk/fi/laitokset/mutku/en/research/projects2/past-projects/coe/materials/Multitrack
title: IDMT Multitrack
metadata:
- multitrack
- style
contents: 12 songs
audio: 'yes'
iKala:
url: http://mac.citi.sinica.edu.tw/ikala/
metadata:
- singing voice tracks
- background tracks
contents: 252 excerpts (30s)
audio: 'yes'
INRIA:EuroVision:
url: http://musicdata.gforge.inria.fr/structureAnnotation.html
metadata: structure
contents: 124 songs
audio: 'no'
INRIA:Quaero:
url: http://musicdata.gforge.inria.fr/structureAnnotation.html
metadata: structure
contents: 159 songs
audio: 'no'
UIOWA:MIS:
url: http://theremin.music.uiowa.edu/MIS.html
metadata: single instrument notes
contents: many
audio: 'yes'
IRMAS:
url: http://www.mtg.upf.edu/download/datasets/irmas
metadata: 11 instruments
contents: 2874 excerpts
audio: 'yes'
ISMIR2004Genre:
url: http://ismir2004.ismir.net/genre_contest/index.html
metadata: 6 genres
contents: 729 excerpts (30s)
audio: 'yes'
ISMIR2004Tempo:
url: http://mtg.upf.edu/ismir2004/contest/tempoContest/node6.html
metadata: tempo
contents: 465 excerpts (20s)
audio: 'yes'
JAAH:
url: https://github.com/MTG/JAAH
title: Jazz Audio-Aligned Harmony Dataset
metadata:
- structure
- key
- chords
- beats
contents: 113 songs
audio: 'no'
Jamendo-VAD:
url: https://jobim.ofai.at/download/jamendo.tgz
metadata: voice activity
contents: 61+16+16 songs
audio: 'yes'
JGDB:
url: https://ccrma.stanford.edu/~jga/ismir2010/ismir2010.html
metadata:
- multitrack
- MIDI
contents: random generated excerpts
audio: 'yes'
JKU-ScoFo:
url: http://www.cp.jku.at/resources/2019_RLScoFo_TISMIR
metadata:
- audio
- MIDI
contents: 16 recordings
audio: 'yes'
Jordan:Classical:
url: http://jblsmith.github.io/projects/masters-thesis/
metadata: structure
contents: 15 pieces
audio: 'yes'
Jordan:Jazz:
url: http://jblsmith.github.io/projects/masters-thesis/
metadata: structure
contents: 15 pieces
audio: 'yes'
JLSDD:
url: https://github.com/ELVIS-Project/mass-duos-corpus-josquin-larue/tree/Methodologies-for-Creating-Symbolic-Music-Corpora
title: Josquin La Rue Secure Duo Dataset
metadata: symbolic scores
contents: 77 duos (Josquin & La Rue)
audio: 'no'
KUGDastgahi:
url: https://phaidra.kug.ac.at/view/o:127195
metadata: dastgahi music
contents: 213 solo recordings by four professional musicians
audio: 'audio'
LabROSA:APT:
url: http://labrosa.ee.columbia.edu/projects/piano/
metadata: MIDI
contents: 29 piano excerpts
audio: 'yes'
LabROSA:MIDI:
url: http://labrosa.ee.columbia.edu/sounds/music/
metadata:
- audio
- MIDI
contents: 4 songs
audio: 'yes'
last.fm:
url: https://zenodo.org/record/6090214
title: last.fm-1K and last.fm-360K
metadata: user listening habits from last.fm
contents: 992 users
audio: 'no'
LIND:
url: https://purl.stanford.edu/zy061bp9773
title: Lyrical Influence Networks Dataset
metadata: lyrics-based artist and genre graphs
contents: 42802 artists/214 genres
audio: 'no'
LFM-1b:
url: http://www.cp.jku.at/datasets/LFM-1b
metadata: listening habits
contents: 120000 users
audio: 'no'
LMD:
url: https://colinraffel.com/projects/lmd/
title: Lakh MIDI Dataset
metadata:
- MIDI
- tempo: http://www.tagtraum.com/download/schreiber_tempo_cnn_ismir2018.zip
- key: http://www.tagtraum.com/download/lmd-key.zip
contents: 176581 MIDI files
audio: 'no'
LMD - Latin:
url: http://www.ppgia.pucpr.br/~silla/lmd/
metadata: 10 genres
contents: 3160 songs
audio: 'no'
LocalifyMusicEvents-USA-2019:
url: https://github.com/JimiLab/LocalifyMusicEventData
metadata:
- music events
- socioeconomic indicators
contents: 308051 music events that took place in 2019 and from 1139 US cities
audio: 'no'
Lyra:
url: https://github.com/pxaris/lyra-dataset
metadata: a dataset for Greek Traditional and Folk music that includes 1570 pieces
contents: 1570 songs
audio: 'yes'
M-DJCUE:
url: https://github.com/MZehren/M-DJCUE
metadata: cue points
contents: 134 tracks
audio: 'no'
MAESTRO:
url: https://magenta.tensorflow.org/datasets/maestro
metadata:
- audio aligned midi
- velocity
- sustain
contents: 172 hours of piano
audio: 'yes'
magnatagatune:
url: http://mirg.city.ac.uk/codeapps/the-magnatagatune-dataset
metadata:
- similarity
- tags
contents: 25863 excerpts (30s)
audio: 'yes'
MAPS:
url: http://www.tsi.telecom-paristech.fr/aao/en/2010/07/08/maps-database-a-piano-database-for-multipitch-estimation-and-automatic-transcription-of-music/
metadata:
- piano notes/chords/pieces
- tempo/key: http://c4dm.eecs.qmul.ac.uk/ycart/a-maps.html
contents: 238 pieces
audio: 'yes'
MARD:
url: http://mtg.upf.edu/download/datasets/mard
metadata: album reviews
contents: 66566 songs
audio: 'no'
MARG-AMT:
url: http://marg.snu.ac.kr/?page_id=767
metadata:
- MIDI pitch
- onset/offset times
contents: 30 melodies
audio: 'yes'
MAST:
url: https://github.com/barisbozkurt/MASTmelody_dataset
metadata: vocal performance assessment
contents: 1018 performances
audio: 'no'
MAST-Rhythm:
url: https://zenodo.org/record/2620357
metadata: rhythm performance assessment
contents: 3721 performances
audio: 'yes'
McGill Billboard:
url: http://ddmal.music.mcgill.ca/billboard
metadata: chords
contents: 740 songs
audio: 'no'
MDBDrums:
url: https://github.com/CarlSouthall/MDBDrums
metadata:
- onset times
- perc. instrument
- playing technique
contents: 23 excerpts
audio: 'yes'
MedleyDB:
url: http://medleydb.weebly.com
metadata:
- multitrack
- genre
- melody f0
- instrument activation
contents: 122 songs
audio: 'yes'
Medley-solos-DB:
title: "Medley-solos-DB: a cross-collection dataset for musical instrument recognition"
url: https://zenodo.org/record/2582103
metadata: 8 instruments
contents: 21572 excerpts
audio: 'yes'
MeloSol:
url: https://davidjohnbaker1.github.io/melosol/
metadata:
- melody
- monophonic