-
Notifications
You must be signed in to change notification settings - Fork 23
/
3_extract.py
35 lines (32 loc) · 1005 Bytes
/
3_extract.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
import math
from jukemir import CACHE_DIR
REPRESENTATIONS = ["chroma", "mfcc", "choi", "musicnn", "clmr", "jukebox"]
DATASET_SIZES = [
("gtzan_ff", 930),
("giantsteps_clips", 7035),
("magnatagatune", 25860),
("emomusic", 744),
]
BATCH_SIZE = 256
CMD_TEMPLATE = """
docker run \\
-it \\
--rm \\
-v {cache_dir}/processed/{dataset}/wav:/input \\
-v {cache_dir}/representations/{dataset}/{representation}:/output \\
jukemir/representations_{representation} \\
--batch_size {batch_size} \\
--batch_idx {batch_idx}
""".strip()
for dataset, dataset_size in DATASET_SIZES:
for representation in REPRESENTATIONS:
for batch_idx in range(math.ceil(dataset_size / BATCH_SIZE)):
print(
CMD_TEMPLATE.format(
cache_dir=CACHE_DIR,
dataset=dataset,
representation=representation,
batch_size=BATCH_SIZE,
batch_idx=batch_idx,
)
)