File size: 1,068 Bytes
4427a9f
7f6eb84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0030bc6
b6800ef
c95adc4
7f6eb84
 
 
 
ec63e8e
 
7f6eb84
 
 
 
ec63e8e
 
 
 
7f6eb84
 
 
 
 
 
 
 
 
0030bc6
 
 
 
 
7f6eb84
0030bc6
 
ec63e8e
7f6eb84
0030bc6
e6fd727
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
training_fn: wav2vec2.train_huggingface
device: cuda
seed: 42
dance_ids: &dance_ids
  - BCH
  - CHA
  - JIV
  - ECS
  - QST
  - RMB
  - SFT
  - SLS
  - SMB
  - SWZ
  - TGO
  - VWZ
  - WCS

data_module:
  batch_size: 64
  num_workers: 5
  test_proportion: 0.2

datasets:
  preprocessing.dataset.Music4DanceDataset:
    song_data_path: ../../s3_connections/music4dance/songs_cleaned.csv
    song_audio_path: ../../s3_connections/music4dance
    class_list: *dance_ids
    multi_label: False
    min_votes: 1
    audio_window_jitter: 0.7
  preprocessing.dataset.BestBallroomDataset:
    audio_dir: ../../s3_connections/ballroom-songs
    class_list: *dance_ids
    audio_window_jitter: 0.7

model:
  n_channels: 128

feature_extractor:
  mask_count: 0 # Don't mask the data
  snr_mean: 15.0 # Pretty much eliminate the noise
  freq_mask_size: 10
  time_mask_size: 80

trainer:
  log_every_n_steps: 15
  accelerator: gpu
  max_epochs: 50
  min_epochs: 7
  fast_dev_run: False
  # gradient_clip_val: 0.5
  overfit_batches: 1

training_environment:
  learning_rate: 0.00053