p-alonso commited on
Commit
cb49d44
·
verified ·
1 Parent(s): 88ca33c

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. config.gin +99 -0
  2. model.ckpt +3 -0
config.gin ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Parameters for AudioDataModule:
2
+ # ==============================================================================
3
+ AudioDataModule.num_workers = 20
4
+
5
+ # Parameters for AudioDataset:
6
+ # ==============================================================================
7
+ AudioDataset.half_precision = True
8
+ AudioDataset.mono = True
9
+ AudioDataset.new_freq = 16000
10
+ AudioDataset.num_frames = 480000
11
+ AudioDataset.orig_freq = 16000
12
+
13
+ # Parameters for build_dev_datamodule:
14
+ # ==============================================================================
15
+ build_dev_datamodule.datamodule = @discotube
16
+
17
+ # Parameters for build_module:
18
+ # ==============================================================================
19
+ build_module.ckpt_path = 'model.ckpt'
20
+ build_module.module = @modules.maskingmodel.MaskingModel
21
+ build_module.net = @nets.conformer.Conformer
22
+ build_module.representation = @nets.melspectrogram.MelSpectrogram
23
+
24
+ # Parameters for Conformer:
25
+ # ==============================================================================
26
+ Conformer.alpha_deepnorm = 2.6321480259049848
27
+ Conformer.beta_deepnorm = 0.022386873579657126
28
+ Conformer.conv_kernel_size = 5
29
+ Conformer.depth = 24
30
+ Conformer.dropout = 0.2
31
+ Conformer.embed_dim = 1024
32
+ Conformer.input_dropout = 0.0
33
+ Conformer.mlp_ratio = 4.0
34
+ Conformer.mlp_residual_factor = 4.0
35
+ Conformer.num_heads = 8
36
+ Conformer.num_patches = 460
37
+ Conformer.patch_size = (96, 4)
38
+ Conformer.use_deepnorm = True
39
+ Conformer.use_rope = True
40
+
41
+ # Parameters for CosineAnnealingCallback:
42
+ # ==============================================================================
43
+ CosineAnnealingCallback.eta_min = 1e-07
44
+ CosineAnnealingCallback.warmup_steps = 30000
45
+
46
+ # Parameters for DiscotubeAudioDataModule:
47
+ # ==============================================================================
48
+ DiscotubeAudioDataModule.batch_size = 32
49
+ DiscotubeAudioDataModule.data_dir = ''
50
+ DiscotubeAudioDataModule.filelist_train = ''
51
+ DiscotubeAudioDataModule.filelist_val = ''
52
+
53
+ # Parameters for MaskingModel:
54
+ # ==============================================================================
55
+ MaskingModel.codebook_dim = 16
56
+ MaskingModel.codebook_size = 8192
57
+ MaskingModel.diff_input = False
58
+ MaskingModel.lr = 0.0001
59
+ MaskingModel.mask_prob = 0.6
60
+ MaskingModel.mask_seconds = 0.4
61
+ MaskingModel.num_codebooks = 4
62
+ MaskingModel.plot_tokens = False
63
+ MaskingModel.seed = 0
64
+ MaskingModel.weight_decay = 0.01
65
+
66
+ # Parameters for MelSpectrogram:
67
+ # ==============================================================================
68
+ MelSpectrogram.freq_mask_param = 0
69
+ MelSpectrogram.hop_len = 256
70
+ MelSpectrogram.mel_scale = 'slaney'
71
+ MelSpectrogram.n_mel = 96
72
+ MelSpectrogram.norm = 'slaney'
73
+ MelSpectrogram.norm_mean = 2.06755686098554
74
+ MelSpectrogram.norm_std = 1.268292820667291
75
+ MelSpectrogram.power = 2
76
+ MelSpectrogram.sr = 16000
77
+ MelSpectrogram.stretch_factor = 1
78
+ MelSpectrogram.time_mask_param = 0
79
+ MelSpectrogram.win_len = 512
80
+ MelSpectrogram.patch_size = (96, 4)
81
+
82
+ # Parameters for train:
83
+ # ==============================================================================
84
+ train.params = \
85
+ {'accelerator': 'gpu',
86
+ 'devices': 4,
87
+ 'log_every_n_steps': 50,
88
+ 'max_steps': 400000,
89
+ 'num_nodes': 1,
90
+ 'num_sanity_val_steps': 0,
91
+ 'precision': 'bf16-mixed',
92
+ 'strategy': 'ddp_find_unused_parameters_true'}
93
+ train.wandb_params = \
94
+ {'entity': 'mtg-upf',
95
+ 'group': 'masking_conformer',
96
+ 'name': 'mask_conformer_rope_multi4_large',
97
+ 'offline': True,
98
+ 'project': 'mtg-ssl',
99
+ 'save_dir': '/gpfs/projects/upf97/logs/'}
model.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04384614600f75333e13c9ff950ceed1cf0fd296c44f7ce82aa32e2b4512e99a
3
+ size 7374069142