Some more changes to split files per program
Browse files
HuggingFace_Mistral_Transformer_Single_Instrument.ipynb
CHANGED
@@ -85,19 +85,19 @@
|
|
85 |
"# Our tokenizer's configuration\n",
|
86 |
"BEAT_RES = {(0, 1): 12, (1, 2): 4, (2, 4): 2, (4, 8): 1}\n",
|
87 |
"TOKENIZER_PARAMS = {\n",
|
88 |
-
" \"pitch_range\": (21,
|
89 |
" \"beat_res\": BEAT_RES,\n",
|
90 |
-
" \"num_velocities\":
|
91 |
" \"special_tokens\": [\"PAD\", \"BOS\", \"EOS\"],\n",
|
92 |
" \"use_chords\": True,\n",
|
93 |
" \"use_rests\": True,\n",
|
94 |
" \"use_tempos\": True,\n",
|
95 |
" \"use_time_signatures\": True,\n",
|
96 |
" \"use_programs\": False, # We want single track \n",
|
97 |
-
" \"one_token_stream_for_programs\":
|
98 |
" \"programs\": list(range(0, 128)), #-1 drums, skip drums\n",
|
99 |
" \"num_tempos\": 32,\n",
|
100 |
-
" \"tempo_range\": (
|
101 |
"}\n",
|
102 |
"config = TokenizerConfig(**TOKENIZER_PARAMS)\n",
|
103 |
"\n",
|
@@ -485,7 +485,7 @@
|
|
485 |
" \n",
|
486 |
")\n",
|
487 |
"\n",
|
488 |
-
"collator = DataCollator(tokenizer[\"PAD_None\"], copy_inputs_as_labels=True)\n",
|
489 |
"trainer = Trainer(\n",
|
490 |
" model=model,\n",
|
491 |
" args=training_config,\n",
|
|
|
85 |
"# Our tokenizer's configuration\n",
|
86 |
"BEAT_RES = {(0, 1): 12, (1, 2): 4, (2, 4): 2, (4, 8): 1}\n",
|
87 |
"TOKENIZER_PARAMS = {\n",
|
88 |
+
" \"pitch_range\": (21, 108),\n",
|
89 |
" \"beat_res\": BEAT_RES,\n",
|
90 |
+
" \"num_velocities\": 32,\n",
|
91 |
" \"special_tokens\": [\"PAD\", \"BOS\", \"EOS\"],\n",
|
92 |
" \"use_chords\": True,\n",
|
93 |
" \"use_rests\": True,\n",
|
94 |
" \"use_tempos\": True,\n",
|
95 |
" \"use_time_signatures\": True,\n",
|
96 |
" \"use_programs\": False, # We want single track \n",
|
97 |
+
" \"one_token_stream_for_programs\": False, # We want single track\n",
|
98 |
" \"programs\": list(range(0, 128)), #-1 drums, skip drums\n",
|
99 |
" \"num_tempos\": 32,\n",
|
100 |
+
" \"tempo_range\": (40, 250), # (min_tempo, max_tempo)\n",
|
101 |
"}\n",
|
102 |
"config = TokenizerConfig(**TOKENIZER_PARAMS)\n",
|
103 |
"\n",
|
|
|
485 |
" \n",
|
486 |
")\n",
|
487 |
"\n",
|
488 |
+
"collator = DataCollator(tokenizer[\"PAD_None\"], copy_inputs_as_labels=True, pad_on_left=True) #not sure about the pad_on_left, it might get better results\n",
|
489 |
"trainer = Trainer(\n",
|
490 |
" model=model,\n",
|
491 |
" args=training_config,\n",
|