adricl commited on
Commit
4c06149
·
1 Parent(s): 0c2af15

Some more changes to split files per program

Browse files
HuggingFace_Mistral_Transformer_Single_Instrument.ipynb CHANGED
@@ -85,19 +85,19 @@
85
  "# Our tokenizer's configuration\n",
86
  "BEAT_RES = {(0, 1): 12, (1, 2): 4, (2, 4): 2, (4, 8): 1}\n",
87
  "TOKENIZER_PARAMS = {\n",
88
- " \"pitch_range\": (21, 109),\n",
89
  " \"beat_res\": BEAT_RES,\n",
90
- " \"num_velocities\": 24,\n",
91
  " \"special_tokens\": [\"PAD\", \"BOS\", \"EOS\"],\n",
92
  " \"use_chords\": True,\n",
93
  " \"use_rests\": True,\n",
94
  " \"use_tempos\": True,\n",
95
  " \"use_time_signatures\": True,\n",
96
  " \"use_programs\": False, # We want single track \n",
97
- " \"one_token_stream_for_programs\": True,\n",
98
  " \"programs\": list(range(0, 128)), #-1 drums, skip drums\n",
99
  " \"num_tempos\": 32,\n",
100
- " \"tempo_range\": (50, 200), # (min_tempo, max_tempo)\n",
101
  "}\n",
102
  "config = TokenizerConfig(**TOKENIZER_PARAMS)\n",
103
  "\n",
@@ -485,7 +485,7 @@
485
  " \n",
486
  ")\n",
487
  "\n",
488
- "collator = DataCollator(tokenizer[\"PAD_None\"], copy_inputs_as_labels=True)\n",
489
  "trainer = Trainer(\n",
490
  " model=model,\n",
491
  " args=training_config,\n",
 
85
  "# Our tokenizer's configuration\n",
86
  "BEAT_RES = {(0, 1): 12, (1, 2): 4, (2, 4): 2, (4, 8): 1}\n",
87
  "TOKENIZER_PARAMS = {\n",
88
+ " \"pitch_range\": (21, 108),\n",
89
  " \"beat_res\": BEAT_RES,\n",
90
+ " \"num_velocities\": 32,\n",
91
  " \"special_tokens\": [\"PAD\", \"BOS\", \"EOS\"],\n",
92
  " \"use_chords\": True,\n",
93
  " \"use_rests\": True,\n",
94
  " \"use_tempos\": True,\n",
95
  " \"use_time_signatures\": True,\n",
96
  " \"use_programs\": False, # We want single track \n",
97
+ " \"one_token_stream_for_programs\": False, # We want single track\n",
98
  " \"programs\": list(range(0, 128)), #-1 drums, skip drums\n",
99
  " \"num_tempos\": 32,\n",
100
+ " \"tempo_range\": (40, 250), # (min_tempo, max_tempo)\n",
101
  "}\n",
102
  "config = TokenizerConfig(**TOKENIZER_PARAMS)\n",
103
  "\n",
 
485
  " \n",
486
  ")\n",
487
  "\n",
488
+ "collator = DataCollator(tokenizer[\"PAD_None\"], copy_inputs_as_labels=True, pad_on_left=True) #not sure about the pad_on_left, it might get better results\n",
489
  "trainer = Trainer(\n",
490
  " model=model,\n",
491
  " args=training_config,\n",