Update README.md
Browse files
README.md
CHANGED
|
@@ -7,6 +7,7 @@ language:
|
|
| 7 |
base_model:
|
| 8 |
- Qwen/Qwen2.5-Coder-32B-Instruct
|
| 9 |
pipeline_tag: text-generation
|
|
|
|
| 10 |
---
|
| 11 |
|
| 12 |
# Model Card for OlympicCoder-32B
|
|
@@ -77,4 +78,4 @@ The following hyperparameters were used during training on 16 H100 nodes:
|
|
| 77 |
- lr_scheduler_type: cosine_with_min_lr
|
| 78 |
- min_lr_rate: 0.1
|
| 79 |
- lr_scheduler_warmup_ratio: 0.03
|
| 80 |
-
- num_epochs: 10.0
|
|
|
|
| 7 |
base_model:
|
| 8 |
- Qwen/Qwen2.5-Coder-32B-Instruct
|
| 9 |
pipeline_tag: text-generation
|
| 10 |
+
library_name: transformers
|
| 11 |
---
|
| 12 |
|
| 13 |
# Model Card for OlympicCoder-32B
|
|
|
|
| 78 |
- lr_scheduler_type: cosine_with_min_lr
|
| 79 |
- min_lr_rate: 0.1
|
| 80 |
- lr_scheduler_warmup_ratio: 0.03
|
| 81 |
+
- num_epochs: 10.0
|