tokyotech-llm/Llama-3.1-8B-code-ablation-exp3-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0012500
8B
•
Updated
•
5
•
1
tokyotech-llm/Llama-3.1-8B-code-ablation-exp3-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0010000
tokyotech-llm/Llama-3.1-8B-code-ablation-exp3-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0007500
8B
•
Updated
•
4
tokyotech-llm/Llama-3.1-8B-code-ablation-exp3-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0005000
tokyotech-llm/Llama-3.1-8B-code-ablation-exp3-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0002500
8B
•
Updated
•
36
tokyotech-llm/Llama-3.1-8B-code-ablation-exp2-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0012500
tokyotech-llm/Llama-3.1-8B-code-ablation-exp2-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0010000
tokyotech-llm/Llama-3.1-8B-code-ablation-exp2-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0007500
tokyotech-llm/Llama-3.1-8B-code-ablation-exp2-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0005000
tokyotech-llm/Llama-3.1-8B-code-ablation-exp2-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0002500
8B
•
Updated
•
6
tokyotech-llm/Llama-3.1-8B-code-ablation-exp1-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0012500
8B
•
Updated
•
5
tokyotech-llm/Llama-3.1-8B-code-ablation-exp1-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0010000
tokyotech-llm/Llama-3.1-8B-code-ablation-exp1-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0007500
8B
•
Updated
•
6
tokyotech-llm/Llama-3.1-8B-code-ablation-exp1-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0005000
8B
•
Updated
•
7
tokyotech-llm/Llama-3.1-8B-code-ablation-exp1-LR2.5e-5-MINLR2.5E-6-WD0.1-iter0002500
tokyotech-llm/Llama-3.1-Swallow-8B-v0.5
8B
•
Updated
•
2.96k
•
8
tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4
Text Generation
•
71B
•
Updated
•
2.74k
•
•
12
tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.5
Text Generation
•
8B
•
Updated
•
32.9k
•
•
17
tokyotech-llm/Llama-3.3-Swallow-70B-v0.4
Text Generation
•
71B
•
Updated
•
1.35k
•
4
tokyotech-llm/Gemma-2-Llama-Swallow-27b-it-v0.1
Text Generation
•
Updated
•
170
•
2
tokyotech-llm/Gemma-2-Llama-Swallow-9b-it-v0.1
Text Generation
•
Updated
•
638
•
•
4
tokyotech-llm/Gemma-2-Llama-Swallow-2b-it-v0.1
Text Generation
•
Updated
•
719
•
4
tokyotech-llm/Gemma-2-Llama-Swallow-2b-pt-v0.1
Text Generation
•
Updated
•
5.42k
tokyotech-llm/Gemma-2-Llama-Swallow-27b-pt-v0.1
Text Generation
•
27B
•
Updated
•
124
•
1
tokyotech-llm/Gemma-2-Llama-Swallow-9b-pt-v0.1
Text Generation
•
Updated
•
356
•
1
tokyotech-llm/Llama-3.1-8B-math-ablation-exp1-LR2.5e-5-WD0.1-iter0012500
8B
•
Updated
•
3
tokyotech-llm/Llama-3.1-8B-math-ablation-exp1-LR2.5e-5-WD0.1-iter0010000
8B
•
Updated
•
4
tokyotech-llm/Llama-3.1-8B-math-ablation-exp1-LR2.5e-5-WD0.1-iter0007500
8B
•
Updated
•
3
tokyotech-llm/Llama-3.1-8B-math-ablation-exp1-LR2.5e-5-WD0.1-iter0005000
8B
•
Updated
•
8
tokyotech-llm/Llama-3.1-8B-math-ablation-exp1-LR2.5e-5-WD0.1-iter0002500
8B
•
Updated
•
3