Automatic Speech Recognition
Transformers
PyTorch
TensorBoard
Georgian
wav2vec2
mozilla-foundation/common_voice_8_0
Generated from Trainer
robust-speech-event
hf-asr-leaderboard
Eval Results (legacy)
Instructions to use arampacha/wav2vec2-xls-r-1b-ka with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use arampacha/wav2vec2-xls-r-1b-ka with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("automatic-speech-recognition", model="arampacha/wav2vec2-xls-r-1b-ka")# Load model directly from transformers import AutoProcessor, AutoModelForCTC processor = AutoProcessor.from_pretrained("arampacha/wav2vec2-xls-r-1b-ka") model = AutoModelForCTC.from_pretrained("arampacha/wav2vec2-xls-r-1b-ka") - Notebooks
- Google Colab
- Kaggle
| { | |
| "best_metric": 0.10217397660017014, | |
| "best_model_checkpoint": "/workspace/output/ka/wav2vec2-xls-r-1b-ka-2/checkpoint-4000", | |
| "epoch": 64.512, | |
| "global_step": 4000, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.61, | |
| "learning_rate": 1.7678499999999997e-05, | |
| "loss": 5.1431, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 3.22, | |
| "learning_rate": 3.500349999999999e-05, | |
| "loss": 2.6801, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 4.83, | |
| "learning_rate": 5.232849999999999e-05, | |
| "loss": 1.4529, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 6.45, | |
| "learning_rate": 6.965349999999999e-05, | |
| "loss": 1.2839, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 6.45, | |
| "eval_cer": 0.05568531627678561, | |
| "eval_loss": 0.22294116020202637, | |
| "eval_runtime": 52.1848, | |
| "eval_samples_per_second": 25.774, | |
| "eval_steps_per_second": 0.422, | |
| "eval_wer": 0.3608917324802559, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 8.06, | |
| "learning_rate": 7e-05, | |
| "loss": 1.2486, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 9.67, | |
| "learning_rate": 7e-05, | |
| "loss": 1.139, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 11.29, | |
| "learning_rate": 7e-05, | |
| "loss": 1.0481, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 12.9, | |
| "learning_rate": 7e-05, | |
| "loss": 0.9775, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 12.9, | |
| "eval_cer": 0.03166960125528526, | |
| "eval_loss": 0.127132385969162, | |
| "eval_runtime": 50.7158, | |
| "eval_samples_per_second": 26.52, | |
| "eval_steps_per_second": 0.434, | |
| "eval_wer": 0.2202339298210537, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 14.51, | |
| "learning_rate": 7e-05, | |
| "loss": 0.9449, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 16.13, | |
| "learning_rate": 7e-05, | |
| "loss": 0.9374, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 17.74, | |
| "learning_rate": 7e-05, | |
| "loss": 0.9197, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 19.35, | |
| "learning_rate": 7e-05, | |
| "loss": 0.9045, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 19.35, | |
| "eval_cer": 0.02939379783678896, | |
| "eval_loss": 0.12676405906677246, | |
| "eval_runtime": 50.6864, | |
| "eval_samples_per_second": 26.536, | |
| "eval_steps_per_second": 0.434, | |
| "eval_wer": 0.20303908827351794, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 20.96, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8889, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 22.58, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8873, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 24.19, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8828, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 25.8, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8652, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 25.8, | |
| "eval_cer": 0.028746990549426858, | |
| "eval_loss": 0.12111534923315048, | |
| "eval_runtime": 50.502, | |
| "eval_samples_per_second": 26.633, | |
| "eval_steps_per_second": 0.436, | |
| "eval_wer": 0.19404178746376088, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 27.42, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8775, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 29.03, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8587, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 30.64, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8518, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 32.26, | |
| "learning_rate": 7e-05, | |
| "loss": 0.8505, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 32.26, | |
| "eval_cer": 0.027573155101991927, | |
| "eval_loss": 0.11918943375349045, | |
| "eval_runtime": 50.5112, | |
| "eval_samples_per_second": 26.628, | |
| "eval_steps_per_second": 0.436, | |
| "eval_wer": 0.19124262721183644, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 33.86, | |
| "learning_rate": 6.67415e-05, | |
| "loss": 0.8436, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 35.48, | |
| "learning_rate": 6.34165e-05, | |
| "loss": 0.8399, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 37.1, | |
| "learning_rate": 6.009149999999999e-05, | |
| "loss": 0.8258, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 38.7, | |
| "learning_rate": 5.679975e-05, | |
| "loss": 0.8168, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 38.7, | |
| "eval_cer": 0.025956136883586667, | |
| "eval_loss": 0.10860513150691986, | |
| "eval_runtime": 51.1919, | |
| "eval_samples_per_second": 26.274, | |
| "eval_steps_per_second": 0.43, | |
| "eval_wer": 0.17634709587123862, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 40.32, | |
| "learning_rate": 5.3474749999999995e-05, | |
| "loss": 0.8068, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 41.93, | |
| "learning_rate": 5.0149749999999995e-05, | |
| "loss": 0.7971, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 43.54, | |
| "learning_rate": 4.6824749999999996e-05, | |
| "loss": 0.7893, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 45.16, | |
| "learning_rate": 4.3499749999999996e-05, | |
| "loss": 0.7737, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 45.16, | |
| "eval_cer": 0.025620755327176687, | |
| "eval_loss": 0.10982357710599899, | |
| "eval_runtime": 50.6716, | |
| "eval_samples_per_second": 26.543, | |
| "eval_steps_per_second": 0.434, | |
| "eval_wer": 0.17534739578126562, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 46.77, | |
| "learning_rate": 4.017475e-05, | |
| "loss": 0.7748, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 48.38, | |
| "learning_rate": 3.684974999999999e-05, | |
| "loss": 0.762, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 49.99, | |
| "learning_rate": 3.352475e-05, | |
| "loss": 0.753, | |
| "step": 3100 | |
| }, | |
| { | |
| "epoch": 51.61, | |
| "learning_rate": 3.0199749999999995e-05, | |
| "loss": 0.744, | |
| "step": 3200 | |
| }, | |
| { | |
| "epoch": 51.61, | |
| "eval_cer": 0.02391989171966893, | |
| "eval_loss": 0.10541926324367523, | |
| "eval_runtime": 50.5525, | |
| "eval_samples_per_second": 26.606, | |
| "eval_steps_per_second": 0.435, | |
| "eval_wer": 0.16455063480955714, | |
| "step": 3200 | |
| }, | |
| { | |
| "epoch": 53.22, | |
| "learning_rate": 2.6874749999999995e-05, | |
| "loss": 0.7233, | |
| "step": 3300 | |
| }, | |
| { | |
| "epoch": 54.83, | |
| "learning_rate": 2.3549749999999996e-05, | |
| "loss": 0.725, | |
| "step": 3400 | |
| }, | |
| { | |
| "epoch": 56.45, | |
| "learning_rate": 2.0224749999999996e-05, | |
| "loss": 0.7158, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 58.06, | |
| "learning_rate": 1.6899749999999997e-05, | |
| "loss": 0.7114, | |
| "step": 3600 | |
| }, | |
| { | |
| "epoch": 58.06, | |
| "eval_cer": 0.022829901661336496, | |
| "eval_loss": 0.10338227450847626, | |
| "eval_runtime": 51.0232, | |
| "eval_samples_per_second": 26.361, | |
| "eval_steps_per_second": 0.431, | |
| "eval_wer": 0.15725282415275418, | |
| "step": 3600 | |
| }, | |
| { | |
| "epoch": 59.67, | |
| "learning_rate": 1.3574749999999999e-05, | |
| "loss": 0.696, | |
| "step": 3700 | |
| }, | |
| { | |
| "epoch": 61.29, | |
| "learning_rate": 1.0249750000000001e-05, | |
| "loss": 0.7046, | |
| "step": 3800 | |
| }, | |
| { | |
| "epoch": 62.9, | |
| "learning_rate": 6.924750000000003e-06, | |
| "loss": 0.6915, | |
| "step": 3900 | |
| }, | |
| { | |
| "epoch": 64.51, | |
| "learning_rate": 3.5997500000000035e-06, | |
| "loss": 0.6773, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 64.51, | |
| "eval_cer": 0.02207529315941404, | |
| "eval_loss": 0.10217397660017014, | |
| "eval_runtime": 50.9761, | |
| "eval_samples_per_second": 26.385, | |
| "eval_steps_per_second": 0.432, | |
| "eval_wer": 0.15265420373887834, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 64.51, | |
| "step": 4000, | |
| "total_flos": 3.3884437885491655e+20, | |
| "train_loss": 1.020361618041992, | |
| "train_runtime": 40092.8966, | |
| "train_samples_per_second": 12.77, | |
| "train_steps_per_second": 0.1 | |
| } | |
| ], | |
| "max_steps": 4000, | |
| "num_train_epochs": 65, | |
| "total_flos": 3.3884437885491655e+20, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |