Upload llama_1b_seq8k_bs2M_100B_gqa/0000050000/train_state_00063.json with huggingface_hub
Browse files
llama_1b_seq8k_bs2M_100B_gqa/0000050000/train_state_00063.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"step": 50000, "acc_step": 0, "data_loader_state": {"it_state": {"start_token": 40, "it_state": {"it_state": {"root_dir": "/mnt/hdfs/tiktok_aiic/user/liuqian", "sources": {"dclm_pro": 1.0}, "source_to_state": {"dclm_pro": {"file_path": "/mnt/hdfs/tiktok_aiic/user/liuqian/dclm_pro/dclm_pro.chunk.00063.jsonl", "position": 6595672358, "block_size": 1, "offset": 0, "current_iter": 0}}, "rng_state": {"bit_generator": "PCG64", "state": {"state": 334113584793861336619255535688624306195, "inc": 212233488579996093995791538832249536073}, "has_uint32": 0, "uinteger": 0}}, "add_bos": true, "add_eos": true, "name": "sp", "path": "/opt/tiger/Github-Repo/lingua/tokenizers/llama2/tokenizer.model"}, "output_seq_len": 8192, "n_views": 2}, "seq_idx": 848, "rng_state": {"bit_generator": "PCG64", "state": {"state": 10447236268337811388774289615661269301, "inc": 116309495240665725662210951802735177975}, "has_uint32": 1, "uinteger": 996174404}, "batch_size": 4, "prefetch_size": 1024}, "scheduler": {"base_lrs": [0.0004], "last_epoch": 50000, "verbose": false, "_step_count": 50001, "_get_lr_called_within_step": false, "_last_lr": [0.0004], "lr_lambdas": [{}]}}
|