Upload llama_1b_seq8k_bs2M_100B_gqa_64skyladder/0000030000/train_state_00037.json with huggingface_hub

Browse files

Files changed (1) hide show

llama_1b_seq8k_bs2M_100B_gqa_64skyladder/0000030000/train_state_00037.json +1 -0

llama_1b_seq8k_bs2M_100B_gqa_64skyladder/0000030000/train_state_00037.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"step": 30000, "acc_step": 0, "data_loader_state": {"it_state": {"start_token": 845, "it_state": {"it_state": {"root_dir": "/mnt/hdfs/tiktok_aiic/user/liuqian", "sources": {"dclm_pro": 1.0}, "source_to_state": {"dclm_pro": {"file_path": "/mnt/hdfs/tiktok_aiic/user/liuqian/dclm_pro/dclm_pro.chunk.00037.jsonl", "position": 3993861343, "block_size": 1, "offset": 0, "current_iter": 0}}, "rng_state": {"bit_generator": "PCG64", "state": {"state": 122131031923026501061526045476221272751, "inc": 318386594169462210370610108991610772715}, "has_uint32": 0, "uinteger": 0}}, "add_bos": true, "add_eos": true, "name": "sp", "path": "/opt/tiger/Github-Repo/lingua/tokenizers/llama2/tokenizer.model"}, "output_seq_len": 8192, "n_views": 2}, "seq_idx": 304, "rng_state": {"bit_generator": "PCG64", "state": {"state": 190759602785120137915843454697985761667, "inc": 302020966480363221226961946381524881597}, "has_uint32": 1, "uinteger": 1031082334}, "batch_size": 4, "prefetch_size": 1024}, "scheduler": {"base_lrs": [0.0004], "last_epoch": 30000, "verbose": false, "_step_count": 30001, "_get_lr_called_within_step": false, "_last_lr": [0.0004], "lr_lambdas": [{}]}}