Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +2 -0
- checkpoint_1388500/config.json +130 -0
- checkpoint_1388500/optimizer.tp00/.metadata +3 -0
- checkpoint_1388500/optimizer.tp00/__0_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__10_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__11_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__12_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__13_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__14_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__15_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__16_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__17_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__18_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__19_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__1_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__20_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__21_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__22_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__23_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__24_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__25_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__26_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__27_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__28_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__29_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__2_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__30_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__31_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__3_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__4_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__5_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__6_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__7_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__8_0.distcp +3 -0
- checkpoint_1388500/optimizer.tp00/__9_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/.metadata +3 -0
- checkpoint_1388500/sharded_model.tp00/__0_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__10_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__11_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__12_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__13_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__14_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__15_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__16_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__17_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__18_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__19_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__1_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__20_0.distcp +3 -0
- checkpoint_1388500/sharded_model.tp00/__21_0.distcp +3 -0
.gitattributes
CHANGED
|
@@ -13,3 +13,5 @@ checkpoint_1000000/optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
|
| 13 |
checkpoint_1000000/sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
| 14 |
optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
| 15 |
sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 13 |
checkpoint_1000000/sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
| 14 |
optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
| 15 |
sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
checkpoint_1388500/optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
checkpoint_1388500/sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1388500/config.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"async_checkpointing": false,
|
| 3 |
+
"async_eval_ngpus": 0,
|
| 4 |
+
"batch_size": 2,
|
| 5 |
+
"chunk_parallel_size": 1,
|
| 6 |
+
"cluster": "tacc",
|
| 7 |
+
"data": "/scratch/10631/ryantlee/dolma/cc_en_head:10.865,/scratch/10631/ryantlee/dolma/cc_en_middle:13.038,/scratch/10631/ryantlee/dolma/cc_en_tail:12.314,/scratch/10631/ryantlee/dolma/starcoder:15.984,/scratch/10631/ryantlee/dolma/c4:4.193,/scratch/10631/ryantlee/dolma/reddit:4.841,/scratch/10631/ryantlee/dolma/arxiv:1.697,/scratch/10631/ryantlee/dolma/stackexchange:1.188,/scratch/10631/ryantlee/dolma/falcon:27.653,/scratch/10631/ryantlee/dolma/cc_news:0.866,/scratch/10631/ryantlee/dolma/open-web-math-train:0.763,/scratch/10631/ryantlee/dolma/algebraic-stack-train:0.763,/scratch/10631/ryantlee/dolma/pes2o:3.466,/scratch/10631/ryantlee/dolma/megawika:0.279,/scratch/10631/ryantlee/dolma/wiki:0.448,/scratch/10631/ryantlee/dolma/books:0.642,/scratch/10631/ryantlee/dolma/tulu_flan:1.000",
|
| 8 |
+
"disable_logging": false,
|
| 9 |
+
"disable_workers_print": true,
|
| 10 |
+
"dtype": "bf16",
|
| 11 |
+
"dump_dir": "/scratch/10631/ryantlee/saved_models/gecko1.2B_stage1",
|
| 12 |
+
"dump_freq": 500,
|
| 13 |
+
"enable_loss_tracker": false,
|
| 14 |
+
"eval_freq": 5000,
|
| 15 |
+
"finetuning_dir": "",
|
| 16 |
+
"fp32_reduce_scatter": true,
|
| 17 |
+
"gc_collect_freq": 50,
|
| 18 |
+
"gpu_check_level": 2,
|
| 19 |
+
"instruct": {
|
| 20 |
+
"no_loss_prompt": false,
|
| 21 |
+
"no_loss_truncated": false
|
| 22 |
+
},
|
| 23 |
+
"instruct_data": "",
|
| 24 |
+
"iter_jsonl": {
|
| 25 |
+
"buffer_size": 64,
|
| 26 |
+
"same_data": false
|
| 27 |
+
},
|
| 28 |
+
"iter_multi": {
|
| 29 |
+
"buffer_size": 512,
|
| 30 |
+
"ignore_extra_chunks": true,
|
| 31 |
+
"max_precompute": 20,
|
| 32 |
+
"multiprocess": true
|
| 33 |
+
},
|
| 34 |
+
"iter_type": "multi",
|
| 35 |
+
"keep_eval_checkpoints": true,
|
| 36 |
+
"keep_n_last_checkpoints": 5,
|
| 37 |
+
"log_freq": 10,
|
| 38 |
+
"log_wandb": false,
|
| 39 |
+
"loss_rescaling": false,
|
| 40 |
+
"model": {
|
| 41 |
+
"attention_dropout": 0.0,
|
| 42 |
+
"cema_ndim": 16,
|
| 43 |
+
"chunk_size": 2048,
|
| 44 |
+
"custom_bwd": true,
|
| 45 |
+
"dropout": 0.0,
|
| 46 |
+
"efficient_attn": "fused",
|
| 47 |
+
"ffn_hidden_dim": 6528,
|
| 48 |
+
"hidden_dropout": 0.0,
|
| 49 |
+
"init_mode": "he",
|
| 50 |
+
"layernorm_num_groups": 1,
|
| 51 |
+
"layerwise_ckpt": false,
|
| 52 |
+
"loss_parallel": false,
|
| 53 |
+
"memory_efficient_norm": true,
|
| 54 |
+
"model_dim": 2048,
|
| 55 |
+
"norm_affine": true,
|
| 56 |
+
"norm_eps": 1e-05,
|
| 57 |
+
"num_heads": 2,
|
| 58 |
+
"num_layers": 16,
|
| 59 |
+
"output_size": -1,
|
| 60 |
+
"recompute_attention": true,
|
| 61 |
+
"recompute_fc1_out": true,
|
| 62 |
+
"recompute_fc3_out": true,
|
| 63 |
+
"recompute_v": true,
|
| 64 |
+
"rescale_nffn": false,
|
| 65 |
+
"rope_base": null,
|
| 66 |
+
"scale_emb": false,
|
| 67 |
+
"share_emb": false,
|
| 68 |
+
"swiglu": true,
|
| 69 |
+
"timenorm_beta1": 0.999,
|
| 70 |
+
"timenorm_beta2": 0.9999,
|
| 71 |
+
"timenorm_num_groups": 32,
|
| 72 |
+
"two_hop_residual": false,
|
| 73 |
+
"value_dim": 4096,
|
| 74 |
+
"vocab_size": 50281,
|
| 75 |
+
"z_dim": 512
|
| 76 |
+
},
|
| 77 |
+
"model_parallel_size": 1,
|
| 78 |
+
"multi_segments": true,
|
| 79 |
+
"nccl_timeout": 1800,
|
| 80 |
+
"optim": {
|
| 81 |
+
"beta1": 0.9,
|
| 82 |
+
"beta2": 0.95,
|
| 83 |
+
"clip": 1.0,
|
| 84 |
+
"cycles": 1.0,
|
| 85 |
+
"epsilon": 1e-08,
|
| 86 |
+
"lr": 0.0004,
|
| 87 |
+
"lr_end_ratio": 0.05,
|
| 88 |
+
"lr_init_ratio": 0.0001,
|
| 89 |
+
"optim_state_dtype": null,
|
| 90 |
+
"scheduler": "cosine",
|
| 91 |
+
"warmup": 2000,
|
| 92 |
+
"weight_decay": 0.05
|
| 93 |
+
},
|
| 94 |
+
"reshard_after_forward": true,
|
| 95 |
+
"restore_dataloader_position": false,
|
| 96 |
+
"seed": 3,
|
| 97 |
+
"seq_len": 32768,
|
| 98 |
+
"slurm": {
|
| 99 |
+
"global_rank": 0,
|
| 100 |
+
"is_slurm_job": true,
|
| 101 |
+
"world_size": 32
|
| 102 |
+
},
|
| 103 |
+
"steps": 1907349,
|
| 104 |
+
"sync_check_freq": 10000,
|
| 105 |
+
"tokenizer": {
|
| 106 |
+
"data_tokenized": false,
|
| 107 |
+
"num_reserved_special_tokens": 0,
|
| 108 |
+
"path": "/work/10631/ryantlee/vista/OLMo1_tokenizer",
|
| 109 |
+
"type": "gptneox"
|
| 110 |
+
},
|
| 111 |
+
"valid": {
|
| 112 |
+
"batch_size": 2,
|
| 113 |
+
"gen_seq_len": 8192,
|
| 114 |
+
"majority_voting": 0,
|
| 115 |
+
"n_batches": 1,
|
| 116 |
+
"ppl_files_str": "/scratch/10631/ryantlee/dolma_val/validation_100k.jsonl",
|
| 117 |
+
"prompt_path": "",
|
| 118 |
+
"random_fewshots": false,
|
| 119 |
+
"seq_len": 32768,
|
| 120 |
+
"tasks_root_dir": "/scratch/10631/ryantlee/tasks",
|
| 121 |
+
"tasks_str": "boolq,hellaswag,nq",
|
| 122 |
+
"temperature": 1.0,
|
| 123 |
+
"top_k": 0,
|
| 124 |
+
"top_p": 0.0,
|
| 125 |
+
"use_sampling": false,
|
| 126 |
+
"write_eval": false
|
| 127 |
+
},
|
| 128 |
+
"wandb_entity": null,
|
| 129 |
+
"wandb_project": null
|
| 130 |
+
}
|
checkpoint_1388500/optimizer.tp00/.metadata
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da73f34f93c0d13e931538a0ac1a76af1cb931203bc09b2d9df29ddc85087e4d
|
| 3 |
+
size 4028123
|
checkpoint_1388500/optimizer.tp00/__0_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:049fe0e48590cf2379d5455ef48205c946305f765eb6bfffee4bd72298933c9e
|
| 3 |
+
size 335250656
|
checkpoint_1388500/optimizer.tp00/__10_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d17eff7f61b91d4eadde6705294c1b5661fdfd1c801c46b9d2ff96e1a3acf6c
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__11_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9763acbf9dacbe135e3204a63dfece065e970e80597e5410d136f1c54497c96
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__12_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:223a29c266c589da25b52831653b318bb0f741da25b3535d0ae655007aef7f32
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__13_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c500c268f91397422f556ab4ad2d4f3cfca17fb6595d4b163f96acb993397de
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__14_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1571268849956914d7e504a75a19af340f03b654d1de8ff06fc181253ea70bc
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__15_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0bf688da5b932f3d671b706d0465ef0b18d3445c65196a280380d6f44840f4b0
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__16_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e9804f1a6c1af3f9c5940c3422d2972af4c393944aa66376c6effd8802d6e1b
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__17_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c55ad2eeafaab4a431b0b483a762df9f9eb151839cfe8b86947262eeaaa0ca8
|
| 3 |
+
size 335062436
|
checkpoint_1388500/optimizer.tp00/__18_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:916289ff0152487e68793a523bd99521a0e83e7b5e51020785b34e32b79fe1d7
|
| 3 |
+
size 335062436
|
checkpoint_1388500/optimizer.tp00/__19_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:389de162f57bebc91f20a80343a0bff7957073789b3546b6c8590bcd9d6f7d59
|
| 3 |
+
size 335062436
|
checkpoint_1388500/optimizer.tp00/__1_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e905beb925ea17d55b2edf5b78b94bc69ed938489667ade44f5d8ba8bf5bc66d
|
| 3 |
+
size 335265996
|
checkpoint_1388500/optimizer.tp00/__20_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2eb6aab0a798ce5aae4202aeb00b901fe61a309b46e1733a0162b13fd624ba55
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__21_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c278c3c3907a23db83179960e7fefb423bcc9761dd19eca5c992656baa8fc315
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__22_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d4c695d025d5a75fdae0d0619053d41b82351115c767db58ebd00a040ada43b
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__23_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4fb0df5342ac3760842cfa867202df7435615717967dd35a3de0abeffd94b2fc
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__24_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2c66dd2076c09c8aa062803f945ef0ea7d89637370e6e0707205695f88674a5c
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__25_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a40c3ef7c2c5d49048447f121930d0b4ce15e259db428577604d71da4fc6dee
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__26_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2902c3633fc5b2d628ca026cc81a2a5ac6d078174ab03ac80f3cbbf8d099b77f
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__27_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d80b81d74d5b2126ae9ca69d4ac1df49cc06a721a9aa6b678b10f770c9f1801
|
| 3 |
+
size 335061320
|
checkpoint_1388500/optimizer.tp00/__28_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47ec6577abe8e154e1ce48bd136bcf903655e54a8f9651c7dc3efff0e85e880e
|
| 3 |
+
size 335073672
|
checkpoint_1388500/optimizer.tp00/__29_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80b08593db87f1eb6702b21cf9a9fbea0b7422cc98ecf5149fb0a57409e7dace
|
| 3 |
+
size 335061572
|
checkpoint_1388500/optimizer.tp00/__2_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf69eb21235d8a8b4a2729549cc074e1042b7a613035c2eee7e95011b29826be
|
| 3 |
+
size 335059404
|
checkpoint_1388500/optimizer.tp00/__30_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d78c8d3dc803c73b4a8160ef02ef0122ff301bc43756e2104f942ac3cddab2aa
|
| 3 |
+
size 335061572
|
checkpoint_1388500/optimizer.tp00/__31_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff2123392baa4bead18ad79e342ee92aac0a3278f6de32b64a83538f289f8f1d
|
| 3 |
+
size 334307908
|
checkpoint_1388500/optimizer.tp00/__3_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:057614543b7620fb69ca06cd529a826b195c820157a9db41c7ebbd2009c757ec
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__4_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45a1a118e7cd0629d7e53d38bbd284aaa250738ce0ed450c5c81608690897515
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__5_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0bfd578a25ef9458bb349693f088d527314041ff069534d12a4328a5ab14272
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__6_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa73fb42fada15f95e93529769c9e39af502d25fdafd69b1d5720ae64cbfee60
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__7_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4f6115b1b637fff4573bca1d3ea376c663034586c05a1f817aca4e2b2142fbd
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__8_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1b40a34ad6aaa897c1fe250126d88c8974a60a942680f53be77a0a03db85028
|
| 3 |
+
size 335061636
|
checkpoint_1388500/optimizer.tp00/__9_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a699312994e4edbf201d6036537175cd2ea007629a68494fb99cb9a806653450
|
| 3 |
+
size 335061636
|
checkpoint_1388500/sharded_model.tp00/.metadata
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ae2fcf7233815a312dd7795ef00a103201888044943b33f8a99ba7d0badc9d4
|
| 3 |
+
size 1775629
|
checkpoint_1388500/sharded_model.tp00/__0_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc4b2b2cd36140e753710064a4f92ab73d1ae3f13918b4628b0064b94f7eb40a
|
| 3 |
+
size 167625328
|
checkpoint_1388500/sharded_model.tp00/__10_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be8133092af31b977e85dae914e259a15ad99e13ce71f759a85f114c686082a7
|
| 3 |
+
size 167525764
|
checkpoint_1388500/sharded_model.tp00/__11_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd3364e95c95690342cbaf4c3aabdcda866c112c157ce6769af665fc2cda1cbb
|
| 3 |
+
size 167526816
|
checkpoint_1388500/sharded_model.tp00/__12_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb2e3cf3bd520af2399fa5af7395b524f27ad35f695f7459fadbb38b8fb26f33
|
| 3 |
+
size 167525572
|
checkpoint_1388500/sharded_model.tp00/__13_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5c7e8c7a0425cbfa720cc7856008649cc5bdf2524407d4361558a9a450bf79b
|
| 3 |
+
size 167525572
|
checkpoint_1388500/sharded_model.tp00/__14_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:693d377af06ec39d8e5524ebbcad94f1e738b48da7ebd445a034079014243fc3
|
| 3 |
+
size 167525636
|
checkpoint_1388500/sharded_model.tp00/__15_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a8e53d9e943a3b2a6ea176976248dca7891c8a896b56f3dd57d96d2515aa52c
|
| 3 |
+
size 167525572
|
checkpoint_1388500/sharded_model.tp00/__16_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:931a75ac0fff1a083ac2a6c86f09ad6aaf7f9855b4d8b6541e176c9f13a40bdb
|
| 3 |
+
size 167524456
|
checkpoint_1388500/sharded_model.tp00/__17_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f9866dfeed8bd16dd5acfc5b63cbffc08361a88cccb9ba796d524894bee99c1
|
| 3 |
+
size 167525636
|
checkpoint_1388500/sharded_model.tp00/__18_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f75ff3ee330072d8fe8159a785856a1d7fe927154ab68014c9e65c5652eb67f
|
| 3 |
+
size 167524456
|
checkpoint_1388500/sharded_model.tp00/__19_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e80500a94545eae3367bfe1af15e8e17a4b4ec4ebaae9ec004ddab89c4d02c2
|
| 3 |
+
size 167524456
|
checkpoint_1388500/sharded_model.tp00/__1_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b3363ab480fc14d6439fa83f3920c8a2dd45c97c3961d06a1eee65755c3a15d
|
| 3 |
+
size 167627020
|
checkpoint_1388500/sharded_model.tp00/__20_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23daa1f513be6d5daf9b9340ee7b4c090e7b670dca7cbb8347e283eb97023124
|
| 3 |
+
size 167527996
|
checkpoint_1388500/sharded_model.tp00/__21_0.distcp
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b890e697a540f3940a1a0f1467d0558a21ee75a1b4810d92551604e778da1d1c
|
| 3 |
+
size 167524456
|