ml-ryanlee commited on
Commit
a925e29
·
verified ·
1 Parent(s): f8665c2

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +2 -0
  2. checkpoint_1388500/config.json +130 -0
  3. checkpoint_1388500/optimizer.tp00/.metadata +3 -0
  4. checkpoint_1388500/optimizer.tp00/__0_0.distcp +3 -0
  5. checkpoint_1388500/optimizer.tp00/__10_0.distcp +3 -0
  6. checkpoint_1388500/optimizer.tp00/__11_0.distcp +3 -0
  7. checkpoint_1388500/optimizer.tp00/__12_0.distcp +3 -0
  8. checkpoint_1388500/optimizer.tp00/__13_0.distcp +3 -0
  9. checkpoint_1388500/optimizer.tp00/__14_0.distcp +3 -0
  10. checkpoint_1388500/optimizer.tp00/__15_0.distcp +3 -0
  11. checkpoint_1388500/optimizer.tp00/__16_0.distcp +3 -0
  12. checkpoint_1388500/optimizer.tp00/__17_0.distcp +3 -0
  13. checkpoint_1388500/optimizer.tp00/__18_0.distcp +3 -0
  14. checkpoint_1388500/optimizer.tp00/__19_0.distcp +3 -0
  15. checkpoint_1388500/optimizer.tp00/__1_0.distcp +3 -0
  16. checkpoint_1388500/optimizer.tp00/__20_0.distcp +3 -0
  17. checkpoint_1388500/optimizer.tp00/__21_0.distcp +3 -0
  18. checkpoint_1388500/optimizer.tp00/__22_0.distcp +3 -0
  19. checkpoint_1388500/optimizer.tp00/__23_0.distcp +3 -0
  20. checkpoint_1388500/optimizer.tp00/__24_0.distcp +3 -0
  21. checkpoint_1388500/optimizer.tp00/__25_0.distcp +3 -0
  22. checkpoint_1388500/optimizer.tp00/__26_0.distcp +3 -0
  23. checkpoint_1388500/optimizer.tp00/__27_0.distcp +3 -0
  24. checkpoint_1388500/optimizer.tp00/__28_0.distcp +3 -0
  25. checkpoint_1388500/optimizer.tp00/__29_0.distcp +3 -0
  26. checkpoint_1388500/optimizer.tp00/__2_0.distcp +3 -0
  27. checkpoint_1388500/optimizer.tp00/__30_0.distcp +3 -0
  28. checkpoint_1388500/optimizer.tp00/__31_0.distcp +3 -0
  29. checkpoint_1388500/optimizer.tp00/__3_0.distcp +3 -0
  30. checkpoint_1388500/optimizer.tp00/__4_0.distcp +3 -0
  31. checkpoint_1388500/optimizer.tp00/__5_0.distcp +3 -0
  32. checkpoint_1388500/optimizer.tp00/__6_0.distcp +3 -0
  33. checkpoint_1388500/optimizer.tp00/__7_0.distcp +3 -0
  34. checkpoint_1388500/optimizer.tp00/__8_0.distcp +3 -0
  35. checkpoint_1388500/optimizer.tp00/__9_0.distcp +3 -0
  36. checkpoint_1388500/sharded_model.tp00/.metadata +3 -0
  37. checkpoint_1388500/sharded_model.tp00/__0_0.distcp +3 -0
  38. checkpoint_1388500/sharded_model.tp00/__10_0.distcp +3 -0
  39. checkpoint_1388500/sharded_model.tp00/__11_0.distcp +3 -0
  40. checkpoint_1388500/sharded_model.tp00/__12_0.distcp +3 -0
  41. checkpoint_1388500/sharded_model.tp00/__13_0.distcp +3 -0
  42. checkpoint_1388500/sharded_model.tp00/__14_0.distcp +3 -0
  43. checkpoint_1388500/sharded_model.tp00/__15_0.distcp +3 -0
  44. checkpoint_1388500/sharded_model.tp00/__16_0.distcp +3 -0
  45. checkpoint_1388500/sharded_model.tp00/__17_0.distcp +3 -0
  46. checkpoint_1388500/sharded_model.tp00/__18_0.distcp +3 -0
  47. checkpoint_1388500/sharded_model.tp00/__19_0.distcp +3 -0
  48. checkpoint_1388500/sharded_model.tp00/__1_0.distcp +3 -0
  49. checkpoint_1388500/sharded_model.tp00/__20_0.distcp +3 -0
  50. checkpoint_1388500/sharded_model.tp00/__21_0.distcp +3 -0
.gitattributes CHANGED
@@ -13,3 +13,5 @@ checkpoint_1000000/optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
13
  checkpoint_1000000/sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
14
  optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
15
  sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
 
 
 
13
  checkpoint_1000000/sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
14
  optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
15
  sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
16
+ checkpoint_1388500/optimizer.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
17
+ checkpoint_1388500/sharded_model.tp00/.metadata filter=lfs diff=lfs merge=lfs -text
checkpoint_1388500/config.json ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "async_checkpointing": false,
3
+ "async_eval_ngpus": 0,
4
+ "batch_size": 2,
5
+ "chunk_parallel_size": 1,
6
+ "cluster": "tacc",
7
+ "data": "/scratch/10631/ryantlee/dolma/cc_en_head:10.865,/scratch/10631/ryantlee/dolma/cc_en_middle:13.038,/scratch/10631/ryantlee/dolma/cc_en_tail:12.314,/scratch/10631/ryantlee/dolma/starcoder:15.984,/scratch/10631/ryantlee/dolma/c4:4.193,/scratch/10631/ryantlee/dolma/reddit:4.841,/scratch/10631/ryantlee/dolma/arxiv:1.697,/scratch/10631/ryantlee/dolma/stackexchange:1.188,/scratch/10631/ryantlee/dolma/falcon:27.653,/scratch/10631/ryantlee/dolma/cc_news:0.866,/scratch/10631/ryantlee/dolma/open-web-math-train:0.763,/scratch/10631/ryantlee/dolma/algebraic-stack-train:0.763,/scratch/10631/ryantlee/dolma/pes2o:3.466,/scratch/10631/ryantlee/dolma/megawika:0.279,/scratch/10631/ryantlee/dolma/wiki:0.448,/scratch/10631/ryantlee/dolma/books:0.642,/scratch/10631/ryantlee/dolma/tulu_flan:1.000",
8
+ "disable_logging": false,
9
+ "disable_workers_print": true,
10
+ "dtype": "bf16",
11
+ "dump_dir": "/scratch/10631/ryantlee/saved_models/gecko1.2B_stage1",
12
+ "dump_freq": 500,
13
+ "enable_loss_tracker": false,
14
+ "eval_freq": 5000,
15
+ "finetuning_dir": "",
16
+ "fp32_reduce_scatter": true,
17
+ "gc_collect_freq": 50,
18
+ "gpu_check_level": 2,
19
+ "instruct": {
20
+ "no_loss_prompt": false,
21
+ "no_loss_truncated": false
22
+ },
23
+ "instruct_data": "",
24
+ "iter_jsonl": {
25
+ "buffer_size": 64,
26
+ "same_data": false
27
+ },
28
+ "iter_multi": {
29
+ "buffer_size": 512,
30
+ "ignore_extra_chunks": true,
31
+ "max_precompute": 20,
32
+ "multiprocess": true
33
+ },
34
+ "iter_type": "multi",
35
+ "keep_eval_checkpoints": true,
36
+ "keep_n_last_checkpoints": 5,
37
+ "log_freq": 10,
38
+ "log_wandb": false,
39
+ "loss_rescaling": false,
40
+ "model": {
41
+ "attention_dropout": 0.0,
42
+ "cema_ndim": 16,
43
+ "chunk_size": 2048,
44
+ "custom_bwd": true,
45
+ "dropout": 0.0,
46
+ "efficient_attn": "fused",
47
+ "ffn_hidden_dim": 6528,
48
+ "hidden_dropout": 0.0,
49
+ "init_mode": "he",
50
+ "layernorm_num_groups": 1,
51
+ "layerwise_ckpt": false,
52
+ "loss_parallel": false,
53
+ "memory_efficient_norm": true,
54
+ "model_dim": 2048,
55
+ "norm_affine": true,
56
+ "norm_eps": 1e-05,
57
+ "num_heads": 2,
58
+ "num_layers": 16,
59
+ "output_size": -1,
60
+ "recompute_attention": true,
61
+ "recompute_fc1_out": true,
62
+ "recompute_fc3_out": true,
63
+ "recompute_v": true,
64
+ "rescale_nffn": false,
65
+ "rope_base": null,
66
+ "scale_emb": false,
67
+ "share_emb": false,
68
+ "swiglu": true,
69
+ "timenorm_beta1": 0.999,
70
+ "timenorm_beta2": 0.9999,
71
+ "timenorm_num_groups": 32,
72
+ "two_hop_residual": false,
73
+ "value_dim": 4096,
74
+ "vocab_size": 50281,
75
+ "z_dim": 512
76
+ },
77
+ "model_parallel_size": 1,
78
+ "multi_segments": true,
79
+ "nccl_timeout": 1800,
80
+ "optim": {
81
+ "beta1": 0.9,
82
+ "beta2": 0.95,
83
+ "clip": 1.0,
84
+ "cycles": 1.0,
85
+ "epsilon": 1e-08,
86
+ "lr": 0.0004,
87
+ "lr_end_ratio": 0.05,
88
+ "lr_init_ratio": 0.0001,
89
+ "optim_state_dtype": null,
90
+ "scheduler": "cosine",
91
+ "warmup": 2000,
92
+ "weight_decay": 0.05
93
+ },
94
+ "reshard_after_forward": true,
95
+ "restore_dataloader_position": false,
96
+ "seed": 3,
97
+ "seq_len": 32768,
98
+ "slurm": {
99
+ "global_rank": 0,
100
+ "is_slurm_job": true,
101
+ "world_size": 32
102
+ },
103
+ "steps": 1907349,
104
+ "sync_check_freq": 10000,
105
+ "tokenizer": {
106
+ "data_tokenized": false,
107
+ "num_reserved_special_tokens": 0,
108
+ "path": "/work/10631/ryantlee/vista/OLMo1_tokenizer",
109
+ "type": "gptneox"
110
+ },
111
+ "valid": {
112
+ "batch_size": 2,
113
+ "gen_seq_len": 8192,
114
+ "majority_voting": 0,
115
+ "n_batches": 1,
116
+ "ppl_files_str": "/scratch/10631/ryantlee/dolma_val/validation_100k.jsonl",
117
+ "prompt_path": "",
118
+ "random_fewshots": false,
119
+ "seq_len": 32768,
120
+ "tasks_root_dir": "/scratch/10631/ryantlee/tasks",
121
+ "tasks_str": "boolq,hellaswag,nq",
122
+ "temperature": 1.0,
123
+ "top_k": 0,
124
+ "top_p": 0.0,
125
+ "use_sampling": false,
126
+ "write_eval": false
127
+ },
128
+ "wandb_entity": null,
129
+ "wandb_project": null
130
+ }
checkpoint_1388500/optimizer.tp00/.metadata ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da73f34f93c0d13e931538a0ac1a76af1cb931203bc09b2d9df29ddc85087e4d
3
+ size 4028123
checkpoint_1388500/optimizer.tp00/__0_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:049fe0e48590cf2379d5455ef48205c946305f765eb6bfffee4bd72298933c9e
3
+ size 335250656
checkpoint_1388500/optimizer.tp00/__10_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d17eff7f61b91d4eadde6705294c1b5661fdfd1c801c46b9d2ff96e1a3acf6c
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__11_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9763acbf9dacbe135e3204a63dfece065e970e80597e5410d136f1c54497c96
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__12_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:223a29c266c589da25b52831653b318bb0f741da25b3535d0ae655007aef7f32
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__13_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c500c268f91397422f556ab4ad2d4f3cfca17fb6595d4b163f96acb993397de
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__14_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1571268849956914d7e504a75a19af340f03b654d1de8ff06fc181253ea70bc
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__15_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bf688da5b932f3d671b706d0465ef0b18d3445c65196a280380d6f44840f4b0
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__16_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e9804f1a6c1af3f9c5940c3422d2972af4c393944aa66376c6effd8802d6e1b
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__17_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c55ad2eeafaab4a431b0b483a762df9f9eb151839cfe8b86947262eeaaa0ca8
3
+ size 335062436
checkpoint_1388500/optimizer.tp00/__18_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:916289ff0152487e68793a523bd99521a0e83e7b5e51020785b34e32b79fe1d7
3
+ size 335062436
checkpoint_1388500/optimizer.tp00/__19_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:389de162f57bebc91f20a80343a0bff7957073789b3546b6c8590bcd9d6f7d59
3
+ size 335062436
checkpoint_1388500/optimizer.tp00/__1_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e905beb925ea17d55b2edf5b78b94bc69ed938489667ade44f5d8ba8bf5bc66d
3
+ size 335265996
checkpoint_1388500/optimizer.tp00/__20_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eb6aab0a798ce5aae4202aeb00b901fe61a309b46e1733a0162b13fd624ba55
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__21_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c278c3c3907a23db83179960e7fefb423bcc9761dd19eca5c992656baa8fc315
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__22_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d4c695d025d5a75fdae0d0619053d41b82351115c767db58ebd00a040ada43b
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__23_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fb0df5342ac3760842cfa867202df7435615717967dd35a3de0abeffd94b2fc
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__24_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c66dd2076c09c8aa062803f945ef0ea7d89637370e6e0707205695f88674a5c
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__25_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a40c3ef7c2c5d49048447f121930d0b4ce15e259db428577604d71da4fc6dee
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__26_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2902c3633fc5b2d628ca026cc81a2a5ac6d078174ab03ac80f3cbbf8d099b77f
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__27_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d80b81d74d5b2126ae9ca69d4ac1df49cc06a721a9aa6b678b10f770c9f1801
3
+ size 335061320
checkpoint_1388500/optimizer.tp00/__28_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47ec6577abe8e154e1ce48bd136bcf903655e54a8f9651c7dc3efff0e85e880e
3
+ size 335073672
checkpoint_1388500/optimizer.tp00/__29_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80b08593db87f1eb6702b21cf9a9fbea0b7422cc98ecf5149fb0a57409e7dace
3
+ size 335061572
checkpoint_1388500/optimizer.tp00/__2_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf69eb21235d8a8b4a2729549cc074e1042b7a613035c2eee7e95011b29826be
3
+ size 335059404
checkpoint_1388500/optimizer.tp00/__30_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d78c8d3dc803c73b4a8160ef02ef0122ff301bc43756e2104f942ac3cddab2aa
3
+ size 335061572
checkpoint_1388500/optimizer.tp00/__31_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2123392baa4bead18ad79e342ee92aac0a3278f6de32b64a83538f289f8f1d
3
+ size 334307908
checkpoint_1388500/optimizer.tp00/__3_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:057614543b7620fb69ca06cd529a826b195c820157a9db41c7ebbd2009c757ec
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__4_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45a1a118e7cd0629d7e53d38bbd284aaa250738ce0ed450c5c81608690897515
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__5_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0bfd578a25ef9458bb349693f088d527314041ff069534d12a4328a5ab14272
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__6_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa73fb42fada15f95e93529769c9e39af502d25fdafd69b1d5720ae64cbfee60
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__7_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4f6115b1b637fff4573bca1d3ea376c663034586c05a1f817aca4e2b2142fbd
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__8_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b40a34ad6aaa897c1fe250126d88c8974a60a942680f53be77a0a03db85028
3
+ size 335061636
checkpoint_1388500/optimizer.tp00/__9_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a699312994e4edbf201d6036537175cd2ea007629a68494fb99cb9a806653450
3
+ size 335061636
checkpoint_1388500/sharded_model.tp00/.metadata ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae2fcf7233815a312dd7795ef00a103201888044943b33f8a99ba7d0badc9d4
3
+ size 1775629
checkpoint_1388500/sharded_model.tp00/__0_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc4b2b2cd36140e753710064a4f92ab73d1ae3f13918b4628b0064b94f7eb40a
3
+ size 167625328
checkpoint_1388500/sharded_model.tp00/__10_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be8133092af31b977e85dae914e259a15ad99e13ce71f759a85f114c686082a7
3
+ size 167525764
checkpoint_1388500/sharded_model.tp00/__11_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd3364e95c95690342cbaf4c3aabdcda866c112c157ce6769af665fc2cda1cbb
3
+ size 167526816
checkpoint_1388500/sharded_model.tp00/__12_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb2e3cf3bd520af2399fa5af7395b524f27ad35f695f7459fadbb38b8fb26f33
3
+ size 167525572
checkpoint_1388500/sharded_model.tp00/__13_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5c7e8c7a0425cbfa720cc7856008649cc5bdf2524407d4361558a9a450bf79b
3
+ size 167525572
checkpoint_1388500/sharded_model.tp00/__14_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:693d377af06ec39d8e5524ebbcad94f1e738b48da7ebd445a034079014243fc3
3
+ size 167525636
checkpoint_1388500/sharded_model.tp00/__15_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a8e53d9e943a3b2a6ea176976248dca7891c8a896b56f3dd57d96d2515aa52c
3
+ size 167525572
checkpoint_1388500/sharded_model.tp00/__16_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:931a75ac0fff1a083ac2a6c86f09ad6aaf7f9855b4d8b6541e176c9f13a40bdb
3
+ size 167524456
checkpoint_1388500/sharded_model.tp00/__17_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9866dfeed8bd16dd5acfc5b63cbffc08361a88cccb9ba796d524894bee99c1
3
+ size 167525636
checkpoint_1388500/sharded_model.tp00/__18_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f75ff3ee330072d8fe8159a785856a1d7fe927154ab68014c9e65c5652eb67f
3
+ size 167524456
checkpoint_1388500/sharded_model.tp00/__19_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e80500a94545eae3367bfe1af15e8e17a4b4ec4ebaae9ec004ddab89c4d02c2
3
+ size 167524456
checkpoint_1388500/sharded_model.tp00/__1_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b3363ab480fc14d6439fa83f3920c8a2dd45c97c3961d06a1eee65755c3a15d
3
+ size 167627020
checkpoint_1388500/sharded_model.tp00/__20_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23daa1f513be6d5daf9b9340ee7b4c090e7b670dca7cbb8347e283eb97023124
3
+ size 167527996
checkpoint_1388500/sharded_model.tp00/__21_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b890e697a540f3940a1a0f1467d0558a21ee75a1b4810d92551604e778da1d1c
3
+ size 167524456