Ignatfhc commited on
Commit
2d49f26
·
verified ·
1 Parent(s): c10fdea

checkpoint 1

Browse files
Files changed (26) hide show
  1. .gitattributes +1 -0
  2. imdb/checkpoint-1/added_tokens.json +3 -0
  3. imdb/checkpoint-1/config.json +54 -0
  4. imdb/checkpoint-1/generation_config.json +7 -0
  5. imdb/checkpoint-1/model.safetensors +3 -0
  6. imdb/checkpoint-1/optimizer.pt +3 -0
  7. imdb/checkpoint-1/rng_state.pth +3 -0
  8. imdb/checkpoint-1/scaler.pt +3 -0
  9. imdb/checkpoint-1/scheduler.pt +3 -0
  10. imdb/checkpoint-1/special_tokens_map.json +27 -0
  11. imdb/checkpoint-1/tokenizer.json +3 -0
  12. imdb/checkpoint-1/tokenizer.model +3 -0
  13. imdb/checkpoint-1/tokenizer_config.json +0 -0
  14. imdb/checkpoint-1/trainer_state.json +41 -0
  15. imdb/checkpoint-1/training_args.bin +3 -0
  16. imdb/runs/Sep15_14-09-51_09b0c4cc94f0/events.out.tfevents.1757945394.09b0c4cc94f0.191.0 +3 -0
  17. imdb/runs/Sep15_14-11-12_09b0c4cc94f0/events.out.tfevents.1757945472.09b0c4cc94f0.191.1 +3 -0
  18. imdb/runs/Sep15_14-12-25_09b0c4cc94f0/events.out.tfevents.1757945546.09b0c4cc94f0.191.2 +3 -0
  19. imdb/runs/Sep15_14-13-16_09b0c4cc94f0/events.out.tfevents.1757945597.09b0c4cc94f0.191.3 +3 -0
  20. imdb/runs/Sep15_14-14-59_09b0c4cc94f0/events.out.tfevents.1757945700.09b0c4cc94f0.191.4 +3 -0
  21. imdb/runs/Sep15_14-16-59_09b0c4cc94f0/events.out.tfevents.1757945820.09b0c4cc94f0.191.5 +3 -0
  22. imdb/runs/Sep15_14-17-54_09b0c4cc94f0/events.out.tfevents.1757945875.09b0c4cc94f0.191.6 +3 -0
  23. imdb/runs/Sep15_14-18-53_09b0c4cc94f0/events.out.tfevents.1757945934.09b0c4cc94f0.191.7 +3 -0
  24. imdb/runs/Sep15_14-19-41_09b0c4cc94f0/events.out.tfevents.1757945981.09b0c4cc94f0.191.8 +3 -0
  25. imdb/runs/Sep15_14-20-27_09b0c4cc94f0/events.out.tfevents.1757946027.09b0c4cc94f0.191.9 +3 -0
  26. imdb/runs/Sep15_14-21-12_09b0c4cc94f0/events.out.tfevents.1757946072.09b0c4cc94f0.191.10 +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ imdb/checkpoint-1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
imdb/checkpoint-1/added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
imdb/checkpoint-1/config.json ADDED
@@ -0,0 +1,54 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_sliding_window_pattern": 6,
3
+ "architectures": [
4
+ "Gemma3ForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "attn_logit_softcapping": null,
9
+ "bos_token_id": 2,
10
+ "dtype": "float32",
11
+ "eos_token_id": 1,
12
+ "final_logit_softcapping": null,
13
+ "head_dim": 256,
14
+ "hidden_activation": "gelu_pytorch_tanh",
15
+ "hidden_size": 640,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 2048,
18
+ "layer_types": [
19
+ "sliding_attention",
20
+ "sliding_attention",
21
+ "sliding_attention",
22
+ "sliding_attention",
23
+ "sliding_attention",
24
+ "full_attention",
25
+ "sliding_attention",
26
+ "sliding_attention",
27
+ "sliding_attention",
28
+ "sliding_attention",
29
+ "sliding_attention",
30
+ "full_attention",
31
+ "sliding_attention",
32
+ "sliding_attention",
33
+ "sliding_attention",
34
+ "sliding_attention",
35
+ "sliding_attention",
36
+ "full_attention"
37
+ ],
38
+ "max_position_embeddings": 32768,
39
+ "model_type": "gemma3_text",
40
+ "num_attention_heads": 4,
41
+ "num_hidden_layers": 18,
42
+ "num_key_value_heads": 1,
43
+ "pad_token_id": 1,
44
+ "query_pre_attn_scalar": 256,
45
+ "rms_norm_eps": 1e-06,
46
+ "rope_local_base_freq": 10000.0,
47
+ "rope_scaling": null,
48
+ "rope_theta": 1000000.0,
49
+ "sliding_window": 512,
50
+ "transformers_version": "4.56.1",
51
+ "use_bidirectional_attention": false,
52
+ "use_cache": true,
53
+ "vocab_size": 262145
54
+ }
imdb/checkpoint-1/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.56.1"
7
+ }
imdb/checkpoint-1/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfd0102a948013901a3ffe97cf39cc2d670d86bad8dced4619bb088126fadbcc
3
+ size 1072421816
imdb/checkpoint-1/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c40072905a7f116cc301bc430c42cf9f9613403a2e72a2ae6d1060dfa5b6b5d
3
+ size 2169
imdb/checkpoint-1/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61c19bab1174704a4a4441475683bf1270277af15d2e2c95e964789128e482c4
3
+ size 14645
imdb/checkpoint-1/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9be1d3e9114d64374b079cefeec7fbeb79e328d8b599d6c744b89f08c2cc8641
3
+ size 1383
imdb/checkpoint-1/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:141ec64e4f4776fb65ab9ae37d90cb86998730d56d004f9aa30026767099dff6
3
+ size 1465
imdb/checkpoint-1/special_tokens_map.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "boi_token": "<start_of_image>",
3
+ "bos_token": {
4
+ "content": "<bos>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ "eoi_token": "<end_of_image>",
11
+ "eos_token": {
12
+ "content": "<eos>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false
17
+ },
18
+ "image_token": "<image_soft_token>",
19
+ "pad_token": "<eos>",
20
+ "unk_token": {
21
+ "content": "<unk>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false
26
+ }
27
+ }
imdb/checkpoint-1/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29f262de790b850fbbf7bba2c74c3271291ef3df8093143a028ab737bc1fff20
3
+ size 33384664
imdb/checkpoint-1/tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
3
+ size 4689074
imdb/checkpoint-1/tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff
 
imdb/checkpoint-1/trainer_state.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 1,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 1.0,
14
+ "grad_norm": NaN,
15
+ "learning_rate": 5e-05,
16
+ "loss": 7.0255,
17
+ "step": 1
18
+ }
19
+ ],
20
+ "logging_steps": 1,
21
+ "max_steps": 1,
22
+ "num_input_tokens_seen": 0,
23
+ "num_train_epochs": 9223372036854775807,
24
+ "save_steps": 1,
25
+ "stateful_callbacks": {
26
+ "TrainerControl": {
27
+ "args": {
28
+ "should_epoch_stop": false,
29
+ "should_evaluate": false,
30
+ "should_log": false,
31
+ "should_save": true,
32
+ "should_training_stop": true
33
+ },
34
+ "attributes": {}
35
+ }
36
+ },
37
+ "total_flos": 9631297536.0,
38
+ "train_batch_size": 1,
39
+ "trial_name": null,
40
+ "trial_params": null
41
+ }
imdb/checkpoint-1/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7e92b4179f9cb01415a278b5bb2cc86ca94d198f985c0defa23ac8da2bf2b81
3
+ size 5777
imdb/runs/Sep15_14-09-51_09b0c4cc94f0/events.out.tfevents.1757945394.09b0c4cc94f0.191.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdf1f85478cc7575be6ece3fe4d711441189bd13f716e2ea42545ddc5638e720
3
+ size 5684
imdb/runs/Sep15_14-11-12_09b0c4cc94f0/events.out.tfevents.1757945472.09b0c4cc94f0.191.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f204262a5a024cdcb2fa1dfebb848515502d87ce544e583945d54a139be06b6
3
+ size 5685
imdb/runs/Sep15_14-12-25_09b0c4cc94f0/events.out.tfevents.1757945546.09b0c4cc94f0.191.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75ada27154549692219dadd9f2b9192a5ebbb163434064e41d7654aa350c9941
3
+ size 5684
imdb/runs/Sep15_14-13-16_09b0c4cc94f0/events.out.tfevents.1757945597.09b0c4cc94f0.191.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f8f60cd74e6fab86b24f74d851317e7b27f1d4c982d6898dddd8d39c3493b65
3
+ size 5685
imdb/runs/Sep15_14-14-59_09b0c4cc94f0/events.out.tfevents.1757945700.09b0c4cc94f0.191.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e87435915b3677e7be9f3a85f886be668075cbff80025d1e70333b860b1905e
3
+ size 5685
imdb/runs/Sep15_14-16-59_09b0c4cc94f0/events.out.tfevents.1757945820.09b0c4cc94f0.191.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c412ae94dd6da2807a1b9e9ecc6d9c3328185188d0bf4fd47337d4b39d52de0b
3
+ size 5679
imdb/runs/Sep15_14-17-54_09b0c4cc94f0/events.out.tfevents.1757945875.09b0c4cc94f0.191.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07676aad0f43e45b975d377e26b66483d42480aa4b630ee159824e9aee0cadfa
3
+ size 5679
imdb/runs/Sep15_14-18-53_09b0c4cc94f0/events.out.tfevents.1757945934.09b0c4cc94f0.191.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5ecf722247549d6376b9cf4addc418588d70aa6fd378e8ac36dbfffd77ca91
3
+ size 5680
imdb/runs/Sep15_14-19-41_09b0c4cc94f0/events.out.tfevents.1757945981.09b0c4cc94f0.191.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67c1df12d5c1084f454f67d8b657b22af2131c0941a7a08886ae5865c93b49ef
3
+ size 4184
imdb/runs/Sep15_14-20-27_09b0c4cc94f0/events.out.tfevents.1757946027.09b0c4cc94f0.191.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58c8b50c71be0718ee6ba2abc845f4f8700b08ba75a2a67ec570ebca7d5b8d0d
3
+ size 4184
imdb/runs/Sep15_14-21-12_09b0c4cc94f0/events.out.tfevents.1757946072.09b0c4cc94f0.191.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b14cb46696b0b1372812dd0f6eb37e1db9ac09ec7b2ed0469e8487e73017feb
3
+ size 5887