SubhrajitSain commited on
Commit
82b4fa6
verified
1 Parent(s): e346e65

Upload model

Browse files
Files changed (3) hide show
  1. config.json +5 -3
  2. generation_config.json +1 -1
  3. model.safetensors +2 -2
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "activation_function": "gelu_new",
3
  "architectures": [
4
  "GPT2LMHeadModel"
@@ -35,7 +36,8 @@
35
  "max_length": 50
36
  }
37
  },
38
- "transformers_version": "4.57.1",
39
- "use_cache": false,
40
- "vocab_size": 50257
 
41
  }
 
1
  {
2
+ "_name_or_path": "SubhrajitSain/anwgpt2-355m",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
36
  "max_length": 50
37
  }
38
  },
39
+ "torch_dtype": "float16",
40
+ "transformers_version": "4.41.2",
41
+ "use_cache": true,
42
+ "vocab_size": 50259
43
  }
generation_config.json CHANGED
@@ -5,5 +5,5 @@
5
  50256
6
  ],
7
  "pad_token_id": 50256,
8
- "transformers_version": "4.57.1"
9
  }
 
5
  50256
6
  ],
7
  "pad_token_id": 50256,
8
+ "transformers_version": "4.41.2"
9
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d658bedcbb682f29912ac124d7ab5b87650bceb61d42bdaed5c8b9dd82b8299e
3
- size 1419322880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5097f1b16ba2b7c48b9cc187db9da852244aaf6c9ddee8bacb7c5dd55f8407b6
3
+ size 709680472