625k step, 6e-4lr, batch4x8, training data rev1

Files changed (3) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "heegyu/kogpt-j-base",
   "activation_function": "gelu_new",
   "architectures": [
     "GPTJForCausalLM"

 {
+  "_name_or_path": "heegyu/kogpt-j-base-24L",
   "activation_function": "gelu_new",
   "architectures": [
     "GPTJForCausalLM"

flax_model.msgpack ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:21a7eefe15868d842b8a84efcc21db03ba1d1bd3b225dfb242a7440867e0c7a8
+size 994786268

tokenizer_config.json CHANGED Viewed

@@ -19,7 +19,7 @@
   },
   "errors": "replace",
   "model_max_length": 1000000000000000019884624838656,
-  "name_or_path": "heegyu/kogpt-j-base",
   "pad_token": null,
   "special_tokens_map_file": null,
   "tokenizer_class": "GPT2Tokenizer",

   },
   "errors": "replace",
   "model_max_length": 1000000000000000019884624838656,
+  "name_or_path": "heegyu/kogpt-j-base-24L",
   "pad_token": null,
   "special_tokens_map_file": null,
   "tokenizer_class": "GPT2Tokenizer",