pszemraj
/

mGPT-Peter-2E

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

pszemraj commited on May 12, 2022

Commit

a3d4f33

•

1 Parent(s): 475fce6

Upload config.json

Files changed (1) hide show

config.json +2 -12

config.json CHANGED Viewed

@@ -4,19 +4,12 @@
     "GPT2LMHeadModel"
   ],
   "attn_pdrop": 0.1,
-  "auto_map": {
-    "AutoModelForCausalLM": "modeling_gpt2.GPT2LMHeadModel"
-  },
   "bos_token_id": 50256,
-  "do_sample": true,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "gradient_checkpointing": false,
   "initializer_range": 0.02,
   "layer_norm_epsilon": 1e-05,
-  "length_penalty": 2.3,
-  "max_length": 64,
-  "min_length": 16,
   "model_type": "gpt2",
   "n_ctx": 2048,
   "n_embd": 2048,
@@ -24,10 +17,7 @@
   "n_inner": null,
   "n_layer": 24,
   "n_positions": 2048,
-  "no_repeat_ngram_size": 4,
-  "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,
-  "scale_attn_by_inverse_layer_idx": false,
   "scale_attn_weights": true,
   "summary_activation": null,
   "summary_first_dropout": 0.1,
@@ -35,7 +25,7 @@
   "summary_type": "cls_index",
   "summary_use_proj": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.18.0",
-  "use_cache": false,
   "vocab_size": 100000
 }

     "GPT2LMHeadModel"
   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "gradient_checkpointing": false,
   "initializer_range": 0.02,
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 2048,
   "n_embd": 2048,
   "n_inner": null,
   "n_layer": 24,
   "n_positions": 2048,
   "resid_pdrop": 0.1,
   "scale_attn_weights": true,
   "summary_activation": null,
   "summary_first_dropout": 0.1,
   "summary_type": "cls_index",
   "summary_use_proj": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.10.3",
+  "use_cache": true,
   "vocab_size": 100000
 }