Hoang Pham commited on
Commit
cbd4ab9
·
verified ·
1 Parent(s): 613f7d2

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
- "_name_or_path": "distilgpt2",
3
- "_num_labels": 1,
4
  "activation_function": "gelu_new",
5
  "architectures": [
6
  "GPT2LMHeadModel"
@@ -9,20 +8,14 @@
9
  "bos_token_id": 50256,
10
  "embd_pdrop": 0.1,
11
  "eos_token_id": 50256,
12
- "id2label": {
13
- "0": "LABEL_0"
14
- },
15
  "initializer_range": 0.02,
16
- "label2id": {
17
- "LABEL_0": 0
18
- },
19
  "layer_norm_epsilon": 1e-05,
20
  "model_type": "gpt2",
21
  "n_ctx": 1024,
22
  "n_embd": 768,
23
  "n_head": 12,
24
  "n_inner": null,
25
- "n_layer": 6,
26
  "n_positions": 1024,
27
  "reorder_and_upcast_attn": false,
28
  "resid_pdrop": 0.1,
 
1
  {
2
+ "_name_or_path": "gpt2",
 
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
8
  "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
 
 
 
11
  "initializer_range": 0.02,
 
 
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
  "n_embd": 768,
16
  "n_head": 12,
17
  "n_inner": null,
18
+ "n_layer": 12,
19
  "n_positions": 1024,
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a988075e8b7fe5b99273707075bf984354e5ceecf8303486a264319bac13542
3
- size 327657928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5609ac6f01101d2bcb425aa64610463292a0fe69c5001c2522d8c213dfd822b8
3
+ size 497774208
runs/Dec26_14-07-41_4f87fa13cf4f/events.out.tfevents.1735222063.4f87fa13cf4f.45582.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42d90d36507cff8dc7b5c73957e780c540998ad2791ba8de0f4eaa382f5d1d9d
3
+ size 5919
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd4f2906cbf2f7f7bbd40826ec841400a6fa3bcde012ac5923d5be7e0c0c23fa
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f301c938db1cb6977900c5e27614e30ccd7fd4df22c121c98fedc0e91b2cf20
3
  size 5240