Commit
·
962cc10
1
Parent(s):
feaccc5
Training in progress, step 2000
Browse files- .gitignore +1 -0
- config.json +29 -0
- pytorch_model.bin +3 -0
- runs/Mar07_06-08-51_af02b8537d44/1646633357.0119393/events.out.tfevents.1646633357.af02b8537d44.818.1 +3 -0
- runs/Mar07_06-08-51_af02b8537d44/events.out.tfevents.1646633356.af02b8537d44.818.0 +3 -0
- runs/Mar07_06-11-29_af02b8537d44/1646633515.3078463/events.out.tfevents.1646633515.af02b8537d44.818.3 +3 -0
- runs/Mar07_06-11-29_af02b8537d44/events.out.tfevents.1646633515.af02b8537d44.818.2 +3 -0
- runs/Mar07_06-20-03_af02b8537d44/1646634028.9164531/events.out.tfevents.1646634028.af02b8537d44.818.5 +3 -0
- runs/Mar07_06-20-03_af02b8537d44/events.out.tfevents.1646634028.af02b8537d44.818.4 +3 -0
- runs/Mar07_06-22-12_af02b8537d44/1646634159.3245156/events.out.tfevents.1646634159.af02b8537d44.818.7 +3 -0
- runs/Mar07_06-22-12_af02b8537d44/events.out.tfevents.1646634159.af02b8537d44.818.6 +3 -0
- runs/Mar07_07-14-50_af02b8537d44/1646637318.5613942/events.out.tfevents.1646637318.af02b8537d44.818.9 +3 -0
- runs/Mar07_07-14-50_af02b8537d44/events.out.tfevents.1646637318.af02b8537d44.818.8 +3 -0
- training_args.bin +3 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "google/byt5-small",
|
3 |
+
"architectures": [
|
4 |
+
"T5ForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"d_ff": 3584,
|
7 |
+
"d_kv": 64,
|
8 |
+
"d_model": 1472,
|
9 |
+
"decoder_start_token_id": 0,
|
10 |
+
"dropout_rate": 0.1,
|
11 |
+
"eos_token_id": 1,
|
12 |
+
"feed_forward_proj": "gated-gelu",
|
13 |
+
"gradient_checkpointing": false,
|
14 |
+
"initializer_factor": 1.0,
|
15 |
+
"is_encoder_decoder": true,
|
16 |
+
"layer_norm_epsilon": 1e-06,
|
17 |
+
"model_type": "t5",
|
18 |
+
"num_decoder_layers": 4,
|
19 |
+
"num_heads": 6,
|
20 |
+
"num_layers": 12,
|
21 |
+
"pad_token_id": 0,
|
22 |
+
"relative_attention_num_buckets": 32,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"tokenizer_class": "ByT5Tokenizer",
|
25 |
+
"torch_dtype": "float32",
|
26 |
+
"transformers_version": "4.18.0.dev0",
|
27 |
+
"use_cache": true,
|
28 |
+
"vocab_size": 384
|
29 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e96660d64a21b2e0adc68bb871b38d9ed0f6f9cab57e50367797c5d40505afbe
|
3 |
+
size 1203128041
|
runs/Mar07_06-08-51_af02b8537d44/1646633357.0119393/events.out.tfevents.1646633357.af02b8537d44.818.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae6fab4d300fff0700436d511515392e5d5c1149898ccbe2a519b0b2bae2c704
|
3 |
+
size 4757
|
runs/Mar07_06-08-51_af02b8537d44/events.out.tfevents.1646633356.af02b8537d44.818.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc98dd38d6b824f1cc8021ea99470792731f21c33628f5b3bd7e44db642167d9
|
3 |
+
size 3330
|
runs/Mar07_06-11-29_af02b8537d44/1646633515.3078463/events.out.tfevents.1646633515.af02b8537d44.818.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d315803fdee8a9e2dc111eb818f1864c40617ccdfa0ee3d1477918458693f800
|
3 |
+
size 4757
|
runs/Mar07_06-11-29_af02b8537d44/events.out.tfevents.1646633515.af02b8537d44.818.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc7b4bbaf4ee76f10c4570c45c60b089e376a78f2f869db3358a0d47b2a735d4
|
3 |
+
size 3331
|
runs/Mar07_06-20-03_af02b8537d44/1646634028.9164531/events.out.tfevents.1646634028.af02b8537d44.818.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293efbb95ae7abdde3c9b2b89f0aff95c0f068388de4d6901ec726006babece7
|
3 |
+
size 4757
|
runs/Mar07_06-20-03_af02b8537d44/events.out.tfevents.1646634028.af02b8537d44.818.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa6a387057c07be631248e89e197fc41d5ef79401ec152a46353e93fe2e86bd4
|
3 |
+
size 3331
|
runs/Mar07_06-22-12_af02b8537d44/1646634159.3245156/events.out.tfevents.1646634159.af02b8537d44.818.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3461fb6e17d66341de34733e72cf17491208c8126156d66c5ea7062e87284d52
|
3 |
+
size 4757
|
runs/Mar07_06-22-12_af02b8537d44/events.out.tfevents.1646634159.af02b8537d44.818.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6b398ade91222b5554a82549dc5823bcba796bdb3957c2923deb93f01b9bc27
|
3 |
+
size 3331
|
runs/Mar07_07-14-50_af02b8537d44/1646637318.5613942/events.out.tfevents.1646637318.af02b8537d44.818.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63e3177e43e81536f7ad30e5c41c1f7c0a35eae226cb93cafc8c7e49b5b022ca
|
3 |
+
size 4757
|
runs/Mar07_07-14-50_af02b8537d44/events.out.tfevents.1646637318.af02b8537d44.818.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3b953c6dbf70bf088dad52d3fa6066d4acea030e7429d0c7c4921afc8b6b318
|
3 |
+
size 3959
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a73b08c46125496e93849fefb48ee849b156511da7f264d80235f8d78bb9d0cb
|
3 |
+
size 2991
|