dulcet-durian-136 training with t5-efficient-tiny base model
Browse files- config.json +4 -4
- onnx/decoder_model.onnx +2 -2
- onnx/decoder_model_fp16.onnx +3 -0
- onnx/decoder_model_merged.onnx +2 -2
- onnx/decoder_model_merged_fp16.onnx +3 -0
- onnx/decoder_model_merged_quantized.onnx +2 -2
- onnx/decoder_model_quantized.onnx +2 -2
- onnx/decoder_with_past_model.onnx +2 -2
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_quantized.onnx +2 -2
- onnx/encoder_model.onnx +2 -2
- onnx/encoder_model_fp16.onnx +3 -0
- onnx/encoder_model_quantized.onnx +2 -2
- quantize_config.json +1 -1
config.json
CHANGED
|
@@ -1,12 +1,12 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"architectures": [
|
| 4 |
"T5ForConditionalGeneration"
|
| 5 |
],
|
| 6 |
"classifier_dropout": 0.0,
|
| 7 |
-
"d_ff":
|
| 8 |
"d_kv": 64,
|
| 9 |
-
"d_model":
|
| 10 |
"decoder_start_token_id": 0,
|
| 11 |
"dense_act_fn": "relu",
|
| 12 |
"dropout_rate": 0.1,
|
|
@@ -19,7 +19,7 @@
|
|
| 19 |
"model_type": "t5",
|
| 20 |
"n_positions": 512,
|
| 21 |
"num_decoder_layers": 4,
|
| 22 |
-
"num_heads":
|
| 23 |
"num_layers": 4,
|
| 24 |
"pad_token_id": 0,
|
| 25 |
"relative_attention_max_distance": 128,
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "dulcet-durian-136",
|
| 3 |
"architectures": [
|
| 4 |
"T5ForConditionalGeneration"
|
| 5 |
],
|
| 6 |
"classifier_dropout": 0.0,
|
| 7 |
+
"d_ff": 1024,
|
| 8 |
"d_kv": 64,
|
| 9 |
+
"d_model": 256,
|
| 10 |
"decoder_start_token_id": 0,
|
| 11 |
"dense_act_fn": "relu",
|
| 12 |
"dropout_rate": 0.1,
|
|
|
|
| 19 |
"model_type": "t5",
|
| 20 |
"n_positions": 512,
|
| 21 |
"num_decoder_layers": 4,
|
| 22 |
+
"num_heads": 4,
|
| 23 |
"num_layers": 4,
|
| 24 |
"pad_token_id": 0,
|
| 25 |
"relative_attention_max_distance": 128,
|
onnx/decoder_model.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b3f924580ed1fb94175f1f4520b3f1d723cf626016a5ec2cb206ca3ff3f0bda
|
| 3 |
+
size 49810798
|
onnx/decoder_model_fp16.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3fd9e09812d88af5fb1f89fc398120fb831e54039c9a290173a0d09f3c377bf
|
| 3 |
+
size 24967116
|
onnx/decoder_model_merged.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f179daee6bbc93ec07ebcbd4d69f6e51413f293d44fd6a3a45deb3df801aaf7
|
| 3 |
+
size 49934579
|
onnx/decoder_model_merged_fp16.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47033b8efbe3188d049726160cb3deca93453d1c05332a912b2692643f823b83
|
| 3 |
+
size 48902126
|
onnx/decoder_model_merged_quantized.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8b2b3f7c2438219ef677763e088d89f440ae1fbc2649d314d8cf410ab3fcd73
|
| 3 |
+
size 45733795
|
onnx/decoder_model_quantized.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb32c0f150b93b71443445b481465eac48ed36e67da9be2b54cc12598e3e249f
|
| 3 |
+
size 45568756
|
onnx/decoder_with_past_model.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84be9fe3fd001ecae01a5b866ff46469e4decc715819bcac7af4fbabf6539794
|
| 3 |
+
size 47692795
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f94c451121cdb73a772f822778f669def38770df54baf8468f326baa7b08ff98
|
| 3 |
+
size 23899674
|
onnx/decoder_with_past_model_quantized.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5125b3c19badeb55148498ecc58501dda392b82c64aae2f5717127e1e8f4b7d
|
| 3 |
+
size 45005314
|
onnx/encoder_model.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:039a737b275da31cfc474020e81514774adf871c44411ee548443554402accf8
|
| 3 |
+
size 45553423
|
onnx/encoder_model_fp16.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4e9a8ca2f0549224bb3a961850253d96e922b024ddb9fd2f656a4970fa652db
|
| 3 |
+
size 22807586
|
onnx/encoder_model_quantized.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:927a680f7cb4bbcdd7d718a95c2c658731c27d0f204f02e947910b54ddf6f3fa
|
| 3 |
+
size 11515728
|
quantize_config.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"modes": [
|
| 3 |
-
"
|
| 4 |
],
|
| 5 |
"per_channel": true,
|
| 6 |
"reduce_range": true,
|
|
|
|
| 1 |
{
|
| 2 |
"modes": [
|
| 3 |
+
"fp16"
|
| 4 |
],
|
| 5 |
"per_channel": true,
|
| 6 |
"reduce_range": true,
|