eager-plant-323 model - no removed layers
Browse files- .gitattributes +4 -0
- config.json +2 -2
- generation_config.json +0 -0
- onnx/decoder_model.onnx +2 -2
- onnx/decoder_model_merged.onnx +2 -2
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_quantized.onnx +2 -2
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_quantized.onnx +2 -2
- onnx/decoder_with_past_model.onnx +2 -2
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_quantized.onnx +2 -2
- onnx/encoder_model.onnx +1 -1
- onnx/encoder_model_q4.onnx +3 -0
- onnx/encoder_model_quantized.onnx +1 -1
- quantize_config.json +1 -1
.gitattributes
CHANGED
@@ -55,3 +55,7 @@ onnx/decoder_model_merged_quantized.onnx_data filter=lfs diff=lfs merge=lfs -tex
|
|
55 |
onnx/decoder_with_past_model_fp16.onnx filter=lfs diff=lfs merge=lfs -text
|
56 |
onnx/decoder_with_past_model_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
|
57 |
onnx/encoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
55 |
onnx/decoder_with_past_model_fp16.onnx filter=lfs diff=lfs merge=lfs -text
|
56 |
onnx/decoder_with_past_model_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
|
57 |
onnx/encoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
|
58 |
+
onnx/decoder_model_merged_q4.onnx filter=lfs diff=lfs merge=lfs -text
|
59 |
+
onnx/decoder_model_q4.onnx filter=lfs diff=lfs merge=lfs -text
|
60 |
+
onnx/decoder_with_past_model_q4.onnx filter=lfs diff=lfs merge=lfs -text
|
61 |
+
onnx/encoder_model_q4.onnx filter=lfs diff=lfs merge=lfs -text
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"T5ForConditionalGeneration"
|
5 |
],
|
@@ -18,7 +18,7 @@
|
|
18 |
"layer_norm_epsilon": 1e-06,
|
19 |
"model_type": "t5",
|
20 |
"n_positions": 512,
|
21 |
-
"num_decoder_layers":
|
22 |
"num_heads": 6,
|
23 |
"num_layers": 8,
|
24 |
"output_past": true,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "eager-plant-323",
|
3 |
"architectures": [
|
4 |
"T5ForConditionalGeneration"
|
5 |
],
|
|
|
18 |
"layer_norm_epsilon": 1e-06,
|
19 |
"model_type": "t5",
|
20 |
"n_positions": 512,
|
21 |
+
"num_decoder_layers": 8,
|
22 |
"num_heads": 6,
|
23 |
"num_layers": 8,
|
24 |
"output_past": true,
|
generation_config.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
onnx/decoder_model.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ccfd3430c89baf346caf4a250faa4da0c8b55e68a01e8272d887b18982b808f
|
3 |
+
size 232559765
|
onnx/decoder_model_merged.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26631dcf6242110611180fb493f7ac64570d2713f83786237b62251599809ef4
|
3 |
+
size 232798796
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1462f8228098ac506856153660c21af14228219e897f91e09eeee5e9d06aaca2
|
3 |
+
size 92370214
|
onnx/decoder_model_merged_quantized.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d2e411095a8b75a7124ee5ba7699e8688a395a1ed5a9398f05e8208fe31b495
|
3 |
+
size 59198001
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e8620b66a490a1038a0ec7627871bbf0b55c611fdb0ce24b14e1d050e325ff3
|
3 |
+
size 92121184
|
onnx/decoder_model_quantized.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f15c7fc318265c50cd49f0d8a1e98f355870274c32d1358c83f2b8ad99bb552
|
3 |
+
size 58868682
|
onnx/decoder_with_past_model.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d93c2d87f7e3f2412c241edcaf1192b7a9a4b4594e69f918ea2733397a6c97c0
|
3 |
+
size 219930693
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aba09ce9a99af045ee525ac9719cdcead945f93d5c2e114c5861a915caa8e520
|
3 |
+
size 90106560
|
onnx/decoder_with_past_model_quantized.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:621ce8d2c22fb66d5e0f7fb0bc4198726d3fb1d418a7ee1d4948d1dee0650016
|
3 |
+
size 55630603
|
onnx/encoder_model.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 141467235
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d92762de4cd38898dd6c4004facf6148b55e224fd847cab65de9d4fa31fe0cb
|
3 |
size 141467235
|
onnx/encoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edc8033b8256a8fbd7bf5f8b6c98a6ea99b817ff07ac6c82772b720246fa2737
|
3 |
+
size 77774564
|
onnx/encoder_model_quantized.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 35726832
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1afa42a0bf17ec78ee965342836a1bb41f8ecc391edddf527812183df9c83fa
|
3 |
size 35726832
|
quantize_config.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"modes": [
|
3 |
-
"
|
4 |
],
|
5 |
"per_channel": true,
|
6 |
"reduce_range": true,
|
|
|
1 |
{
|
2 |
"modes": [
|
3 |
+
"q4"
|
4 |
],
|
5 |
"per_channel": true,
|
6 |
"reduce_range": true,
|