ONNX
t5
rolf-mozilla commited on
Commit
999b59c
·
unverified ·
1 Parent(s): f567279

eager-plant-323 model - no removed layers

Browse files
.gitattributes CHANGED
@@ -55,3 +55,7 @@ onnx/decoder_model_merged_quantized.onnx_data filter=lfs diff=lfs merge=lfs -tex
55
  onnx/decoder_with_past_model_fp16.onnx filter=lfs diff=lfs merge=lfs -text
56
  onnx/decoder_with_past_model_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
57
  onnx/encoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
55
  onnx/decoder_with_past_model_fp16.onnx filter=lfs diff=lfs merge=lfs -text
56
  onnx/decoder_with_past_model_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
57
  onnx/encoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
58
+ onnx/decoder_model_merged_q4.onnx filter=lfs diff=lfs merge=lfs -text
59
+ onnx/decoder_model_q4.onnx filter=lfs diff=lfs merge=lfs -text
60
+ onnx/decoder_with_past_model_q4.onnx filter=lfs diff=lfs merge=lfs -text
61
+ onnx/encoder_model_q4.onnx filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "still-durian-309",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
@@ -18,7 +18,7 @@
18
  "layer_norm_epsilon": 1e-06,
19
  "model_type": "t5",
20
  "n_positions": 512,
21
- "num_decoder_layers": 3,
22
  "num_heads": 6,
23
  "num_layers": 8,
24
  "output_past": true,
 
1
  {
2
+ "_name_or_path": "eager-plant-323",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
 
18
  "layer_norm_epsilon": 1e-06,
19
  "model_type": "t5",
20
  "n_positions": 512,
21
+ "num_decoder_layers": 8,
22
  "num_heads": 6,
23
  "num_layers": 8,
24
  "output_past": true,
generation_config.json CHANGED
The diff for this file is too large to render. See raw diff
 
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d5c683daf8582019908023cfd96c044d6d80ed506b817b8e2c1e770800d1cd5
3
- size 169472581
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ccfd3430c89baf346caf4a250faa4da0c8b55e68a01e8272d887b18982b808f
3
+ size 232559765
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1c0722608a7ac8dcc72eff44c396211c58d0dec42fba8fd320e0002fb78188d
3
- size 169578960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26631dcf6242110611180fb493f7ac64570d2713f83786237b62251599809ef4
3
+ size 232798796
onnx/decoder_model_merged_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1462f8228098ac506856153660c21af14228219e897f91e09eeee5e9d06aaca2
3
+ size 92370214
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d2160f76ae6e90d21779e65dcd15aa2991ba1f45edbc23e5d55a192fc20842b
3
- size 42895015
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d2e411095a8b75a7124ee5ba7699e8688a395a1ed5a9398f05e8208fe31b495
3
+ size 59198001
onnx/decoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e8620b66a490a1038a0ec7627871bbf0b55c611fdb0ce24b14e1d050e325ff3
3
+ size 92121184
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c9557b1dcc44b7db91830c6ec1822f7b599752507fb7e74c1386b7c90f60fbd
3
- size 42753832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f15c7fc318265c50cd49f0d8a1e98f355870274c32d1358c83f2b8ad99bb552
3
+ size 58868682
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71927dd32ee3df4dcc085ee6c52091530e84ae576ff1dbb8f66686d0c452b1e1
3
- size 164738287
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d93c2d87f7e3f2412c241edcaf1192b7a9a4b4594e69f918ea2733397a6c97c0
3
+ size 219930693
onnx/decoder_with_past_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aba09ce9a99af045ee525ac9719cdcead945f93d5c2e114c5861a915caa8e520
3
+ size 90106560
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6ae7050dc0ca3df5c06e221084994492267d86162910f9c94aa5f0e44bd5dc6
3
- size 41540983
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:621ce8d2c22fb66d5e0f7fb0bc4198726d3fb1d418a7ee1d4948d1dee0650016
3
+ size 55630603
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f24d6b82b25d1a04ff1de0f1426fafc8ffedd077571f037075e0a3a621c423be
3
  size 141467235
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d92762de4cd38898dd6c4004facf6148b55e224fd847cab65de9d4fa31fe0cb
3
  size 141467235
onnx/encoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc8033b8256a8fbd7bf5f8b6c98a6ea99b817ff07ac6c82772b720246fa2737
3
+ size 77774564
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4c151184859c474309c13d1332d3aa3a4d5bc2d6f95d32ee35d071546c4a0fa
3
  size 35726832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1afa42a0bf17ec78ee965342836a1bb41f8ecc391edddf527812183df9c83fa
3
  size 35726832
quantize_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "modes": [
3
- "q8"
4
  ],
5
  "per_channel": true,
6
  "reduce_range": true,
 
1
  {
2
  "modes": [
3
+ "q4"
4
  ],
5
  "per_channel": true,
6
  "reduce_range": true,