Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +103 -0

config.json CHANGED Viewed

@@ -35,7 +35,7 @@
   },
   "tie_word_embeddings": false,
   "tokenizer_class": "GPT2Tokenizer",
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 51200
 }

   },
   "tie_word_embeddings": false,
   "tokenizer_class": "GPT2Tokenizer",
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 51200
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 50256,
-  "transformers_version": "4.29.2"
 }

   "_from_model_config": true,
   "bos_token_id": 1,
   "eos_token_id": 50256,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:001ffadb35ae890965862447cb2a898a65d6773bb63bfc1e54e8eb5157d8b4b6
-size 1435433361

 version https://git-lfs.github.com/spec/v1
+oid sha256:6e253a493c957bf95f09bcdf7993e6b5a2d186c11ecceb26552b13c11a5056c6
+size 1435431277

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5144a56780c9634fd33f2c222c33e43d9c86d2bc10270d4e819f64761f5a00cc
-size 1436616692

 version https://git-lfs.github.com/spec/v1
+oid sha256:aab6c0373942118feca0695cae8731c0870b4aff536bd53520ad90dc02672348
+size 1440806543

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea712a8bc11dedd856351158bd57f7559cb5f76b9f5fbbfe0a287daaf2b0db70
-size 370397170

 version https://git-lfs.github.com/spec/v1
+oid sha256:aa7ebc46ccff17b6ceb88f22374d66b88e2a97e8db3cd2fa656d8407a8b21642
+size 373406712

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1211fd052d96727b54ec9ae545c18eb759aa112a79c72122526397dfe16226de
-size 368793710

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb38edfc1cbf1dfff557ca96a9b7b4360eb7ee156b30a703c4f5e18de60dee6a
+size 367612429

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58c23045d67dfe409d2482c2d63d12c2df4ced0fc501f762d1d4fe84564b7616
-size 1432225419

 version https://git-lfs.github.com/spec/v1
+oid sha256:66bfd6759c350ba9a1ce93618f279eca8ecc0e5c23b83d7c21eef10bf3ef236c
+size 1432223346

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b539fa9219b2f212463333eeb53f3a594f3b7df68c32dc4616d660085961ed52
-size 364276590

 version https://git-lfs.github.com/spec/v1
+oid sha256:fce1369c36d39319d1a6088d18edae2a4fd18e9bfadffc07eac4f4435fd128a8
+size 363095324

quantize_config.json ADDED Viewed

	@@ -0,0 +1,103 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "MatMul",
+                "Tanh",
+                "Unsqueeze",
+                "Range",
+                "Add",
+                "Sqrt",
+                "Slice",
+                "Split",
+                "Sub",
+                "Where",
+                "Transpose",
+                "ReduceMean",
+                "Softmax",
+                "Shape",
+                "Mul",
+                "Equal",
+                "Reshape",
+                "Squeeze",
+                "Concat",
+                "Pow",
+                "Constant",
+                "ConstantOfShape",
+                "Expand",
+                "Cast",
+                "Gather",
+                "Div",
+                "Neg"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "MatMul",
+                "Tanh",
+                "Unsqueeze",
+                "Range",
+                "Add",
+                "Sqrt",
+                "Slice",
+                "Split",
+                "Sub",
+                "Where",
+                "Transpose",
+                "ReduceMean",
+                "Softmax",
+                "Shape",
+                "If",
+                "Mul",
+                "Equal",
+                "Reshape",
+                "Squeeze",
+                "Concat",
+                "Pow",
+                "Constant",
+                "ConstantOfShape",
+                "Expand",
+                "Cast",
+                "Gather",
+                "Div",
+                "Neg"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "MatMul",
+                "Tanh",
+                "Unsqueeze",
+                "Range",
+                "Add",
+                "Sqrt",
+                "Slice",
+                "Split",
+                "Sub",
+                "Where",
+                "Transpose",
+                "ReduceMean",
+                "Softmax",
+                "Shape",
+                "Mul",
+                "Equal",
+                "Reshape",
+                "Squeeze",
+                "Concat",
+                "Pow",
+                "Constant",
+                "ConstantOfShape",
+                "Expand",
+                "Cast",
+                "Gather",
+                "Div",
+                "Neg"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}