Flan Mini fine tuned

Files changed (9) hide show

README.md +7 -0
config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +0 -3
onnx/decoder_model_merged.onnx +0 -3
onnx/decoder_with_past_model.onnx +0 -3
onnx/encoder_model.onnx +0 -3
quantize_config.json +139 -0
spiece.model +0 -3

README.md ADDED Viewed

	@@ -0,0 +1,7 @@

+---
+library_name: transformers.js
+---
+https://huggingface.co/MBZUAI/LaMini-Flan-T5-783M with ONNX weights to be compatible with Transformers.js.
+Note: Having a separate repo for ONNX weights is intended to be a temporary solution until WebML gains more traction. If you would like to make your models web-ready, we recommend converting to ONNX using [🤗 Optimum](https://huggingface.co/docs/optimum/index) and structuring your repo like this one (with ONNX weights located in a subfolder named `onnx`).

config.json CHANGED Viewed

@@ -26,7 +26,7 @@
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
-  "transformers_version": "4.33.2",
   "use_cache": true,
   "vocab_size": 32128
 }

   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 32128
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.33.2"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0af2d5176759dac258e16aa9b5421584e608a20bb8d1234871df44bf7cf2ef05
-size 1899966097

onnx/decoder_model_merged.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:27a50e179d5d00261fd29170f82abd0545d7d6e8fc1c13d5f4d3115743c440d1
-size 1900612149

onnx/decoder_with_past_model.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:450dff530ac7190bac7689ecf04f1b5ba3cd484dee7ce073ca2a46009a4fdb2b
-size 1698575515

onnx/encoder_model.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c58209b472cdf3e7fea925f109fe7ee67d12d99368ccd8d18a18c75cce6a9e51
-size 1365283172

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Add",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Neg",
+                "Expand",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Tile",
+                "Log",
+                "Concat",
+                "Cast",
+                "LessOrEqual",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Add",
+                "Abs",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Greater",
+                "Log",
+                "Concat",
+                "Cast",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "If",
+                "Add",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Neg",
+                "Expand",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Tile",
+                "Log",
+                "Concat",
+                "Cast",
+                "LessOrEqual",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Add",
+                "Less",
+                "ConstantOfShape",
+                "Mul",
+                "Slice",
+                "Pow",
+                "Gather",
+                "Shape",
+                "ReduceMean",
+                "MatMul",
+                "Range",
+                "Transpose",
+                "Neg",
+                "Expand",
+                "Sqrt",
+                "Min",
+                "Unsqueeze",
+                "Where",
+                "Div",
+                "Tile",
+                "Log",
+                "Concat",
+                "Cast",
+                "LessOrEqual",
+                "Reshape",
+                "Sub",
+                "Softmax",
+                "Tanh",
+                "Constant"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

spiece.model DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
-size 791656