ngxson HF staff Xenova HF staff commited on
Commit
cdf8a31
·
verified ·
1 Parent(s): 9538930

Upload folder using huggingface_hub (#1)

Browse files

- Upload folder using huggingface_hub (449fbb0afcfaa00abd4b1b1320d2c834eb055a25)
- Update config.json (8736183eee68facec8494ca62bc6f79dca970e56)
- Update generation_config.json (ac457217e45a70fc4b7df868ff1e8909c2dc1385)
- Update config.json (03ac92f9bfcc8dc9affbbc3b19ed5dabb498c075)


Co-authored-by: Joshua <[email protected]>

.gitattributes CHANGED
@@ -34,3 +34,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
38
+ onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -35,6 +35,12 @@
35
  "tie_word_embeddings": true,
36
  "torch_dtype": "float32",
37
  "transformers_version": "4.47.1",
 
 
 
 
 
 
38
  "use_cache": true,
39
  "vocab_size": 128256
40
- }
 
35
  "tie_word_embeddings": true,
36
  "torch_dtype": "float32",
37
  "transformers_version": "4.47.1",
38
+ "transformers.js_config": {
39
+ "kv_cache_dtype": {
40
+ "q4f16": "float16",
41
+ "fp16": "float16"
42
+ }
43
+ },
44
  "use_cache": true,
45
  "vocab_size": 128256
46
+ }
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b1860a6bda206918f22bc4700a803196de792979a961a649d684b35a091d5b9
3
+ size 83590
onnx/model.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec00849ff44be3e1cfebae18aaaf06c9126da53e5daa1de285e740aab31c2716
3
+ size 4976812032
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9a9db6cd7d88964dfa5fb7e89be9ae1b5371e9f6058fdd0998ca83fa52e6d98
3
+ size 1631947377
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba1237166f263f7e28df2d91f9e0ec6e635df1e2b63f88c172409efb3081aff4
3
+ size 398674945
onnx/model_fp16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa6fe8cb21aa7b2a7f53a0f0b855c015a24e5ddd5fe1e60ac39c509b84b67572
3
+ size 2089811968
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27f15664651c68f7ab03396778198743bcb0394e34933f6fe499a8a916909ffb
3
+ size 1269746162
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d6ab9eee4b33ae0d47ee4c1a8bed6df5b0fb9cd245a234b54071c424222f847
3
+ size 1692764177
onnx/model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc8b4d8c2ea5eba115f6ddf99badb7b3690a7b98566fd161259a96074eb3a187
3
+ size 1089697758
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:950a03f7cdfb3de8da8c1222ba262f2e00d309588e43765634d1b8ea4b19af78
3
+ size 1269746207
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:950a03f7cdfb3de8da8c1222ba262f2e00d309588e43765634d1b8ea4b19af78
3
+ size 1269746207
special_tokens_map.json CHANGED
@@ -13,5 +13,11 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": "<|finetune_right_pad_id|>"
 
 
 
 
 
 
17
  }
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": {
17
+ "content": "<|finetune_right_pad_id|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb9b85b70a1b34e497c3476c315b656613e7ed0b2db8c6cf62ec83d381c98737
3
- size 17209986
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c02b5c0c3fbb4b776c5ad9ede41ef8421ce0a8be84fa0bf5812fbbc80557e21
3
+ size 11574684
tokenizer_config.json CHANGED
@@ -2054,11 +2054,15 @@
2054
  "clean_up_tokenization_spaces": true,
2055
  "eos_token": "<|eot_id|>",
2056
  "extra_special_tokens": {},
 
2057
  "model_input_names": [
2058
  "input_ids",
2059
  "attention_mask"
2060
  ],
2061
  "model_max_length": 131072,
2062
  "pad_token": "<|finetune_right_pad_id|>",
2063
- "tokenizer_class": "PreTrainedTokenizerFast"
 
 
 
2064
  }
 
2054
  "clean_up_tokenization_spaces": true,
2055
  "eos_token": "<|eot_id|>",
2056
  "extra_special_tokens": {},
2057
+ "max_length": 32000,
2058
  "model_input_names": [
2059
  "input_ids",
2060
  "attention_mask"
2061
  ],
2062
  "model_max_length": 131072,
2063
  "pad_token": "<|finetune_right_pad_id|>",
2064
+ "stride": 0,
2065
+ "tokenizer_class": "PreTrainedTokenizerFast",
2066
+ "truncation_side": "right",
2067
+ "truncation_strategy": "longest_first"
2068
  }