Upload 56 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +73 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": false,
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 10240,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 50432,
|
12 |
+
"rotary_pct": 1.0,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 2048,
|
15 |
+
"head_dim": 80,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32",
|
19 |
+
"max_batch_size": 80
|
20 |
+
},
|
21 |
+
"vocab_size": 50432,
|
22 |
+
"context_window_size": 2048,
|
23 |
+
"sliding_window_size": -1,
|
24 |
+
"prefill_chunk_size": 2048,
|
25 |
+
"attention_sink_size": -1,
|
26 |
+
"tensor_parallel_shards": 1,
|
27 |
+
"mean_gen_len": 128,
|
28 |
+
"max_gen_len": 512,
|
29 |
+
"shift_fill_factor": 0.3,
|
30 |
+
"temperature": 0.7,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.95,
|
35 |
+
"conv_template": {
|
36 |
+
"name": "redpajama_chat",
|
37 |
+
"system_template": "{system_message}",
|
38 |
+
"system_message": "",
|
39 |
+
"add_role_after_system_message": true,
|
40 |
+
"roles": {
|
41 |
+
"user": "<human>",
|
42 |
+
"assistant": "<bot>"
|
43 |
+
},
|
44 |
+
"role_templates": {
|
45 |
+
"user": "{user_message}",
|
46 |
+
"assistant": "{assistant_message}",
|
47 |
+
"tool": "{tool_message}"
|
48 |
+
},
|
49 |
+
"messages": [],
|
50 |
+
"seps": [
|
51 |
+
"\n"
|
52 |
+
],
|
53 |
+
"role_content_sep": ": ",
|
54 |
+
"role_empty_sep": ":",
|
55 |
+
"stop_str": [
|
56 |
+
"<human>"
|
57 |
+
],
|
58 |
+
"stop_token_ids": [
|
59 |
+
0
|
60 |
+
],
|
61 |
+
"function_string": "",
|
62 |
+
"use_function_calling": false
|
63 |
+
},
|
64 |
+
"pad_token_id": 0,
|
65 |
+
"bos_token_id": 0,
|
66 |
+
"eos_token_id": 0,
|
67 |
+
"tokenizer_files": [
|
68 |
+
"tokenizer.json",
|
69 |
+
"tokenizer_config.json"
|
70 |
+
],
|
71 |
+
"token_table_postproc_method": "byte_level",
|
72 |
+
"version": "0.1.0"
|
73 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0bf72854d0eecb6149b96776290d4f588f0966293fd5282a629d9eee6afa222
|
3 |
+
size 64552960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:517532087722385eb588aff2fe81d0a00457e3ed4a20901369e376d7cdad150d
|
3 |
+
size 22855680
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2731225ef5fa36c0a8d39831009b057a0e3933bfde305d68525c6dc974878f6
|
3 |
+
size 29537280
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ec34ef29bc37df8a660efedbeb14d24b94db54d6648480ef8a799fc8be77f93
|
3 |
+
size 29537280
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b5e56aace16824ed98144e650caca5021eb4ec17a8abbf6756ab8722edd9fb1
|
3 |
+
size 29532160
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3269f3222ead543f0650772ccea2bdfd34410d839e5aee12218338447dd47198
|
3 |
+
size 29537280
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b9a1051b69e4cb4dd320e44fe96d978998d856c1a09f171e87d7d790a5141ca
|
3 |
+
size 29537280
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d7b66ec0fd9893999d61422253f5b44ca762697697688189d4e374e6efe918e
|
3 |
+
size 29532160
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8658c857b229094ae26c2e2c11a4cb3484286313a0ea0b23b33064f67efb5309
|
3 |
+
size 29537280
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a37013d6e46a56d21051dcae94aee73c1ca9333d603463a59a37d75c0e6d6b30
|
3 |
+
size 29537280
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81c7be621ff21e1851948a72a8ccf607f5fd8022e75a0f8f93cb9af82006f152
|
3 |
+
size 29532160
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac0323ac533bed6c70afe445757b622fcf5dcea3a52512378200c6007077c137
|
3 |
+
size 29537280
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4395316ff5682c2a6d9386b9cf7e545cb7ff36ae561e948c1baf8b98fd4b62b
|
3 |
+
size 29537280
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5aa771aa3dedc07f4958d9ed24bc13d5c460d64676af0d3a6082662bcb846605
|
3 |
+
size 29537280
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f840c00f91d0d36a699b48a4fd59ac4a6a4afc2501c4f53609dbbd4a0369c9f9
|
3 |
+
size 29532160
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a894fff84dabad0033b6918c76c7653b1d8ad4529b50ca3b57e33860a635d6ed
|
3 |
+
size 29537280
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dae5ced419892a4d299fa43090d9c9a57cb09a59a069486b578d8c842506e3e0
|
3 |
+
size 29537280
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8a456f96f12a00d859de3d5995f507d4fcfbd4241d7a84ff4022c85f16cdf6f
|
3 |
+
size 29532160
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f226871fcfc9ad542a6d5c30ad91b2cdc142e2ea667569a17fb6ccf0894c7f15
|
3 |
+
size 29537280
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:803a8190c0b09a5dc3123c49088cde3c1401bcbc83b05ab62a4f184efe08aa9f
|
3 |
+
size 29537280
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cf3467751f3df32ca189cb6592839e6bdffb1d38b8bc0e1d1efa7809e870252
|
3 |
+
size 29532160
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0825686f98feedbf40d31f540c4ae03c45a3e7939de67bc4782ddb4773c5bc59
|
3 |
+
size 29537280
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46fde38dcf5fb22aebb191563d9fdb2ac744e85b07c5207ab0a1c6f1ad42258f
|
3 |
+
size 29537280
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8427b91520da0ca3e05e503cf5d35e44c67ff95c64c4e5bcc337d41a90424959
|
3 |
+
size 29532160
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:140b601c2c3b9983568987c04239546881e1f69d5609cf930ae9fa840c7abe49
|
3 |
+
size 29532160
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adc7008e353dd6e673b39217195bd993f751ce076255ec4a038a542cca3cd9df
|
3 |
+
size 29537280
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3b432ad6699754dd76f929ee60a1688c14580d4e4db607aaad8675bfcb88728
|
3 |
+
size 29537280
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea5ec5635f45dd213014f7fc6ef3cc59105b4dabddfc2007227a0ea04a093f3a
|
3 |
+
size 29532160
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8d61e3e4ef11bcfa0ce10caeaa254f9a880f4aade00e9b921e062413215541a
|
3 |
+
size 29537280
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1eba77695bc573493a22497cb4ea3e529c8b2e443abbf87842deaccd97420c0
|
3 |
+
size 29537280
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a04663656cfdfd3590e873c4d4ec53131c3a9d84f3e9b1f02c93c45a73094c8
|
3 |
+
size 29532160
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ece563e3dfd4683f01b73b8295084f9950123d4b81d548cc19be88fe518a6785
|
3 |
+
size 29537280
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b2d79b809fc7cecf2e85d6fefb0ded47f8ed9a2adba1bb82b9ea5fbdc4075b0
|
3 |
+
size 29537280
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82c47e303c92b7a2584478fd1660c4c63d4aed9add7e8209459e3a5ef6646396
|
3 |
+
size 29532160
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce37ce4e8375887d6927129074232f315610c84fb3cdc7ec4119b72d2d49870f
|
3 |
+
size 29537280
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:352bf44d311ef4330e15e0cc54d65fe9c69d9ef225bb49b1d03443e83892f120
|
3 |
+
size 29537280
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:951f7b2a96d465741e6050efe9f48fcb7b1a07e4f1f5bb12174a99d16940725a
|
3 |
+
size 29537280
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d9f5c7e577d702692f197e24926248c286d23f05b7cfd4883f6ea35c8e78d7c
|
3 |
+
size 29532160
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0e52de6d3b6862f449e831968356bb97d676a264f2b20fdc1cf3682a8870141
|
3 |
+
size 29537280
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:618d6f841ad74bc1fb9246bae6f17a83d7bdaa3cf17609f4099aef43ec6bae52
|
3 |
+
size 29537280
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ac93bc650662868bddcacbd9f2dd3d619f04964319331e8520641a596c1521b
|
3 |
+
size 29532160
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1a6f40f477e587c8e139f74825a60d9b03cb9838f3461b5bc23ffa4ed26e9d5
|
3 |
+
size 29537280
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12943ed5ff94f939700624ee2af4a53076cb0dfd4666eec2c1cda5f9dfff5877
|
3 |
+
size 29537280
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c760c4c241267eb84337b29a1fba6644cfd79859f080f17ea0cbc0b94b803e57
|
3 |
+
size 29532160
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fe3b24c2f8355d076738d557c792358445f1e7fbb5400b0b321edf71319889b
|
3 |
+
size 64552960
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5e127cd837309e19f198b2517340860df38bbac4c55bdaf7c6a6b05dc843418
|
3 |
+
size 29537280
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f37dbc1290a4fbb4e0e0c8906a88e3cba136b5cf5669d290a16dfb631e2a3e0
|
3 |
+
size 22830080
|