jeehwon commited on
Commit
e455b11
·
verified ·
1 Parent(s): c2b69c7

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +27 -0
  3. added_tokens.json +28 -0
  4. config.json +38 -0
  5. generation_config.json +13 -0
  6. merges.txt +0 -0
  7. model-00001-of-00095.safetensors +3 -0
  8. model-00002-of-00095.safetensors +3 -0
  9. model-00003-of-00095.safetensors +3 -0
  10. model-00004-of-00095.safetensors +3 -0
  11. model-00005-of-00095.safetensors +3 -0
  12. model-00006-of-00095.safetensors +3 -0
  13. model-00007-of-00095.safetensors +3 -0
  14. model-00008-of-00095.safetensors +3 -0
  15. model-00009-of-00095.safetensors +3 -0
  16. model-00010-of-00095.safetensors +3 -0
  17. model-00011-of-00095.safetensors +3 -0
  18. model-00012-of-00095.safetensors +3 -0
  19. model-00013-of-00095.safetensors +3 -0
  20. model-00014-of-00095.safetensors +3 -0
  21. model-00015-of-00095.safetensors +3 -0
  22. model-00016-of-00095.safetensors +3 -0
  23. model-00017-of-00095.safetensors +3 -0
  24. model-00018-of-00095.safetensors +3 -0
  25. model-00019-of-00095.safetensors +3 -0
  26. model-00020-of-00095.safetensors +3 -0
  27. model-00021-of-00095.safetensors +3 -0
  28. model-00022-of-00095.safetensors +3 -0
  29. model-00023-of-00095.safetensors +3 -0
  30. model-00024-of-00095.safetensors +3 -0
  31. model-00025-of-00095.safetensors +3 -0
  32. model-00026-of-00095.safetensors +3 -0
  33. model-00027-of-00095.safetensors +3 -0
  34. model-00028-of-00095.safetensors +3 -0
  35. model-00029-of-00095.safetensors +3 -0
  36. model-00030-of-00095.safetensors +3 -0
  37. model-00031-of-00095.safetensors +3 -0
  38. model-00032-of-00095.safetensors +3 -0
  39. model-00033-of-00095.safetensors +3 -0
  40. model-00034-of-00095.safetensors +3 -0
  41. model-00035-of-00095.safetensors +3 -0
  42. model-00036-of-00095.safetensors +3 -0
  43. model-00037-of-00095.safetensors +3 -0
  44. model-00038-of-00095.safetensors +3 -0
  45. model-00039-of-00095.safetensors +3 -0
  46. model-00040-of-00095.safetensors +3 -0
  47. model-00041-of-00095.safetensors +3 -0
  48. model-00042-of-00095.safetensors +3 -0
  49. model-00043-of-00095.safetensors +3 -0
  50. model-00044-of-00095.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Modified Model: Qwen/Qwen3-235B-A22B
2
+
3
+ ## Configuration
4
+ - Base model: Qwen/Qwen3-235B-A22B
5
+ - Minimum scale factor: 0.5
6
+ - Smoothness: 10.0
7
+ - Sample size: 1000
8
+ - Window size: 4
9
+ - N-gram weights: [0.5, 0.3, 0.2]
10
+
11
+ ## Unicode Ranges
12
+ - Range 1: 0x4e00 - 0x9fff
13
+ - Range 2: 0x3400 - 0x4dbf
14
+ - Range 3: 0x20000 - 0x2a6df
15
+ - Range 4: 0xf900 - 0xfaff
16
+ - Range 5: 0x2e80 - 0x2eff
17
+ - Range 6: 0x2f00 - 0x2fdf
18
+ - Range 7: 0x2ff0 - 0x2fff
19
+ - Range 8: 0x3000 - 0x303f
20
+ - Range 9: 0x31c0 - 0x31ef
21
+ - Range 10: 0x3200 - 0x32ff
22
+ - Range 11: 0x3300 - 0x33ff
23
+
24
+ ## Statistics
25
+ - Target tokens: 26,153
26
+ - Broken tokens: 1,457
27
+ - Modified tokens: 27,564
added_tokens.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</think>": 151668,
3
+ "</tool_call>": 151658,
4
+ "</tool_response>": 151666,
5
+ "<think>": 151667,
6
+ "<tool_call>": 151657,
7
+ "<tool_response>": 151665,
8
+ "<|box_end|>": 151649,
9
+ "<|box_start|>": 151648,
10
+ "<|endoftext|>": 151643,
11
+ "<|file_sep|>": 151664,
12
+ "<|fim_middle|>": 151660,
13
+ "<|fim_pad|>": 151662,
14
+ "<|fim_prefix|>": 151659,
15
+ "<|fim_suffix|>": 151661,
16
+ "<|im_end|>": 151645,
17
+ "<|im_start|>": 151644,
18
+ "<|image_pad|>": 151655,
19
+ "<|object_ref_end|>": 151647,
20
+ "<|object_ref_start|>": 151646,
21
+ "<|quad_end|>": 151651,
22
+ "<|quad_start|>": 151650,
23
+ "<|repo_name|>": 151663,
24
+ "<|video_pad|>": 151656,
25
+ "<|vision_end|>": 151653,
26
+ "<|vision_pad|>": 151654,
27
+ "<|vision_start|>": 151652
28
+ }
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen3MoeForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "decoder_sparse_step": 1,
9
+ "eos_token_id": 151645,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 4096,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 12288,
15
+ "max_position_embeddings": 40960,
16
+ "max_window_layers": 94,
17
+ "mlp_only_layers": [],
18
+ "model_type": "qwen3_moe",
19
+ "moe_intermediate_size": 1536,
20
+ "norm_topk_prob": true,
21
+ "num_attention_heads": 64,
22
+ "num_experts": 128,
23
+ "num_experts_per_tok": 8,
24
+ "num_hidden_layers": 94,
25
+ "num_key_value_heads": 4,
26
+ "output_router_logits": false,
27
+ "rms_norm_eps": 1e-06,
28
+ "rope_scaling": null,
29
+ "rope_theta": 1000000.0,
30
+ "router_aux_loss_coef": 0.001,
31
+ "sliding_window": null,
32
+ "tie_word_embeddings": false,
33
+ "torch_dtype": "bfloat16",
34
+ "transformers_version": "4.51.3",
35
+ "use_cache": true,
36
+ "use_sliding_window": false,
37
+ "vocab_size": 151936
38
+ }
generation_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "temperature": 0.6,
10
+ "top_k": 20,
11
+ "top_p": 0.95,
12
+ "transformers_version": "4.51.3"
13
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44518d32283e922fe0a0d1ab05b3a5fc90b3b7c6b7e89d0c6913c782ba82d915
3
+ size 4999647472
model-00002-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3760131c5a7c2d22da6f4a40f0d4fdf9b0dd4a64d7b824cc137ba2961536c999
3
+ size 4988141728
model-00003-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:120af6e205aea86baaf957b05518f5fe792d991be77410fc0d5c0b4405b6e8c4
3
+ size 4988141728
model-00004-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c15e35e9646baf640cc6edc7283423735ae369d6f8a8e9d53582e34397c18c34
3
+ size 4988141728
model-00005-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e815c879560529cf5499af48393b7b2e1ba914146c9e98e12016d54dce7ea79d
3
+ size 4988141728
model-00006-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:380b3e9deb0158e86534da933daaf6f02620089b886ea57cd5710c13d78ae0bb
3
+ size 4988141728
model-00007-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f4adb52dfec880689a0abe1d0a2644f6587db05608fc5195d30712cf756ec3c
3
+ size 4988141728
model-00008-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e2a8455afb34349d491699c9f87d7f1b0b01f05bb8f717b4e7fd10489151986
3
+ size 4988141728
model-00009-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ea52db9e30e55fb9f6bf16bb002a2657c59628674a3cc0fe557ab3666b06d61
3
+ size 4988141728
model-00010-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6c4a4e99178a442f8fff20ae0fe3e35f48566619fdcdc42d73a8d2db556c222
3
+ size 4988141728
model-00011-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2abb853ff1cd9b79693b5185abb458acb5c402eec642532e0121ee01b957c846
3
+ size 4988142048
model-00012-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e723649eb454a506df7e8508300d8ede91f31192508b58b020de3efe3e5007
3
+ size 4988142120
model-00013-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58227b0e328b7bfe476ce420ec99a2501c6089fd52c90de242c77b709ef299c9
3
+ size 4988142120
model-00014-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9079b9c821b7fe456e1cb63fc80e5ad7eb18c0f7ae8bf1c092252591cee465e4
3
+ size 4988142120
model-00015-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73fe6978122c476ab0dfade6ee4a5a6b3f73d72f98ed74bde6ccbc22c0901333
3
+ size 4988142120
model-00016-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2637ff19b833112d43d4e7d7ec4b6fca932d01161288e35e5015994f6a062a5
3
+ size 4988142120
model-00017-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ec006a3f123126ad18a8350567b3f9b656f4601042c468c33f1399d5359e6bf
3
+ size 4988142120
model-00018-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06287d2b1d255e9f55af0ff826a5294162bd632af0e9a0890b19e1150858751f
3
+ size 4988142120
model-00019-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f26231d8207bec1a66e7ec7a7c3bf32e6867e56d779ef3906423c0f5776415
3
+ size 4988142120
model-00020-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09fede2cd15c6a2216b0d4521c7d8480b3a0650a13ab0648d9f28550d030a649
3
+ size 4988142120
model-00021-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0013efae89b040dd1d458656f50db6c072c26f5ff0e05d21ac966834e8f32eca
3
+ size 4988142120
model-00022-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d895a2cc28611a781beb4cce7522403ab57362bcf8e180b12fbaab854f93d9
3
+ size 4988142120
model-00023-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6bd2b8fb1b9acdde30065cbda7483034b5f8d47068b318181b22be6555c5915
3
+ size 4988142120
model-00024-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25530a34a496de186e6ba9427b6e4b47f34f6001f0339c4b3d89d52fcc8141d0
3
+ size 4988142120
model-00025-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70fa5d0cb7b36d31566a4298768bc5c9c87dab9c014f1d3ddf4172028d7d50c1
3
+ size 4988142120
model-00026-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81ae6701340f4e4de6776170befa394220d68fda8e9840972cc567d71b9c202e
3
+ size 4988142120
model-00027-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd00635d186ad16344f69fb81609ac9eb6d820137e7ba648af0a21faa3393d91
3
+ size 4988142120
model-00028-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2aa0df63b5b5018a591b5211de33c47588a457a2e92076f84bf6587458f9c8
3
+ size 4988142120
model-00029-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02aa7a1b674836a25bf398973e0f977b84610e9c8301c24167c63552796b82f1
3
+ size 4988142120
model-00030-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75741f0735379294cb074ac0c8b9cf99ec62668f7b5c0700b761d1412858fabe
3
+ size 4988142120
model-00031-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c95381ed9ccc1b1218a94e145b2349f02dd605ff0b1d667053e5a96a80ebe62
3
+ size 4988142120
model-00032-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b2f51adb680f492ea045f9a51b72216a00715af707cd5fead878ad3a74b6e6b
3
+ size 4988142120
model-00033-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed3f2c3abfeacbd10f42d0d44b65fd0478c33e2eedb8ff70c5ba1943049972b8
3
+ size 4988142120
model-00034-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fe7118d5f3504d2e8b06581042bd9e43e94ee6d48a19d1121085253af7b0833
3
+ size 4988142120
model-00035-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f98be5afa224d6593407ec15a9e8b9f0ca9c859d1bd37b3e58d4496038325b3e
3
+ size 4988142120
model-00036-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bff736b60aef07caf7a9ecf0cb4b6c4f878760cb206c281b120e8c71f70c7ee5
3
+ size 4988142120
model-00037-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37e4ae19d6a42ee3dc55914644e67a8c6c35d94ecc3788f65a44ae46520376a0
3
+ size 4988142120
model-00038-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fd5bb50c531e2041b82a0dd1b83e34d8a99bf69d2910de497e7293a49c50469
3
+ size 4988142120
model-00039-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:815cf65bd55b5168a9f3d8d8495fcdbeefb67b16abb1832674d656998bed5808
3
+ size 4988142120
model-00040-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f6cd6588c74ae00003bb8334e2cee85ce35c8e3ae008ba254eaa7b43c3af3bd
3
+ size 4988142120
model-00041-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05f72698222324d5db5846a35badb8fa0a0c9214cc20f6468e798c35124ce29c
3
+ size 4988142120
model-00042-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5b269a4d966065ee09d4a5f7f840435bbfebef519b9317735ae83721b934cd0
3
+ size 4988142120
model-00043-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a19a1c8ff6e38cff2a05943b91bfc197e3689b93732cc6a82177516498120e
3
+ size 4988142120
model-00044-of-00095.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13be03e0397d175c693dd8ad7f874a6aa29ace8b77c16d86d708eb97787a78ef
3
+ size 4988142120