winglian commited on
Commit
25e440b
·
verified ·
1 Parent(s): 75edf2d

Converted ./Llama-4-Maverick-17B-128E-Linearized to BNB with nf4 and bf16

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. chat_template.json +3 -0
  3. config.json +83 -0
  4. generation_config.json +7 -0
  5. model-00001-of-00042.safetensors +3 -0
  6. model-00002-of-00042.safetensors +3 -0
  7. model-00003-of-00042.safetensors +3 -0
  8. model-00004-of-00042.safetensors +3 -0
  9. model-00005-of-00042.safetensors +3 -0
  10. model-00006-of-00042.safetensors +3 -0
  11. model-00007-of-00042.safetensors +3 -0
  12. model-00008-of-00042.safetensors +3 -0
  13. model-00009-of-00042.safetensors +3 -0
  14. model-00010-of-00042.safetensors +3 -0
  15. model-00011-of-00042.safetensors +3 -0
  16. model-00012-of-00042.safetensors +3 -0
  17. model-00013-of-00042.safetensors +3 -0
  18. model-00014-of-00042.safetensors +3 -0
  19. model-00015-of-00042.safetensors +3 -0
  20. model-00016-of-00042.safetensors +3 -0
  21. model-00017-of-00042.safetensors +3 -0
  22. model-00018-of-00042.safetensors +3 -0
  23. model-00019-of-00042.safetensors +3 -0
  24. model-00020-of-00042.safetensors +3 -0
  25. model-00021-of-00042.safetensors +3 -0
  26. model-00022-of-00042.safetensors +3 -0
  27. model-00023-of-00042.safetensors +3 -0
  28. model-00024-of-00042.safetensors +3 -0
  29. model-00025-of-00042.safetensors +3 -0
  30. model-00026-of-00042.safetensors +3 -0
  31. model-00027-of-00042.safetensors +3 -0
  32. model-00028-of-00042.safetensors +3 -0
  33. model-00029-of-00042.safetensors +3 -0
  34. model-00030-of-00042.safetensors +3 -0
  35. model-00031-of-00042.safetensors +3 -0
  36. model-00032-of-00042.safetensors +3 -0
  37. model-00033-of-00042.safetensors +3 -0
  38. model-00034-of-00042.safetensors +3 -0
  39. model-00035-of-00042.safetensors +3 -0
  40. model-00036-of-00042.safetensors +3 -0
  41. model-00037-of-00042.safetensors +3 -0
  42. model-00038-of-00042.safetensors +3 -0
  43. model-00039-of-00042.safetensors +3 -0
  44. model-00040-of-00042.safetensors +3 -0
  45. model-00041-of-00042.safetensors +3 -0
  46. model-00042-of-00042.safetensors +3 -0
  47. model.safetensors.index.json +0 -0
  48. preprocessor_config.json +33 -0
  49. processor_config.json +6 -0
  50. special_tokens_map.json +23 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
chat_template.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- if strftime_now is defined %}\n {%- set date_string = strftime_now(\"%d %b %Y\") %}\n {%- else %}\n {%- set date_string = \"26 Jul 2024\" %}\n {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %} \n {%- if messages[0]['content'] is string %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- else %}\n {#- FIXME: The processor requires an array, always. #}\n {%- set system_message = messages[0]['content'][0]['text']|trim %}\n {%- endif %}\n {%- set messages = messages[1:] %}\n {%- set user_supplied_system_message = true %}\n{%- else %}\n {%- set system_message = \"\" %}\n {%- set user_supplied_system_message = false %}\n{%- endif %}\n\n{#- System message if the user supplied one #}\n{%- if user_supplied_system_message %}\n {{- \"<|header_start|>system<|header_end|>\n\n\" }}\n {%- if tools is not none %}\n {{- \"Environment: ipython\n\" }}\n {%- endif %}\n {%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\n\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\n\n\" }}\n {%- endfor %}\n {%- endif %}\n {{- system_message }}\n {{- \"<|eot|>\" }}\n{%- endif %}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|header_start|>user<|header_end|>\n\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\n\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\n\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\n\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|header_start|>' + message['role'] + '<|header_end|>\n\n' }}\n {%- if message['content'] is string %}\n {{- message['content'] }}\n {%- else %}\n {%- for content in message['content'] %}\n {%- if content['type'] == 'image' %}\n {{- '<|image|>' }}\n {%- elif content['type'] == 'text' %}\n {{- content['text'] }}\n {%- endif %}\n {%- endfor %}\n {%- endif %}\n {{- \"<|eot|>\" }}\n {%- elif 'tool_calls' in message and message.tool_calls|length > 0 %}\n {{- '<|header_start|>assistant<|header_end|>\n\n' -}}\n {{- '<|python_start|>' }}\n {%- if message['content'] is string %}\n {{- message['content'] }}\n {%- else %}\n {%- for content in message['content'] %}\n {%- if content['type'] == 'image' %}\n {{- '<|image|>' }}\n {%- elif content['type'] == 'text' %}\n {{- content['text'] }}\n {%- endif %}\n {%- endfor %}\n {%- endif %}\n {{- '<|python_end|>' }}\n {%- for tool_call in message.tool_calls %}\n {{- '{\"name\": \"' + tool_call.function.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.function.arguments | tojson }}\n {{- \"}\" }}\n {%- endfor %}\n {{- \"<|eot|>\" }}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|header_start|>ipython<|header_end|>\n\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|header_start|>assistant<|header_end|>\n\n' }}\n{%- endif %}\n"
3
+ }
config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Llama4ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_chunk_size": 8192,
7
+ "attention_dropout": 0.0,
8
+ "attn_scale": 0.1,
9
+ "attn_temperature_tuning": 4,
10
+ "bos_token_id": 200000,
11
+ "eos_token_id": 200001,
12
+ "floor_scale": 8192,
13
+ "for_llm_compressor": false,
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 5120,
17
+ "initializer_range": 0.02,
18
+ "interleave_moe_layer_step": 2,
19
+ "intermediate_size": 8192,
20
+ "intermediate_size_mlp": 16384,
21
+ "max_position_embeddings": 262144,
22
+ "model_type": "llama4_text",
23
+ "moe_layers": [
24
+ 1,
25
+ 3,
26
+ 5,
27
+ 7,
28
+ 9,
29
+ 11,
30
+ 13,
31
+ 15,
32
+ 17,
33
+ 19,
34
+ 21,
35
+ 23,
36
+ 25,
37
+ 27,
38
+ 29,
39
+ 31,
40
+ 33,
41
+ 35,
42
+ 37,
43
+ 39,
44
+ 41,
45
+ 43,
46
+ 45,
47
+ 47
48
+ ],
49
+ "no_rope_layers": 4,
50
+ "num_attention_heads": 40,
51
+ "num_experts_per_tok": 1,
52
+ "num_hidden_layers": 48,
53
+ "num_key_value_heads": 8,
54
+ "num_local_experts": 128,
55
+ "output_router_logits": false,
56
+ "pad_token_id": 200018,
57
+ "quantization_config": {
58
+ "_load_in_4bit": true,
59
+ "_load_in_8bit": false,
60
+ "bnb_4bit_compute_dtype": "bfloat16",
61
+ "bnb_4bit_quant_storage": "bfloat16",
62
+ "bnb_4bit_quant_type": "nf4",
63
+ "bnb_4bit_use_double_quant": true,
64
+ "llm_int8_enable_fp32_cpu_offload": false,
65
+ "llm_int8_has_fp16_weight": false,
66
+ "llm_int8_skip_modules": null,
67
+ "llm_int8_threshold": 6.0,
68
+ "load_in_4bit": true,
69
+ "load_in_8bit": false,
70
+ "quant_method": "bitsandbytes"
71
+ },
72
+ "rms_norm_eps": 1e-05,
73
+ "rope_scaling": null,
74
+ "rope_theta": 500000.0,
75
+ "router_aux_loss_coef": 0.001,
76
+ "router_jitter_noise": 0.0,
77
+ "tie_word_embeddings": false,
78
+ "torch_dtype": "bfloat16",
79
+ "transformers_version": "4.51.0",
80
+ "use_cache": true,
81
+ "use_qk_norm": false,
82
+ "vocab_size": 202048
83
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 200000,
4
+ "eos_token_id": 200001,
5
+ "pad_token_id": 200018,
6
+ "transformers_version": "4.51.0"
7
+ }
model-00001-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9a13110f59602845defca4898dac0703c01c2619ffd206c216b97c2338cb65d
3
+ size 4990289311
model-00002-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db9535255b9bf2d039d13bea3bc718517844e5eec1b8f6bb9381478d092e76d7
3
+ size 4998657065
model-00003-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc89ba38a15e90c37dc2029d01466e2c4fbe16459aa119930611703794697280
3
+ size 4999042575
model-00004-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8a770529bdd0673f497d19230628a32dbbd46741d4397ac7083e7d961c2641f
3
+ size 4999042613
model-00005-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee043017a34fb2e5e643885350d12bf3cd37ca09bbc0bca9b6033fa0a35b6347
3
+ size 4998657261
model-00006-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a340c957cd75b9bafcddb24d40ebb97856cb67e6550c18fc19d41bf9097393c
3
+ size 4999043213
model-00007-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9d48f39b16086bf857f821a65c8e36dcc8fc010d476bb3211ba26935d01a056
3
+ size 4998657217
model-00008-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff27415ac0f2254273c7c3c3016372026ffea0614ead7b9fd4cba20b6c1e4a00
3
+ size 4999042994
model-00009-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76083dbe9f3d327777da4667ec6151d7c5dbe58a7ebc67bb38272a1929ac396e
3
+ size 4966564401
model-00010-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a6bcb9fd97fad0b00fe58c0ddeb69f510bd857719ea2ba9b2461207730b4755
3
+ size 4987858255
model-00011-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cb754c44232e6443a4dc7fa7f7e9c833f45d07db55a845603b6f5dbb1bd00a3
3
+ size 4999044384
model-00012-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5acf4a89594b8ab78521e925f487423303c7d7426983c67d925aa54ae0f6b43b
3
+ size 4998658594
model-00013-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67a3e4abe6493908c96e36e744d3b4fa226a2cc544feb832c2af24f6cb63e085
3
+ size 4999044817
model-00014-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be599e20500a2c032aa3082aa43aee4fd4b03ed747fe14303ffefa8d990d51af
3
+ size 4998658454
model-00015-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9045c54df0afbad6f3f2720a41a1bb2571595b74ed3c2bf575ef51e677281f62
3
+ size 4999044022
model-00016-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab9ecb62fb47b2244022aa60f0c449086ad9312a31c3d9ad09ae7dfcf2def722
3
+ size 4999043993
model-00017-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2130b465e514cd3b3682f0bbdc83a2dd3e4bd11524ae74fc963504f7bf730b54
3
+ size 4998658670
model-00018-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e8e5e2252b00ccfca43b2406a88237e4ad0f0b58b1990076fc1926c1066bb8
3
+ size 4999044638
model-00019-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:100f37312e61b8d02629386544f8ae1544beb2a1206e8d58ed08df0050fd743d
3
+ size 4998658613
model-00020-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f4a6f6ee5dc66c52af55d1ce7d2947dbfaefa382954d3abfadc07568ba1f672
3
+ size 4999044422
model-00021-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edb1cafd1d8bac2ffe8b29998e8504d3dcf2025eecff10c54b90ab55871c27ac
3
+ size 4996319067
model-00022-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b41963defe627efba36062d07791730e9f027ce620b220122a3c8a3596fcf9bb
3
+ size 4979744240
model-00023-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc909b808e1c944be33822b5b364d05f06e910158c38d247f8db253e6b7a8f64
3
+ size 4999044392
model-00024-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1731b723bc23918f4ba85cc992afc9588ababa5d5c95810bc19253e777f9633c
3
+ size 4998658602
model-00025-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c68fdc1aaa291921b14dab0cc0cda02a1dc22b98d7e0ce9b09b5bc16364fed4
3
+ size 4999044794
model-00026-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cd7d20331c37c059a2d3ce4bc42c120e9b902036b9d1450a37c8d44cef2434e
3
+ size 4998658469
model-00027-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1778fa8485c9bb1854935139921d984c0a73008738be87c7b71125090e9094e4
3
+ size 4999044033
model-00028-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e4f7962fecf648ee4abbe901f7fada853e407b716eccfe3bec5f9884816644a
3
+ size 4999043968
model-00029-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19c9f2e70ed7b8836dcfbb65ce56b4c3cc24be1ad561a8e71134e067b6d0290
3
+ size 4998658664
model-00030-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2db00eb3a75534e473a6e168f7c23fdb0dbf8db36931878dc2b5d407388f966f
3
+ size 4999044626
model-00031-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:034d767cdd37e40f49dc5019558dd1a3d04a22d8dd37d4c9da8f4099a1e1d65c
3
+ size 4998658592
model-00032-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6fc9a26a3cb425777abc0ff789c49ec5699b9dbb8a2298b4c7e67b4e8ef08d4
3
+ size 4999044464
model-00033-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8dbea0c3ecaa21ffdf5127d9c368de4b43bd39a85b3ad7582fa474ff2a8b128
3
+ size 4999019807
model-00034-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0080540f863dc4c831cbaf95a2ce8939d19cff2853a60e6e358aa482c9cd4242
3
+ size 4998682670
model-00035-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e01b6ac5932bf3b7e7944ec9a97bfd8e184f6373264cac27e84ed86808945e7a
3
+ size 4999044358
model-00036-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca588e9745123f6c68eec89a24b18d6bcdf0dda08ec186a02d03804a5f1d56b5
3
+ size 4998658606
model-00037-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47a93bd3f9c82c5a8b400a5f7239de9074a2964ffbd4fb3a28fffca20874541c
3
+ size 4999044816
model-00038-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0242a73372482b179c216d157e07116290e4c5c127639177e2c7cc99a1a9cd7e
3
+ size 4998658462
model-00039-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e51a7107fcb97dbcd8af7914d04093ad2e937bb0b13dac02f9ca74596c685c3
3
+ size 4999044046
model-00040-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:616d10f389fe63716ba76779bc8341777e25b81e9baf385e920133ca968787d8
3
+ size 4999043966
model-00041-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d598534eb86640f7abcba394c19d97fdab18df13781ca24a27c128d38be6d16
3
+ size 4998658660
model-00042-of-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13a9241e0658adfd259210b6f9d21769b92554d87757514e46b8dea093cb25cb
3
+ size 4925719795
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
preprocessor_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": null,
3
+ "data_format": "channels_first",
4
+ "default_to_square": true,
5
+ "device": null,
6
+ "do_center_crop": null,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "image_processor_type": "Llama4ImageProcessorFast",
17
+ "image_std": [
18
+ 0.5,
19
+ 0.5,
20
+ 0.5
21
+ ],
22
+ "input_data_format": null,
23
+ "max_patches": 16,
24
+ "processor_class": "Llama4Processor",
25
+ "resample": 2,
26
+ "rescale_factor": 0.00392156862745098,
27
+ "resize_to_max_canvas": false,
28
+ "return_tensors": null,
29
+ "size": {
30
+ "height": 336,
31
+ "width": 336
32
+ }
33
+ }
processor_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "fake_image_token": "<|image|>",
3
+ "image_token": "<|image|>",
4
+ "patch_size": 14,
5
+ "processor_class": "Llama4Processor"
6
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|begin_of_text|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|end_of_text|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|finetune_right_pad_id|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }