Upload folder using huggingface_hub

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
README.md +189 -0
chat_template.json +3 -0
config.json +330 -0
generation_config.json +13 -0
model-00001-of-00072.safetensors +3 -0
model-00002-of-00072.safetensors +3 -0
model-00003-of-00072.safetensors +3 -0
model-00004-of-00072.safetensors +3 -0
model-00005-of-00072.safetensors +3 -0
model-00006-of-00072.safetensors +3 -0
model-00007-of-00072.safetensors +3 -0
model-00008-of-00072.safetensors +3 -0
model-00009-of-00072.safetensors +3 -0
model-00010-of-00072.safetensors +3 -0
model-00011-of-00072.safetensors +3 -0
model-00012-of-00072.safetensors +3 -0
model-00013-of-00072.safetensors +3 -0
model-00014-of-00072.safetensors +3 -0
model-00015-of-00072.safetensors +3 -0
model-00016-of-00072.safetensors +3 -0
model-00017-of-00072.safetensors +3 -0
model-00018-of-00072.safetensors +3 -0
model-00019-of-00072.safetensors +3 -0
model-00020-of-00072.safetensors +3 -0
model-00021-of-00072.safetensors +3 -0
model-00022-of-00072.safetensors +3 -0
model-00023-of-00072.safetensors +3 -0
model-00024-of-00072.safetensors +3 -0
model-00025-of-00072.safetensors +3 -0
model-00026-of-00072.safetensors +3 -0
model-00027-of-00072.safetensors +3 -0
model-00028-of-00072.safetensors +3 -0
model-00029-of-00072.safetensors +3 -0
model-00030-of-00072.safetensors +3 -0
model-00031-of-00072.safetensors +3 -0
model-00032-of-00072.safetensors +3 -0
model-00033-of-00072.safetensors +3 -0
model-00034-of-00072.safetensors +3 -0
model-00035-of-00072.safetensors +3 -0
model-00036-of-00072.safetensors +3 -0
model-00037-of-00072.safetensors +3 -0
model-00038-of-00072.safetensors +3 -0
model-00039-of-00072.safetensors +3 -0
model-00040-of-00072.safetensors +3 -0
model-00041-of-00072.safetensors +3 -0
model-00042-of-00072.safetensors +3 -0
model-00043-of-00072.safetensors +3 -0
model-00044-of-00072.safetensors +3 -0
model-00045-of-00072.safetensors +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,189 @@

+---
+library_name: transformers
+language:
+- ar
+- de
+- en
+- es
+- fr
+- hi
+- id
+- it
+- pt
+- th
+- tl
+- vi
+base_model:
+- meta-llama/Llama-4-Maverick-17B-128E
+tags:
+- facebook
+- meta
+- pytorch
+- llama
+- llama-4
+- mlx
+extra_gated_prompt: '**LLAMA 4 COMMUNITY LICENSE AGREEMENT**
+  Llama 4 Version Effective Date: April 5, 2025
+  "**Agreement**" means the terms and conditions for use, reproduction, distribution
+  and modification of the Llama Materials set forth herein.
+  "**Documentation**" means the specifications, manuals and documentation accompanying
+  Llama 4 distributed by Meta at [https://www.llama.com/docs/overview](https://llama.com/docs/overview).
+  "**Licensee**" or "**you**" means you, or your employer or any other person or entity
+  (if you are entering into this Agreement on such person or entity’s behalf), of
+  the age required under applicable laws, rules or regulations to provide legal consent
+  and that has legal authority to bind your employer or such other person or entity
+  if you are entering in this Agreement on their behalf.
+  "**Llama 4**" means the foundational large language models and software and algorithms,
+  including machine-learning model code, trained model weights, inference-enabling
+  code, training-enabling code, fine-tuning enabling code and other elements of the
+  foregoing distributed by Meta at [https://www.llama.com/llama-downloads](https://www.llama.com/llama-downloads).
+  "**Llama Materials**" means, collectively, Meta’s proprietary Llama 4 and Documentation
+  (and any portion thereof) made available under this Agreement.
+  "**Meta**" or "**we**" means Meta Platforms Ireland Limited (if you are located
+  in or, if you are an entity, your principal place of business is in the EEA or Switzerland)
+  and Meta Platforms, Inc. (if you are located outside of the EEA or Switzerland).
+  By clicking "I Accept" below or by using or distributing any portion or element
+  of the Llama Materials, you agree to be bound by this Agreement.
+  1\. **License Rights and Redistribution**.
+  a. Grant of Rights. You are granted a non-exclusive, worldwide, non-transferable
+  and royalty-free limited license under Meta’s intellectual property or other rights
+  owned by Meta embodied in the Llama Materials to use, reproduce, distribute, copy,
+  create derivative works of, and make modifications to the Llama Materials.
+  b. Redistribution and Use.
+  i. If you distribute or make available the Llama Materials (or any derivative works
+  thereof), or a product or service (including another AI model) that contains any
+  of them, you shall (A) provide a copy of this Agreement with any such Llama Materials;
+  and (B) prominently display "Built with Llama" on a related website, user interface,
+  blogpost, about page, or product documentation. If you use the Llama Materials or
+  any outputs or results of the Llama Materials to create, train, fine tune, or otherwise
+  improve an AI model, which is distributed or made available, you shall also include
+  "Llama" at the beginning of any such AI model name.
+  ii. If you receive Llama Materials, or any derivative works thereof, from a Licensee
+  as part of an integrated end user product, then Section 2 of this Agreement will
+  not apply to you.
+  iii. You must retain in all copies of the Llama Materials that you distribute the
+  following attribution notice within a "Notice" text file distributed as a part of
+  such copies: "Llama 4 is licensed under the Llama 4 Community License, Copyright
+  © Meta Platforms, Inc. All Rights Reserved."
+  iv. Your use of the Llama Materials must comply with applicable laws and regulations
+  (including trade compliance laws and regulations) and adhere to the Acceptable Use
+  Policy for the Llama Materials (available at [https://www.llama.com/llama4/use-policy](https://www.llama.com/llama4/use-policy)),
+  which is hereby incorporated by reference into this Agreement.        2\. **Additional
+  Commercial Terms**. If, on the Llama 4 version release date, the monthly active
+  users of the products or services made available by or for Licensee, or Licensee’s
+  affiliates, is greater than 700 million monthly active users in the preceding calendar
+  month, you must request a license from Meta, which Meta may grant to you in its
+  sole discretion, and you are not authorized to exercise any of the rights under
+  this Agreement unless or until Meta otherwise expressly grants you such rights.
+  3**. Disclaimer of Warranty**. UNLESS REQUIRED BY APPLICABLE LAW, THE LLAMA MATERIALS
+  AND ANY OUTPUT AND RESULTS THEREFROM ARE PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES
+  OF ANY KIND, AND META DISCLAIMS ALL WARRANTIES OF ANY KIND, BOTH EXPRESS AND IMPLIED,
+  INCLUDING, WITHOUT LIMITATION, ANY WARRANTIES OF TITLE, NON-INFRINGEMENT, MERCHANTABILITY,
+  OR FITNESS FOR A PARTICULAR PURPOSE. YOU ARE SOLELY RESPONSIBLE FOR DETERMINING
+  THE APPROPRIATENESS OF USING OR REDISTRIBUTING THE LLAMA MATERIALS AND ASSUME ANY
+  RISKS ASSOCIATED WITH YOUR USE OF THE LLAMA MATERIALS AND ANY OUTPUT AND RESULTS.
+  4\. **Limitation of Liability**. IN NO EVENT WILL META OR ITS AFFILIATES BE LIABLE
+  UNDER ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, TORT, NEGLIGENCE, PRODUCTS LIABILITY,
+  OR OTHERWISE, ARISING OUT OF THIS AGREEMENT, FOR ANY LOST PROFITS OR ANY INDIRECT,
+  SPECIAL, CONSEQUENTIAL, INCIDENTAL, EXEMPLARY OR PUNITIVE DAMAGES, EVEN IF META
+  OR ITS AFFILIATES HAVE BEEN ADVISED OF THE POSSIBILITY OF ANY OF THE FOREGOING.
+  5\. **Intellectual Property**.
+  a. No trademark licenses are granted under this Agreement, and in connection with
+  the Llama Materials, neither Meta nor Licensee may use any name or mark owned by
+  or associated with the other or any of its affiliates, except as required for reasonable
+  and customary use in describing and redistributing the Llama Materials or as set
+  forth in this Section 5(a). Meta hereby grants you a license to use "Llama" (the
+  "Mark") solely as required to comply with the last sentence of Section 1.b.i. You
+  will comply with Meta’s brand guidelines (currently accessible at [https://about.meta.com/brand/resources/meta/company-brand/](https://about.meta.com/brand/resources/meta/company-brand/)[)](https://en.facebookbrand.com/).
+  All goodwill arising out of your use of the Mark will inure to the benefit of Meta.
+  b. Subject to Meta’s ownership of Llama Materials and derivatives made by or for
+  Meta, with respect to any derivative works and modifications of the Llama Materials
+  that are made by you, as between you and Meta, you are and will be the owner of
+  such derivative works and modifications.
+  c. If you institute litigation or other proceedings against Meta or any entity (including
+  a cross-claim or counterclaim in a lawsuit) alleging that the Llama Materials or
+  Llama 4 outputs or results, or any portion of any of the foregoing, constitutes
+  infringement of intellectual property or other rights owned or licensable by you,
+  then any licenses granted to you under this Agreement shall terminate as of the
+  date such litigation or claim is filed or instituted. You will indemnify and hold
+  harmless Meta from and against any claim by any third party arising out of or related
+  to your use or distribution of the Llama Materials.
+  6\. **Term and Termination**. The term of this Agreement will commence upon your
+  acceptance of this Agreement or access to the Llama Materials and will continue
+  in full force and effect until terminated in accordance with the terms and conditions
+  herein. Meta may terminate this Agreement if you are in breach of any term or condition
+  of this Agreement. Upon termination of this Agreement, you shall delete and cease
+  use of the Llama Materials. Sections 3, 4 and 7 shall survive the termination of
+  this Agreement.
+  7\. **Governing Law and Jurisdiction**. This Agreement will be governed and construed
+  under the laws of the State of California without regard to choice of law principles,
+  and the UN Convention on Contracts for the International Sale of Goods does not
+  apply to this Agreement. The courts of California shall have exclusive jurisdiction
+  of any dispute arising out of this Agreement.'
+extra_gated_fields:
+  First Name: text
+  Last Name: text
+  Date of birth: date_picker
+  Country: country
+  Affiliation: text
+  Job title:
+    type: select
+    options:
+    - Student
+    - Research Graduate
+    - AI researcher
+    - AI developer/engineer
+    - Reporter
+    - Other
+  geo: ip_location
+  ? By clicking Submit below I accept the terms of the license and acknowledge that
+    the information I provide will be collected stored processed and shared in accordance
+    with the Meta Privacy Policy
+  : checkbox
+extra_gated_description: The information you provide will be collected, stored, processed
+  and shared in accordance with the [Meta Privacy Policy](https://www.facebook.com/privacy/policy/).
+extra_gated_button_content: Submit
+extra_gated_heading: Please be sure to provide your full legal name, date of birth,
+  and full organization name with all corporate identifiers. Avoid the use of acronyms
+  and special characters. Failure to follow these instructions may prevent you from
+  accessing this model and others on Hugging Face. You will not have the ability to
+  edit this form after submission, so please ensure all information is accurate.
+license: other
+license_name: llama4
+---
+# mlx-community/Llama-4-Maverick-17B-128E-Instruct-4bit
+This model was converted to MLX format from [`meta-llama/Llama-4-Maverick-17B-128E-Instruct`]() using mlx-vlm version **0.1.21**.
+Refer to the [original model card](https://huggingface.co/meta-llama/Llama-4-Maverick-17B-128E-Instruct) for more details on the model.
+## Use with mlx
+```bash
+pip install -U mlx-vlm
+```
+```bash
+python -m mlx_vlm.generate --model mlx-community/Llama-4-Maverick-17B-128E-Instruct-4bit --max-tokens 100 --temperature 0.0 --prompt "Describe this image." --image <path_to_image>
+```

chat_template.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n    {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n    {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n    {%- if strftime_now is defined %}\n        {%- set date_string = strftime_now(\"%d %b %Y\") %}\n    {%- else %}\n        {%- set date_string = \"26 Jul 2024\" %}\n    {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}    \n    {%- if messages[0]['content'] is string %}\n        {%- set system_message = messages[0]['content']|trim %}\n    {%- else %}\n        {#- FIXME: The processor requires an array, always. #}\n        {%- set system_message = messages[0]['content'][0]['text']|trim %}\n    {%- endif %}\n    {%- set messages = messages[1:] %}\n    {%- set user_supplied_system_message = true %}\n{%- else %}\n    {%- set system_message = \"\" %}\n    {%- set user_supplied_system_message = false %}\n{%- endif %}\n\n{#- System message if the user supplied one #}\n{%- if user_supplied_system_message %}\n    {{- \"<|header_start|>system<|header_end|>\\n\\n\" }}\n    {%- if tools is not none %}\n        {{- \"Environment: ipython\\n\" }}\n    {%- endif %}\n    {%- if tools is not none and not tools_in_user_message %}\n        {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n        {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n        {{- \"Do not use variables.\\n\\n\" }}\n        {%- for t in tools %}\n            {{- t | tojson(indent=4) }}\n            {{- \"\\n\\n\" }}\n        {%- endfor %}\n    {%- endif %}\n    {{- system_message }}\n    {{- \"<|eot|>\" }}\n{%- endif %}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n    {#- Extract the first user message so we can plug it in here #}\n    {%- if messages | length != 0 %}\n        {%- set first_user_message = messages[0]['content']|trim %}\n        {%- set messages = messages[1:] %}\n    {%- else %}\n        {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n    {{- '<|header_start|>user<|header_end|>\\n\\n' -}}\n    {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n    {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n    {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n    {{- \"Do not use variables.\\n\\n\" }}\n    {%- for t in tools %}\n        {{- t | tojson(indent=4) }}\n        {{- \"\\n\\n\" }}\n    {%- endfor %}\n    {{- first_user_message + \"<|eot|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n    {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n    {{- '<|header_start|>' + message['role'] + '<|header_end|>\\n\\n' }}\n        {%- if message['content'] is string %}\n            {{- message['content'] }}\n        {%- else %}\n            {%- for content in message['content'] %}\n                {%- if content['type'] == 'image' %}\n                    {{- '<|image|>' }}\n                {%- elif content['type'] == 'text' %}\n                    {{- content['text'] }}\n                {%- endif %}\n            {%- endfor %}\n        {%- endif %}\n        {{- \"<|eot|>\" }}\n    {%- elif 'tool_calls' in message and message.tool_calls|length > 0 %}\n       {{- '<|header_start|>assistant<|header_end|>\\n\\n' -}}\n       {{- '<|python_start|>' }}\n        {%- if message['content'] is string %}\n            {{- message['content'] }}\n        {%- else %}\n            {%- for content in message['content'] %}\n                {%- if content['type'] == 'image' %}\n                    {{- '<|image|>' }}\n                {%- elif content['type'] == 'text' %}\n                    {{- content['text'] }}\n                {%- endif %}\n            {%- endfor %}\n        {%- endif %}\n       {{- '<|python_end|>' }}\n        {%- for tool_call in message.tool_calls %}\n           {{- '{\"name\": \"' + tool_call.function.name + '\", ' }}\n           {{- '\"parameters\": ' }}\n           {{- tool_call.function.arguments | tojson }}\n           {{- \"}\" }}\n        {%- endfor %}\n       {{- \"<|eot|>\" }}\n    {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n        {{- \"<|header_start|>ipython<|header_end|>\\n\\n\" }}\n        {%- if message.content is mapping or message.content is iterable %}\n            {{- message.content | tojson }}\n        {%- else %}\n            {{- message.content }}\n        {%- endif %}\n        {{- \"<|eot|>\" }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|header_start|>assistant<|header_end|>\\n\\n' }}\n{%- endif %}\n"
+}

config.json ADDED Viewed

	@@ -0,0 +1,330 @@

+{
+    "_attn_implementation_autoset": false,
+    "add_cross_attention": false,
+    "architectures": [
+        "Llama4ForConditionalGeneration"
+    ],
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "boi_token_index": 200080,
+    "bos_token_id": null,
+    "chunk_size_feed_forward": 0,
+    "cross_attention_hidden_size": null,
+    "decoder_start_token_id": null,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eoi_token_index": 200081,
+    "eos_token_id": null,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "id2label": {
+        "0": "LABEL_0",
+        "1": "LABEL_1"
+    },
+    "image_token_index": 200092,
+    "is_decoder": false,
+    "is_encoder_decoder": false,
+    "label2id": {
+        "LABEL_0": 0,
+        "LABEL_1": 1
+    },
+    "length_penalty": 1.0,
+    "max_length": 20,
+    "min_length": 0,
+    "model_type": "llama4",
+    "no_repeat_ngram_size": 0,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": null,
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "quantization": {
+        "group_size": 64,
+        "bits": 4
+    },
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "text_config": {
+        "return_dict": true,
+        "output_hidden_states": false,
+        "output_attentions": false,
+        "torchscript": false,
+        "torch_dtype": "bfloat16",
+        "use_bfloat16": false,
+        "tf_legacy_loss": false,
+        "pruned_heads": {},
+        "tie_word_embeddings": false,
+        "chunk_size_feed_forward": 0,
+        "is_encoder_decoder": false,
+        "is_decoder": false,
+        "cross_attention_hidden_size": null,
+        "add_cross_attention": false,
+        "tie_encoder_decoder": false,
+        "max_length": 20,
+        "min_length": 0,
+        "do_sample": false,
+        "early_stopping": false,
+        "num_beams": 1,
+        "num_beam_groups": 1,
+        "diversity_penalty": 0.0,
+        "temperature": 1.0,
+        "top_k": 50,
+        "top_p": 1.0,
+        "typical_p": 1.0,
+        "repetition_penalty": 1.0,
+        "length_penalty": 1.0,
+        "no_repeat_ngram_size": 0,
+        "encoder_no_repeat_ngram_size": 0,
+        "bad_words_ids": null,
+        "num_return_sequences": 1,
+        "output_scores": false,
+        "return_dict_in_generate": false,
+        "forced_bos_token_id": null,
+        "forced_eos_token_id": null,
+        "remove_invalid_values": false,
+        "exponential_decay_length_penalty": null,
+        "suppress_tokens": null,
+        "begin_suppress_tokens": null,
+        "architectures": null,
+        "finetuning_task": null,
+        "id2label": {
+            "0": "LABEL_0",
+            "1": "LABEL_1"
+        },
+        "label2id": {
+            "LABEL_0": 0,
+            "LABEL_1": 1
+        },
+        "tokenizer_class": null,
+        "prefix": null,
+        "bos_token_id": 200000,
+        "pad_token_id": 200018,
+        "eos_token_id": [
+            200001,
+            200007,
+            200008
+        ],
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
+        "task_specific_params": null,
+        "problem_type": null,
+        "_name_or_path": "",
+        "_attn_implementation_autoset": true,
+        "attention_bias": false,
+        "for_llm_compressor": false,
+        "model_type": "llama4_text",
+        "attn_temperature_tuning": 4,
+        "attn_scale": 0.1,
+        "floor_scale": 8192,
+        "vocab_size": 202048,
+        "max_position_embeddings": 1048576,
+        "hidden_size": 5120,
+        "intermediate_size": 8192,
+        "intermediate_size_mlp": 16384,
+        "num_hidden_layers": 48,
+        "num_attention_heads": 40,
+        "rope_scaling": null,
+        "num_key_value_heads": 8,
+        "hidden_act": "silu",
+        "initializer_range": 0.02,
+        "rms_norm_eps": 1e-05,
+        "use_cache": true,
+        "rope_theta": 500000.0,
+        "attention_dropout": 0.0,
+        "head_dim": 128,
+        "use_qk_norm": false,
+        "num_experts_per_tok": 1,
+        "num_local_experts": 128,
+        "output_router_logits": false,
+        "router_aux_loss_coef": 0.001,
+        "router_jitter_noise": 0.0,
+        "no_rope_layers": [
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0,
+            1,
+            1,
+            1,
+            0
+        ],
+        "interleave_moe_layer_step": 2,
+        "moe_layers": [
+            1,
+            3,
+            5,
+            7,
+            9,
+            11,
+            13,
+            15,
+            17,
+            19,
+            21,
+            23,
+            25,
+            27,
+            29,
+            31,
+            33,
+            35,
+            37,
+            39,
+            41,
+            43,
+            45,
+            47
+        ],
+        "attention_chunk_size": 8192
+    },
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": false,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": "bfloat16",
+    "torchscript": false,
+    "transformers_version": "4.51.0",
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "vision_config": {
+        "hidden_size": 1408,
+        "hidden_act": "gelu",
+        "num_hidden_layers": 34,
+        "num_channels": 3,
+        "intermediate_size": 5632,
+        "image_size": 336,
+        "vision_output_dim": 4096,
+        "patch_size": 14,
+        "norm_eps": 1e-05,
+        "num_attention_heads": 16,
+        "initializer_range": 0.02,
+        "pixel_shuffle_ratio": 0.5,
+        "projector_input_dim": 4096,
+        "projector_output_dim": 4096,
+        "multi_modal_projector_bias": false,
+        "projector_dropout": 0.0,
+        "attention_dropout": 0.0,
+        "vision_feature_layer": -1,
+        "vision_feature_select_strategy": "default",
+        "rope_theta": 10000,
+        "return_dict": true,
+        "output_hidden_states": false,
+        "output_attentions": false,
+        "torchscript": false,
+        "torch_dtype": null,
+        "use_bfloat16": false,
+        "tf_legacy_loss": false,
+        "pruned_heads": {},
+        "tie_word_embeddings": true,
+        "chunk_size_feed_forward": 0,
+        "is_encoder_decoder": false,
+        "is_decoder": false,
+        "cross_attention_hidden_size": null,
+        "add_cross_attention": false,
+        "tie_encoder_decoder": false,
+        "max_length": 20,
+        "min_length": 0,
+        "do_sample": false,
+        "early_stopping": false,
+        "num_beams": 1,
+        "num_beam_groups": 1,
+        "diversity_penalty": 0.0,
+        "temperature": 1.0,
+        "top_k": 50,
+        "top_p": 1.0,
+        "typical_p": 1.0,
+        "repetition_penalty": 1.0,
+        "length_penalty": 1.0,
+        "no_repeat_ngram_size": 0,
+        "encoder_no_repeat_ngram_size": 0,
+        "bad_words_ids": null,
+        "num_return_sequences": 1,
+        "output_scores": false,
+        "return_dict_in_generate": false,
+        "forced_bos_token_id": null,
+        "forced_eos_token_id": null,
+        "remove_invalid_values": false,
+        "exponential_decay_length_penalty": null,
+        "suppress_tokens": null,
+        "begin_suppress_tokens": null,
+        "architectures": null,
+        "finetuning_task": null,
+        "id2label": {
+            "0": "LABEL_0",
+            "1": "LABEL_1"
+        },
+        "label2id": {
+            "LABEL_0": 0,
+            "LABEL_1": 1
+        },
+        "tokenizer_class": null,
+        "prefix": null,
+        "bos_token_id": null,
+        "pad_token_id": null,
+        "eos_token_id": null,
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
+        "task_specific_params": null,
+        "problem_type": null,
+        "_name_or_path": "",
+        "_attn_implementation_autoset": true,
+        "model_type": "llama4_vision_model"
+    }
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "bos_token_id": 200000,
+  "do_sample": true,
+  "eos_token_id": [
+    200001,
+    200007,
+    200008
+  ],
+  "pad_token_id": 200018,
+  "temperature": 0.6,
+  "top_p": 0.9,
+  "transformers_version": "4.51.0.dev0"
+}

model-00001-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96a4ce933080317f696016a1adf5ee4053574b5d40427ba5eb353db9fbe8db54
+size 4308004373

model-00002-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c070297a0d3d79f7655b59e169c3d2014803c2cae42ac8f8726a76b19868f993
+size 3019899344

model-00003-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99508aacb146412d365b70b5547dba0912b237216ddc801722451ee3cd9708c1
+size 3303430951

model-00004-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a15125fa2807b83130bcb6e761c9d3337c7fb2c6f2646698151896f5aa45418f
+size 3019899350

model-00005-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:31b4f2e5594ebdbe1135f941ab42f21d9dd065de0b8adcd811f4ec79cb44fa73
+size 3019899344

model-00006-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b068ecf623f86405c8537b14a439eb0dfc4cb46b000b884a7de7c1928548d7e
+size 3303430927

model-00007-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:86aa984c6d32ec4780d133245d2dbbdf10dc603acd3c0d08e11abfafaa03c756
+size 3019899350

model-00008-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e16ca3814f602001a337f110ed17fe254eeaaadc3a631f63e5868071080a6fd9
+size 3019899344

model-00009-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c7e7565090f1a98335ab6f4c3f65ce2686dea69ed8cd95226332fbc99b7ce8b
+size 3303430951

model-00010-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f7492de0813043da7cdb80e01ce7d0e2aa6c92a897dc232b4a9e310eb24c859
+size 3019899350

model-00011-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6741aef63f058c727708609f99b96282595c97123d4e7b59c5712122e1f65bcc
+size 3019899344

model-00012-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0524ea28c7c8eb9e6bcb95e32b8cd9d12ae490a7798fbe31d68ef25974491190
+size 3303430947

model-00013-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:85f87d3921074aadc41ee045943e05667ccce6abad0a0c9c804b46b4989a64d5
+size 3019899350

model-00014-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3f89fb34e7ce0a88fde4c3faeb49fa297b895f89f08d490964a6e3401ce68686
+size 3019899344

model-00015-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3ecbc36b215a281601d6fea8c4b6d9ba82a04195cbfb401af9aeb9fb701839a
+size 3303430970

model-00016-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c34d1d8ad9e4d75c53246061088e7930b32a44d7d3d280e69a61c1198865dffc
+size 3019899353

model-00017-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6454995111aa5f43a5b28b11530cd4774cfa526df592dccc1602b1851f6a4cfe
+size 3019899347

model-00018-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aadfa21ef4fdf115bda4a6bdd22a0d50b340d4cbd6a50f6c2d0f52a92751f8fa
+size 3303430973

model-00019-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6171ad882cad20fd67477cea85b6c36a21c6d87fd1fb7b8c6ee036e424045d8
+size 3019899353

model-00020-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:07f89288d8ab988ae05e5c264559e2482a77589c22e75f24dcfb8b5d91bc6757
+size 3019899347

model-00021-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc4dce8f0bb164d10b256daf1fa7ba22559e22e2ccf2f64fa278ce77c4d08378
+size 3303430983

model-00022-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00c0cfe6e70a407042d7d542961eb59c49b665daa8e42b6904e2dad3966fc4fc
+size 3019899353

model-00023-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:330fa98b8c4e1f24a056e09d71fc6e4fd7dae60667c0b0a11795b876319432eb
+size 3019899347

model-00024-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c48329c9acb150da52f2d9c3d15309bbd9fcaa3a21cf3c9d8c8bec26a802cbbc
+size 3303431003

model-00025-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ed4578168ff4ad11762f1598e5e4d0fe81964cdbcef786d510af3f5276106a6
+size 3019899353

model-00026-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c1db4858193b41d6082adb8742c2e7d93e9920d85dc16027de92cacb1889029
+size 3019899347

model-00027-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:428cb579ec999fd9f7d061b824fa53a1fa2e4b31c8eba870128870d7b746ba4a
+size 3303431019

model-00028-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:183692aba6fe3bd78138ab66dad6bd3ea48abfd396db47d1c2fea59351b77123
+size 3019899353

model-00029-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c0d9f52705a2ffbedbda440800701ead33d1791f4db7f0de4aab145833102c4
+size 3019899347

model-00030-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d9d244d7175ce8394fbfdb09d8c974e5769701a0ec9c5687133f8625ac72b39
+size 3303431017

model-00031-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e07467a79080294282e20eed310841c2e8c40ee9297ea9263a80de2aa49abca6
+size 3019899353

model-00032-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3634e7f77aa7453b01cf817300c443ab58c084af487744496d442be4c8429b6
+size 3019899347

model-00033-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7322e1fa2530f401e5da5fe876e6aa1fd2e72342b44b0a72dabe9c7b9754cc1b
+size 3303430987

model-00034-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:98b2e1855bc6865d863e35e5fa128486bcd12ea4cbd5d85bf1fce98bbde5fb62
+size 3019899353

model-00035-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0ecd65c0d326f6eff44805f3424000573867613d9ad980cd84d8e777ef684ab
+size 3019899347

model-00036-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3499357293285c49c13eace190f62cbdb8859d43218c236aa55560dcc460542
+size 3303431003

model-00037-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81bcc430a822ddb51346cff92f3715df4331a2c6cac48d6d9c244d132259c821
+size 3019899353

model-00038-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d801e366330b523a6e227b411e570d9b04373b3a705bf8a24fc90793e9004991
+size 3019899347

model-00039-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:170249a943340b4d10015fb2171330306aa888f02e19e18662bc0d15a325c483
+size 3303430997

model-00040-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6be027228b540138827fe255d2a042e1abc5eb0b453d603d64b533d6576cdb6
+size 3019899353

model-00041-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:74af69c97d246e0dfa068762cfeff681d168a15ead52868b4ef00d9685b4d76f
+size 3019899347

model-00042-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e0b2e3a1c2068ff917b61c8704a489ffe4bff9c6084728b041c41a45b68a9c2
+size 3303431023

model-00043-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60284ae2d175666b013d7285efba3b6f686ce3ffa9e5e39b020ae469dc3d2be2
+size 3019899353

model-00044-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a3acfbecd71b7d6f89fb144a87682cfeb6e03ddbaa1d171ad3035b116e775d0
+size 3019899347

model-00045-of-00072.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9afa236ee407b0a9f8d12e8759a0c6e0eb41866dd8b86aed2f26c51d402e5d57
+size 3303430993