aipib commited on 9 days ago

Commit

db29e4e

verified ·

1 Parent(s): d87f43c

Add files using upload-large-folder tool

Browse files

Files changed (23) hide show

README.md +54 -0
config.json +41 -0
generation_config.json +6 -0
model-00001-of-00016.safetensors +3 -0
model-00002-of-00016.safetensors +3 -0
model-00003-of-00016.safetensors +3 -0
model-00004-of-00016.safetensors +3 -0
model-00005-of-00016.safetensors +3 -0
model-00006-of-00016.safetensors +3 -0
model-00007-of-00016.safetensors +3 -0
model-00008-of-00016.safetensors +3 -0
model-00009-of-00016.safetensors +3 -0
model-00010-of-00016.safetensors +3 -0
model-00011-of-00016.safetensors +3 -0
model-00012-of-00016.safetensors +3 -0
model-00013-of-00016.safetensors +3 -0
model-00014-of-00016.safetensors +3 -0
model-00015-of-00016.safetensors +3 -0
model-00016-of-00016.safetensors +3 -0
model.safetensors.index.json +0 -0
special_tokens_map.json +51 -0
tokenizer.json +0 -0
tokenizer_config.json +85 -0

README.md ADDED Viewed

	@@ -0,0 +1,54 @@

+---
+license: apache-2.0
+language:
+- en
+- ja
+programming_language:
+- C
+- C++
+- C#
+- Go
+- Java
+- JavaScript
+- Lua
+- PHP
+- Python
+- Ruby
+- Rust
+- Scala
+- TypeScript
+pipeline_tag: text-generation
+library_name: mlx
+inference: false
+base_model: llm-jp/llm-jp-3.1-8x13b-instruct4
+tags:
+- mlx
+---
+# mlx-community/llm-jp-3.1-8x13b-instruct4-8bit
+This model [mlx-community/llm-jp-3.1-8x13b-instruct4-8bit](https://huggingface.co/mlx-community/llm-jp-3.1-8x13b-instruct4-8bit) was
+converted to MLX format from [llm-jp/llm-jp-3.1-8x13b-instruct4](https://huggingface.co/llm-jp/llm-jp-3.1-8x13b-instruct4)
+using mlx-lm version **0.24.1**.
+## Use with mlx
+```bash
+pip install mlx-lm
+```
+```python
+from mlx_lm import load, generate
+model, tokenizer = load("mlx-community/llm-jp-3.1-8x13b-instruct4-8bit")
+prompt = "hello"
+if tokenizer.chat_template is not None:
+    messages = [{"role": "user", "content": prompt}]
+    prompt = tokenizer.apply_chat_template(
+        messages, add_generation_prompt=True
+    )
+response = generate(model, tokenizer, prompt=prompt, verbose=True)
+```

config.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+    "architectures": [
+        "MixtralForCausalLM"
+    ],
+    "attention_bias": false,
+    "attention_dropout": 0.0,
+    "bos_token_id": 1,
+    "eos_token_id": 2,
+    "head_dim": 128,
+    "hidden_act": "silu",
+    "hidden_size": 5120,
+    "initializer_range": 0.02,
+    "intermediate_size": 13824,
+    "max_position_embeddings": 4096,
+    "mlp_bias": false,
+    "model_type": "mixtral",
+    "num_attention_heads": 40,
+    "num_experts_per_tok": 2,
+    "num_hidden_layers": 40,
+    "num_key_value_heads": 40,
+    "num_local_experts": 8,
+    "output_router_logits": false,
+    "quantization": {
+        "group_size": 64,
+        "bits": 8
+    },
+    "quantization_config": {
+        "group_size": 64,
+        "bits": 8
+    },
+    "rms_norm_eps": 1e-05,
+    "rope_theta": 10000,
+    "router_aux_loss_coef": 0.01,
+    "router_jitter_noise": 0.0,
+    "sliding_window": null,
+    "tie_word_embeddings": false,
+    "torch_dtype": "bfloat16",
+    "transformers_version": "4.47.0",
+    "use_cache": true,
+    "vocab_size": 99584
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.47.0"
+}

model-00001-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d01be6c15f9aafde0c23d7c3cebb43fa68ef61cc21865913b81b8194360834f8
+size 5087494332

model-00002-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ed8b36de36dfe1c4a8ac11ae8a83a87a1cfc8eb81f1e33df7f32bddc3c7a5fd6
+size 5147398606

model-00003-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d376feac92613c403b9b624e05ab698784f7c8d273b96ad626e73ee80a6f142
+size 5035921484

model-00004-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:542212659f62efe3faae0b560f3eb2f02e1bf4ec8c2bc7b065ecf0dec49a72ca
+size 5147398686

model-00005-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2da92c3247a12c07bda9a944c07d85191e9a87b439b24e78554b4b47481c8e88
+size 5147398689

model-00006-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b50ff0361d4bb2fce32346ecfa51af9aec9c399229f11e7212e3475e336e5372
+size 5035921556

model-00007-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6408d40bf65c751075f34cd41df8fe0e029fc204ec1ad5c430037479ed75373
+size 5147398693

model-00008-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d8d2ffab7fe28fa60e481b66bb5822f6ac814aace401debd0692040a55a7df5
+size 5147398743

model-00009-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01c39e59d1ad04fe629e1069c9d8ff4336e71165e66e235ad546759d6b3c6be5
+size 5035921548

model-00010-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32b2fc41f6c5455a1ea2638acf393986a2f84bf682d9ff90edaf463f900aca0d
+size 5147398737

model-00011-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28f4fb4355ea483196f99d20741d67fbc0348e83259ef2a982e3de08b60b31de
+size 5147398703

model-00012-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc563f21d0fa45b57c7ebd00b5093022904d112b51cb50b2aef3451db3324779
+size 5035921576

model-00013-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48a8229b70c7b9cd13a8b66f84d7171450e35fe8a5c652920528a53f9ec19a8f
+size 5147398723

model-00014-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84a4b2a0304338013b13637e8fdb2eca99732b4a6b612a70727a4215a9ffcdb7
+size 5147398703

model-00015-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:277e906ba1b5897750a4f2fbeb66cef99e7aea9b3b4329f38c88899058db18e6
+size 5035921578

model-00016-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ff196d20cab0e92254ffca5f0872aea73a20a3b4195548199ffde4e0eb06306
+size 1143389197

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "cls_token": {
+    "content": "<CLS|LLM-jp>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "<MASK|LLM-jp>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<PAD|LLM-jp>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "<SEP|LLM-jp>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<MASK|LLM-jp>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "<PAD|LLM-jp>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "<CLS|LLM-jp>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "6": {
+      "content": "<SEP|LLM-jp>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "7": {
+      "content": "<EOD|LLM-jp>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "chat_template": "{{bos_token}}{% for message in messages %}{% if message['role'] == 'user' %}{{ '\\n\\n### 指示:\\n' + message['content'] }}{% elif message['role'] == 'system' %}{{ '以下は、タスクを説明する指示です。要求を適切に満たす応答を書きなさい。' }}{% elif message['role'] == 'assistant' %}{{ '\\n\\n### 応答:\\n' + message['content'] + eos_token }}{% endif %}{% if loop.last and add_generation_prompt %}{{ '\\n\\n### 応答:\\n' }}{% endif %}{% endfor %}",
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "<CLS|LLM-jp>",
+  "eod_token": "</s>",
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "extra_special_tokens": {},
+  "mask_token": "<MASK|LLM-jp>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<PAD|LLM-jp>",
+  "sep_token": "<SEP|LLM-jp>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "PreTrainedTokenizer",
+  "unk_token": "<unk>"
+}