RedHatAI
/

Mistral-Small-24B-Instruct-2501

Text Generation

text-generation-inference

Model card Files Files and versions Community

jennyyyi commited on 8 days ago

Commit

2dbb8c7

·

verified ·

1 Parent(s): 267d955

Update README.md

Files changed (1) hide show

README.md +12 -1

README.md CHANGED Viewed

@@ -149,7 +149,7 @@ ilab model download --repository docker://registry.redhat.io/rhelai1/mistral-sma
 ```bash
 # Serve model via ilab
-ilab model serve --model-path ~/.cache/instructlab/models/mistral-small-24b-instruct-2501
 # Chat with model
 ilab model chat --model ~/.cache/instructlab/models/mistral-small-24b-instruct-2501
@@ -216,6 +216,17 @@ spec:
     maxReplicas: 1
     minReplicas: 1
     model:
       modelFormat:
         name: vLLM
       name: ''

 ```bash
 # Serve model via ilab
+ilab model serve --model-path ~/.cache/instructlab/models/mistral-small-24b-instruct-2501 --gpu 1 -- --tokenizer-mode "mistral" --config-format "mistral" --load-format "mistral" --tool-call-parser "mistral" --enable-auto-tool-choice --limit-mm-per-prompt "image=10" --max-model-len 16384 --uvicorn-log-level "debug" --trust-remote-code
 # Chat with model
 ilab model chat --model ~/.cache/instructlab/models/mistral-small-24b-instruct-2501
     maxReplicas: 1
     minReplicas: 1
     model:
+      args:
+        - "--tokenizer-mode=mistral"
+        - "--config-format=mistral"
+        - "--load-format=mistral"
+        - "--tool-call-parser=mistral"
+        - "--enable-auto-tool-choice"
+        - "--limit-mm-per-prompt=image=10"
+        - "--max-model-len=16384"
+        - "--uvicorn-log-level=debug"
+        - "--trust-remote-code"
       modelFormat:
         name: vLLM
       name: ''