May need --override-kv tokenizer.ggml.eot_token_id=int:151336
Browse files
README.md
CHANGED
@@ -157,6 +157,7 @@ $ ./build/bin/llama-server \
|
|
157 |
-fa -fmoe \
|
158 |
-ctk q8_0 -ctv q8_0 \
|
159 |
--chat-template chatglm4 \
|
|
|
160 |
-ub 4096 -b 4096 \
|
161 |
-ngl 99 \
|
162 |
-ot exps=CPU \
|
|
|
157 |
-fa -fmoe \
|
158 |
-ctk q8_0 -ctv q8_0 \
|
159 |
--chat-template chatglm4 \
|
160 |
+
--override-kv tokenizer.ggml.eot_token_id=int:151336 \
|
161 |
-ub 4096 -b 4096 \
|
162 |
-ngl 99 \
|
163 |
-ot exps=CPU \
|