Update README.md
Browse files
README.md
CHANGED
@@ -187,7 +187,7 @@ vLLM aslo supports OpenAI-compatible serving. See the [documentation](https://do
|
|
187 |
|
188 |
# Configure the quantization algorithm and scheme
|
189 |
recipe = [
|
190 |
-
SmoothQuantModifier(),
|
191 |
GPTQModifier(
|
192 |
ignore=["language_model.lm_head", "re:vision_tower.*", "re:multi_modal_projector.*"]
|
193 |
sequential_targets=["MistralDecoderLayer"]
|
|
|
187 |
|
188 |
# Configure the quantization algorithm and scheme
|
189 |
recipe = [
|
190 |
+
SmoothQuantModifier(smoothing_strength=0.8),
|
191 |
GPTQModifier(
|
192 |
ignore=["language_model.lm_head", "re:vision_tower.*", "re:multi_modal_projector.*"]
|
193 |
sequential_targets=["MistralDecoderLayer"]
|