Update README.md
Browse files
README.md
CHANGED
|
@@ -187,7 +187,7 @@ vLLM aslo supports OpenAI-compatible serving. See the [documentation](https://do
|
|
| 187 |
|
| 188 |
# Configure the quantization algorithm and scheme
|
| 189 |
recipe = [
|
| 190 |
-
SmoothQuantModifier(),
|
| 191 |
GPTQModifier(
|
| 192 |
ignore=["language_model.lm_head", "re:vision_tower.*", "re:multi_modal_projector.*"]
|
| 193 |
sequential_targets=["MistralDecoderLayer"]
|
|
|
|
| 187 |
|
| 188 |
# Configure the quantization algorithm and scheme
|
| 189 |
recipe = [
|
| 190 |
+
SmoothQuantModifier(smoothing_strength=0.8),
|
| 191 |
GPTQModifier(
|
| 192 |
ignore=["language_model.lm_head", "re:vision_tower.*", "re:multi_modal_projector.*"]
|
| 193 |
sequential_targets=["MistralDecoderLayer"]
|