Update README.md
Browse files
README.md
CHANGED
@@ -130,9 +130,7 @@ The model was evaluated on the [OpenLLM](https://huggingface.co/spaces/open-llm-
|
|
130 |
```
|
131 |
lm_eval \
|
132 |
--model vllm \
|
133 |
-
--model_args pretrained="neuralmagic/Qwen2.5-7B-quantized.w4a16",dtype=auto,gpu_memory_utilization=0.
|
134 |
-
--apply_chat_template \
|
135 |
-
--fewshot_as_multiturn \
|
136 |
--tasks openllm \
|
137 |
--batch_size auto
|
138 |
```
|
|
|
130 |
```
|
131 |
lm_eval \
|
132 |
--model vllm \
|
133 |
+
--model_args pretrained="neuralmagic/Qwen2.5-7B-quantized.w4a16",dtype=auto,gpu_memory_utilization=0.9,add_bos_token=True,max_model_len=4096,enable_chunk_prefill=True,tensor_parallel_size=1 \
|
|
|
|
|
134 |
--tasks openllm \
|
135 |
--batch_size auto
|
136 |
```
|