Update README.md
Browse files
README.md
CHANGED
|
@@ -233,7 +233,7 @@ The results were obtained using the following commands:
|
|
| 233 |
```
|
| 234 |
lm_eval \
|
| 235 |
--model vllm \
|
| 236 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 237 |
--tasks mmlu_llama_3.1_instruct \
|
| 238 |
--fewshot_as_multiturn \
|
| 239 |
--apply_chat_template \
|
|
@@ -245,7 +245,7 @@ lm_eval \
|
|
| 245 |
```
|
| 246 |
lm_eval \
|
| 247 |
--model vllm \
|
| 248 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 249 |
--tasks mmlu_cot_0shot_llama_3.1_instruct \
|
| 250 |
--apply_chat_template \
|
| 251 |
--num_fewshot 0 \
|
|
@@ -256,7 +256,7 @@ lm_eval \
|
|
| 256 |
```
|
| 257 |
lm_eval \
|
| 258 |
--model vllm \
|
| 259 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 260 |
--tasks arc_challenge_llama_3.1_instruct \
|
| 261 |
--apply_chat_template \
|
| 262 |
--num_fewshot 0 \
|
|
@@ -267,7 +267,7 @@ lm_eval \
|
|
| 267 |
```
|
| 268 |
lm_eval \
|
| 269 |
--model vllm \
|
| 270 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 271 |
--tasks gsm8k_cot_llama_3.1_instruct \
|
| 272 |
--fewshot_as_multiturn \
|
| 273 |
--apply_chat_template \
|
|
@@ -279,7 +279,7 @@ lm_eval \
|
|
| 279 |
```
|
| 280 |
lm_eval \
|
| 281 |
--model vllm \
|
| 282 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 283 |
--tasks hellaswag \
|
| 284 |
--num_fewshot 10 \
|
| 285 |
--batch_size auto
|
|
@@ -289,7 +289,7 @@ lm_eval \
|
|
| 289 |
```
|
| 290 |
lm_eval \
|
| 291 |
--model vllm \
|
| 292 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 293 |
--tasks winogrande \
|
| 294 |
--num_fewshot 5 \
|
| 295 |
--batch_size auto
|
|
@@ -299,7 +299,7 @@ lm_eval \
|
|
| 299 |
```
|
| 300 |
lm_eval \
|
| 301 |
--model vllm \
|
| 302 |
-
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.
|
| 303 |
--tasks truthfulqa \
|
| 304 |
--num_fewshot 0 \
|
| 305 |
--batch_size auto
|
|
|
|
| 233 |
```
|
| 234 |
lm_eval \
|
| 235 |
--model vllm \
|
| 236 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=3850,max_gen_toks=10,tensor_parallel_size=1 \
|
| 237 |
--tasks mmlu_llama_3.1_instruct \
|
| 238 |
--fewshot_as_multiturn \
|
| 239 |
--apply_chat_template \
|
|
|
|
| 245 |
```
|
| 246 |
lm_eval \
|
| 247 |
--model vllm \
|
| 248 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=4064,max_gen_toks=1024,tensor_parallel_size=1 \
|
| 249 |
--tasks mmlu_cot_0shot_llama_3.1_instruct \
|
| 250 |
--apply_chat_template \
|
| 251 |
--num_fewshot 0 \
|
|
|
|
| 256 |
```
|
| 257 |
lm_eval \
|
| 258 |
--model vllm \
|
| 259 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=3940,max_gen_toks=100,tensor_parallel_size=1 \
|
| 260 |
--tasks arc_challenge_llama_3.1_instruct \
|
| 261 |
--apply_chat_template \
|
| 262 |
--num_fewshot 0 \
|
|
|
|
| 267 |
```
|
| 268 |
lm_eval \
|
| 269 |
--model vllm \
|
| 270 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=4096,max_gen_toks=1024,tensor_parallel_size=1 \
|
| 271 |
--tasks gsm8k_cot_llama_3.1_instruct \
|
| 272 |
--fewshot_as_multiturn \
|
| 273 |
--apply_chat_template \
|
|
|
|
| 279 |
```
|
| 280 |
lm_eval \
|
| 281 |
--model vllm \
|
| 282 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=4096,tensor_parallel_size=1 \
|
| 283 |
--tasks hellaswag \
|
| 284 |
--num_fewshot 10 \
|
| 285 |
--batch_size auto
|
|
|
|
| 289 |
```
|
| 290 |
lm_eval \
|
| 291 |
--model vllm \
|
| 292 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=4096,tensor_parallel_size=1 \
|
| 293 |
--tasks winogrande \
|
| 294 |
--num_fewshot 5 \
|
| 295 |
--batch_size auto
|
|
|
|
| 299 |
```
|
| 300 |
lm_eval \
|
| 301 |
--model vllm \
|
| 302 |
+
--model_args pretrained="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16",dtype=auto,add_bos_token=True,max_model_len=4096,tensor_parallel_size=1 \
|
| 303 |
--tasks truthfulqa \
|
| 304 |
--num_fewshot 0 \
|
| 305 |
--batch_size auto
|