alexmarques commited on
Commit
7a4ffde
·
verified ·
1 Parent(s): d993353

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -3
README.md CHANGED
@@ -89,13 +89,13 @@ model = AutoModelForCausalLM.from_pretrained(
89
  model_stub, torch_dtype="auto", device_map="auto"
90
  )
91
 
 
 
92
  output_dir = f"./{model_name}-FP8-dynamic"
93
 
94
  oneshot(
95
  model=model,
96
  recipe=recipe,
97
- output_dir=output_dir,
98
- tokenizer=AutoTokenizer.from_pretrained(model_stub),
99
  )
100
 
101
  model.save_pretrained(output_dir, save_compressed=True, skip_sparsity_compression_stats=False)
@@ -110,7 +110,7 @@ The model was evaluated on the test split of [trl-lib/tldr](https://huggingface.
110
  One can reproduce these results by using the following command:
111
 
112
  ```bash
113
- lm_eval --model vllm --model_args "pretrained=RedHatAI/Sparse-Llama-3.1-8B-tldr-2of4-FP8-dynamic,dtype=auto,add_bos_token" --batch-size auto --tasks tldr
114
  ```
115
 
116
  <table>
 
89
  model_stub, torch_dtype="auto", device_map="auto"
90
  )
91
 
92
+ tokenizer = AutoTokenizer.from_pretrained(model_stub),
93
+
94
  output_dir = f"./{model_name}-FP8-dynamic"
95
 
96
  oneshot(
97
  model=model,
98
  recipe=recipe,
 
 
99
  )
100
 
101
  model.save_pretrained(output_dir, save_compressed=True, skip_sparsity_compression_stats=False)
 
110
  One can reproduce these results by using the following command:
111
 
112
  ```bash
113
+ lm_eval --model vllm --model_args "pretrained=RedHatAI/Sparse-Llama-3.1-8B-tldr-2of4-FP8-dynamic,dtype=auto,add_bos_token=True" --batch-size auto --tasks tldr
114
  ```
115
 
116
  <table>