nm-research commited on
Commit
4ef76e4
·
verified ·
1 Parent(s): 24b86ed

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -39,7 +39,7 @@ from vllm import LLM, SamplingParams
39
 
40
  # prepare model
41
  llm = LLM(
42
- model="nm-testing/gemma-3-1b-it-quantized.w8a8",
43
  trust_remote_code=True,
44
  max_model_len=4096,
45
  max_num_seqs=2,
@@ -183,7 +183,7 @@ lm_eval \
183
  <th>Category</th>
184
  <th>Metric</th>
185
  <th>google/gemma-3-1b-it</th>
186
- <th>nm-testing/gemma-3-1b-it-quantized.w8a8</th>
187
  <th>Recovery (%)</th>
188
  </tr>
189
  </thead>
 
39
 
40
  # prepare model
41
  llm = LLM(
42
+ model="RedHatAI/gemma-3-1b-it-quantized.w8a8",
43
  trust_remote_code=True,
44
  max_model_len=4096,
45
  max_num_seqs=2,
 
183
  <th>Category</th>
184
  <th>Metric</th>
185
  <th>google/gemma-3-1b-it</th>
186
+ <th>RedHatAI/gemma-3-1b-it-quantized.w8a8</th>
187
  <th>Recovery (%)</th>
188
  </tr>
189
  </thead>