|
140 | 140 | } |
141 | 141 | }, |
142 | 142 | { |
143 | | - "test_name": "latency_gemma3_12b_it_fp8", |
| 143 | + "test_name": "latency_gemma3_12b_it_fp8_torchao", |
144 | 144 | "parameters": { |
145 | 145 | "model": "pytorch/gemma-3-12b-it-FP8", |
146 | 146 | "load_format": "dummy", |
|
149 | 149 | } |
150 | 150 | }, |
151 | 151 | { |
152 | | - "test_name": "latency_gemma3_12b_it_int4", |
| 152 | + "test_name": "latency_gemma3_12b_it_int4_torchao", |
153 | 153 | "parameters": { |
154 | 154 | "model": "pytorch/gemma-3-12b-it-INT4", |
155 | 155 | "load_format": "dummy", |
|
158 | 158 | } |
159 | 159 | }, |
160 | 160 | { |
161 | | - "test_name": "latency_gemma3_12b_it_awq_int4", |
| 161 | + "test_name": "latency_gemma3_12b_it_awq_int4_torchao", |
162 | 162 | "parameters": { |
163 | 163 | "model": "pytorch/gemma-3-12b-it-AWQ-INT4", |
164 | 164 | "load_format": "dummy", |
|
167 | 167 | } |
168 | 168 | }, |
169 | 169 | { |
170 | | - "test_name": "latency_gemma3_27b_it_fp8", |
| 170 | + "test_name": "latency_gemma3_27b_it_fp8_torchao", |
171 | 171 | "parameters": { |
172 | 172 | "model": "pytorch/gemma-3-27b-it-FP8", |
173 | 173 | "load_format": "dummy", |
|
176 | 176 | } |
177 | 177 | }, |
178 | 178 | { |
179 | | - "test_name": "latency_gemma3_27b_it_int4", |
| 179 | + "test_name": "latency_gemma3_27b_it_int4_torchao", |
180 | 180 | "parameters": { |
181 | 181 | "model": "pytorch/gemma-3-27b-it-INT4", |
182 | 182 | "load_format": "dummy", |
|
185 | 185 | } |
186 | 186 | }, |
187 | 187 | { |
188 | | - "test_name": "latency_gemma3_27b_it_awq_int4", |
| 188 | + "test_name": "latency_gemma3_27b_it_awq_int4_torchao", |
189 | 189 | "parameters": { |
190 | 190 | "model": "pytorch/gemma-3-27b-it-AWQ-INT4", |
191 | 191 | "load_format": "dummy", |
|
0 commit comments