File tree Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -191,7 +191,7 @@ def gen_eval_wrapper(
191
191
192
192
pt2e_quant_params , quantizers , quant_dtype = get_quantizer_and_quant_params (args )
193
193
# GPTFastEvalWrapper: Create a wrapper around a pre-exported model
194
- manager : LLMEdgeManager = _prepare_for_llama_export (model_name , args )
194
+ manager : LLMEdgeManager = _prepare_for_llama_export (args )
195
195
196
196
if len (quantizers ) != 0 :
197
197
manager = manager .export ().pt2e_quantize (quantizers )
Original file line number Diff line number Diff line change @@ -38,7 +38,7 @@ def __init__(self, args):
38
38
model_args = model_args ,
39
39
device = "cuda" if torch .cuda .is_available () else "cpu" ,
40
40
)
41
- manager : LLMEdgeManager = _prepare_for_llama_export ("llama" , args )
41
+ manager : LLMEdgeManager = _prepare_for_llama_export (args )
42
42
self .model = manager .model .eval ().to (device = self .device )
43
43
44
44
def forward (
You can’t perform that action at this time.
0 commit comments