diff --git a/examples/models/llama/export_llama_lib.py b/examples/models/llama/export_llama_lib.py index 6d4e1de0c09..73e4cc865ff 100644 --- a/examples/models/llama/export_llama_lib.py +++ b/examples/models/llama/export_llama_lib.py @@ -662,7 +662,6 @@ def _validate_args(args): def _export_llama(args) -> LLMEdgeManager: # noqa: C901 _validate_args(args) - pt2e_quant_params, quantizers, quant_dtype = get_quantizer_and_quant_params(args) # export_to_edge builder_exported = _prepare_for_llama_export(args).export() @@ -670,9 +669,16 @@ def _export_llama(args) -> LLMEdgeManager: # noqa: C901 if args.export_only: exit() - builder_exported_to_edge = builder_exported.pt2e_quantize( - quantizers - ).export_to_edge() + if args.pt2e_quantize: + pt2e_quant_params, quantizers, quant_dtype = get_quantizer_and_quant_params( + args + ) + builder_exported_to_edge = builder_exported.pt2e_quantize( + quantizers + ).export_to_edge() + else: + pt2e_quant_params = None + builder_exported_to_edge = builder_exported.export_to_edge() modelname = builder_exported_to_edge.modelname