diff --git a/src/brevitas_examples/llm/main.py b/src/brevitas_examples/llm/main.py index 7a9e6ba4e..5237c31c7 100644 --- a/src/brevitas_examples/llm/main.py +++ b/src/brevitas_examples/llm/main.py @@ -170,7 +170,6 @@ choices=[ None, 'onnx_qcdq', - 'packed_onnx', 'torch_qcdq', 'sharded_torchmlir_group_weight', 'sharded_packed_torchmlir_group_weight'], @@ -191,8 +190,6 @@ def model_export(model, ref_input, args): from brevitas_examples.llm.llm_quant.sharded_mlir_group_export import \ sharded_weight_group_export sharded_weight_group_export(model, no_custom_packed_export=False) - elif args.export_target == 'packed_onnx': - export_packed_onnx(model, ref_input, export_path=f"{args.model.replace('/', '-')}.onnx") elif args.export_target == 'onnx_qcdq': if args.weight_quant_granularity == 'per_group': export_manager = BlockQuantProxyLevelManager