examples/qualcomm/scripts/export_example.py - platform/external/executorch - Git at Google

 import argparse

 import torch
 from backends.qualcomm.serialization.qnn_compile_spec_schema import QcomChipset
 from executorch.backends.qualcomm.partition.qnn_partitioner import QnnPartitioner
 from executorch.backends.qualcomm.quantizer.quantizer import (
     get_default_8bit_qnn_ptq_config,
     QnnQuantizer,
 )
 from executorch.backends.qualcomm.utils.utils import (
     capture_program,
     generate_qnn_executorch_compiler_spec,
 )
 from executorch.examples.models import MODEL_NAME_TO_MODEL
 from executorch.examples.models.model_factory import EagerModelFactory
 from executorch.examples.portable.utils import save_pte_program
 from executorch.exir.backend.backend_api import to_backend, validation_disabled
 from executorch.exir.capture._config import ExecutorchBackendConfig

 from torch.ao.quantization.quantize_pt2e import convert_pt2e, prepare_pt2e

 if __name__ == "__main__":
     parser = argparse.ArgumentParser()
     parser.add_argument(
         "-m",
         "--model_name",
         required=True,
         help=f"provide a model name. Valid ones: {list(MODEL_NAME_TO_MODEL.keys())}",
     )

     args = parser.parse_args()

     if args.model_name not in MODEL_NAME_TO_MODEL:
         raise RuntimeError(
             f"Model {args.model_name} is not a valid name. "
             f"Available models are {list(MODEL_NAME_TO_MODEL.keys())}."
         )

     model, example_inputs, _ = EagerModelFactory.create_model(
         *MODEL_NAME_TO_MODEL[args.model_name]
     )

     # Get quantizer
     quantizer = QnnQuantizer()
     quant_config = get_default_8bit_qnn_ptq_config()
     quantizer.set_bit8_op_quant_config(quant_config)

     # Typical pytorch 2.0 quantization flow
     m = torch._export.capture_pre_autograd_graph(model.eval(), example_inputs)
     m = prepare_pt2e(m, quantizer)
     # Calibration
     m(*example_inputs)
     # Get the quantized model
     m = convert_pt2e(m)

     # Capture program for edge IR
     edge_program = capture_program(m, example_inputs)

     # Delegate to QNN backend
     qnn_partitioner = QnnPartitioner(
         generate_qnn_executorch_compiler_spec(
             is_fp16=False,
             soc_model=QcomChipset.SM8550,
             debug=False,
             saver=False,
         )
     )
     with validation_disabled():
         delegated_program = edge_program
         delegated_program.exported_program = to_backend(
             edge_program.exported_program, qnn_partitioner
         )

     executorch_program = delegated_program.to_executorch(
         config=ExecutorchBackendConfig(extract_constant_segment=False)
     )
     save_pte_program(executorch_program.buffer, args.model_name)
	import argparse

	import torch
	from backends.qualcomm.serialization.qnn_compile_spec_schema import QcomChipset
	from executorch.backends.qualcomm.partition.qnn_partitioner import QnnPartitioner
	from executorch.backends.qualcomm.quantizer.quantizer import (
	get_default_8bit_qnn_ptq_config,
	QnnQuantizer,
	)
	from executorch.backends.qualcomm.utils.utils import (
	capture_program,
	generate_qnn_executorch_compiler_spec,
	)
	from executorch.examples.models import MODEL_NAME_TO_MODEL
	from executorch.examples.models.model_factory import EagerModelFactory
	from executorch.examples.portable.utils import save_pte_program
	from executorch.exir.backend.backend_api import to_backend, validation_disabled
	from executorch.exir.capture._config import ExecutorchBackendConfig

	from torch.ao.quantization.quantize_pt2e import convert_pt2e, prepare_pt2e

	if __name__ == "__main__":
	parser = argparse.ArgumentParser()
	parser.add_argument(
	"-m",
	"--model_name",
	required=True,
	help=f"provide a model name. Valid ones: {list(MODEL_NAME_TO_MODEL.keys())}",
	)

	args = parser.parse_args()

	if args.model_name not in MODEL_NAME_TO_MODEL:
	raise RuntimeError(
	f"Model {args.model_name} is not a valid name. "
	f"Available models are {list(MODEL_NAME_TO_MODEL.keys())}."
	)

	model, example_inputs, _ = EagerModelFactory.create_model(
	*MODEL_NAME_TO_MODEL[args.model_name]
	)

	# Get quantizer
	quantizer = QnnQuantizer()
	quant_config = get_default_8bit_qnn_ptq_config()
	quantizer.set_bit8_op_quant_config(quant_config)

	# Typical pytorch 2.0 quantization flow
	m = torch._export.capture_pre_autograd_graph(model.eval(), example_inputs)
	m = prepare_pt2e(m, quantizer)
	# Calibration
	m(*example_inputs)
	# Get the quantized model
	m = convert_pt2e(m)

	# Capture program for edge IR
	edge_program = capture_program(m, example_inputs)

	# Delegate to QNN backend
	qnn_partitioner = QnnPartitioner(
	generate_qnn_executorch_compiler_spec(
	is_fp16=False,
	soc_model=QcomChipset.SM8550,
	debug=False,
	saver=False,
	)
	)
	with validation_disabled():
	delegated_program = edge_program
	delegated_program.exported_program = to_backend(
	edge_program.exported_program, qnn_partitioner
	)

	executorch_program = delegated_program.to_executorch(
	config=ExecutorchBackendConfig(extract_constant_segment=False)
	)
	save_pte_program(executorch_program.buffer, args.model_name)