examples/models/llama2/llama_test.py - platform/external/executorch - Git at Google

 # Copyright (c) Meta Platforms, Inc. and affiliates.
 # All rights reserved.
 #
 # This source code is licensed under the BSD-style license found in the
 # LICENSE file in the root directory of this source tree.

 import unittest

 from .export_llama import build_model


 class LlamaTest(unittest.TestCase):
     def test_quantized_llama(self):
         _ = build_model(
             modelname="model",
             extra_opts="--fairseq2 -qmode int8",
             par_local_output=True,
             resource_pkg_name=__name__,
         )

     def test_half_llama(self):
         _ = build_model(
             modelname="model",
             extra_opts="--fairseq2 -d fp16",
             par_local_output=True,
             resource_pkg_name=__name__,
         )


 #    def test_half_xnnpack_llama(self):
 #        output_path = build_model(
 #            modelname="model",
 #            extra_opts="--fairseq2 -d fp16 -X",
 #            par_local_output=True,
 #            resource_pkg_name=__name__,
 #        )
	# Copyright (c) Meta Platforms, Inc. and affiliates.
	# All rights reserved.
	#
	# This source code is licensed under the BSD-style license found in the
	# LICENSE file in the root directory of this source tree.

	import unittest

	from .export_llama import build_model


	class LlamaTest(unittest.TestCase):
	def test_quantized_llama(self):
	_ = build_model(
	modelname="model",
	extra_opts="--fairseq2 -qmode int8",
	par_local_output=True,
	resource_pkg_name=__name__,
	)

	def test_half_llama(self):
	_ = build_model(
	modelname="model",
	extra_opts="--fairseq2 -d fp16",
	par_local_output=True,
	resource_pkg_name=__name__,
	)


	# def test_half_xnnpack_llama(self):
	# output_path = build_model(
	# modelname="model",
	# extra_opts="--fairseq2 -d fp16 -X",
	# par_local_output=True,
	# resource_pkg_name=__name__,
	# )