pashu123 · January 10, 2023 17:58
diff --git a/shark_importer.py b/shark_importer.py
 # Lint as: python3
 """SHARK Importer"""

 import sys
 import tempfile
 import os

 # List of the supported frontends.
 supported_frontends = {
    "tensorflow",
    "tf",
    "pytorch",
    "torch",
    "tf-lite",
    "tflite",
 }


 class SharkImporter:
    """
    SharkImporter converts frontend modules into a
    mlir_module. The supported frameworks are tensorflow,
    pytorch, and tf-lite.

    ...

    Attributes
    ----------
    module :
        torch, tensorflow or tf-lite module.
    inputs :
        inputs to the module, may be required for the shape
        information.
    frontend: str
        frontend to which the module belongs.
    raw_model_file: str
        temp tflite model path

    Methods
    -------
    import_mlir(is_dynamic, tracing_required, func_name):
        is_dynamic: input shapes to be totally dynamic (pytorch specific).
        tracing_required: whether tracing is required (pytorch specific.
        func_name: The function to be traced out or imported to mlir.

    import_debug(is_dynamic, tracing_required, func_name):
        returns the converted (mlir_module,func_name) with inputs and golden
        outputs.
        The inputs and outputs are converted into np array.
    """

    def __init__(
        self,
        module,
        inputs: tuple = (),
        frontend: str = "torch",
        raw_model_file: str = "",
    ):
        self.module = module
        self.inputs = None if len(inputs) == 0 else inputs
        self.frontend = frontend
        if not self.frontend in supported_frontends:
            print(
                f"The frontend is not in the supported_frontends: {supported_frontends}"
            )
            sys.exit(1)
        self.raw_model_file = raw_model_file

    # NOTE: The default function for torch is "forward" and tf-lite is "main".

    def _torch_mlir(self, is_dynamic, tracing_required):
        from shark.torch_mlir_utils import get_torch_mlir_module

        return get_torch_mlir_module(
            self.module, self.inputs, is_dynamic, tracing_required
        )

    def _tf_mlir(self, func_name, save_dir="./shark_tmp/"):
        from iree.compiler import tf as tfc

        return tfc.compile_module(
            self.module,
            exported_names=[func_name],
            import_only=True,
            output_file=save_dir,
        )

    def _tflite_mlir(self, func_name, save_dir="./shark_tmp/"):
        from iree.compiler import tflite as tflitec

        self.mlir_model = tflitec.compile_file(
            self.raw_model_file,  # in tflite, it is a path to .tflite file, not a tflite interpreter
            input_type="tosa",
            import_only=True,
            output_file=save_dir,
        )
        return self.mlir_model

    # Adds the conversion of the frontend with the private function.
    def import_mlir(
        self,
        is_dynamic=False,
        tracing_required=False,
        func_name="forward",
        save_dir="./shark_tmp/",
    ):
        if self.frontend in ["torch", "pytorch"]:
            if self.inputs == None:
                print(
                    "Please pass in the inputs, the inputs are required to determine the shape of the mlir_module"
                )
                sys.exit(1)
            return self._torch_mlir(is_dynamic, tracing_required), func_name
        if self.frontend in ["tf", "tensorflow"]:
            return self._tf_mlir(func_name, save_dir), func_name
        if self.frontend in ["tflite", "tf-lite"]:
            func_name = "main"
            return self._tflite_mlir(func_name, save_dir), func_name

    # Converts the frontend specific tensors into np array.
    def convert_to_numpy(self, array_tuple: tuple):
        if self.frontend in ["torch", "pytorch"]:
            return [x.detach().cpu().numpy() for x in array_tuple]
        if self.frontend in ["tf", "tensorflow"]:
            return [x.numpy() for x in array_tuple]

    # Saves `function_name.npy`, `inputs.npz`, `golden_out.npz` and `model_name.mlir` in the directory `dir`.
    def save_data(
        self, dir, model_name, mlir_data, func_name, inputs, outputs
    ):
        import numpy as np

        inputs_name = "inputs.npz"
        outputs_name = "golden_out.npz"
        func_file_name = "function_name"
        model_name_mlir = model_name + "_" + self.frontend + ".mlir"
        try:
            inputs = [x.cpu().detach() for x in inputs]
        except AttributeError:
            try:
                inputs = [x.numpy() for x in inputs]
            except AttributeError:
                inputs = [x for x in inputs]
        np.savez(os.path.join(dir, inputs_name), *inputs)
        np.savez(os.path.join(dir, outputs_name), *outputs)
        np.save(os.path.join(dir, func_file_name), np.array(func_name))

        if self.frontend == "torch":
            with open(os.path.join(dir, model_name_mlir), "wb") as mlir_file:
                mlir_file.write(mlir_data)

        return

    def import_debug(
        self,
        is_dynamic=False,
        tracing_required=False,
        func_name="forward",
        dir=tempfile.gettempdir(),
        model_name="model",
    ):
        if self.inputs == None:
            print(
                f"There is no input provided: {self.inputs}, please provide inputs or simply run import_mlir."
            )
            sys.exit(1)
        model_name_mlir = model_name + "_" + self.frontend + ".mlir"
        artifact_path = os.path.join(dir, model_name_mlir)
        imported_mlir = self.import_mlir(
            is_dynamic,
            tracing_required,
            func_name,
            save_dir=artifact_path,
        )
        # TODO: Make sure that any generic function name is accepted. Currently takes in the default function names.
        # TODO: Check for multiple outputs.
        if self.frontend in ["torch", "pytorch"]:
            import torch

            golden_out = self.module(*self.inputs)
            if torch.is_tensor(golden_out):
                golden_out = tuple(
                    golden_out.detach().cpu().numpy(),
                )
            else:
                golden_out = self.convert_to_numpy(golden_out)
            # Save the artifacts in the directory dir.
            self.save_data(
                dir,
                model_name,
                imported_mlir[0],
                imported_mlir[1],
                self.inputs,
                golden_out,
            )
            return (
                imported_mlir,
                self.convert_to_numpy(self.inputs),
                golden_out,
            )
        if self.frontend in ["tf", "tensorflow"]:
            import tensorflow as tf

            golden_out = self.module.forward(*self.inputs)
            if tf.is_tensor(golden_out):
                golden_out = tuple(
                    golden_out.numpy(),
                )
            elif golden_out is tuple:
                golden_out = self.convert_to_numpy(golden_out)
            elif hasattr(golden_out, "logits"):
                # from transformers import TFSequenceClassifierOutput
                golden_out = golden_out.logits
            else:
                golden_out = golden_out.last_hidden_state
            # Save the artifacts in the directory dir.
            self.save_data(
                dir,
                model_name,
                imported_mlir[0],
                imported_mlir[1],
                self.inputs,
                golden_out,
            )
            return (
                imported_mlir,
                self.convert_to_numpy(self.inputs),
                golden_out,
            )
        if self.frontend in ["tflite", "tf-lite"]:
            # TODO(Chi): Validate it for tflite models.
            golden_out = self.module.invoke_tflite(self.inputs)
            self.save_data(
                dir,
                model_name,
                imported_mlir[0],
                imported_mlir[1],
                self.inputs,
                golden_out,
            )
            return (
                imported_mlir,
                self.inputs,
                golden_out,
            )


 # Applies fx conversion to the model and imports the mlir.
 def import_with_fx(model, inputs, debug=False):
    import torch
    from torch.fx.experimental.proxy_tensor import make_fx
    from torch._decomp import get_decompositions

    # TODO: Control the decompositions.
    fx_g = make_fx(
        model,
        decomposition_table=get_decompositions(
            [
                torch.ops.aten.embedding_dense_backward,
                torch.ops.aten.native_layer_norm_backward,
                torch.ops.aten.slice_backward,
                torch.ops.aten.select_backward,
                torch.ops.aten.norm.ScalarOpt_dim,
                torch.ops.aten.native_group_norm,
                torch.ops.aten.upsample_bilinear2d.vec,
                torch.ops.aten.split.Tensor,
                torch.ops.aten.split_with_sizes,
                torch.ops.aten.native_layer_norm,
            ]
        ),
    )(*inputs)

    fx_g.graph.set_codegen(torch.fx.graph.CodeGen())
    fx_g.recompile()

    def strip_overloads(gm):
        """
        Modifies the target of graph nodes in :attr:`gm` to strip overloads.
        Args:
            gm(fx.GraphModule): The input Fx graph module to be modified
        """
        for node in gm.graph.nodes:
            if isinstance(node.target, torch._ops.OpOverload):
                node.target = node.target.overloadpacket
        gm.recompile()

    strip_overloads(fx_g)
    fx_g.half()
    x = torch.jit.script(fx_g)
    inputs = tuple([x.half() for x in inputs])

    mlir_importer = SharkImporter(
        x,
        inputs,
        frontend="torch",
    )

    if debug:
        (mlir_module, func_name), _, _ = mlir_importer.import_debug()
        return mlir_module, func_name

    mlir_module, func_name = mlir_importer.import_mlir()

    return mlir_module, func_name
	# Lint as: python3
	"""SHARK Importer"""

	import sys
	import tempfile
	import os

	# List of the supported frontends.
	supported_frontends = {
	"tensorflow",
	"tf",
	"pytorch",
	"torch",
	"tf-lite",
	"tflite",
	}


	class SharkImporter:
	"""
	SharkImporter converts frontend modules into a
	mlir_module. The supported frameworks are tensorflow,
	pytorch, and tf-lite.

	...

	Attributes
	----------
	module :
	torch, tensorflow or tf-lite module.
	inputs :
	inputs to the module, may be required for the shape
	information.
	frontend: str
	frontend to which the module belongs.
	raw_model_file: str
	temp tflite model path

	Methods
	-------
	import_mlir(is_dynamic, tracing_required, func_name):
	is_dynamic: input shapes to be totally dynamic (pytorch specific).
	tracing_required: whether tracing is required (pytorch specific.
	func_name: The function to be traced out or imported to mlir.

	import_debug(is_dynamic, tracing_required, func_name):
	returns the converted (mlir_module,func_name) with inputs and golden
	outputs.
	The inputs and outputs are converted into np array.
	"""

	def __init__(
	self,
	module,
	inputs: tuple = (),
	frontend: str = "torch",
	raw_model_file: str = "",
	):
	self.module = module
	self.inputs = None if len(inputs) == 0 else inputs
	self.frontend = frontend
	if not self.frontend in supported_frontends:
	print(
	f"The frontend is not in the supported_frontends: {supported_frontends}"
	)
	sys.exit(1)
	self.raw_model_file = raw_model_file

	# NOTE: The default function for torch is "forward" and tf-lite is "main".

	def _torch_mlir(self, is_dynamic, tracing_required):
	from shark.torch_mlir_utils import get_torch_mlir_module

	return get_torch_mlir_module(
	self.module, self.inputs, is_dynamic, tracing_required
	)

	def _tf_mlir(self, func_name, save_dir="./shark_tmp/"):
	from iree.compiler import tf as tfc

	return tfc.compile_module(
	self.module,
	exported_names=[func_name],
	import_only=True,
	output_file=save_dir,
	)

	def _tflite_mlir(self, func_name, save_dir="./shark_tmp/"):
	from iree.compiler import tflite as tflitec

	self.mlir_model = tflitec.compile_file(
	self.raw_model_file, # in tflite, it is a path to .tflite file, not a tflite interpreter
	input_type="tosa",
	import_only=True,
	output_file=save_dir,
	)
	return self.mlir_model

	# Adds the conversion of the frontend with the private function.
	def import_mlir(
	self,
	is_dynamic=False,
	tracing_required=False,
	func_name="forward",
	save_dir="./shark_tmp/",
	):
	if self.frontend in ["torch", "pytorch"]:
	if self.inputs == None:
	print(
	"Please pass in the inputs, the inputs are required to determine the shape of the mlir_module"
	)
	sys.exit(1)
	return self._torch_mlir(is_dynamic, tracing_required), func_name
	if self.frontend in ["tf", "tensorflow"]:
	return self._tf_mlir(func_name, save_dir), func_name
	if self.frontend in ["tflite", "tf-lite"]:
	func_name = "main"
	return self._tflite_mlir(func_name, save_dir), func_name

	# Converts the frontend specific tensors into np array.
	def convert_to_numpy(self, array_tuple: tuple):
	if self.frontend in ["torch", "pytorch"]:
	return [x.detach().cpu().numpy() for x in array_tuple]
	if self.frontend in ["tf", "tensorflow"]:
	return [x.numpy() for x in array_tuple]

	# Saves `function_name.npy`, `inputs.npz`, `golden_out.npz` and `model_name.mlir` in the directory `dir`.
	def save_data(
	self, dir, model_name, mlir_data, func_name, inputs, outputs
	):
	import numpy as np

	inputs_name = "inputs.npz"
	outputs_name = "golden_out.npz"
	func_file_name = "function_name"
	model_name_mlir = model_name + "_" + self.frontend + ".mlir"
	try:
	inputs = [x.cpu().detach() for x in inputs]
	except AttributeError:
	try:
	inputs = [x.numpy() for x in inputs]
	except AttributeError:
	inputs = [x for x in inputs]
	np.savez(os.path.join(dir, inputs_name), *inputs)
	np.savez(os.path.join(dir, outputs_name), *outputs)
	np.save(os.path.join(dir, func_file_name), np.array(func_name))

	if self.frontend == "torch":
	with open(os.path.join(dir, model_name_mlir), "wb") as mlir_file:
	mlir_file.write(mlir_data)

	return

	def import_debug(
	self,
	is_dynamic=False,
	tracing_required=False,
	func_name="forward",
	dir=tempfile.gettempdir(),
	model_name="model",
	):
	if self.inputs == None:
	print(
	f"There is no input provided: {self.inputs}, please provide inputs or simply run import_mlir."
	)
	sys.exit(1)
	model_name_mlir = model_name + "_" + self.frontend + ".mlir"
	artifact_path = os.path.join(dir, model_name_mlir)
	imported_mlir = self.import_mlir(
	is_dynamic,
	tracing_required,
	func_name,
	save_dir=artifact_path,
	)
	# TODO: Make sure that any generic function name is accepted. Currently takes in the default function names.
	# TODO: Check for multiple outputs.
	if self.frontend in ["torch", "pytorch"]:
	import torch

	golden_out = self.module(*self.inputs)
	if torch.is_tensor(golden_out):
	golden_out = tuple(
	golden_out.detach().cpu().numpy(),
	)
	else:
	golden_out = self.convert_to_numpy(golden_out)
	# Save the artifacts in the directory dir.
	self.save_data(
	dir,
	model_name,
	imported_mlir[0],
	imported_mlir[1],
	self.inputs,
	golden_out,
	)
	return (
	imported_mlir,
	self.convert_to_numpy(self.inputs),
	golden_out,
	)
	if self.frontend in ["tf", "tensorflow"]:
	import tensorflow as tf

	golden_out = self.module.forward(*self.inputs)
	if tf.is_tensor(golden_out):
	golden_out = tuple(
	golden_out.numpy(),
	)
	elif golden_out is tuple:
	golden_out = self.convert_to_numpy(golden_out)
	elif hasattr(golden_out, "logits"):
	# from transformers import TFSequenceClassifierOutput
	golden_out = golden_out.logits
	else:
	golden_out = golden_out.last_hidden_state
	# Save the artifacts in the directory dir.
	self.save_data(
	dir,
	model_name,
	imported_mlir[0],
	imported_mlir[1],
	self.inputs,
	golden_out,
	)
	return (
	imported_mlir,
	self.convert_to_numpy(self.inputs),
	golden_out,
	)
	if self.frontend in ["tflite", "tf-lite"]:
	# TODO(Chi): Validate it for tflite models.
	golden_out = self.module.invoke_tflite(self.inputs)
	self.save_data(
	dir,
	model_name,
	imported_mlir[0],
	imported_mlir[1],
	self.inputs,
	golden_out,
	)
	return (
	imported_mlir,
	self.inputs,
	golden_out,
	)


	# Applies fx conversion to the model and imports the mlir.
	def import_with_fx(model, inputs, debug=False):
	import torch
	from torch.fx.experimental.proxy_tensor import make_fx
	from torch._decomp import get_decompositions

	# TODO: Control the decompositions.
	fx_g = make_fx(
	model,
	decomposition_table=get_decompositions(
	[
	torch.ops.aten.embedding_dense_backward,
	torch.ops.aten.native_layer_norm_backward,
	torch.ops.aten.slice_backward,
	torch.ops.aten.select_backward,
	torch.ops.aten.norm.ScalarOpt_dim,
	torch.ops.aten.native_group_norm,
	torch.ops.aten.upsample_bilinear2d.vec,
	torch.ops.aten.split.Tensor,
	torch.ops.aten.split_with_sizes,
	torch.ops.aten.native_layer_norm,
	]
	),
	)(*inputs)

	fx_g.graph.set_codegen(torch.fx.graph.CodeGen())
	fx_g.recompile()

	def strip_overloads(gm):
	"""
	Modifies the target of graph nodes in :attr:`gm` to strip overloads.
	Args:
	gm(fx.GraphModule): The input Fx graph module to be modified
	"""
	for node in gm.graph.nodes:
	if isinstance(node.target, torch._ops.OpOverload):
	node.target = node.target.overloadpacket
	gm.recompile()

	strip_overloads(fx_g)
	fx_g.half()
	x = torch.jit.script(fx_g)
	inputs = tuple([x.half() for x in inputs])

	mlir_importer = SharkImporter(
	x,
	inputs,
	frontend="torch",
	)

	if debug:
	(mlir_module, func_name), _, _ = mlir_importer.import_debug()
	return mlir_module, func_name

	mlir_module, func_name = mlir_importer.import_mlir()

	return mlir_module, func_name