fusion_nhwc_conv.py 3.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899
  1. # -------------------------------------------------------------------------
  2. # Copyright (c) Microsoft Corporation. All rights reserved.
  3. # Licensed under the MIT License.
  4. # --------------------------------------------------------------------------
  5. from logging import getLogger
  6. from fusion_base import Fusion
  7. from fusion_utils import FusionUtils
  8. from onnx import helper, numpy_helper
  9. from onnx_model import OnnxModel
  10. logger = getLogger(__name__)
  11. class FusionNhwcConv(Fusion):
  12. """Convert Conv to NhwcConv"""
  13. def __init__(self, model: OnnxModel, update_weight=False):
  14. super().__init__(model, "NhwcConv", ["Conv"], "NhwcConv")
  15. self.update_weight = update_weight
  16. self.fusion_utils = FusionUtils(model)
  17. def create_transpose_node(self, input_name: str, perm: list[int], output_name=None):
  18. """Append a Transpose node after an input"""
  19. node_name = self.model.create_node_name("Transpose")
  20. if output_name is None:
  21. output_name = node_name + "_out" + "-" + input_name
  22. transpose_node = helper.make_node("Transpose", inputs=[input_name], outputs=[output_name], name=node_name)
  23. transpose_node.attribute.extend([helper.make_attribute("perm", perm)])
  24. return transpose_node
  25. def fuse(self, conv, input_name_to_nodes, output_name_to_node):
  26. # Add Transpose node to convert input from NCHW to NHWC
  27. input_transpose_node = self.create_transpose_node(conv.input[0], [0, 2, 3, 1])
  28. nhwc_conv_input = input_transpose_node.output[0]
  29. # Create a tensor for transposed weights (already in NHWC format).
  30. node_name = self.model.create_node_name("NhwcConv")
  31. # Make sure the weights is 4D
  32. weight_tensor = self.model.get_initializer(conv.input[1])
  33. if weight_tensor is None:
  34. return
  35. weight = numpy_helper.to_array(weight_tensor)
  36. if len(weight.shape) != 4:
  37. return
  38. dtype = self.model.get_dtype(nhwc_conv_input)
  39. if not (dtype is not None and weight_tensor.data_type == dtype):
  40. cast_node = self.fusion_utils.add_cast_node(
  41. input_name=nhwc_conv_input,
  42. to_type=weight_tensor.data_type,
  43. output_name_to_node=output_name_to_node,
  44. )
  45. nhwc_conv_input = cast_node.output[0]
  46. if self.update_weight:
  47. # Transpose weights from NCHW to NHWC
  48. weight = weight.transpose(0, 2, 3, 1)
  49. weight_name = node_name + "_weight_NHWC"
  50. self.add_initializer(
  51. name=weight_name,
  52. data_type=weight_tensor.data_type,
  53. dims=list(weight.shape),
  54. vals=weight,
  55. )
  56. weight_transpose_node = None
  57. else:
  58. weight_transpose_node = self.create_transpose_node(conv.input[1], [0, 2, 3, 1])
  59. weight_name = weight_transpose_node.output[0]
  60. nhwc_output_name = node_name + "_out" + "-" + conv.output[0]
  61. nhwc_conv = helper.make_node(
  62. "NhwcConv",
  63. inputs=[nhwc_conv_input, weight_name, *conv.input[2:]],
  64. outputs=[nhwc_output_name],
  65. name=node_name + "-" + conv.name,
  66. )
  67. nhwc_conv.attribute.extend(conv.attribute)
  68. nhwc_conv.domain = "com.microsoft"
  69. output_transpose_node = self.create_transpose_node(nhwc_conv.output[0], [0, 3, 1, 2], conv.output[0])
  70. self.nodes_to_remove.append(conv)
  71. nodes_to_add = [input_transpose_node, nhwc_conv, output_transpose_node]
  72. if weight_transpose_node:
  73. nodes_to_add.append(weight_transpose_node)
  74. for node in nodes_to_add:
  75. self.node_name_to_graph_name[node.name] = self.this_graph_name
  76. self.nodes_to_add.extend(nodes_to_add)
  77. self.increase_counter("NhwcConv")