Map more elementwise ops to LLGA (#874)

sanchitintel · web-flow · commit 2c079e5e2b02 · 2022-06-17T11:53:30.000+08:00
diff --git a/intel_extension_for_pytorch/csrc/jit/codegen/onednn/graph_helper.cpp b/intel_extension_for_pytorch/csrc/jit/codegen/onednn/graph_helper.cpp
@@ -229,16 +229,39 @@ Operator LlgaGraphHelper::createOperator(Node* node) const {
     return makeEltwiseOp(node, opkind::Sigmoid);
   } else if (nodeKind == Symbol::aten("gelu")) {
     return makeEltwiseOp(node, opkind::GELU);
+  } else if (nodeKind == Symbol::aten("round")) {
+    return makeEltwiseOp(node, opkind::Round);
+  } else if (nodeKind == Symbol::aten("exp")) {
+    return makeEltwiseOp(node, opkind::Exp);
   } else if (nodeKind == Symbol::aten("sqrt")) {
     return makeEltwiseOp(node, opkind::Sqrt);
   } else if (nodeKind == Symbol::aten("abs")) {
     return makeEltwiseOp(node, opkind::Abs);
   } else if (nodeKind == Symbol::aten("square")) {
     return makeEltwiseOp(node, opkind::Square);
+  } else if (nodeKind == Symbol::aten("clamp")) {
+    // PyTorch API already checks that both min & max are not None.
+    // But we can check it nevertheless.
+    auto clamp_min = toIValue(node->input(1));
+    auto clamp_max = toIValue(node->input(2));
+    REQ(!(clamp_max->isNone() && clamp_min->isNone()));
+    auto clamp_min_value = (clamp_min->isNone())
+        ? -std::numeric_limits<float>::infinity()
+        : Operator::ScalarToFloat(node, 1);
+    auto clamp_max_value = (clamp_max->isNone())
+        ? std::numeric_limits<float>::infinity()
+        : Operator::ScalarToFloat(node, 2);
+    return makeEltwiseOp(node, opkind::Clamp)
+        .setAttr("min", clamp_min_value)
+        .setAttr("max", clamp_max_value);
   } else if (nodeKind == Symbol::aten("hardtanh")) {
     return makeEltwiseOp(node, opkind::HardTanh)
-        .setAttr("min", Operator::Float, 1)
-        .setAttr("max", Operator::Float, 2);
+        .setAttr("min", Operator::ScalarToFloat, 1)
+        .setAttr("max", Operator::ScalarToFloat, 2);
+  } else if (nodeKind == Symbol::aten("hardswish")) {
+    return makeEltwiseOp(node, opkind::HardSwish);
+  } else if (nodeKind == Symbol::aten("log")) {
+    return makeEltwiseOp(node, opkind::Log);
   } else if (nodeKind == Symbol::aten("leaky_relu")) {
     return makeEltwiseOp(node, opkind::LeakyReLU)
         .setAttr("alpha", Operator::Float, 1);
diff --git a/intel_extension_for_pytorch/csrc/jit/codegen/onednn/operator.h b/intel_extension_for_pytorch/csrc/jit/codegen/onednn/operator.h
@@ -69,6 +69,10 @@ class Operator {
     return static_cast<float>(toIValue(node->input(offset))->toDouble());
   }
 
+  static float ScalarToFloat(const Node* node, size_t offset) {
+    return toIValue(node->input(offset))->toScalar().to<float>();
+  }
+
   static std::vector<float> FloatValueToVector(float value) {
     return {value};
   }
diff --git a/tests/cpu/test_ao_jit_llga_quantization_fuser.py b/tests/cpu/test_ao_jit_llga_quantization_fuser.py
@@ -41,6 +41,8 @@ def get_eltwise_fn(name):
     elif hasattr(F, name):
         return getattr(F, name)
     else:
+        if name == 'hardswish_':
+            return torch.nn.Hardswish(inplace=True);
         raise NameError('Eltwise function %s not found' % name)
 
 class TestOp(JitLlgaTestCase):
@@ -350,7 +352,8 @@ def forward(self, x):
                 x = self.conv2(x)
                 return x
 
-        for eltwise in ['relu', 'leaky_relu']: # TODO: ['sigmoid', 'sqrt', 'abs', 'square', 'hardtanh']
+        for eltwise in ['relu', 'leaky_relu', 'sigmoid', 'round', 'abs', 'square',
+                        'abs', 'round', 'exp', 'hardswish', 'tanh', 'hardtanh']:
             for inplace in [False, True]:
                 for memory_format in [torch.contiguous_format, torch.channels_last]:
                     eltwise_fn_name = eltwise + '_' if inplace else eltwise
@@ -369,6 +372,38 @@ def forward(self, x):
                         self.assertFused(graph, ['aten::_convolution', 'aten::' + eltwise, 'aten::quantize_per_channel', 'aten::dequantize'])
                         self.checkPatterns(graph, patterns)
 
+    def test_conv2d_clamp(self):
+        class M(nn.Module):
+            def __init__(self):
+                super(M, self).__init__()
+                self.conv1 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv2 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv3 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv4 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv5 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+
+            def forward(self, x):
+                x = self.conv1(x)
+                x = torch.clamp(x, min=float('-inf'))
+                x = self.conv2(x)
+                x = torch.clamp(x, min=-5)
+                x = self.conv3(x)
+                x = torch.clamp(x, min=0, max=float('inf'))
+                x = self.conv4(x)
+                x = torch.clamp(x, min=1, max=5)
+                x = self.conv5(x)
+                x = torch.clamp(x, max=2)
+                return x
+
+        for inplace in [False, True]:
+            for memory_format in [torch.contiguous_format, torch.channels_last]:
+                x = torch.rand(1, 32, 28, 28).to(memory_format=memory_format)
+                m = M()
+                for qconfig in static_qconfig:
+                    graph = self.checkQuantizeTrace(m, [x], atol=2e-1, qconfig=qconfig)
+                    self.assertGraphContainsExactly(graph, LLGA_FUSION_GROUP, 5)
+                    self.assertFused(graph, ['aten::_convolution', 'aten::' + "clamp", 'aten::quantize_per_channel', 'aten::dequantize'])
+
     def test_ensure_tensor_is_rewrapped(self):
         class M(nn.Module):
             def __init__(self, eltwise_fn):
diff --git a/tests/cpu/test_jit_llga_fuser.py b/tests/cpu/test_jit_llga_fuser.py
@@ -22,6 +22,8 @@ def get_eltwise_fn(name):
     elif hasattr(F, name):
         return getattr(F, name)
     else:
+        if name == 'hardswish_':
+            return torch.nn.Hardswish(inplace=True);
         raise NameError('Eltwise function %s not found' % name)
 
 
@@ -414,8 +416,8 @@ def forward(self, x):
                 x = self.eltwise(x)
                 return x
 
-        # for eltwise in ['relu', 'sigmoid', 'sqrt', 'abs', 'square', 'hardtanh']:
-        for eltwise in ['relu']:
+        for eltwise in ['relu', 'leaky_relu', 'sigmoid', 'round', 'abs', 'square',
+                        'abs', 'round', 'exp', 'hardswish', 'tanh', 'hardtanh']:
             for inplace in [True, False]:
                 eltwise_fn_name = eltwise + '_' if inplace else eltwise
                 eltwise_fn = get_eltwise_fn(eltwise_fn_name)
@@ -429,6 +431,38 @@ def forward(self, x):
                 # test if relu is fused into the fusion group
                 self.assertFused(graph, ['aten::' + eltwise])
 
+    @llga_fp32_bf16_test_env
+    def test_conv2d_clamp(self):
+        class M(nn.Module):
+            def __init__(self):
+                super(M, self).__init__()
+                self.conv1 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv2 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv3 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv4 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+                self.conv5 = nn.Conv2d(32, 32, 3, padding=1, bias=True)
+
+            def forward(self, x):
+                x = self.conv1(x)
+                x = torch.clamp(x, min=float('-inf'))
+                x = self.conv2(x)
+                x = torch.clamp(x, min=-5)
+                x = self.conv3(x)
+                x = torch.clamp(x, min=0, max=float('inf'))
+                x = self.conv4(x)
+                x = torch.clamp(x, min=1, max=5)
+                x = self.conv5(x)
+                x = torch.clamp(x, max=2)
+                return x
+
+        for inplace in [False, True]:
+            for memory_format in [torch.contiguous_format, torch.channels_last]:
+                x = torch.rand(1, 32, 28, 28).to(memory_format=memory_format)
+                m = M()
+                graph, _ = self.checkTrace(m, [x])
+                self.assertGraphContainsExactly(graph, LLGA_FUSION_GROUP, 5)
+                self.assertFused(graph, ['aten::_convolution', "aten::clamp"])
+
     @llga_fp32_bf16_test_env
     def test_ensure_tensor_is_rewrapped(self):
         class M(nn.Module):

Original file line number	Diff line number	Diff line change
`@@ -69,6 +69,10 @@ class Operator {`
`69`	`69`	`return static_cast<float>(toIValue(node->input(offset))->toDouble());`
`70`	`70`	`}`
`71`	`71`
	`72`	`+ static float ScalarToFloat(const Node* node, size_t offset) {`
	`73`	`+ return toIValue(node->input(offset))->toScalar().to<float>();`
	`74`	`+ }`
	`75`	`+`
`72`	`76`	`static std::vector<float> FloatValueToVector(float value) {`
`73`	`77`	`return {value};`
`74`	`78`	`}`