update llga to 0887652, keep oneDNN as v2.7 (#1256)

chunyuan-w · web-flow · commit ac8b947dd10b · 2022-11-02T18:21:53.000+08:00
* add ut for int8 bmm with chunked inputs

* update llga to 0887652, keep oneDNN as v2.7
diff --git a/tests/cpu/test_ao_jit_llga_quantization_fuser.py b/tests/cpu/test_ao_jit_llga_quantization_fuser.py
@@ -347,6 +347,24 @@ def forward(self, x, y):
         self.assertFused(graph, ['aten::matmul', 'aten::dequantize', 'aten::quantize_per_tensor'])
         self.checkPatterns(graph, patterns)
 
+    def test_chunk_bmm(self):
+        class M(nn.Module):
+            def __init__(self):
+                super(M, self).__init__()
+
+            def forward(self, x, y):
+                z = torch.matmul(x, y)
+                return z
+        
+        m = M()        
+        x = torch.randn(2, 1, 5, 5)
+        
+        y = torch.randn(2, 1, 5, 9)
+        y_chunk, _, _ = y.chunk(3, dim=3)
+        graph = self.checkQuantizeTrace(m, [x, y_chunk], atol=2e-1)
+        self.assertGraphContainsExactly(graph, LLGA_FUSION_GROUP, 1)
+        self.assertFused(graph, ['aten::matmul', 'aten::dequantize'])
+
     def test_mixed_precision_softmax(self):
         class M(torch.nn.Module):
             def __init__(self):
diff --git a/third_party/ideep b/third_party/ideep
@@ -1 +1 @@
-Subproject commit 6c55dbb7de4a1195f88772452bee39f042be3dc5
+Subproject commit aecf36e552b1170133f18b331871547844ed6edb