Skip to content

Commit ac8b947

Browse files
authored
update llga to 0887652, keep oneDNN as v2.7 (#1256)
* add ut for int8 bmm with chunked inputs * update llga to 0887652, keep oneDNN as v2.7
1 parent 730ae93 commit ac8b947

File tree

2 files changed

+19
-1
lines changed

2 files changed

+19
-1
lines changed

tests/cpu/test_ao_jit_llga_quantization_fuser.py

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -347,6 +347,24 @@ def forward(self, x, y):
347347
self.assertFused(graph, ['aten::matmul', 'aten::dequantize', 'aten::quantize_per_tensor'])
348348
self.checkPatterns(graph, patterns)
349349

350+
def test_chunk_bmm(self):
351+
class M(nn.Module):
352+
def __init__(self):
353+
super(M, self).__init__()
354+
355+
def forward(self, x, y):
356+
z = torch.matmul(x, y)
357+
return z
358+
359+
m = M()
360+
x = torch.randn(2, 1, 5, 5)
361+
362+
y = torch.randn(2, 1, 5, 9)
363+
y_chunk, _, _ = y.chunk(3, dim=3)
364+
graph = self.checkQuantizeTrace(m, [x, y_chunk], atol=2e-1)
365+
self.assertGraphContainsExactly(graph, LLGA_FUSION_GROUP, 1)
366+
self.assertFused(graph, ['aten::matmul', 'aten::dequantize'])
367+
350368
def test_mixed_precision_softmax(self):
351369
class M(torch.nn.Module):
352370
def __init__(self):

third_party/ideep

Submodule ideep updated 1 file

0 commit comments

Comments
 (0)