We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent cbfe979 commit 35f6bb1Copy full SHA for 35f6bb1
python/tvm/topi/x86/dense.py
@@ -333,18 +333,18 @@ def split_y(out):
333
334
if C == O:
335
fused = s[O].fuse(a_yo, a_xo)
336
- s[O].parallel(fused)
337
else:
338
a_yo, a_yi = split_y(O)
339
a_xo, a_xi = s[O].split(O.op.axis[1], factor=16)
340
341
s[O].reorder(a_yo, a_xo, a_yi, a_xi)
342
- fused = s[O].fuse(a_yo, a_xo)
343
s[O].vectorize(a_xi)
344
345
-
346
s[C].compute_at(s[O], a_yi)
347
+ fused = s[O].fuse(a_yo, a_xo)
+
+ s[O].parallel(fused)
348
return s
349
350
0 commit comments