Skip to content

Commit 4ad3e63

Browse files
committed
add missing paralleization for dense
1 parent 978158d commit 4ad3e63

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

python/tvm/topi/hexagon/dense.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -88,6 +88,7 @@ def _schedule_dense(s, C, O):
8888

8989
pc = dot_vrmpy("uint8", "uint8")
9090
s[C].tensorize(a_xi, pc)
91+
s[C].parallel(s[C].fuse(a_yo, a_xo))
9192

9293
if C != O:
9394
a_y = O.op.axis[-2]
@@ -97,6 +98,7 @@ def _schedule_dense(s, C, O):
9798
s[O].reorder(a_yo, a_xo, a_yi, a_xi)
9899
s[O].vectorize(a_xi)
99100
s[C].compute_at(s[O], a_yi)
101+
s[O].parallel(s[O].fuse(a_yo, a_xo))
100102

101103
def _callback(op):
102104
if "u8u8i32_vrmpy" in op.tag:

0 commit comments

Comments
 (0)