| 45 | |
| 46 | @T.prim_func(private=True, s_tir=True) |
| 47 | def add(rxplaceholder: T.Buffer((T.int64(1), T.int64(2), T.int64(3)), "float32"), rxplaceholder_1: T.Buffer((T.int64(4), T.int64(3), T.int64(2), T.int64(1)), "float32"), T_add: T.Buffer((T.int64(4), T.int64(3), T.int64(2), T.int64(3)), "float32")): |
| 48 | T.func_attr({"tirx.noalias": True}) |
| 49 | for i0, i1, i2, i3 in T.grid(T.int64(4), T.int64(3), T.int64(2), T.int64(3)): |
| 50 | with T.sblock("T_add"): |
| 51 | ax0, ax1, ax2, ax3 = T.axis.remap("SSSS", [i0, i1, i2, i3]) |
| 52 | T.reads(rxplaceholder[T.int64(0), ax2, ax3], rxplaceholder_1[ax0, ax1, ax2, T.int64(0)]) |
| 53 | T.writes(T_add[ax0, ax1, ax2, ax3]) |
| 54 | T_add[ax0, ax1, ax2, ax3] = rxplaceholder[T.int64(0), ax2, ax3] + rxplaceholder_1[ax0, ax1, ax2, T.int64(0)] |
| 55 | # fmt: on |
| 56 | |
| 57 | mod = LegalizeOps()(Add) |