Skip to content

Commit

Permalink
save
Browse files Browse the repository at this point in the history
  • Loading branch information
zasdfgbnm committed Oct 31, 2024
1 parent 54e8cde commit 3533b15
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions __tmp_kernel_none_f0_c0_r0_g0.cu
Original file line number Diff line number Diff line change
Expand Up @@ -10929,7 +10929,7 @@ nvfuser_none_f0_c0_r0_g0(Tensor<__half, 3, 3> T0, Tensor<__half, 3, 3> T1, const
mbarrier::arriveExpectTX(toSmem((&T7[i21])), 8192U + 4096U);
#pragma unroll
for(nvfuser_index_t i25 = 0; i25 < 4; ++i25) {
Hopper::cpAsyncBulkTensorTileG2S((Hopper::CpAsyncBulkTensorTileG2SIndex<2>{ ptr4, (Array<nvfuser_index_t, 2, 1>{(i5 + (64 * i25)), i22}), toSmem((&T7[i21])) }), (i23 + (2048 * i25)));
Hopper::cpAsyncBulkTensorTileG2S((Hopper::CpAsyncBulkTensorTileG2SIndex<2>{ ptr4, (Array<nvfuser_index_t, 2, 1>{(i5 + (64 * i25)), i22}), toSmem((&T7[i21])) }), (i23 + (2048 * i25)), 3);
}
#pragma unroll
for(nvfuser_index_t i26 = 0; i26 < 2; ++i26) {
Expand Down Expand Up @@ -10959,7 +10959,7 @@ nvfuser_none_f0_c0_r0_g0(Tensor<__half, 3, 3> T0, Tensor<__half, 3, 3> T1, const
mbarrier::arriveExpectTX(toSmem((&T7[((3 + i27) % 4)])), 8192U + 4096U);
#pragma unroll
for(nvfuser_index_t i25 = 0; i25 < 4; ++i25) {
Hopper::cpAsyncBulkTensorTileG2S((Hopper::CpAsyncBulkTensorTileG2SIndex<2>{ ptr4, (Array<nvfuser_index_t, 2, 1>{(i5 + (64 * i25)), i28}), toSmem((&T7[((3 + i27) % 4)])) }), (i30 + (2048 * i25)));
Hopper::cpAsyncBulkTensorTileG2S((Hopper::CpAsyncBulkTensorTileG2SIndex<2>{ ptr4, (Array<nvfuser_index_t, 2, 1>{(i5 + (64 * i25)), i28}), toSmem((&T7[((3 + i27) % 4)])) }), (i30 + (2048 * i25)), 3);
}
#pragma unroll
for(nvfuser_index_t i26 = 0; i26 < 2; ++i26) {
Expand Down

0 comments on commit 3533b15

Please sign in to comment.