Skip to content

Commit d90ac01

Browse files
committed
Merge remote-tracking branch 'origin/refactor/grp-hadamard-ldmatrix-transpose' into refactor/grp-hadamard-ldmatrix-transpose
Made-with: Cursor
2 parents 6c2818a + 28fb320 commit d90ac01

1 file changed

Lines changed: 1 addition & 2 deletions

File tree

transformer_engine/common/hadamard_transform/group_hadamard_transform.cu

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -90,8 +90,7 @@ __device__ __forceinline__ void ComputeKernel(uint32_t b_frag_i[4], uint32_t b_f
9090
}
9191

9292
if (kReturnIdentityAmax) {
93-
if (kReturnTransposedAmax ||
94-
(!kReturnTransposedAmax && !kReturnPreRhtAmax)) {
93+
if (kReturnTransposedAmax || (!kReturnTransposedAmax && !kReturnPreRhtAmax)) {
9594
ldmatrix_x4_m8n8_shared_b16<false>(a_frag[0], a_frag[1], a_frag[2], a_frag[3],
9695
reinterpret_cast<uint4*>(in_sh_ptr) + swizzle_idx);
9796
}

0 commit comments

Comments
 (0)