Skip to content

Commit 82ace62

Browse files
authored
[Common] Fix "0" literal for compilation (#2934)
1 parent f2e31db commit 82ace62

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

transformer_engine/common/fused_attn/flash_attn.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -311,7 +311,7 @@ __device__ __forceinline__ void permute_vec_loop(const T *__restrict__ in, T *__
311311
const size_t s_local = w / pad_elems;
312312
const size_t s_i = s_begin + s_local;
313313
const size_t d_off = D + (w % pad_elems);
314-
out[out_base + s_i * D_out + d_off] = static_cast<T>(0);
314+
out[out_base + s_i * D_out + d_off] = static_cast<T>(0.f);
315315
}
316316
}
317317
}

0 commit comments

Comments
 (0)