Use F32 sqrtf instead of F64 sqrt
Co-authored-by: Johannes Gäßler <johannesg@5d6.de>
This commit is contained in:
parent
fea1dc98c0
commit
3591f1cc8c
1 changed files with 1 additions and 1 deletions
|
@ -98,7 +98,7 @@ static __global__ void sqrt_f32(const float * x, float * dst, const int k) {
|
|||
if (i >= k) {
|
||||
return;
|
||||
}
|
||||
dst[i] = sqrt(x[i]);
|
||||
dst[i] = sqrtf(x[i]);
|
||||
}
|
||||
|
||||
static void gelu_f32_cuda(const float * x, float * dst, const int k, cudaStream_t stream) {
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue