From 2c6c38c0dbbb6268ebbb499fb80966c19500e09b Mon Sep 17 00:00:00 2001 From: Praneet Rathi <prrathi10@gmail.com> Date: Fri, 17 Jan 2025 18:33:50 -0600 Subject: [PATCH] cuda nowoprk? --- hercules_cg/src/gpu.rs | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/hercules_cg/src/gpu.rs b/hercules_cg/src/gpu.rs index e7195223..0c69544b 100644 --- a/hercules_cg/src/gpu.rs +++ b/hercules_cg/src/gpu.rs @@ -371,6 +371,7 @@ impl GPUContext<'_> { #include <stddef.h> #include <cuda.h> #include <cuda_runtime.h> +#include <math_constants.h> #include <mma.h> #include <cooperative_groups.h> #include <cooperative_groups/memcpy_async.h> @@ -1906,7 +1907,7 @@ extern \"C\" {} {}(", if ret_primitive { ret_type.clone() } else { "void".to_str _ => "sinh", }, Intrinsic::Sqrt => match ty { - ty if ty.is_float() => "__sqrtf", + Type::Float32 => "__sqrtf", ty if ty.is_signed() || ty.is_unsigned() => "isqrt", _ => "sqrt", }, -- GitLab