Skip to content
Snippets Groups Projects
Commit 2c6c38c0 authored by Praneet Rathi's avatar Praneet Rathi
Browse files

cuda nowoprk?

parent df630f84
No related branches found
No related tags found
1 merge request!115GPU backend
Checking pipeline status
...@@ -371,6 +371,7 @@ impl GPUContext<'_> { ...@@ -371,6 +371,7 @@ impl GPUContext<'_> {
#include <stddef.h> #include <stddef.h>
#include <cuda.h> #include <cuda.h>
#include <cuda_runtime.h> #include <cuda_runtime.h>
#include <math_constants.h>
#include <mma.h> #include <mma.h>
#include <cooperative_groups.h> #include <cooperative_groups.h>
#include <cooperative_groups/memcpy_async.h> #include <cooperative_groups/memcpy_async.h>
...@@ -1906,7 +1907,7 @@ extern \"C\" {} {}(", if ret_primitive { ret_type.clone() } else { "void".to_str ...@@ -1906,7 +1907,7 @@ extern \"C\" {} {}(", if ret_primitive { ret_type.clone() } else { "void".to_str
_ => "sinh", _ => "sinh",
}, },
Intrinsic::Sqrt => match ty { Intrinsic::Sqrt => match ty {
ty if ty.is_float() => "__sqrtf", Type::Float32 => "__sqrtf",
ty if ty.is_signed() || ty.is_unsigned() => "isqrt", ty if ty.is_signed() || ty.is_unsigned() => "isqrt",
_ => "sqrt", _ => "sqrt",
}, },
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment