Skip to content
Snippets Groups Projects

GPU backend

Merged prathi3 requested to merge gpu-cg into main
1 file
+ 2
1
Compare changes
  • Side-by-side
  • Inline
+ 2
1
@@ -371,6 +371,7 @@ impl GPUContext<'_> {
#include <stddef.h>
#include <cuda.h>
#include <cuda_runtime.h>
#include <math_constants.h>
#include <mma.h>
#include <cooperative_groups.h>
#include <cooperative_groups/memcpy_async.h>
@@ -1906,7 +1907,7 @@ extern \"C\" {} {}(", if ret_primitive { ret_type.clone() } else { "void".to_str
_ => "sinh",
},
Intrinsic::Sqrt => match ty {
ty if ty.is_float() => "__sqrtf",
Type::Float32 => "__sqrtf",
ty if ty.is_signed() || ty.is_unsigned() => "isqrt",
_ => "sqrt",
},
Loading