Skip to content
Snippets Groups Projects

A whole bunch of optimization

Merged rarbore2 requested to merge more_miranda_optts into main
20 files
+ 246
109
Compare changes
  • Side-by-side
  • Inline
Files
20
+ 4
2
@@ -1225,11 +1225,13 @@ namespace cg = cooperative_groups;
// because Fork basic block's init section already does gating
write!(
w,
"{}{} = (threadIdx.x % {}) / {};\n",
"{}{} = (((threadIdx.x % {}) / {}) / ({})) % ({});\n",
tabs,
define_variable,
use_thread_quota.unwrap(),
use_thread_quota.unwrap() / parallel_factor.unwrap()
use_thread_quota.unwrap() / parallel_factor.unwrap(),
divide,
modulo,
)?;
}
}
Loading