Grouped Conv support in tensorHalfConvolution

9bc2ca73 · Hashim Sharif · a9f49265 · 9bc2ca73
Commit 9bc2ca73 authored 5 years ago by Hashim Sharif
--- a/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/half_precision_api.h
+++ b/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/half_precision_api.h
@@ -149,7 +149,7 @@ void* tensorHalfGemmGPU(void* lhs_ptr, void* rhs_ptr){
 void* tensorHalfConvolution(void* input_ptr, void* filter_ptr,
 			    int vertical_pad, int horizontal_pad,
 			    int vertical_stride, int horizontal_stride,
-			    int conv_mode, int compute_precision){
+			    int conv_mode, int conv_groups){

  INFO("*** TensorHConvolution \n");
  profileEvent("tensorHalfConv");
@@ -200,8 +200,17 @@ void* tensorHalfConvolution(void* input_ptr, void* filter_ptr,
  /******* END OF INPUT DATA CONVERSIONS*/


-
  checkCUDNN(cudnnCreateConvolutionDescriptor(&convDesc));
+
+  //FIXME: Current hack to preserve backward compatibilty
+  if(conv_groups == 0){
+    conv_groups = 1;
+  }
+  
+  // NOTE: Adding support for grouped convolution
+  checkCUDNN(cudnnSetConvolutionGroupCount(convDesc, conv_groups));
+
+  
  // FIXIT: Think if upscaling values need to be configurable?
  // IMP-FIXIT:  CUDNN Cross correlation is only used in the Lenet context
  // IMP-FIXIT: Either make mode configurable OR see if CUDNN_CONVOLUTION MODE should be used?