From 9ab7b33283a4ffab97666d4e7ffa42eeacff99ae Mon Sep 17 00:00:00 2001 From: Hashim Sharif <hsharif3@tyler.cs.illinois.edu> Date: Fri, 14 Jun 2019 17:25:26 -0500 Subject: [PATCH] Separating cuda dependencies and adding CPU CMakeLists --- .../hpvm-tensor-rt/CMakeLists_cpu.txt | 19 ++++++++++++++ .../dnn_sources/include/utils_cpu.h | 6 ++--- .../tensor_runtime/include/tensor_cpu.h | 25 +++++++++++++++++++ .../include/tensor_cpu_runtime.h | 7 +++--- .../tensor_runtime/src/tensor_cpu_runtime.cc | 3 ++- 5 files changed, 53 insertions(+), 7 deletions(-) create mode 100644 llvm/projects/hpvm-tensor-rt/CMakeLists_cpu.txt create mode 100644 llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu.h diff --git a/llvm/projects/hpvm-tensor-rt/CMakeLists_cpu.txt b/llvm/projects/hpvm-tensor-rt/CMakeLists_cpu.txt new file mode 100644 index 0000000000..cff0129c2a --- /dev/null +++ b/llvm/projects/hpvm-tensor-rt/CMakeLists_cpu.txt @@ -0,0 +1,19 @@ +cmake_minimum_required (VERSION 2.6) +project (approxhpvm-tensorRt-cpu) + + +# Addresses a bug where code is not compiled as C++11 in non-CUDA code and older g++ versions +set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++11 " ) + + +# Adding new rule for building a cuDNN runtime library +add_library(tensor_cpu_runtime tensor_runtime/src/tensor_cpu_runtime.cc) +target_link_libraries(tensor_cpu_runtime) + + +#**** CPU sources +add_executable(fc2_cpu dnn_sources/src/fc2_cpu.cc) +target_link_libraries(fc2_cpu tensor_cpu_runtime) + + + diff --git a/llvm/projects/hpvm-tensor-rt/dnn_sources/include/utils_cpu.h b/llvm/projects/hpvm-tensor-rt/dnn_sources/include/utils_cpu.h index f035855602..c5981d752c 100644 --- a/llvm/projects/hpvm-tensor-rt/dnn_sources/include/utils_cpu.h +++ b/llvm/projects/hpvm-tensor-rt/dnn_sources/include/utils_cpu.h @@ -7,7 +7,7 @@ #include <sstream> #include <vector> #include <bits/stdc++.h> -#include "../../tensor_runtime/include/tensor.h" +#include "../../tensor_runtime/include/tensor_cpu.h" #include "types.h" #include <cmath> @@ -88,10 +88,10 @@ struct Tensor* readTrainedWeightsCPU(const char* file_name, int data_type, printf("size in bytes = %lu, bytes read = %lu \n", size_in_bytes, bytes_read); fclose(file); - + struct Tensor* weights = (struct Tensor*) create4DTensorCPU(data_type, nchw, dim1_size, dim2_size, - dim3_size, dim4_size); + dim3_size, dim4_size); initTensorData(weights, tensor_data, size_in_bytes); //compareValues(weights, tensor_data, num_elems); diff --git a/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu.h b/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu.h new file mode 100644 index 0000000000..c812a516ae --- /dev/null +++ b/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu.h @@ -0,0 +1,25 @@ + + +#ifndef TENSOR_HEADER +#define TENSOR_HEADER + + +struct Dimension{ + int num_dims; + size_t* dim_sizes; +}; + + +struct Tensor{ + int data_type; + int data_format; + void* host_data; + void* gpu_data; // The pointers should not be device specific per se - TODO: Better design needed + size_t num_elems; // Total elements + size_t size_in_bytes; // Total size in bytes + struct Dimension dims; +}; + + +#endif + diff --git a/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu_runtime.h b/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu_runtime.h index dfa9511055..cc84094111 100644 --- a/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu_runtime.h +++ b/llvm/projects/hpvm-tensor-rt/tensor_runtime/include/tensor_cpu_runtime.h @@ -4,7 +4,6 @@ #include <cmath> #include <memory> #include <string> -//#include "runtime_types.h" #ifndef CUDNN_HEADER @@ -41,10 +40,12 @@ extern "C"{ int vertical_stride, int horizontal_stride); void* tensorGemmCPU(void* lhs, void* rhs); - // NOTE: In place operation + void* tensorAddCPU(void* x, void* bias); - // NOTE: In-place operation + void* tensorReluCPU(void* input); + + void* tensorRelu2CPU(void* input); void* tensorTanhCPU(void* input); diff --git a/llvm/projects/hpvm-tensor-rt/tensor_runtime/src/tensor_cpu_runtime.cc b/llvm/projects/hpvm-tensor-rt/tensor_runtime/src/tensor_cpu_runtime.cc index 336c98b767..8d2591372a 100644 --- a/llvm/projects/hpvm-tensor-rt/tensor_runtime/src/tensor_cpu_runtime.cc +++ b/llvm/projects/hpvm-tensor-rt/tensor_runtime/src/tensor_cpu_runtime.cc @@ -23,7 +23,8 @@ // Tensor runtime header files #include "../include/tensor_cpu_runtime.h" -#include "../include/tensor.h" +#include "../include/tensor_cpu.h" + void llvm_hpvm_initTensorRt(int gpuid){ -- GitLab