Skip to content
Snippets Groups Projects
Commit c27cb78c authored by Hashim Sharif's avatar Hashim Sharif
Browse files

Adding cmake tmeplate for Keras frontend -- not yet autogenerated

parent 18a09740
No related branches found
No related tags found
No related merge requests found
cmake_minimum_required (VERSION 3.17)
project (hpvm-tensor-rt)
find_package(CUDA 6.5 REQUIRED)
set(CUDA_SEPARABLE_COMPILATION ON CACHE BOOL "")
set(CUDA_PROPAGATE_HOST_FLAGS OFF)
# Addresses a bug where code is not compiled as C++11 in non-CUDA code and older g++ versions
# Edit: using c++14 now
set(CMAKE_CXX_STANDARD 14)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++14 -I/")
set(
CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};
-gencode;arch=compute_60,code=sm_60;
-gencode;arch=compute_60,code=compute_60;
-std=c++14 --expt-relaxed-constexpr -maxrregcount 32 # These are for image ops
)
if(CMAKE_BUILD_TYPE STREQUAL "Debug")
message("Debug mode")
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};-g;-lineinfo;-Xcompiler;-ggdb)
else()
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};-DNDEBUG;-Xcompiler;-DNDEBUG)
endif()
# Default include/link directories
include_directories(${CUDA_TOOLKIT_ROOT_DIR} ${CUDA_TOOLKIT_ROOT_DIR}/include)
include_directories($ENV{CUDNN_PATH} $ENV{CUDNN_PATH}/include)
include_directories($ENV{LLVM_SRC_ROOT}/projects/hpvm-tensor-rt/tensor_runtime/include)
include_directories($ENV{LLVM_SRC_ROOT}/projects/hpvm-tensor-rt/dnn_sources/include)
include_directories($ENV{LLVM_SRC_ROOT}/projects/gpu_profiler/include)
include_directories($ENV{LLVM_SRC_ROOT}/projects/soc_simulator/include)
link_directories(${CUDA_TOOLKIT_ROOT_DIR}/lib64 $ENV{CUDNN_PATH} $ENV{CUDNN_PATH}/lib $ENV{CUDNN_PATH}/lib64)
# Default link libraries
find_library(GPU_PROFILER_LIB
NAMES libgpu_profiler.a
HINTS $ENV{LLVM_SRC_ROOT}/projects/gpu_profiler/lib
)
find_library(SOC_SIMULATOR_LIB
NAMES libpromise_profiler.a
HINTS $ENV{LLVM_SRC_ROOT}/projects/soc_simulator/lib
)
find_library(TENSOR_LIB
NAMES libtensor_runtime.a
HINTS $ENV{LLVM_SRC_ROOT}/projects/hpvm-tensor-rt/lib
)
set(LINK_LIBS cudart cudnn cufft cublas stdc++fs curand)
#### Image Processing Benchmarks
add_executable(DNN_binary src.cc)
target_link_libraries(DNN_binary ${TENSOR_LIB} ${GPU_PROFILER_LIB} ${SOC_SIMULATOR_LIB} ${LINK_LIBS})
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment