forked from zhihu/cuBERT
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathCMakeLists.txt
168 lines (143 loc) · 5.68 KB
/
CMakeLists.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
cmake_minimum_required(VERSION 3.6)
project(cuBERT VERSION 0.0.5 LANGUAGES C CXX)
set(CMAKE_CXX_STANDARD 11)
set(CMAKE_POSITION_INDEPENDENT_CODE ON)
set(CMAKE_MODULE_PATH ${PROJECT_SOURCE_DIR}/cmake/)
add_definitions(-D_GLIBCXX_USE_CXX11_ABI=0)
option(cuBERT_ENABLE_GPU "Enable GPU support" OFF)
option(cuBERT_ENABLE_MKL_SUPPORT "Enable Intel MKL support" OFF)
option(cuBERT_SYSTEM_MKL "Use system MKL" OFF)
option(cuBERT_SYSTEM_PROTOBUF "Use system Protobuf" OFF)
find_package(Threads REQUIRED)
# OpenMP Support
find_package(OpenMP)
if (OPENMP_FOUND)
set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${OpenMP_C_FLAGS}")
set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${OpenMP_CXX_FLAGS}")
set (CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} ${OpenMP_EXE_LINKER_FLAGS}")
endif()
include(cub)
include(utf8proc)
include(protobuf-c)
include(googletest)
set(cuBERT_EXTERNAL_DEPENDENCIES
cub
utf8proc
protobuf-c
googletest)
set(cuBERT_EXTERNAL_LIBRARIES
${protobuf-c_STATIC_LIBRARIES}
${utf8proc_STATIC_LIBRARIES})
include_directories(
# Source and generated code.
src
${CMAKE_CURRENT_BINARY_DIR}
# External dependencies.
${cub_INCLUDE_DIR}
${protobuf-c_INCLUDE_DIRS}
${utf8proc_INCLUDE_DIRS})
# MKL Support
if(cuBERT_ENABLE_MKL_SUPPORT)
add_definitions(-DHAVE_MKL)
if(cuBERT_SYSTEM_MKL)
find_package(MKL REQUIRED)
else()
include(mkl)
list(APPEND cuBERT_EXTERNAL_DEPENDENCIES mkl_copy_shared_to_destination)
endif()
list(APPEND cuBERT_EXTERNAL_LIBRARIES ${MKL_LIBRARIES})
include_directories(${MKL_INCLUDE_DIR})
endif(cuBERT_ENABLE_MKL_SUPPORT)
if(cuBERT_ENABLE_GPU)
# minimum 9.0 in cuda version
find_package(CUDA 9.0 REQUIRED)
if(NOT CUDA_FOUND)
message(FATAL_ERROR "CUDA not found.")
endif()
add_definitions(-DHAVE_CUDA)
# use cmake internal CUDA_ARCH_NAME switch
# e.g. CUDA_ARCH_NAME="Auto" will autodetect
# CUDA_ARCH_NAME="All" will use all arches
cuda_select_nvcc_arch_flags(NVCC_ARCH_FLAGS ${CUDA_ARCH_NAME})
list(APPEND CUDA_NVCC_FLAGS ${NVCC_ARCH_FLAGS})
message(STATUS "Using CUDA arch flags: ${NVCC_ARCH_FLAGS_readable}")
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};-std=c++11)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};--expt-relaxed-constexpr)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};-O3;-use_fast_math;-Xptxas -O3;-Xcompiler -O3)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS};-ftz=true) # Flush denormals to zero
include_directories(${CUDA_INCLUDE_DIRS})
endif(cuBERT_ENABLE_GPU)
# Let's get to work!
include(tf_core_framework)
set(SOURCE_FILES
src/cuBERT.cpp
src/cuBERT/common.cpp
src/cuBERT/tokenization.cpp
src/cuBERT/Bert.cpp
src/cuBERT/BertM.cpp
src/cuBERT/tensorflow/Graph.cpp
src/cuBERT/op/GELU.cpp src/cuBERT/op/GELU.cu
src/cuBERT/op/Dense.cpp
src/cuBERT/op/Embedding.cpp src/cuBERT/op/Embedding.cu
src/cuBERT/op/Softmax.cpp src/cuBERT/op/Softmax.cu
src/cuBERT/op/LayerNorm.cpp src/cuBERT/op/LayerNorm.cu
src/cuBERT/op_att/AttentionSelf.cpp
src/cuBERT/op_att/AttentionMask.cpp src/cuBERT/op_att/AttentionMask.cu
src/cuBERT/op_att/BatchMatMul.cpp
src/cuBERT/op_att/Transformer.cpp
src/cuBERT/op_bert/BertEmbeddings.cpp
src/cuBERT/op_bert/BertPooler.cpp src/cuBERT/op_bert/BertPooler.cu
src/cuBERT/op_out/AdditionalOutputLayer.cpp)
if (cuBERT_ENABLE_GPU)
cuda_add_library(cuBERT SHARED ${SOURCE_FILES})
set_target_properties(cuBERT PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
cuda_add_cublas_to_target(cuBERT)
else ()
add_library(cuBERT SHARED ${SOURCE_FILES})
endif ()
add_dependencies(cuBERT ${cuBERT_EXTERNAL_DEPENDENCIES})
target_link_libraries(cuBERT tf_protos_cc ${cuBERT_EXTERNAL_LIBRARIES})
add_executable(cuBERT_benchmark benchmark/benchmark_cu.cpp)
target_link_libraries(cuBERT_benchmark cuBERT)
find_package(tensorflow)
if (tensorflow_FOUND)
add_executable(tfBERT_benchmark benchmark/benchmark_tf.cpp)
target_include_directories(tfBERT_benchmark PUBLIC ${tensorflow_INCLUDE_DIR})
target_link_libraries(tfBERT_benchmark ${tensorflow_LIBRARIES})
endif ()
if (cuBERT_ENABLE_GPU)
add_executable(gemm_benchmark benchmark/benchmark_gemm.cpp)
target_link_libraries(gemm_benchmark cuBERT)
endif ()
enable_testing()
configure_file(test_vocab.txt ${CMAKE_CURRENT_BINARY_DIR}/test_vocab.txt COPYONLY)
add_executable(cuBERT_test test/unit_test.cpp
test/cuBERT/common_test.cpp
test/cuBERT/tokenization_test.cpp
test/cuBERT/op/DenseTest.cpp
test/cuBERT/op/LayerNormTest.cpp
test/cuBERT/op/SoftmaxTest.cpp
test/cuBERT/op/GELUTest.cpp
test/cuBERT/op/EmbeddingTest.cpp
test/cuBERT/op_att/BatchMatMulTest.cpp
test/cuBERT/op_att/AttentionSelfTest.cpp
test/cuBERT/op_att/TransformerTest.cpp
test/cuBERT/op_att/AttentionMaskTest.cpp
test/cuBERT/op_bert/BertEmbeddingsTest.cpp
test/cuBERT/op_bert/BertPoolerTest.cpp
test/cuBERT/op_out/AdditionalOutputLayerTest.cpp
test/cuBERT/BertTest.cpp
test/cuBERT/BertMTest.cpp
test/cuBERT_test.cpp)
target_link_libraries(cuBERT_test cuBERT ${googletest_STATIC_LIBRARIES})
target_include_directories(cuBERT_test PUBLIC ${googletest_INCLUDE_DIRS})
add_test(UnitTest cuBERT_test)
install(TARGETS cuBERT
RUNTIME DESTINATION bin
LIBRARY DESTINATION lib
ARCHIVE DESTINATION lib/static)
install(FILES ${CMAKE_SOURCE_DIR}/src/cuBERT.h DESTINATION include)
if(NOT ${cuBERT_SYSTEM_MKL})
install(FILES ${MKL_LIBRARIES} DESTINATION lib)
install(DIRECTORY ${MKL_INCLUDE_DIR} DESTINATION .)
endif()