forked from a1k0n/a1gpt
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathCMakeLists.txt
66 lines (50 loc) · 1.89 KB
/
CMakeLists.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# Set minimum version of CMake. Version 3.8 introduces CUDA as a first-class language
cmake_minimum_required(VERSION 3.8 FATAL_ERROR)
project(a1gpt LANGUAGES CXX)
include(CheckLanguage)
if(NOT CMAKE_BUILD_TYPE)
set(CMAKE_BUILD_TYPE "RelWithDebInfo" CACHE STRING
"Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel."
FORCE)
endif()
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -march=native")
if (APPLE)
find_library(ACCELERATE Accelerate)
endif()
# Add executable target with source files
add_executable(gpt2 main.cpp
model.h model.cpp model_load_gpt2.cpp
blas.h tensor.h
bpe.h bpe.cpp)
check_language(CUDA)
target_link_libraries(gpt2 PRIVATE ${ACCELERATE})
# Specify the C++ standard
set_target_properties(gpt2 PROPERTIES
CXX_STANDARD 14
CXX_STANDARD_REQUIRED TRUE)
if (CMAKE_CUDA_COMPILER)
enable_language(CUDA)
add_executable(cugpt2 main.cpp
model.h model_cu.cpp model_load_gpt2.cpp
tensor.h bpe.h bpe.cpp kernel.cu)
# Specify the C++ standard
set_target_properties(cugpt2 PROPERTIES
CUDA_SEPARABLE_COMPILATION ON
CXX_STANDARD 14
CXX_STANDARD_REQUIRED TRUE)
# #define CUDA and add include path
target_compile_definitions(cugpt2 PRIVATE CUDA)
target_include_directories(cugpt2 PRIVATE ${CMAKE_CUDA_TOOLKIT_INCLUDE_DIRECTORIES})
else()
message(WARNING "CUDA not found, CUDA targets will be unavailable.")
endif()
enable_testing()
# add bpe_test
add_executable(bpe_test bpe_test.cpp bpe.h bpe.cpp)
set_target_properties(bpe_test PROPERTIES
CXX_STANDARD 14
CXX_STANDARD_REQUIRED TRUE)
add_test(NAME BPETest COMMAND bpe_test)
execute_process(COMMAND ${CMAKE_COMMAND} -E create_symlink
${CMAKE_SOURCE_DIR}/model
${CMAKE_BINARY_DIR}/model)