forked from APWS25/AccelMoE
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathMakefile
More file actions
32 lines (21 loc) · 667 Bytes
/
Makefile
File metadata and controls
32 lines (21 loc) · 667 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
CXX=g++
CUX=/usr/local/cuda/bin/nvcc
CFLAGS=-std=c++14 -O3 -Wall -march=native -mavx2 -mfma -mno-avx512f -fopenmp -I/usr/local/cuda/include -Iinclude
CUDA_CFLAGS:=$(foreach option, $(CFLAGS), -Xcompiler=$(option) -arch=sm_70)
LDFLAGS=-pthread -L/usr/local/cuda/lib64
LDLIBS=-lstdc++ -lcudart -lm
TARGET=main
OBJECTS=obj/main.o obj/model.o obj/tensor.o obj/layer.o
all: $(TARGET)
$(TARGET): create_obj $(OBJECTS)
$(CC) $(CFLAGS) -o $(TARGET) $(OBJECTS) $(LDFLAGS) $(LDLIBS)
obj/%.o: src/%.cpp
$(CXX) $(CFLAGS) -c -o $@ $^
obj/%.o: src/%.cu
$(CUX) $(CUDA_CFLAGS) -c -o $@ $^
clean:
rm -rf $(TARGET) $(OBJECTS)
run:
sh ./run.sh
create_obj:
mkdir -p obj