Skip to content

Commit 596277b

Browse files
Move headers for unittest with llm.c to unittest_llmc directory
1 parent 05eede8 commit 596277b

3 files changed

Lines changed: 8 additions & 7 deletions

File tree

experimental/kernels/Makefile

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -11,8 +11,8 @@ else
1111
STDLIB := -stdlib=libc++
1212
endif
1313

14-
CXXFLAGS=-std=c++17 -I$(GPUCPP) -I$(GPUCPP)/third_party/headers
15-
CFLAGS=-Ofast -march=native -I.
14+
CXXFLAGS=-std=c++17 -I$(GPUCPP) -I$(GPUCPP)/third_party/headers -I. -Iunittest_llmc
15+
CFLAGS=-Ofast -march=native -I. -Iunittest_llmc
1616

1717
LDFLAGS=$(STDLIB) -L$(GPUCPP)/third_party/lib -ldl -ldawn
1818
FLAGS=$(CXXFLAGS) $(LDFLAGS)
@@ -39,7 +39,7 @@ gpt2_124M.bin: llm.c
3939
ln -s ./llm.c/gpt2_124M_debug_state.bin ; \
4040
fi
4141

42-
build/test_gpt2: llm.c build/kernels_c.o gpt2_124M.bin
42+
build/test_gpt2: llm.c build/unittest_kernels.o gpt2_124M.bin
4343
mkdir -p build
4444
sed -i -e 's/void encoder_forward(/void ENCODER_FORWARD_CPU(/g' llm.c/train_gpt2.c
4545
sed -i -e 's/void layernorm_forward(/void LAYERNORM_FORWARD_CPU(/g' llm.c/train_gpt2.c
@@ -56,10 +56,10 @@ build/test_gpt2: llm.c build/kernels_c.o gpt2_124M.bin
5656
sed -i -e 's/void gelu_backward(/void GELU_BACKWARD_CPU(/g' llm.c/train_gpt2.c
5757
sed -i -e 's/void residual_backward(/void RESIDUAL_BACKWARD_CPU(/g' llm.c/train_gpt2.c
5858
sed -i -e 's/void crossentropy_softmax_backward(/void CROSSENTROPY_SOFTMAX_BACKWARD_CPU(/g' llm.c/train_gpt2.c
59-
grep -q "^#include \"kernels_c.h\"" llm.c/train_gpt2.c || sed -i '1i#include \"kernels_c.h\"' llm.c/train_gpt2.c
60-
$(CC) $(CFLAGS) $(LDFLAGS) -o $@ llm.c/test_gpt2.c build/kernels_c.o
59+
grep -q "^#include \"unittest_kernels.h\"" llm.c/train_gpt2.c || sed -i '1i#include \"unittest_kernels.h\"' llm.c/train_gpt2.c
60+
$(CC) $(CFLAGS) $(LDFLAGS) -o $@ llm.c/test_gpt2.c build/unittest_kernels.o
6161

62-
build/kernels_c.o: kernels_c.cpp kernels_c.h kernels.h
62+
build/unittest_kernels.o: unittest_llmc/unittest_kernels.cpp unittest_llmc/unittest_kernels.h kernels.h
6363
mkdir -p build && $(CXX) $(CXXFLAGS) -DNDEBUG -c -o $@ $<
6464

6565
dawnlib: $(if $(wildcard $(GPUCPP)/third_party/lib/libdawn.so $(GPUCPP)/third_party/lib/libdawn.dylib),,run_setup)

experimental/kernels/kernels_c.cpp renamed to experimental/kernels/unittest_llmc/unittest_kernels.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
#include <future>
55

66
#include "kernels.h"
7-
#include "kernels_c.h"
7+
#include "unittest_llmc/unittest_kernels.h"
88

99
using namespace gpu; // createContext, createTensor, createKernel,
1010
// createShader, dispatchKernel, wait, toCPU

experimental/kernels/kernels_c.h renamed to experimental/kernels/unittest_llmc/unittest_kernels.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@ extern "C" {
99
#define USE_GPU_FOR_LAYERNORM_FORWARD 1
1010
// -- Note: atomicAdd should be used with i32 or u32 not f32.
1111
// #define USE_GPU_FOR_LAYERNORM_BACKWARD 1
12+
// -- Note: matmul_forward kernel works, but it is too slow.
1213
#define USE_GPU_FOR_MATMUL_FORWARD 1
1314
// #define USE_GPU_FOR_MATMUL_BACKWARD 1
1415
#define USE_GPU_FOR_ATTENTION_FORWARD 1

0 commit comments

Comments
 (0)