mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-04-20 14:29:22 +00:00
36 lines
1.4 KiB
Makefile
36 lines
1.4 KiB
Makefile
# CFLAGS += $(shell pkg-config --cflags hwloc)
|
|
# CFLAGS += -march=armv8.2-a+fp16+dotprod+sve+bf16 -I/home/test/kt-code/HPCKit_25.0.0_Linux-aarch64/package/KunpengHPCKit-kml.25.0.0/include
|
|
# CFLAGS += -march=armv8.2-a+fp16+dotprod+sve+bf16 -I/home/test/kt-code/HPCKit_25.0.0_Linux-aarch64/package/KunpengHPCKit-kml.25.0.0/include
|
|
CFLAGS += -O3
|
|
CFLAGS += -I/usr/local/include/blis/ -fopenmp
|
|
LDLIBS += -L/usr/local/lib -lblis
|
|
# LDLIBS += $(shell pkg-config --libs hwloc) -lkml_rt
|
|
|
|
CXX = /usr/bin/g++
|
|
|
|
# i8_cal: i8_cal.cpp
|
|
# $(CXX) i8_cal.cpp $(CFLAGS) -o i8_cal $(LDLIBS)
|
|
# run: i8_cal
|
|
# ./i8_cal
|
|
|
|
simple_test_build: simple_test.cpp
|
|
rm -f simple_test
|
|
BLAS_NUM_THREADS=1 $(CXX) simple_test.cpp $(CFLAGS) -o simple_test $(LDLIBS)
|
|
|
|
simple_aocl_build: build simple_test_aocl.cpp
|
|
$(CXX) simple_test_aocl.cpp $(CFLAGS) -o build/simple_test_aocl $(LDLIBS)
|
|
|
|
fp16_test_build: fp16-test.cpp
|
|
rm -f fp16-test
|
|
$(CXX) fp16-test.cpp $(CFLAGS) -o fp16-test $(LDLIBS)
|
|
bf16_test_build: bf16-test.cpp
|
|
rm -f bf16-test
|
|
$(CXX) bf16-test.cpp $(CFLAGS) -o bf16-test $(LDLIBS)
|
|
build: build
|
|
mkdir -p build
|
|
bandwidth_build: bench_reorder_bandwidth.cpp
|
|
$(CXX) bench_reorder_bandwidth.cpp $(CFLAGS) -o build/bench_reorder_bandwidth $(LDLIBS)
|
|
run: simple_aocl_build
|
|
LD_LIBRARY_PATH=/usr/local/lib:$$LD_LIBRARY_PATH ./build/simple_test_aocl
|
|
run_bandwidth: bandwidth_build
|
|
LD_LIBRARY_PATH=/usr/local/lib:$$LD_LIBRARY_PATH ./build/bench_reorder_bandwidth
|