2023-04-30 17:51:57 +02:00
default : main bench quantize
2023-04-30 11:14:33 +02:00
2022-11-02 07:46:49 +01:00
i f n d e f U N A M E _ S
2022-10-05 19:41:35 +02:00
UNAME_S := $( shell uname -s)
2022-11-02 07:46:49 +01:00
e n d i f
i f n d e f U N A M E _ P
2022-10-05 19:41:35 +02:00
UNAME_P := $( shell uname -p)
2022-11-02 07:46:49 +01:00
e n d i f
i f n d e f U N A M E _ M
2022-10-05 19:41:35 +02:00
UNAME_M := $( shell uname -m)
2022-11-02 07:46:49 +01:00
e n d i f
2022-10-05 19:41:35 +02:00
2023-01-02 12:35:26 +01:00
CCV := $( shell $( CC) --version | head -n 1)
CXXV := $( shell $( CXX) --version | head -n 1)
2022-10-19 01:01:53 +02:00
# Mac OS + Arm can report x86_64
# ref: https://github.com/ggerganov/whisper.cpp/issues/66#issuecomment-1282546789
i f e q ( $( UNAME_S ) , D a r w i n )
ifneq ( $( UNAME_P) ,arm)
SYSCTL_M := $( shell sysctl -n hw.optional.arm64)
ifeq ( $( SYSCTL_M) ,1)
2022-11-02 17:00:19 +01:00
# UNAME_P := arm
# UNAME_M := arm64
2022-10-19 01:01:53 +02:00
warn := $( warning Your arch is announced as x86_64, but it seems to actually be ARM64. Not fixing that can lead to bad performance. For more info see: https://github.com/ggerganov/whisper.cpp/issues/66\# issuecomment-1282546789)
endif
endif
e n d i f
2022-10-05 19:41:35 +02:00
#
# Compile flags
#
2023-02-28 22:27:54 +01:00
CFLAGS = -I. -O3 -DNDEBUG -std= c11 -fPIC
CXXFLAGS = -I. -I./examples -O3 -DNDEBUG -std= c++11 -fPIC
2022-10-17 20:44:16 +02:00
LDFLAGS =
2022-10-05 19:41:35 +02:00
2023-03-22 19:51:42 +01:00
# ref: https://github.com/ggerganov/whisper.cpp/issues/37
i f n e q ( $( wildcard /usr /include /musl /*) , )
2023-03-27 20:00:32 +02:00
CFLAGS += -D_POSIX_SOURCE -D_GNU_SOURCE
2023-03-22 19:51:42 +01:00
CXXFLAGS += -D_POSIX_SOURCE -D_GNU_SOURCE
e n d i f
2022-10-05 19:41:35 +02:00
# OS specific
# TODO: support Windows
i f e q ( $( UNAME_S ) , L i n u x )
2022-10-05 20:34:41 +02:00
CFLAGS += -pthread
CXXFLAGS += -pthread
2022-10-05 19:41:35 +02:00
e n d i f
i f e q ( $( UNAME_S ) , D a r w i n )
2022-10-05 20:34:41 +02:00
CFLAGS += -pthread
CXXFLAGS += -pthread
2022-10-05 19:41:35 +02:00
e n d i f
2022-10-17 17:09:17 +02:00
i f e q ( $( UNAME_S ) , F r e e B S D )
CFLAGS += -pthread
CXXFLAGS += -pthread
e n d i f
2022-12-08 06:34:19 +01:00
i f e q ( $( UNAME_S ) , H a i k u )
CFLAGS += -pthread
CXXFLAGS += -pthread
e n d i f
2022-10-05 19:41:35 +02:00
# Architecture specific
2022-10-08 16:35:55 +02:00
# TODO: probably these flags need to be tweaked on some architectures
2022-10-17 17:09:17 +02:00
# feel free to update the Makefile for your architecture and send a pull request or issue
2022-12-29 12:58:27 +01:00
i f e q ( $( UNAME_M ) , $( filter $ ( UNAME_M ) ,x 86_ 64 i 686) )
2022-11-09 01:28:36 +01:00
ifeq ( $( UNAME_S) ,Darwin)
2023-01-06 18:32:28 +01:00
CFLAGS += -mf16c
2022-11-09 01:28:36 +01:00
AVX1_M := $( shell sysctl machdep.cpu.features)
2023-01-06 18:32:28 +01:00
ifneq ( ,$( findstring FMA,$( AVX1_M) ) )
CFLAGS += -mfma
endif
2022-11-09 01:28:36 +01:00
ifneq ( ,$( findstring AVX1.0,$( AVX1_M) ) )
CFLAGS += -mavx
endif
AVX2_M := $( shell sysctl machdep.cpu.leaf7_features)
ifneq ( ,$( findstring AVX2,$( AVX2_M) ) )
CFLAGS += -mavx2
endif
2022-11-29 08:29:34 +01:00
else ifeq ( $( UNAME_S) ,Linux)
2022-11-23 12:23:35 +01:00
AVX2_M := $( shell grep "avx2 " /proc/cpuinfo)
ifneq ( ,$( findstring avx2,$( AVX2_M) ) )
CFLAGS += -mavx2
endif
FMA_M := $( shell grep "fma " /proc/cpuinfo)
ifneq ( ,$( findstring fma,$( FMA_M) ) )
CFLAGS += -mfma
endif
F16C_M := $( shell grep "f16c " /proc/cpuinfo)
ifneq ( ,$( findstring f16c,$( F16C_M) ) )
CFLAGS += -mf16c
2023-04-14 18:31:51 +02:00
AVX1_M := $( shell grep "avx " /proc/cpuinfo)
ifneq ( ,$( findstring avx,$( AVX1_M) ) )
CFLAGS += -mavx
endif
2022-12-08 06:34:19 +01:00
endif
2023-01-06 17:45:59 +01:00
SSE3_M := $( shell grep "sse3 " /proc/cpuinfo)
ifneq ( ,$( findstring sse3,$( SSE3_M) ) )
CFLAGS += -msse3
endif
2022-12-08 06:34:19 +01:00
else ifeq ( $( UNAME_S) ,Haiku)
AVX2_M := $( shell sysinfo -cpu | grep "AVX2 " )
ifneq ( ,$( findstring avx2,$( AVX2_M) ) )
CFLAGS += -mavx2
endif
FMA_M := $( shell sysinfo -cpu | grep "FMA " )
ifneq ( ,$( findstring fma,$( FMA_M) ) )
CFLAGS += -mfma
endif
F16C_M := $( shell sysinfo -cpu | grep "F16C " )
ifneq ( ,$( findstring f16c,$( F16C_M) ) )
CFLAGS += -mf16c
2023-04-14 18:31:51 +02:00
AVX1_M := $( shell sysinfo -cpu | grep "AVX " )
ifneq ( ,$( findstring avx,$( AVX1_M) ) )
CFLAGS += -mavx
endif
2022-11-23 12:23:35 +01:00
endif
2022-11-09 01:28:36 +01:00
else
2022-11-23 12:23:35 +01:00
CFLAGS += -mfma -mf16c -mavx -mavx2
2022-11-09 01:28:36 +01:00
endif
2022-10-05 19:41:35 +02:00
e n d i f
2022-10-17 17:09:17 +02:00
i f e q ( $( UNAME_M ) , a m d 6 4 )
CFLAGS += -mavx -mavx2 -mfma -mf16c
e n d i f
2023-04-29 09:55:24 +02:00
2023-01-23 19:48:10 +01:00
i f n e q ( $( filter ppc 64%,$ ( UNAME_M ) ) , )
2022-12-23 07:19:19 +01:00
POWER9_M := $( shell grep "POWER9" /proc/cpuinfo)
ifneq ( ,$( findstring POWER9,$( POWER9_M) ) )
CFLAGS += -mpower9-vector
endif
2023-01-23 19:48:10 +01:00
# Require c++23's std::byteswap for big-endian support.
ifeq ( $( UNAME_M) ,ppc64)
CXXFLAGS += -std= c++23 -DGGML_BIG_ENDIAN
endif
2022-12-23 07:19:19 +01:00
e n d i f
2023-04-29 09:55:24 +02:00
2022-11-02 17:00:19 +01:00
i f n d e f W H I S P E R _ N O _ A C C E L E R A T E
2022-10-17 20:44:16 +02:00
# Mac M1 - include Accelerate framework
ifeq ( $( UNAME_S) ,Darwin)
CFLAGS += -DGGML_USE_ACCELERATE
LDFLAGS += -framework Accelerate
endif
2022-10-05 19:41:35 +02:00
e n d i f
2023-04-29 09:55:24 +02:00
2023-04-15 12:21:27 +02:00
i f d e f W H I S P E R _ C O R E M L
CXXFLAGS += -DWHISPER_USE_COREML
LDFLAGS += -framework Foundation -framework CoreML
2023-04-29 09:55:24 +02:00
i f d e f W H I S P E R _ C O R E M L _ A L L O W _ F A L L B A C K
CXXFLAGS += -DWHISPER_COREML_ALLOW_FALLBACK
e n d i f
2023-04-15 12:21:27 +02:00
e n d i f
2023-04-29 09:55:24 +02:00
2022-11-23 12:23:35 +01:00
i f d e f W H I S P E R _ O P E N B L A S
CFLAGS += -DGGML_USE_OPENBLAS -I/usr/local/include/openblas
LDFLAGS += -lopenblas
e n d i f
2023-04-29 09:55:24 +02:00
2023-04-30 11:14:33 +02:00
i f d e f W H I S P E R _ C U B L A S
2023-06-25 12:59:48 +02:00
CFLAGS += -DGGML_USE_CUBLAS -I/usr/local/cuda/include -I/opt/cuda/include -I$( CUDA_PATH) /targets/$( UNAME_M) -linux/include
CXXFLAGS += -DGGML_USE_CUBLAS -I/usr/local/cuda/include -I/opt/cuda/include -I$( CUDA_PATH) /targets/$( UNAME_M) -linux/include
LDFLAGS += -lcublas -lculibos -lcudart -lcublasLt -lpthread -ldl -lrt -L/usr/local/cuda/lib64 -L/opt/cuda/lib64 -L$( CUDA_PATH) /targets/$( UNAME_M) -linux/lib
2023-04-30 11:14:33 +02:00
WHISPER_OBJ += ggml-cuda.o
NVCC = nvcc
2023-06-25 12:57:18 +02:00
NVCCFLAGS = --forward-unknown-to-host-compiler -arch= any
2023-04-30 11:14:33 +02:00
ggml-cuda.o : ggml -cuda .cu ggml -cuda .h
$( NVCC) $( NVCCFLAGS) $( CXXFLAGS) -Wno-pedantic -c $< -o $@
e n d i f
2023-05-02 21:50:32 +02:00
i f d e f W H I S P E R _ C L B L A S T
CFLAGS += -DGGML_USE_CLBLAST
LDFLAGS += -lclblast -lOpenCL
WHISPER_OBJ += ggml-opencl.o
ggml-opencl.o : ggml -opencl .c ggml -opencl .h
$( CC) $( CFLAGS) -c $< -o $@
e n d i f
2022-11-23 13:31:05 +01:00
i f d e f W H I S P E R _ G P R O F
2023-01-18 19:31:46 +01:00
CFLAGS += -pg
CXXFLAGS += -pg
2022-11-23 13:31:05 +01:00
e n d i f
2023-04-29 09:55:24 +02:00
2022-10-08 16:35:55 +02:00
i f n e q ( $( filter aarch 64%,$ ( UNAME_M ) ) , )
2023-05-02 20:47:12 +02:00
CFLAGS += -mcpu= native
2023-02-27 20:04:16 +01:00
CXXFLAGS += -mcpu= native
2022-10-08 16:35:55 +02:00
e n d i f
2023-04-29 09:55:24 +02:00
2022-10-08 16:35:55 +02:00
i f n e q ( $( filter armv 6%,$ ( UNAME_M ) ) , )
2023-03-29 22:11:35 +02:00
# 32-bit Raspberry Pi 1, 2, 3
CFLAGS += -mfpu= neon -mfp16-format= ieee -mno-unaligned-access
2022-10-05 19:41:35 +02:00
e n d i f
2023-04-29 09:55:24 +02:00
2022-10-05 20:34:41 +02:00
i f n e q ( $( filter armv 7%,$ ( UNAME_M ) ) , )
2023-03-29 22:11:35 +02:00
# 32-bit ARM, for example on Armbian or possibly raspbian
2023-05-02 20:47:12 +02:00
#CFLAGS += -mfpu=neon -mfp16-format=ieee -funsafe-math-optimizations -mno-unaligned-access
#CXXFLAGS += -mfpu=neon -mfp16-format=ieee -funsafe-math-optimizations -mno-unaligned-access
2023-04-13 17:53:44 +02:00
2023-05-02 20:47:12 +02:00
# 64-bit ARM on 32-bit OS, use these (TODO: auto-detect 64-bit)
CFLAGS += -mfpu= neon-fp-armv8 -mfp16-format= ieee -funsafe-math-optimizations -mno-unaligned-access
CXXFLAGS += -mfpu= neon-fp-armv8 -mfp16-format= ieee -funsafe-math-optimizations -mno-unaligned-access
2022-10-05 20:34:41 +02:00
e n d i f
2023-04-29 09:55:24 +02:00
2022-10-05 20:34:41 +02:00
i f n e q ( $( filter armv 8%,$ ( UNAME_M ) ) , )
# Raspberry Pi 4
2023-05-02 20:47:12 +02:00
CFLAGS += -mfpu= neon-fp-armv8 -mfp16-format= ieee -funsafe-math-optimizations -mno-unaligned-access
CXXFLAGS += -mfpu= neon-fp-armv8 -mfp16-format= ieee -funsafe-math-optimizations -mno-unaligned-access
2022-10-05 19:41:35 +02:00
e n d i f
2023-01-02 12:35:26 +01:00
#
# Print build information
#
$(info I whisper.cpp build info : )
$(info I UNAME_S : $( UNAME_S ) )
$(info I UNAME_P : $( UNAME_P ) )
$(info I UNAME_M : $( UNAME_M ) )
$(info I CFLAGS : $( CFLAGS ) )
$(info I CXXFLAGS : $( CXXFLAGS ) )
$(info I LDFLAGS : $( LDFLAGS ) )
2023-01-05 20:35:04 +01:00
$(info I CC : $( CCV ) )
$(info I CXX : $( CXXV ) )
2023-01-02 12:35:26 +01:00
$( info )
2022-10-05 19:41:35 +02:00
#
2022-11-13 08:08:33 +01:00
# Build library
2022-10-05 19:41:35 +02:00
#
2022-10-02 16:55:45 +02:00
2023-04-30 11:14:33 +02:00
ggml.o : ggml .c ggml .h ggml -cuda .h
$( CC) $( CFLAGS) -c $< -o $@
2022-09-25 20:23:15 +02:00
2023-04-30 11:14:33 +02:00
whisper.o : whisper .cpp whisper .h ggml .h ggml -cuda .h
$( CXX) $( CXXFLAGS) -c $< -o $@
2022-10-04 19:35:01 +02:00
2023-04-15 12:21:27 +02:00
i f n d e f W H I S P E R _ C O R E M L
2023-04-30 11:14:33 +02:00
WHISPER_OBJ += whisper.o
2023-04-15 12:21:27 +02:00
e l s e
whisper-encoder.o : coreml /whisper -encoder .mm coreml /whisper -encoder .h
2023-05-14 08:47:02 +02:00
$( CXX) -O3 -I . -fobjc-arc -c coreml/whisper-encoder.mm -o whisper-encoder.o
2023-04-15 12:21:27 +02:00
whisper-encoder-impl.o : coreml /whisper -encoder -impl .m coreml /whisper -encoder -impl .h
$( CXX) -O3 -I . -fobjc-arc -c coreml/whisper-encoder-impl.m -o whisper-encoder-impl.o
2023-04-30 11:14:33 +02:00
WHISPER_OBJ += whisper.o whisper-encoder.o whisper-encoder-impl.o
2023-04-15 12:21:27 +02:00
e n d i f
libwhisper.a : ggml .o $( WHISPER_OBJ )
$( AR) rcs libwhisper.a ggml.o $( WHISPER_OBJ)
2022-10-10 03:16:42 +02:00
2023-04-15 12:21:27 +02:00
libwhisper.so : ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) -shared -o libwhisper.so ggml.o $( WHISPER_OBJ) $( LDFLAGS)
2022-11-13 08:08:33 +01:00
2022-09-25 20:23:15 +02:00
clean :
2023-04-30 17:51:57 +02:00
rm -f *.o main stream command talk talk-llama bench quantize libwhisper.a libwhisper.so
2022-09-25 20:23:15 +02:00
2022-10-05 19:41:35 +02:00
#
# Examples
#
CC_SDL = ` sdl2-config --cflags --libs`
2023-04-30 17:51:57 +02:00
SRC_COMMON = examples/common.cpp examples/common-ggml.cpp
2023-02-15 18:28:10 +01:00
SRC_COMMON_SDL = examples/common-sdl.cpp
2023-04-15 12:21:27 +02:00
main : examples /main /main .cpp $( SRC_COMMON ) ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) examples/main/main.cpp $( SRC_COMMON) ggml.o $( WHISPER_OBJ) -o main $( LDFLAGS)
2022-11-13 08:08:33 +01:00
./main -h
2023-04-15 12:21:27 +02:00
bench : examples /bench /bench .cpp ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) examples/bench/bench.cpp ggml.o $( WHISPER_OBJ) -o bench $( LDFLAGS)
2023-03-27 20:00:32 +02:00
2023-04-30 17:51:57 +02:00
quantize : examples /quantize /quantize .cpp ggml .o $( WHISPER_OBJ ) $( SRC_COMMON )
$( CXX) $( CXXFLAGS) examples/quantize/quantize.cpp $( SRC_COMMON) ggml.o $( WHISPER_OBJ) -o quantize $( LDFLAGS)
2023-04-15 12:21:27 +02:00
stream : examples /stream /stream .cpp $( SRC_COMMON ) $( SRC_COMMON_SDL ) ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) examples/stream/stream.cpp $( SRC_COMMON) $( SRC_COMMON_SDL) ggml.o $( WHISPER_OBJ) -o stream $( CC_SDL) $( LDFLAGS)
2022-10-25 18:13:08 +02:00
2023-04-15 12:21:27 +02:00
command : examples /command /command .cpp $( SRC_COMMON ) $( SRC_COMMON_SDL ) ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) examples/command/command.cpp $( SRC_COMMON) $( SRC_COMMON_SDL) ggml.o $( WHISPER_OBJ) -o command $( CC_SDL) $( LDFLAGS)
2022-11-25 18:06:56 +01:00
2023-04-15 12:21:27 +02:00
talk : examples /talk /talk .cpp examples /talk /gpt -2.cpp $( SRC_COMMON ) $( SRC_COMMON_SDL ) ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) examples/talk/talk.cpp examples/talk/gpt-2.cpp $( SRC_COMMON) $( SRC_COMMON_SDL) ggml.o $( WHISPER_OBJ) -o talk $( CC_SDL) $( LDFLAGS)
2022-12-09 19:38:10 +01:00
2023-04-15 12:21:27 +02:00
talk-llama : examples /talk -llama /talk -llama .cpp examples /talk -llama /llama .cpp $( SRC_COMMON ) $( SRC_COMMON_SDL ) ggml .o $( WHISPER_OBJ )
$( CXX) $( CXXFLAGS) examples/talk-llama/talk-llama.cpp examples/talk-llama/llama.cpp $( SRC_COMMON) $( SRC_COMMON_SDL) ggml.o $( WHISPER_OBJ) -o talk-llama $( CC_SDL) $( LDFLAGS)
2022-10-05 19:41:35 +02:00
#
# Audio samples
#
2022-09-26 08:36:51 +02:00
# download a few audio samples into folder "./samples":
2022-09-25 20:23:15 +02:00
.PHONY : samples
samples :
@echo "Downloading samples..."
2022-09-25 21:35:26 +02:00
@mkdir -p samples
2022-09-25 20:23:15 +02:00
@wget --quiet --show-progress -O samples/gb0.ogg https://upload.wikimedia.org/wikipedia/commons/2/22/George_W._Bush%27s_weekly_radio_address_%28November_1%2C_2008%29.oga
@wget --quiet --show-progress -O samples/gb1.ogg https://upload.wikimedia.org/wikipedia/commons/1/1f/George_W_Bush_Columbia_FINAL.ogg
@wget --quiet --show-progress -O samples/hp0.ogg https://upload.wikimedia.org/wikipedia/en/d/d4/En.henryfphillips.ogg
2022-09-30 18:33:09 +02:00
@wget --quiet --show-progress -O samples/mm1.wav https://cdn.openai.com/whisper/draft-20220913a/micro-machines.wav
2022-09-25 20:23:15 +02:00
@echo "Converting to 16-bit WAV ..."
@ffmpeg -loglevel -0 -y -i samples/gb0.ogg -ar 16000 -ac 1 -c:a pcm_s16le samples/gb0.wav
@ffmpeg -loglevel -0 -y -i samples/gb1.ogg -ar 16000 -ac 1 -c:a pcm_s16le samples/gb1.wav
@ffmpeg -loglevel -0 -y -i samples/hp0.ogg -ar 16000 -ac 1 -c:a pcm_s16le samples/hp0.wav
2022-09-30 18:33:09 +02:00
@ffmpeg -loglevel -0 -y -i samples/mm1.wav -ar 16000 -ac 1 -c:a pcm_s16le samples/mm0.wav
@rm samples/mm1.wav
2022-09-25 20:23:15 +02:00
2022-10-05 19:41:35 +02:00
#
# Models
#
2022-09-25 20:23:15 +02:00
2022-09-26 08:36:51 +02:00
# if not already downloaded, the following targets download the specified model and
# runs it on all samples in the folder "./samples":
2022-09-25 20:23:15 +02:00
2022-09-26 08:36:51 +02:00
.PHONY : tiny .en
2022-09-28 19:46:05 +02:00
.PHONY : tiny
2022-09-26 08:36:51 +02:00
.PHONY : base .en
2022-09-28 19:46:05 +02:00
.PHONY : base
2022-09-25 20:23:15 +02:00
.PHONY : small .en
2022-09-28 19:46:05 +02:00
.PHONY : small
.PHONY : medium .en
.PHONY : medium
2022-12-06 17:48:57 +01:00
.PHONY : large -v 1
2022-09-28 19:46:05 +02:00
.PHONY : large
2022-09-25 20:23:15 +02:00
2022-12-06 17:48:57 +01:00
tiny.en tiny base.en base small.en small medium.en medium large-v1 large : main
2022-10-25 18:13:08 +02:00
bash ./models/download-ggml-model.sh $@
2022-09-25 21:35:26 +02:00
@echo ""
2022-09-25 20:23:15 +02:00
@echo "==============================================="
2022-09-26 08:36:51 +02:00
@echo " Running $@ on all samples in ./samples ... "
2022-09-25 20:23:15 +02:00
@echo "==============================================="
@echo ""
@for f in samples/*.wav; do \
echo "----------------------------------------------" ; \
2022-11-25 04:24:08 +01:00
echo " [+] Running $@ on $$ f ... (run 'ffplay $$ f' to listen) " ; \
2022-09-25 20:23:15 +02:00
echo "----------------------------------------------" ; \
echo "" ; \
2022-09-26 08:36:51 +02:00
./main -m models/ggml-$@ .bin -f $$ f ; \
2022-09-25 20:23:15 +02:00
echo "" ; \
done
2022-11-28 21:44:01 +01:00
#
# Tests
#
.PHONY : tests
tests :
bash ./tests/run-tests.sh