mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-01-24 14:58:43 +01:00
Initial C-style interface for whisper.cpp
This commit is contained in:
parent
be8ba034f6
commit
6b77124e01
9
Makefile
9
Makefile
@ -1,17 +1,20 @@
|
||||
CC_SDL=`sdl2-config --cflags --libs`
|
||||
|
||||
main: ggml.o main.o
|
||||
g++ -pthread -o main ggml.o main.o
|
||||
main: ggml.o whisper.o main.o
|
||||
g++ -pthread -o main ggml.o whisper.o main.o
|
||||
./main -h
|
||||
|
||||
ggml.o: ggml.c ggml.h
|
||||
gcc -pthread -O3 -mavx -mavx2 -mfma -mf16c -c ggml.c
|
||||
|
||||
whisper.o: whisper.cpp whisper.h
|
||||
gcc -pthread -O3 -std=c++11 -c whisper.cpp
|
||||
|
||||
main.o: main.cpp ggml.h
|
||||
g++ -pthread -O3 -std=c++11 -c main.cpp
|
||||
|
||||
stream: stream.cpp
|
||||
g++ -pthread -O3 -std=c++11 -o stream stream.cpp ggml.o $(CC_SDL)
|
||||
g++ -pthread -O3 -std=c++11 -o stream stream.cpp ggml.o whisper.o $(CC_SDL)
|
||||
|
||||
# clean up the directory
|
||||
clean:
|
||||
|
2203
stream.cpp
2203
stream.cpp
File diff suppressed because it is too large
Load Diff
2221
whisper.cpp
Normal file
2221
whisper.cpp
Normal file
File diff suppressed because it is too large
Load Diff
133
whisper.h
Normal file
133
whisper.h
Normal file
@ -0,0 +1,133 @@
|
||||
#ifndef WHISPER_H
|
||||
#define WHISPER_H
|
||||
|
||||
#ifdef WHISPER_SHARED
|
||||
# ifdef _WIN32
|
||||
# ifdef WHISPER_BUILD
|
||||
# define WHISPER_API __declspec(dllexport)
|
||||
# else
|
||||
# define WHISPER_API __declspec(dllimport)
|
||||
# endif
|
||||
# else
|
||||
# define WHISPER_API __attribute__ ((visibility ("default")))
|
||||
# endif
|
||||
#else
|
||||
# define WHISPER_API
|
||||
#endif
|
||||
|
||||
#ifdef __cplusplus
|
||||
extern "C" {
|
||||
#endif
|
||||
|
||||
//
|
||||
// C interface
|
||||
//
|
||||
|
||||
#define SAMPLE_RATE 16000
|
||||
#define N_FFT 400
|
||||
#define N_MEL 80
|
||||
#define HOP_LENGTH 160
|
||||
#define CHUNK_SIZE 30
|
||||
|
||||
// TODO: documentation will come soon
|
||||
|
||||
struct whisper_context;
|
||||
|
||||
typedef int whisper_token;
|
||||
|
||||
WHISPER_API struct whisper_context * whisper_init(const char * path_model);
|
||||
WHISPER_API void whisper_free(struct whisper_context * ctx);
|
||||
|
||||
WHISPER_API int whisper_pcm_to_mel(
|
||||
struct whisper_context * ctx,
|
||||
const float * samples,
|
||||
int n_samples,
|
||||
int n_threads);
|
||||
|
||||
// n_mel must be 80
|
||||
WHISPER_API int whisper_set_mel(
|
||||
struct whisper_context * ctx,
|
||||
const float * data,
|
||||
int n_len,
|
||||
int n_mel);
|
||||
|
||||
WHISPER_API int whisper_encode(
|
||||
struct whisper_context * ctx,
|
||||
int offset,
|
||||
int n_threads);
|
||||
|
||||
WHISPER_API int whisper_decode(
|
||||
struct whisper_context * ctx,
|
||||
const whisper_token * tokens,
|
||||
int n_tokens,
|
||||
int n_past,
|
||||
int n_threads);
|
||||
|
||||
WHISPER_API whisper_token whisper_sample_best(struct whisper_context * ctx, bool need_timestamp);
|
||||
WHISPER_API whisper_token whisper_sample_timestamp(struct whisper_context * ctx);
|
||||
|
||||
// return the id of the specified language, returns -1 if not found
|
||||
WHISPER_API int whisper_lang_id(const char * lang);
|
||||
|
||||
WHISPER_API int whisper_n_len (struct whisper_context * ctx); // mel length
|
||||
WHISPER_API int whisper_n_vocab (struct whisper_context * ctx);
|
||||
WHISPER_API int whisper_n_text_ctx (struct whisper_context * ctx);
|
||||
WHISPER_API int whisper_is_multilingual(struct whisper_context * ctx);
|
||||
WHISPER_API float * whisper_get_probs (struct whisper_context * ctx);
|
||||
|
||||
WHISPER_API const char * whisper_token_to_str(struct whisper_context * ctx, whisper_token token);
|
||||
|
||||
WHISPER_API whisper_token whisper_token_eot (struct whisper_context * ctx);
|
||||
WHISPER_API whisper_token whisper_token_sot (struct whisper_context * ctx);
|
||||
WHISPER_API whisper_token whisper_token_prev(struct whisper_context * ctx);
|
||||
WHISPER_API whisper_token whisper_token_solm(struct whisper_context * ctx);
|
||||
WHISPER_API whisper_token whisper_token_not (struct whisper_context * ctx);
|
||||
WHISPER_API whisper_token whisper_token_beg (struct whisper_context * ctx);
|
||||
|
||||
WHISPER_API whisper_token whisper_token_translate ();
|
||||
WHISPER_API whisper_token whisper_token_transcribe();
|
||||
|
||||
WHISPER_API void whisper_print_timings(struct whisper_context * ctx);
|
||||
|
||||
////////////////////////////////////////////////////////////////////////////
|
||||
|
||||
enum whisper_decode_strategy {
|
||||
WHISPER_DECODE_GREEDY,
|
||||
WHISPER_DECODE_BEAM_SEARCH,
|
||||
};
|
||||
|
||||
struct whisper_full_params {
|
||||
enum whisper_decode_strategy strategy;
|
||||
|
||||
int n_threads;
|
||||
|
||||
bool transcribe;
|
||||
|
||||
const char * language;
|
||||
|
||||
union {
|
||||
struct {
|
||||
int n_past;
|
||||
} greedy;
|
||||
|
||||
struct {
|
||||
int n_past;
|
||||
int beam_width;
|
||||
int n_best;
|
||||
} beam_search;
|
||||
};
|
||||
};
|
||||
|
||||
// full whisper run - encode + decode
|
||||
// TODO: implement
|
||||
WHISPER_API int whisper_full(
|
||||
struct whisper_context * ctx,
|
||||
struct whisper_full_params * params,
|
||||
const float * samples,
|
||||
int n_samples);
|
||||
|
||||
#ifdef __cplusplus
|
||||
}
|
||||
#endif
|
||||
|
||||
#endif
|
Loading…
Reference in New Issue
Block a user