server : fix server temperature + add temperature_inc (#1729)

* server : fix server temperature + add temperature_inc

* server : change dashes to underscores in parameter names
This commit is contained in:
Georgi Gerganov 2024-01-07 13:35:14 +02:00 committed by GitHub
parent 3b8c2dff57
commit 022756a872
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 36 additions and 30 deletions

View File

@ -56,8 +56,9 @@ options:
curl 127.0.0.1:8080/inference \ curl 127.0.0.1:8080/inference \
-H "Content-Type: multipart/form-data" \ -H "Content-Type: multipart/form-data" \
-F file="@<file-path>" \ -F file="@<file-path>" \
-F temperature="0.2" \ -F temperature="0.0" \
-F response-format="json" -F temperature_inc="0.2" \
-F response_format="json"
``` ```
**/load** **/load**

View File

@ -63,7 +63,8 @@ struct whisper_params {
float word_thold = 0.01f; float word_thold = 0.01f;
float entropy_thold = 2.40f; float entropy_thold = 2.40f;
float logprob_thold = -1.00f; float logprob_thold = -1.00f;
float userdef_temp = 0.20f; float temperature = 0.00f;
float temperature_inc = 0.20f;
bool speed_up = false; bool speed_up = false;
bool debug_mode = false; bool debug_mode = false;
@ -395,34 +396,37 @@ std::string output_str(struct whisper_context * ctx, const whisper_params & para
void get_req_parameters(const Request & req, whisper_params & params) void get_req_parameters(const Request & req, whisper_params & params)
{ {
// user model configu.has_fileion if (req.has_file("offset_t"))
if (req.has_file("offset-t"))
{ {
params.offset_t_ms = std::stoi(req.get_file_value("offset-t").content); params.offset_t_ms = std::stoi(req.get_file_value("offset_t").content);
} }
if (req.has_file("offset-n")) if (req.has_file("offset_n"))
{ {
params.offset_n = std::stoi(req.get_file_value("offset-n").content); params.offset_n = std::stoi(req.get_file_value("offset_n").content);
} }
if (req.has_file("duration")) if (req.has_file("duration"))
{ {
params.duration_ms = std::stoi(req.get_file_value("duration").content); params.duration_ms = std::stoi(req.get_file_value("duration").content);
} }
if (req.has_file("max-context")) if (req.has_file("max_context"))
{ {
params.max_context = std::stoi(req.get_file_value("max-context").content); params.max_context = std::stoi(req.get_file_value("max_context").content);
} }
if (req.has_file("prompt")) if (req.has_file("prompt"))
{ {
params.prompt = req.get_file_value("prompt").content; params.prompt = req.get_file_value("prompt").content;
} }
if (req.has_file("response-format")) if (req.has_file("response_format"))
{ {
params.response_format = req.get_file_value("response-format").content; params.response_format = req.get_file_value("response_format").content;
} }
if (req.has_file("temperature")) if (req.has_file("temperature"))
{ {
params.userdef_temp = std::stof(req.get_file_value("temperature").content); params.temperature = std::stof(req.get_file_value("temperature").content);
}
if (req.has_file("temperature_inc"))
{
params.temperature_inc = std::stof(req.get_file_value("temperature_inc").content);
} }
} }
@ -602,7 +606,8 @@ int main(int argc, char ** argv) {
wparams.greedy.best_of = params.best_of; wparams.greedy.best_of = params.best_of;
wparams.beam_search.beam_size = params.beam_size; wparams.beam_search.beam_size = params.beam_size;
wparams.temperature_inc = params.userdef_temp; wparams.temperature = params.temperature;
wparams.temperature_inc = params.temperature_inc;
wparams.entropy_thold = params.entropy_thold; wparams.entropy_thold = params.entropy_thold;
wparams.logprob_thold = params.logprob_thold; wparams.logprob_thold = params.logprob_thold;