mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-02-05 02:19:09 +00:00
whisper : fix logit reading
This commit is contained in:
parent
659757329d
commit
7e01486b61
@ -2461,11 +2461,12 @@ static bool whisper_decode_internal(
|
|||||||
// extract logits for all N tokens
|
// extract logits for all N tokens
|
||||||
//logits_out.resize(n_tokens*n_vocab);
|
//logits_out.resize(n_tokens*n_vocab);
|
||||||
//memcpy(logits_out.data(), ggml_get_data(logits), sizeof(float)*n_tokens*n_vocab);
|
//memcpy(logits_out.data(), ggml_get_data(logits), sizeof(float)*n_tokens*n_vocab);
|
||||||
|
//ggml_backend_tensor_get(logits, logits_out.data(), (n_vocab*(n_tokens - 1))*sizeof(float), sizeof(float)*n_vocab);
|
||||||
|
|
||||||
// extract logits only for the last token
|
// extract logits only for the last token
|
||||||
logits_out.resize(n_vocab);
|
logits_out.resize(n_vocab);
|
||||||
//memcpy(logits_out.data(), ggml_get_data(logits), sizeof(float)*n_vocab);
|
//memcpy(logits_out.data(), ggml_get_data(logits), sizeof(float)*n_vocab);
|
||||||
ggml_backend_tensor_get(logits, logits_out.data(), (n_vocab*(n_tokens - 1))*sizeof(float), sizeof(float)*n_vocab);
|
ggml_backend_tensor_get(logits, logits_out.data(), 0, sizeof(float)*n_vocab);
|
||||||
|
|
||||||
if (n_tokens > 1) {
|
if (n_tokens > 1) {
|
||||||
//printf("%s: used_mem = %f MB, %f MB, %f MB %f MB %f MB\n", __func__,
|
//printf("%s: used_mem = %f MB, %f MB, %f MB %f MB %f MB\n", __func__,
|
||||||
|
Loading…
x
Reference in New Issue
Block a user