whisper : fix incorrect timestamps, usually near silences (#2279)

* Incorrect timetstamps

Fixes #2271

- Adds consecutive timestamps after end of last segment as the new starting ts
- Add these timestamp to output when "print-special" enabled
- Fixes fflush usage in live reporting

I was not able to test this with the special "token_timestamps" option.

* Skip initial timestamp
This commit is contained in:
Bjarke Viksøe 2026-05-10 16:24:12 +02:00 committed by GitHub
parent c81b2dabbc
commit c33c5618b7
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
1 changed files with 8 additions and 5 deletions

View File

@ -7659,11 +7659,14 @@ int whisper_full_with_state(
}
}
text = "";
while (i < (int) tokens_cur.size() && tokens_cur[i].id > whisper_token_beg(ctx)) {
i++;
}
i--;
t0 = t1;
while (i + 1 < (int) tokens_cur.size() && tokens_cur[i + 1].id > whisper_token_beg(ctx)) {
i++;
if (params.print_special) {
text += whisper_token_to_str(ctx, tokens_cur[i].id);
}
t0 = seek + 2 * (tokens_cur[i].tid - whisper_token_beg(ctx));
}
i0 = i + 1;
speaker_turn_next = false;
}
@ -7680,8 +7683,8 @@ int whisper_full_with_state(
printf("[%s --> %s] %s\n", to_timestamp(tt0).c_str(), to_timestamp(tt1).c_str(), text.c_str());
} else {
printf("%s", text.c_str());
fflush(stdout);
}
fflush(stdout);
}
result_all.push_back({ tt0, tt1, text, state->no_speech_prob, {}, speaker_turn_next });