mirror of
https://github.com/ggerganov/whisper.cpp
synced 2026-03-27 17:15:25 +01:00
* bindings.ruby : fix test failures in test_whisper
This commit updates the parallel tests to use 2 processors instead of
the number of processors on the system. It also comments out the setting
of the log callback to an empty lambda as this causes a segfault when
enabled.
The motivation for the change to the number of processors is that if one
has a large number of processors, for example I have 16 on the machine I
used to test this, this would cause the following warning to be printed:
```console
whisper_full_with_state: input is too short - 680 ms < 1000 ms. consider padding the input audio with silence
```
This is logged from:
```c++
int whisper_full_with_state(
struct whisper_context * ctx,
struct whisper_state * state,
struct whisper_full_params params,
const float * samples,
int n_samples) {
...
if (seek_end < seek_start + 100) {
WHISPER_LOG_WARN("%s: input is too short - %d ms < 1000 ms. consider padding the input audio with silence\n", __func__, (seek_end - seek_start)*10);
return 0;
}
```
This will return early and there will be segment callbacks to be invoked
which in turn will cause the tests to fail.
* bindings.ruby : fix warnings in tests
This commit fixes the following warnings in the Ruby tests:
```console
/whisper/bindings/ruby/tests/test_segment.rb:52:
warning: ambiguity between regexp and two divisions:
wrap regexp in parentheses or add a space after `/' operator
```
And also adds a '_' prefix to some unused variables to avoid warnings.
* bindings.ruby : enable Wisper.log_set in tests
The commit reverts the commenting out of the Whisper.log_set call in
the test_whisper.rb tests.
I'm no longer getting segfaults when running the tests with this
which was the case earlier. One theory could be that I rebased this to
include the latest ggml sync to master to make sure things still worked.
With the latest changes in ggml, I can't reproduce the segfaults.
75 lines
1.8 KiB
Ruby
75 lines
1.8 KiB
Ruby
require_relative "helper"
|
|
|
|
class TestSegment < TestBase
|
|
def test_iteration
|
|
whisper.each_segment do |segment|
|
|
assert_instance_of Whisper::Segment, segment
|
|
end
|
|
end
|
|
|
|
def test_enumerator
|
|
enum = whisper.each_segment
|
|
assert_instance_of Enumerator, enum
|
|
enum.to_a.each_with_index do |segment, index|
|
|
assert_instance_of Whisper::Segment, segment
|
|
assert_kind_of Integer, index
|
|
end
|
|
end
|
|
|
|
def test_start_time
|
|
i = 0
|
|
whisper.each_segment do |segment|
|
|
assert_equal 0, segment.start_time if i == 0
|
|
i += 1
|
|
end
|
|
end
|
|
|
|
def test_end_time
|
|
i = 0
|
|
whisper.each_segment do |segment|
|
|
assert_equal whisper.full_get_segment_t1(i) * 10, segment.end_time
|
|
i += 1
|
|
end
|
|
end
|
|
|
|
def test_no_speech_prob
|
|
no_speech_prob = nil
|
|
whisper.each_segment do |segment|
|
|
no_speech_prob = segment.no_speech_prob
|
|
end
|
|
assert no_speech_prob > 0.0
|
|
end
|
|
|
|
def test_on_new_segment
|
|
params = Whisper::Params.new
|
|
seg = nil
|
|
index = 0
|
|
params.on_new_segment do |segment|
|
|
assert_instance_of Whisper::Segment, segment
|
|
if index == 0
|
|
seg = segment
|
|
assert_equal 0, segment.start_time
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, segment.text)
|
|
end
|
|
index += 1
|
|
end
|
|
whisper.transcribe(AUDIO, params)
|
|
assert_equal 0, seg.start_time
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, seg.text)
|
|
end
|
|
|
|
def test_on_new_segment_twice
|
|
params = Whisper::Params.new
|
|
seg = nil
|
|
params.on_new_segment do |segment|
|
|
seg = segment
|
|
return
|
|
end
|
|
params.on_new_segment do |segment|
|
|
assert_same seg, segment
|
|
return
|
|
end
|
|
whisper.transcribe(AUDIO, params)
|
|
end
|
|
end
|