2024-11-13 19:52:56 +00:00
|
|
|
require_relative "helper"
|
|
|
|
require "stringio"
|
2024-11-28 08:33:07 +00:00
|
|
|
require "etc"
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-11-13 19:52:56 +00:00
|
|
|
# Exists to detect memory-related bug
|
|
|
|
Whisper.log_set ->(level, buffer, user_data) {}, nil
|
2024-10-28 13:43:27 +00:00
|
|
|
|
2024-11-13 19:52:56 +00:00
|
|
|
class TestWhisper < TestBase
|
2023-02-15 17:46:55 +00:00
|
|
|
def setup
|
|
|
|
@params = Whisper::Params.new
|
|
|
|
end
|
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_whisper
|
2024-11-13 19:52:56 +00:00
|
|
|
@whisper = Whisper::Context.new(MODEL)
|
2024-10-28 13:43:27 +00:00
|
|
|
params = Whisper::Params.new
|
|
|
|
params.print_timestamps = false
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-11-13 19:52:56 +00:00
|
|
|
@whisper.transcribe(AUDIO, params) {|text|
|
2024-10-28 13:43:27 +00:00
|
|
|
assert_match /ask not what your country can do for you, ask what you can do for your country/, text
|
|
|
|
}
|
2023-02-15 17:46:55 +00:00
|
|
|
end
|
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
sub_test_case "After transcription" do
|
|
|
|
class << self
|
|
|
|
attr_reader :whisper
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def startup
|
2024-11-13 19:52:56 +00:00
|
|
|
@whisper = Whisper::Context.new(TestBase::MODEL)
|
2024-10-28 13:43:27 +00:00
|
|
|
params = Whisper::Params.new
|
|
|
|
params.print_timestamps = false
|
2024-11-13 19:52:56 +00:00
|
|
|
@whisper.transcribe(TestBase::AUDIO, params)
|
2024-10-28 13:43:27 +00:00
|
|
|
end
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def whisper
|
|
|
|
self.class.whisper
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_full_n_segments
|
|
|
|
assert_equal 1, whisper.full_n_segments
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_full_lang_id
|
|
|
|
assert_equal 0, whisper.full_lang_id
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_full_get_segment_t0
|
|
|
|
assert_equal 0, whisper.full_get_segment_t0(0)
|
|
|
|
assert_raise IndexError do
|
|
|
|
whisper.full_get_segment_t0(whisper.full_n_segments)
|
|
|
|
end
|
|
|
|
assert_raise IndexError do
|
|
|
|
whisper.full_get_segment_t0(-1)
|
|
|
|
end
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_full_get_segment_t1
|
|
|
|
t1 = whisper.full_get_segment_t1(0)
|
|
|
|
assert_kind_of Integer, t1
|
|
|
|
assert t1 > 0
|
|
|
|
assert_raise IndexError do
|
|
|
|
whisper.full_get_segment_t1(whisper.full_n_segments)
|
|
|
|
end
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_full_get_segment_speaker_turn_next
|
|
|
|
assert_false whisper.full_get_segment_speaker_turn_next(0)
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_full_get_segment_text
|
|
|
|
assert_match /ask not what your country can do for you, ask what you can do for your country/, whisper.full_get_segment_text(0)
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
end
|
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_lang_max_id
|
|
|
|
assert_kind_of Integer, Whisper.lang_max_id
|
2023-02-15 17:46:55 +00:00
|
|
|
end
|
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_lang_id
|
|
|
|
assert_equal 0, Whisper.lang_id("en")
|
|
|
|
assert_raise ArgumentError do
|
|
|
|
Whisper.lang_id("non existing language")
|
2024-10-16 15:44:04 +00:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_lang_str
|
|
|
|
assert_equal "en", Whisper.lang_str(0)
|
|
|
|
assert_raise IndexError do
|
|
|
|
Whisper.lang_str(Whisper.lang_max_id + 1)
|
2024-10-16 15:44:04 +00:00
|
|
|
end
|
2024-10-28 13:43:27 +00:00
|
|
|
end
|
2024-10-16 15:44:04 +00:00
|
|
|
|
2024-10-28 13:43:27 +00:00
|
|
|
def test_lang_str_full
|
|
|
|
assert_equal "english", Whisper.lang_str_full(0)
|
|
|
|
assert_raise IndexError do
|
|
|
|
Whisper.lang_str_full(Whisper.lang_max_id + 1)
|
2024-10-16 15:44:04 +00:00
|
|
|
end
|
|
|
|
end
|
2024-11-13 19:52:56 +00:00
|
|
|
|
|
|
|
def test_log_set
|
|
|
|
user_data = Object.new
|
|
|
|
logs = []
|
|
|
|
log_callback = ->(level, buffer, udata) {
|
|
|
|
logs << [level, buffer, udata]
|
|
|
|
}
|
|
|
|
Whisper.log_set log_callback, user_data
|
|
|
|
Whisper::Context.new(MODEL)
|
|
|
|
|
|
|
|
assert logs.length > 30
|
|
|
|
logs.each do |log|
|
2024-11-21 15:04:29 +00:00
|
|
|
assert_include [Whisper::LOG_LEVEL_DEBUG, Whisper::LOG_LEVEL_INFO, Whisper::LOG_LEVEL_WARN], log[0]
|
2024-11-13 19:52:56 +00:00
|
|
|
assert_same user_data, log[2]
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_log_suppress
|
|
|
|
stderr = $stderr
|
|
|
|
Whisper.log_set ->(level, buffer, user_data) {
|
|
|
|
# do nothing
|
|
|
|
}, nil
|
|
|
|
dev = StringIO.new("")
|
|
|
|
$stderr = dev
|
|
|
|
Whisper::Context.new(MODEL)
|
|
|
|
assert_empty dev.string
|
|
|
|
ensure
|
|
|
|
$stderr = stderr
|
|
|
|
end
|
2024-11-28 08:33:07 +00:00
|
|
|
|
|
|
|
sub_test_case "full" do
|
|
|
|
def setup
|
|
|
|
super
|
|
|
|
@whisper = Whisper::Context.new(MODEL)
|
|
|
|
@samples = File.read(AUDIO, nil, 78).unpack("s<*").collect {|i| i.to_f / 2**15}
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full
|
|
|
|
@whisper.full(@params, @samples, @samples.length)
|
|
|
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments
|
|
|
|
assert_match /ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_without_length
|
|
|
|
@whisper.full(@params, @samples)
|
|
|
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments
|
|
|
|
assert_match /ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_enumerator
|
|
|
|
samples = @samples.each
|
|
|
|
@whisper.full(@params, samples, @samples.length)
|
|
|
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments
|
|
|
|
assert_match /ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_enumerator_without_length
|
|
|
|
samples = @samples.each
|
|
|
|
assert_raise ArgumentError do
|
|
|
|
@whisper.full(@params, samples)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_enumerator_with_too_large_length
|
|
|
|
samples = @samples.each.take(10).to_enum
|
|
|
|
assert_raise StopIteration do
|
|
|
|
@whisper.full(@params, samples, 11)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_with_memory_view
|
|
|
|
samples = JFKReader.new(AUDIO)
|
|
|
|
@whisper.full(@params, samples)
|
|
|
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments
|
|
|
|
assert_match /ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_parallel
|
|
|
|
@whisper.full_parallel(@params, @samples, @samples.length, Etc.nprocessors)
|
|
|
|
|
|
|
|
assert_equal Etc.nprocessors, @whisper.full_n_segments
|
|
|
|
text = @whisper.each_segment.collect(&:text).join
|
|
|
|
assert_match /ask what you can do/i, text
|
|
|
|
assert_match /for your country/i, text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_parallel_with_memory_view
|
|
|
|
samples = JFKReader.new(AUDIO)
|
|
|
|
@whisper.full_parallel(@params, samples, nil, Etc.nprocessors)
|
|
|
|
|
|
|
|
assert_equal Etc.nprocessors, @whisper.full_n_segments
|
|
|
|
text = @whisper.each_segment.collect(&:text).join
|
|
|
|
assert_match /ask what you can do/i, text
|
|
|
|
assert_match /for your country/i, text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_parallel_without_length_and_n_processors
|
|
|
|
@whisper.full_parallel(@params, @samples)
|
|
|
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments
|
|
|
|
text = @whisper.each_segment.collect(&:text).join
|
|
|
|
assert_match /ask what you can do/i, text
|
|
|
|
assert_match /for your country/i, text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_parallel_without_length
|
|
|
|
@whisper.full_parallel(@params, @samples, nil, Etc.nprocessors)
|
|
|
|
|
|
|
|
assert_equal Etc.nprocessors, @whisper.full_n_segments
|
|
|
|
text = @whisper.each_segment.collect(&:text).join
|
|
|
|
assert_match /ask what you can do/i, text
|
|
|
|
assert_match /for your country/i, text
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_full_parallel_without_n_processors
|
|
|
|
@whisper.full_parallel(@params, @samples, @samples.length)
|
|
|
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments
|
|
|
|
text = @whisper.each_segment.collect(&:text).join
|
|
|
|
assert_match /ask what you can do/i, text
|
|
|
|
assert_match /for your country/i, text
|
|
|
|
end
|
|
|
|
end
|
2023-02-15 17:46:55 +00:00
|
|
|
end
|