|
|
require_relative "helper" |
|
|
require "stringio" |
|
|
require "etc" |
|
|
|
|
|
|
|
|
Whisper.log_set ->(level, buffer, user_data) {}, nil |
|
|
|
|
|
class TestWhisper < TestBase |
|
|
def setup |
|
|
@params = Whisper::Params.new |
|
|
end |
|
|
|
|
|
def test_whisper |
|
|
@whisper = Whisper::Context.new("base.en") |
|
|
params = Whisper::Params.new |
|
|
params.print_timestamps = false |
|
|
|
|
|
@whisper.transcribe(AUDIO, params) {|text| |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, text) |
|
|
} |
|
|
end |
|
|
|
|
|
def test_transcribe_non_parallel |
|
|
@whisper = Whisper::Context.new("base.en") |
|
|
params = Whisper::Params.new |
|
|
|
|
|
@whisper.transcribe(AUDIO, params, n_processors: 1) {|text| |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, text) |
|
|
} |
|
|
end |
|
|
|
|
|
def test_transcribe_n_processors |
|
|
@whisper = Whisper::Context.new("base.en") |
|
|
params = Whisper::Params.new |
|
|
|
|
|
@whisper.transcribe(AUDIO, params, n_processors: 4) {|text| |
|
|
assert_match(/what you can do for your country/i, text) |
|
|
} |
|
|
end |
|
|
|
|
|
sub_test_case "After transcription" do |
|
|
def test_full_n_segments |
|
|
assert_equal 1, whisper.full_n_segments |
|
|
end |
|
|
|
|
|
def test_full_lang_id |
|
|
assert_equal 0, whisper.full_lang_id |
|
|
end |
|
|
|
|
|
def test_full_get_segment |
|
|
segment = whisper.full_get_segment(0) |
|
|
assert_equal 0, segment.start_time |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, segment.text) |
|
|
end |
|
|
|
|
|
def test_full_get_segment_t0 |
|
|
assert_equal 0, whisper.full_get_segment_t0(0) |
|
|
assert_raise IndexError do |
|
|
whisper.full_get_segment_t0(whisper.full_n_segments) |
|
|
end |
|
|
assert_raise IndexError do |
|
|
whisper.full_get_segment_t0(-1) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_full_get_segment_t1 |
|
|
t1 = whisper.full_get_segment_t1(0) |
|
|
assert_kind_of Integer, t1 |
|
|
assert t1 > 0 |
|
|
assert_raise IndexError do |
|
|
whisper.full_get_segment_t1(whisper.full_n_segments) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_full_get_segment_speaker_turn_next |
|
|
assert_false whisper.full_get_segment_speaker_turn_next(0) |
|
|
end |
|
|
|
|
|
def test_full_get_segment_text |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, whisper.full_get_segment_text(0)) |
|
|
end |
|
|
|
|
|
def test_full_get_segment_no_speech_prob |
|
|
prob = whisper.full_get_segment_no_speech_prob(0) |
|
|
assert prob > 0.0 |
|
|
assert prob < 1.0 |
|
|
end |
|
|
end |
|
|
|
|
|
def test_lang_max_id |
|
|
assert_kind_of Integer, Whisper.lang_max_id |
|
|
end |
|
|
|
|
|
def test_lang_id |
|
|
assert_equal 0, Whisper.lang_id("en") |
|
|
assert_raise ArgumentError do |
|
|
Whisper.lang_id("non existing language") |
|
|
end |
|
|
end |
|
|
|
|
|
def test_lang_str |
|
|
assert_equal "en", Whisper.lang_str(0) |
|
|
assert_raise IndexError do |
|
|
Whisper.lang_str(Whisper.lang_max_id + 1) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_lang_str_full |
|
|
assert_equal "english", Whisper.lang_str_full(0) |
|
|
assert_raise IndexError do |
|
|
Whisper.lang_str_full(Whisper.lang_max_id + 1) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_system_info_str |
|
|
assert_match(/\AWHISPER : COREML = \d | OPENVINO = \d |/, Whisper.system_info_str) |
|
|
end |
|
|
|
|
|
def test_version |
|
|
assert_kind_of String, Whisper::VERSION |
|
|
end |
|
|
|
|
|
def test_log_set |
|
|
user_data = Object.new |
|
|
logs = [] |
|
|
log_callback = ->(level, buffer, udata) { |
|
|
logs << [level, buffer, udata] |
|
|
} |
|
|
Whisper.log_set log_callback, user_data |
|
|
Whisper::Context.new("base.en") |
|
|
|
|
|
assert logs.length > 30 |
|
|
logs.each do |log| |
|
|
assert_include [Whisper::LOG_LEVEL_DEBUG, Whisper::LOG_LEVEL_INFO, Whisper::LOG_LEVEL_WARN], log[0] |
|
|
assert_same user_data, log[2] |
|
|
end |
|
|
end |
|
|
|
|
|
def test_log_suppress |
|
|
stderr = $stderr |
|
|
Whisper.log_set ->(level, buffer, user_data) { |
|
|
|
|
|
}, nil |
|
|
dev = StringIO.new("") |
|
|
$stderr = dev |
|
|
Whisper::Context.new("base.en") |
|
|
assert_empty dev.string |
|
|
ensure |
|
|
$stderr = stderr |
|
|
end |
|
|
|
|
|
def test_access_attribute_without_initialization |
|
|
whisper = Whisper::Context.allocate |
|
|
assert_raise do |
|
|
whisper.model_type |
|
|
end |
|
|
end |
|
|
|
|
|
sub_test_case "full" do |
|
|
def setup |
|
|
super |
|
|
@whisper = Whisper::Context.new("base.en") |
|
|
@samples = File.read(AUDIO, nil, 78).unpack("s<*").collect {|i| i.to_f / 2**15} |
|
|
end |
|
|
|
|
|
def test_full |
|
|
@whisper.full(@params, @samples, @samples.length) |
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text) |
|
|
end |
|
|
|
|
|
def test_full_without_length |
|
|
@whisper.full(@params, @samples) |
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text) |
|
|
end |
|
|
|
|
|
def test_full_enumerator |
|
|
samples = @samples.each |
|
|
@whisper.full(@params, samples, @samples.length) |
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text) |
|
|
end |
|
|
|
|
|
def test_full_enumerator_without_length |
|
|
samples = @samples.each |
|
|
assert_raise ArgumentError do |
|
|
@whisper.full(@params, samples) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_full_enumerator_with_too_large_length |
|
|
samples = @samples.each.take(10).to_enum |
|
|
assert_raise StopIteration do |
|
|
@whisper.full(@params, samples, 11) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_full_with_memory_view |
|
|
samples = JFKReader.new(AUDIO) |
|
|
@whisper.full(@params, samples) |
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, @whisper.each_segment.first.text) |
|
|
end |
|
|
|
|
|
def test_full_parallel |
|
|
nprocessors = 2 |
|
|
@whisper.full_parallel(@params, @samples, @samples.length, nprocessors) |
|
|
|
|
|
assert_equal nprocessors, @whisper.full_n_segments |
|
|
text = @whisper.each_segment.collect(&:text).join |
|
|
assert_match(/ask what you can do/i, text) |
|
|
assert_match(/for your country/i, text) |
|
|
end |
|
|
|
|
|
def test_full_parallel_with_memory_view |
|
|
nprocessors = 2 |
|
|
samples = JFKReader.new(AUDIO) |
|
|
@whisper.full_parallel(@params, samples, nil, nprocessors) |
|
|
|
|
|
assert_equal nprocessors, @whisper.full_n_segments |
|
|
text = @whisper.each_segment.collect(&:text).join |
|
|
assert_match(/ask what you can do/i, text) |
|
|
assert_match(/for your country/i, text) |
|
|
end |
|
|
|
|
|
def test_full_parallel_without_length_and_n_processors |
|
|
@whisper.full_parallel(@params, @samples) |
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments |
|
|
text = @whisper.each_segment.collect(&:text).join |
|
|
assert_match(/ask what you can do/i, text) |
|
|
assert_match(/for your country/i, text) |
|
|
end |
|
|
|
|
|
def test_full_parallel_without_length |
|
|
nprocessors = 2 |
|
|
@whisper.full_parallel(@params, @samples, nil, nprocessors) |
|
|
|
|
|
assert_equal nprocessors, @whisper.full_n_segments |
|
|
text = @whisper.each_segment.collect(&:text).join |
|
|
assert_match(/ask what you can do/i, text) |
|
|
assert_match(/for your country/i, text) |
|
|
end |
|
|
|
|
|
def test_full_parallel_without_n_processors |
|
|
@whisper.full_parallel(@params, @samples, @samples.length) |
|
|
|
|
|
assert_equal 1, @whisper.full_n_segments |
|
|
text = @whisper.each_segment.collect(&:text).join |
|
|
assert_match(/ask what you can do/i, text) |
|
|
assert_match(/for your country/i, text) |
|
|
end |
|
|
end |
|
|
|
|
|
def test_to_srt |
|
|
whisper = Whisper::Context.new("base.en") |
|
|
whisper.transcribe AUDIO, @params |
|
|
|
|
|
lines = whisper.to_srt.lines |
|
|
assert_match(/\A\d+\n/, lines[0]) |
|
|
assert_match(/\d{2}:\d{2}:\d{2},\d{3} --> \d{2}:\d{2}:\d{2},\d{3}\n/, lines[1]) |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, lines[2]) |
|
|
end |
|
|
|
|
|
def test_to_webvtt |
|
|
whisper = Whisper::Context.new("base.en") |
|
|
whisper.transcribe AUDIO, @params |
|
|
|
|
|
lines = whisper.to_webvtt.lines |
|
|
assert_equal "WEBVTT\n", lines[0] |
|
|
assert_equal "\n", lines[1] |
|
|
assert_match(/\A\d+\n/, lines[2]) |
|
|
assert_match(/\d{2}:\d{2}:\d{2}\.\d{3} --> \d{2}:\d{2}:\d{2}\.\d{3}\n/, lines[3]) |
|
|
assert_match(/ask not what your country can do for you, ask what you can do for your country/, lines[4]) |
|
|
end |
|
|
|
|
|
sub_test_case "Format needs escape" do |
|
|
def setup |
|
|
@whisper = Whisper::Context.new("base.en") |
|
|
@whisper.transcribe AUDIO, Whisper::Params.new |
|
|
segment = @whisper.each_segment.first |
|
|
segment.define_singleton_method :text do |
|
|
"& so my fellow Americans --> ask not what your country can do for you <-- ask what you can do for your country." |
|
|
end |
|
|
@whisper.define_singleton_method :each_segment do |
|
|
Enumerator.new(3) {|yielder| 3.times {yielder << segment}} |
|
|
end |
|
|
end |
|
|
|
|
|
def test_to_srt_escape |
|
|
assert_equal "& so my fellow Americans --> ask not what your country can do for you <-- ask what you can do for your country.\n", @whisper.to_srt.lines[2] |
|
|
end |
|
|
|
|
|
def test_to_webvtt_escape |
|
|
assert_equal "& so my fellow Americans --> ask not what your country can do for you <-- ask what you can do for your country.\n", @whisper.to_webvtt.lines[4] |
|
|
end |
|
|
end |
|
|
end |
|
|
|