mirror of
https://github.com/ggerganov/whisper.cpp
synced 2026-03-07 23:49:29 +01:00
* ruby : Bump version to 1.3.6 * Fix code in example * Add sample code to transcribe from MemoryView * Define GetVADContext macro * Use GetVADContext * Extract parse_full_args function * Use parse_full_args in ruby_whisper_full_parallel * Free samples after use * Check return value of parse_full_args() * Define GetVADParams macro * Add VAD::Context#segments_from_samples * Add tests for VAD::Context#segments_from_samples * Add signature for VAD::Context#segments_from_samples * Add sample code for VAD::Context#segments_from_samples * Add test for Whisper::Context#transcribe with Pathname * Make Whisper::Context#transcribe and Whisper::VAD::Context#detect accept Pathname * Update signature of Whisper::Context#transcribe * Fix variable name * Don't free memory view * Make parse_full_args return struct * Fallback when failed to get MemoryView * Add num of samples when too long * Check members of MemoryView * Fix a typo * Remove unnecessary include * Fix a typo * Fix a typo * Care the case of MemoryView doesn't fit spec * Add TODO comment * Add optimazation option to compiler flags * Use ALLOC_N instead of malloc * Add description to sample code * Rename and change args: parse_full_args -> parse_samples * Free samples when exception raised * Assign type check result to a variable * Define wrapper function of whisper_full * Change signature of parse_samples for rb_ensure * Ensure release MemoryView * Extract fill_samples function * Free samples memory when filling it failed * Free samples memory when transcription failed * Prepare transcription in wrapper funciton * Change function name * Simplify function boundary
123 lines
3.5 KiB
C
123 lines
3.5 KiB
C
#include "ruby_whisper.h"
|
|
|
|
extern ID id_to_s;
|
|
|
|
extern VALUE cVADContext;
|
|
|
|
extern const rb_data_type_t ruby_whisper_vad_params_type;
|
|
extern VALUE ruby_whisper_vad_detect(VALUE self, VALUE file_path, VALUE params);
|
|
extern VALUE ruby_whisper_normalize_model_path(VALUE model_path);
|
|
extern parsed_samples_t parse_samples(VALUE *samples, VALUE *n_samples);
|
|
extern VALUE release_samples(VALUE parsed);
|
|
|
|
extern VALUE ruby_whisper_vad_segments_s_init(struct whisper_vad_segments *segments);
|
|
|
|
typedef struct segments_from_samples_args {
|
|
VALUE *context;
|
|
VALUE *params;
|
|
float *samples;
|
|
int n_samples;
|
|
} segments_from_samples_args;
|
|
|
|
static size_t
|
|
ruby_whisper_vad_context_memsize(const void *p)
|
|
{
|
|
const ruby_whisper_vad_context *rwvc = p;
|
|
size_t size = sizeof(rwvc);
|
|
if (!rwvc) {
|
|
return 0;
|
|
}
|
|
if (rwvc->context) {
|
|
size += sizeof(rwvc->context);
|
|
}
|
|
return size;
|
|
}
|
|
|
|
static void
|
|
ruby_whisper_vad_context_free(void *p)
|
|
{
|
|
ruby_whisper_vad_context *rwvc = (ruby_whisper_vad_context *)p;
|
|
if (rwvc->context) {
|
|
whisper_vad_free(rwvc->context);
|
|
rwvc->context = NULL;
|
|
}
|
|
xfree(rwvc);
|
|
}
|
|
|
|
const rb_data_type_t ruby_whisper_vad_context_type = {
|
|
"ruby_whisper_vad_context",
|
|
{0, ruby_whisper_vad_context_free, ruby_whisper_vad_context_memsize,},
|
|
0, 0,
|
|
0
|
|
};
|
|
|
|
static VALUE
|
|
ruby_whisper_vad_context_s_allocate(VALUE klass)
|
|
{
|
|
ruby_whisper_vad_context *rwvc;
|
|
VALUE obj = TypedData_Make_Struct(klass, ruby_whisper_vad_context, &ruby_whisper_vad_context_type, rwvc);
|
|
rwvc->context = NULL;
|
|
return obj;
|
|
}
|
|
|
|
static VALUE
|
|
ruby_whisper_vad_context_initialize(VALUE self, VALUE model_path)
|
|
{
|
|
ruby_whisper_vad_context *rwvc;
|
|
struct whisper_vad_context *context;
|
|
|
|
model_path = ruby_whisper_normalize_model_path(model_path);
|
|
context = whisper_vad_init_from_file_with_params(StringValueCStr(model_path), whisper_vad_default_context_params());
|
|
if (context == NULL) {
|
|
rb_raise(rb_eRuntimeError, "Failed to initialize whisper VAD context");
|
|
}
|
|
TypedData_Get_Struct(self, ruby_whisper_vad_context, &ruby_whisper_vad_context_type, rwvc);
|
|
rwvc->context = context;
|
|
|
|
return Qnil;
|
|
}
|
|
|
|
static VALUE
|
|
segments_from_samples_body(VALUE rb_args)
|
|
{
|
|
segments_from_samples_args *args = (segments_from_samples_args *)rb_args;
|
|
|
|
ruby_whisper_vad_context *rwvc;
|
|
ruby_whisper_vad_params *rwvp;
|
|
GetVADContext(*args->context, rwvc);
|
|
GetVADParams(*args->params, rwvp);
|
|
|
|
struct whisper_vad_segments *segments = whisper_vad_segments_from_samples(rwvc->context, rwvp->params, args->samples, args->n_samples);
|
|
|
|
return ruby_whisper_vad_segments_s_init(segments);
|
|
}
|
|
|
|
static VALUE
|
|
ruby_whisper_vad_segments_from_samples(int argc, VALUE *argv, VALUE self)
|
|
{
|
|
if (argc < 2 || argc > 3) {
|
|
rb_raise(rb_eArgError, "wrong number of arguments (given %d, expected 2..3)", argc);
|
|
}
|
|
|
|
VALUE n_samples = argc == 2 ? Qnil : argv[2];
|
|
struct parsed_samples_t parsed = parse_samples(&argv[1], &n_samples);
|
|
segments_from_samples_args args = {
|
|
&self,
|
|
&argv[0],
|
|
parsed.samples,
|
|
parsed.n_samples,
|
|
};
|
|
VALUE segments = rb_ensure(segments_from_samples_body, (VALUE)&args, release_samples, (VALUE)&parsed);
|
|
|
|
return segments;
|
|
}
|
|
|
|
void init_ruby_whisper_vad_context(VALUE *mVAD)
|
|
{
|
|
cVADContext = rb_define_class_under(*mVAD, "Context", rb_cObject);
|
|
rb_define_alloc_func(cVADContext, ruby_whisper_vad_context_s_allocate);
|
|
rb_define_method(cVADContext, "initialize", ruby_whisper_vad_context_initialize, 1);
|
|
rb_define_method(cVADContext, "segments_from_samples", ruby_whisper_vad_segments_from_samples, -1);
|
|
rb_define_method(cVADContext, "detect", ruby_whisper_vad_detect, 2);
|
|
}
|