mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-02-22 17:42:38 +00:00
* Fix type signature for Whisper.log_set * Use cache file for model when offline * Extract ruby_whisper_transcribe() into a file * Extract Whisper::Error * Use FileList for ext/*.{c,cpp,h} * Extract Whisper::Segment * Extract Whisper::Model * Extract Whisper::Params * Extract Whisper::Context * Extract log_callback function * Write base code in C rather than C++ * Use chdir instead of Dir.chdir in Rakefile * Define alloc func for Whisper::Model * Define Whisper::Params' calback and user data reader * Add test for Whisper::Params.new with keyword arguments * Make Whisper::Params.new accept keyword arguments * Update type signatures * Update README * Update CLEAN targets * Fix document comment for Whisper::Params#new_segment_callback= * Use macro to define params * Fix dependency of build task * Set Whisper.finalize_log_callback visibility to private * Make Whisper::Context#full and full_parallel return self * Add test for Whisper::Context#full_get_segment * Add Whisper::Context#full_get_segment * Update signatures * Update README * Fix signature * Resplace #initialize with .new in signature file [skip ci] * Fix potential overflow
211 lines
5.3 KiB
C
211 lines
5.3 KiB
C
#include <ruby.h>
|
|
#include "ruby_whisper.h"
|
|
|
|
extern VALUE cModel;
|
|
|
|
static void rb_whisper_model_mark(ruby_whisper_model *rwm) {
|
|
rb_gc_mark(rwm->context);
|
|
}
|
|
|
|
static VALUE ruby_whisper_model_allocate(VALUE klass) {
|
|
ruby_whisper_model *rwm;
|
|
rwm = ALLOC(ruby_whisper_model);
|
|
return Data_Wrap_Struct(klass, rb_whisper_model_mark, RUBY_DEFAULT_FREE, rwm);
|
|
}
|
|
|
|
VALUE rb_whisper_model_initialize(VALUE context) {
|
|
ruby_whisper_model *rwm;
|
|
const VALUE model = ruby_whisper_model_allocate(cModel);
|
|
Data_Get_Struct(model, ruby_whisper_model, rwm);
|
|
rwm->context = context;
|
|
return model;
|
|
};
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_vocab -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_vocab(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_vocab(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_audio_ctx -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_audio_ctx(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_audio_ctx(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_audio_state -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_audio_state(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_audio_state(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_audio_head -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_audio_head(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_audio_head(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_audio_layer -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_audio_layer(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_audio_layer(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_text_ctx -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_text_ctx(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_text_ctx(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_text_state -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_text_state(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_text_state(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_text_head -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_text_head(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_text_head(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_text_layer -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_text_layer(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_text_layer(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* n_mels -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_n_mels(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_n_mels(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* ftype -> Integer
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_ftype(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return INT2NUM(whisper_model_ftype(rw->context));
|
|
}
|
|
|
|
/*
|
|
* call-seq:
|
|
* type -> String
|
|
*/
|
|
static VALUE
|
|
ruby_whisper_model_type(VALUE self)
|
|
{
|
|
ruby_whisper_model *rwm;
|
|
Data_Get_Struct(self, ruby_whisper_model, rwm);
|
|
ruby_whisper *rw;
|
|
Data_Get_Struct(rwm->context, ruby_whisper, rw);
|
|
return rb_str_new2(whisper_model_type_readable(rw->context));
|
|
}
|
|
|
|
void
|
|
init_ruby_whisper_model(VALUE *mWhisper)
|
|
{
|
|
cModel = rb_define_class_under(*mWhisper, "Model", rb_cObject);
|
|
|
|
rb_define_alloc_func(cModel, ruby_whisper_model_allocate);
|
|
rb_define_method(cModel, "n_vocab", ruby_whisper_model_n_vocab, 0);
|
|
rb_define_method(cModel, "n_audio_ctx", ruby_whisper_model_n_audio_ctx, 0);
|
|
rb_define_method(cModel, "n_audio_state", ruby_whisper_model_n_audio_state, 0);
|
|
rb_define_method(cModel, "n_audio_head", ruby_whisper_model_n_audio_head, 0);
|
|
rb_define_method(cModel, "n_audio_layer", ruby_whisper_model_n_audio_layer, 0);
|
|
rb_define_method(cModel, "n_text_ctx", ruby_whisper_model_n_text_ctx, 0);
|
|
rb_define_method(cModel, "n_text_state", ruby_whisper_model_n_text_state, 0);
|
|
rb_define_method(cModel, "n_text_head", ruby_whisper_model_n_text_head, 0);
|
|
rb_define_method(cModel, "n_text_layer", ruby_whisper_model_n_text_layer, 0);
|
|
rb_define_method(cModel, "n_mels", ruby_whisper_model_n_mels, 0);
|
|
rb_define_method(cModel, "ftype", ruby_whisper_model_ftype, 0);
|
|
rb_define_method(cModel, "type", ruby_whisper_model_type, 0);
|
|
}
|