You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
93 lines
3.2 KiB
93 lines
3.2 KiB
#include <jni.h>
|
|
#include <android/log.h>
|
|
#include <stdlib.h>
|
|
#include <sys/sysinfo.h>
|
|
#include "whisper.h"
|
|
|
|
#define UNUSED(x) (void)(x)
|
|
#define TAG "JNI"
|
|
|
|
#define LOGI(...) __android_log_print(ANDROID_LOG_INFO, TAG, __VA_ARGS__)
|
|
|
|
static inline int min(int a, int b) {
|
|
return (a < b) ? a : b;
|
|
}
|
|
|
|
static inline int max(int a, int b) {
|
|
return (a > b) ? a : b;
|
|
}
|
|
|
|
JNIEXPORT jlong JNICALL
|
|
Java_com_whispercppdemo_whisper_WhisperLib_00024Companion_initContext(
|
|
JNIEnv *env, jobject thiz, jstring model_path_str) {
|
|
UNUSED(thiz);
|
|
struct whisper_context *context = NULL;
|
|
const char *model_path_chars = (*env)->GetStringUTFChars(env, model_path_str, NULL);
|
|
context = whisper_init(model_path_chars);
|
|
(*env)->ReleaseStringUTFChars(env, model_path_str, model_path_chars);
|
|
return (jlong) context;
|
|
}
|
|
|
|
JNIEXPORT void JNICALL
|
|
Java_com_whispercppdemo_whisper_WhisperLib_00024Companion_freeContext(
|
|
JNIEnv *env, jobject thiz, jlong context_ptr) {
|
|
UNUSED(env);
|
|
UNUSED(thiz);
|
|
struct whisper_context *context = (struct whisper_context *) context_ptr;
|
|
whisper_free(context);
|
|
}
|
|
|
|
JNIEXPORT void JNICALL
|
|
Java_com_whispercppdemo_whisper_WhisperLib_00024Companion_fullTranscribe(
|
|
JNIEnv *env, jobject thiz, jlong context_ptr, jfloatArray audio_data) {
|
|
UNUSED(thiz);
|
|
struct whisper_context *context = (struct whisper_context *) context_ptr;
|
|
jfloat *audio_data_arr = (*env)->GetFloatArrayElements(env, audio_data, NULL);
|
|
const jsize audio_data_length = (*env)->GetArrayLength(env, audio_data);
|
|
|
|
// Leave 2 processors free (i.e. the high-efficiency cores).
|
|
int max_threads = max(1, min(8, get_nprocs() - 2));
|
|
LOGI("Selecting %d threads", max_threads);
|
|
|
|
// The below adapted from the Objective-C iOS sample
|
|
struct whisper_full_params params = whisper_full_default_params(WHISPER_SAMPLING_GREEDY);
|
|
params.print_realtime = true;
|
|
params.print_progress = false;
|
|
params.print_timestamps = true;
|
|
params.print_special = false;
|
|
params.translate = false;
|
|
params.language = "en";
|
|
params.n_threads = max_threads;
|
|
params.offset_ms = 0;
|
|
params.no_context = true;
|
|
params.single_segment = false;
|
|
|
|
whisper_reset_timings(context);
|
|
|
|
LOGI("About to run whisper_full");
|
|
if (whisper_full(context, params, audio_data_arr, audio_data_length) != 0) {
|
|
LOGI("Failed to run the model");
|
|
} else {
|
|
whisper_print_timings(context);
|
|
}
|
|
(*env)->ReleaseFloatArrayElements(env, audio_data, audio_data_arr, JNI_ABORT);
|
|
}
|
|
|
|
JNIEXPORT jint JNICALL
|
|
Java_com_whispercppdemo_whisper_WhisperLib_00024Companion_getTextSegmentCount(
|
|
JNIEnv *env, jobject thiz, jlong context_ptr) {
|
|
UNUSED(env);
|
|
UNUSED(thiz);
|
|
struct whisper_context *context = (struct whisper_context *) context_ptr;
|
|
return whisper_full_n_segments(context);
|
|
}
|
|
|
|
JNIEXPORT jstring JNICALL
|
|
Java_com_whispercppdemo_whisper_WhisperLib_00024Companion_getTextSegment(
|
|
JNIEnv *env, jobject thiz, jlong context_ptr, jint index) {
|
|
UNUSED(thiz);
|
|
struct whisper_context *context = (struct whisper_context *) context_ptr;
|
|
const char *text = whisper_full_get_segment_text(context, index);
|
|
jstring string = (*env)->NewStringUTF(env, text);
|
|
return string;
|
|
} |