|
|
@ -43,7 +43,7 @@
|
|
|
|
<b>Important:</b>
|
|
|
|
<b>Important:</b>
|
|
|
|
<ul>
|
|
|
|
<ul>
|
|
|
|
<li>your browser must support WASM SIMD instructions for this to work</li>
|
|
|
|
<li>your browser must support WASM SIMD instructions for this to work</li>
|
|
|
|
<li>quantized models are still in experimental stage</li>
|
|
|
|
<li>quantized models are still in experimental stage (<a href="https://github.com/ggerganov/ggml/pull/27">more info</a>)</li>
|
|
|
|
<li>Firefox cannot load files larger than 256 MB - use Chrome instead</li>
|
|
|
|
<li>Firefox cannot load files larger than 256 MB - use Chrome instead</li>
|
|
|
|
</ul>
|
|
|
|
</ul>
|
|
|
|
|
|
|
|
|
|
|
@ -174,6 +174,12 @@
|
|
|
|
<option value="yi">Yiddish</option>
|
|
|
|
<option value="yi">Yiddish</option>
|
|
|
|
</select>
|
|
|
|
</select>
|
|
|
|
</td>
|
|
|
|
</td>
|
|
|
|
|
|
|
|
<!-- Slider to select number of threads between 1 and 16 -->
|
|
|
|
|
|
|
|
<td>
|
|
|
|
|
|
|
|
Threads:
|
|
|
|
|
|
|
|
<input type="range" id="threads" name="threads" min="1" max="16" value="8" onchange="changeThreads(this.value)" />
|
|
|
|
|
|
|
|
<span id="threads-value">8</span>
|
|
|
|
|
|
|
|
</td>
|
|
|
|
<td>
|
|
|
|
<td>
|
|
|
|
<button onclick="onProcess(false);">Transcribe</button>
|
|
|
|
<button onclick="onProcess(false);">Transcribe</button>
|
|
|
|
</td>
|
|
|
|
</td>
|
|
|
@ -281,6 +287,8 @@
|
|
|
|
document.getElementById('model-whisper-status').innerHTML = 'loaded "' + model_whisper + '"!';
|
|
|
|
document.getElementById('model-whisper-status').innerHTML = 'loaded "' + model_whisper + '"!';
|
|
|
|
|
|
|
|
|
|
|
|
printTextarea('storeFS: stored model: ' + fname + ' size: ' + buf.length);
|
|
|
|
printTextarea('storeFS: stored model: ' + fname + ' size: ' + buf.length);
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
document.getElementById('model').innerHTML = 'Model fetched: ' + model_whisper;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
function loadFile(event, fname) {
|
|
|
|
function loadFile(event, fname) {
|
|
|
@ -384,6 +392,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
cbCancel = function() {
|
|
|
|
cbCancel = function() {
|
|
|
|
var el;
|
|
|
|
var el;
|
|
|
|
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-tiny-en' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-tiny-en' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-base-en' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-base-en' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-small-en'); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-small-en'); if (el) el.style.display = 'inline-block';
|
|
|
@ -391,7 +400,13 @@
|
|
|
|
el = document.getElementById('fetch-whisper-base' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-base' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-small' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-small' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-large-q4_0'); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('fetch-whisper-base-en-q4_0' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-base-q4_0' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-small-en-q4_0' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-small-q4_0' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-medium-en-q4_0'); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-medium-q4_0' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
el = document.getElementById('fetch-whisper-large-q4_0' ); if (el) el.style.display = 'inline-block';
|
|
|
|
|
|
|
|
|
|
|
|
el = document.getElementById('whisper-file' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('whisper-file' ); if (el) el.style.display = 'inline-block';
|
|
|
|
el = document.getElementById('model-whisper-status' ); if (el) el.innerHTML = '';
|
|
|
|
el = document.getElementById('model-whisper-status' ); if (el) el.innerHTML = '';
|
|
|
@ -405,6 +420,7 @@
|
|
|
|
//
|
|
|
|
//
|
|
|
|
|
|
|
|
|
|
|
|
const kMaxAudio_s = 30*60;
|
|
|
|
const kMaxAudio_s = 30*60;
|
|
|
|
|
|
|
|
const kMaxRecording_s = 2*60;
|
|
|
|
const kSampleRate = 16000;
|
|
|
|
const kSampleRate = 16000;
|
|
|
|
|
|
|
|
|
|
|
|
window.AudioContext = window.AudioContext || window.webkitAudioContext;
|
|
|
|
window.AudioContext = window.AudioContext || window.webkitAudioContext;
|
|
|
@ -473,7 +489,7 @@
|
|
|
|
doRecording = false;
|
|
|
|
doRecording = false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// record up to kMaxAudio_s seconds of audio from the microphone
|
|
|
|
// record up to kMaxRecording_s seconds of audio from the microphone
|
|
|
|
// check if doRecording is false every 1000 ms and stop recording if so
|
|
|
|
// check if doRecording is false every 1000 ms and stop recording if so
|
|
|
|
// update progress information
|
|
|
|
// update progress information
|
|
|
|
function startRecording() {
|
|
|
|
function startRecording() {
|
|
|
@ -529,9 +545,9 @@
|
|
|
|
printTextarea('js: audio recorded, size: ' + audio.length);
|
|
|
|
printTextarea('js: audio recorded, size: ' + audio.length);
|
|
|
|
|
|
|
|
|
|
|
|
// truncate to first 30 seconds
|
|
|
|
// truncate to first 30 seconds
|
|
|
|
if (audio.length > kMaxAudio_s*kSampleRate) {
|
|
|
|
if (audio.length > kMaxRecording_s*kSampleRate) {
|
|
|
|
audio = audio.slice(0, kMaxAudio_s*kSampleRate);
|
|
|
|
audio = audio.slice(0, kMaxRecording_s*kSampleRate);
|
|
|
|
printTextarea('js: truncated audio to first ' + kMaxAudio_s + ' seconds');
|
|
|
|
printTextarea('js: truncated audio to first ' + kMaxRecording_s + ' seconds');
|
|
|
|
}
|
|
|
|
}
|
|
|
|
setAudio(audio);
|
|
|
|
setAudio(audio);
|
|
|
|
});
|
|
|
|
});
|
|
|
@ -559,24 +575,31 @@
|
|
|
|
});
|
|
|
|
});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
document.getElementById('progress-bar').style.width = (100*(Date.now() - startTime)/1000/kMaxAudio_s) + '%';
|
|
|
|
document.getElementById('progress-bar').style.width = (100*(Date.now() - startTime)/1000/kMaxRecording_s) + '%';
|
|
|
|
document.getElementById('progress-text').innerHTML = (100*(Date.now() - startTime)/1000/kMaxAudio_s).toFixed(0) + '%';
|
|
|
|
document.getElementById('progress-text').innerHTML = (100*(Date.now() - startTime)/1000/kMaxRecording_s).toFixed(0) + '%';
|
|
|
|
}, 1000);
|
|
|
|
}, 1000);
|
|
|
|
|
|
|
|
|
|
|
|
printTextarea('js: recording ...');
|
|
|
|
printTextarea('js: recording ...');
|
|
|
|
|
|
|
|
|
|
|
|
setTimeout(function() {
|
|
|
|
setTimeout(function() {
|
|
|
|
if (doRecording) {
|
|
|
|
if (doRecording) {
|
|
|
|
printTextarea('js: recording stopped after ' + kMaxAudio_s + ' seconds');
|
|
|
|
printTextarea('js: recording stopped after ' + kMaxRecording_s + ' seconds');
|
|
|
|
stopRecording();
|
|
|
|
stopRecording();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}, kMaxAudio_s*1000);
|
|
|
|
}, kMaxRecording_s*1000);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
//
|
|
|
|
//
|
|
|
|
// transcribe
|
|
|
|
// transcribe
|
|
|
|
//
|
|
|
|
//
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
var nthreads = 8;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
function changeThreads(value) {
|
|
|
|
|
|
|
|
nthreads = value;
|
|
|
|
|
|
|
|
document.getElementById('threads-value').innerHTML = nthreads;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
function onProcess(translate) {
|
|
|
|
function onProcess(translate) {
|
|
|
|
if (!instance) {
|
|
|
|
if (!instance) {
|
|
|
|
instance = Module.init('whisper.bin');
|
|
|
|
instance = Module.init('whisper.bin');
|
|
|
@ -603,7 +626,7 @@
|
|
|
|
printTextarea('');
|
|
|
|
printTextarea('');
|
|
|
|
|
|
|
|
|
|
|
|
setTimeout(function() {
|
|
|
|
setTimeout(function() {
|
|
|
|
var ret = Module.full_default(instance, audio, document.getElementById('language').value, translate);
|
|
|
|
var ret = Module.full_default(instance, audio, document.getElementById('language').value, nthreads, translate);
|
|
|
|
console.log('js: full_default returned: ' + ret);
|
|
|
|
console.log('js: full_default returned: ' + ret);
|
|
|
|
if (ret) {
|
|
|
|
if (ret) {
|
|
|
|
printTextarea("js: whisper returned: " + ret);
|
|
|
|
printTextarea("js: whisper returned: " + ret);
|
|
|
|