Non-working draft

This commit is contained in:
msqr1
2024-01-24 23:00:29 -08:00
parent 43b54fd1f6
commit 48b54295f3
7 changed files with 61 additions and 54 deletions

View File

@@ -81,4 +81,4 @@ em++ -pthread -O3 -flto -Wno-deprecated -I. -I$KALDI/src -I$OPENFST/include $VOS
emar -rcs vosk.a ${VOSK_FILES//.cc/.o} && emar -rcs vosk.a ${VOSK_FILES//.cc/.o} &&
cd $SRC && cd $SRC &&
em++ -O3 genericModel.cc model.cc spkModel.cc recognizer.cc bindings.cc -sWASMFS -sWASM_BIGINT -sSINGLE_FILE -sEMBIND_STD_STRING_IS_UTF8 -sSUPPORT_LONGJMP=0 -sMODULARIZE -sEXPORT_NAME=loadBR -sENVIRONMENT=web,worker -sINITIAL_MAX_MEMORY=$MAX_MEMORY -sASYNCIFY -sPTHREAD_POOL_SIZE=$MAX_THREAD -sPTHREAD_POOL_SIZE_STRICT -sPTHREAD_POOL_DELAY_LOAD -sASYNCIFY_ONLY=['emscripten_wget'] -sALLOW_BLOCKING_ON_MAIN_THREAD=0 -sPOLYFILL=0 --pre-js pre.js -I. -I$LIBARCHIVE/include -I$VOSK/src -L$LIBARCHIVE/lib -larchive -L$ZSTD/lib -lzstd -L$KALDI/src -l:online2/kaldi-online2.a -l:decoder/kaldi-decoder.a -l:ivector/kaldi-ivector.a -l:gmm/kaldi-gmm.a -l:tree/kaldi-tree.a -l:feat/kaldi-feat.a -l:cudamatrix/kaldi-cudamatrix.a -l:lat/kaldi-lat.a -l:lm/kaldi-lm.a -l:rnnlm/kaldi-rnnlm.a -l:hmm/kaldi-hmm.a -l:nnet3/kaldi-nnet3.a -l:transform/kaldi-transform.a -l:matrix/kaldi-matrix.a -l:fstext/kaldi-fstext.a -l:util/kaldi-util.a -l:base/kaldi-base.a -L$OPENFST/lib -l:libfst.a -l:libfstngram.a -L$CLAPACK_WASM -l:CBLAS/lib/cblas.a -l:CLAPACK-3.2.1/lapack.a -l:CLAPACK-3.2.1/libcblaswr.a -l:f2c_BLAS-3.8.0/blas.a -l:libf2c/libf2c.a -L$VOSK/src -l:vosk.a -lopfs.js -lembind -pthread -flto -o BrowserRecognizer.js em++ -O3 genericModel.cc model.cc spkModel.cc recognizer.cc bindings.cc -sWASMFS -sWASM_BIGINT -sSINGLE_FILE -sEMBIND_STD_STRING_IS_UTF8 -sSUPPORT_LONGJMP=0 -sMODULARIZE -sEXPORT_NAME=loadBR -sENVIRONMENT=web,worker -sINITIAL_MAX_MEMORY=$MAX_MEMORY -sASYNCIFY -sPTHREAD_POOL_SIZE=$MAX_THREAD -sPTHREAD_POOL_SIZE_STRICT -sPTHREAD_POOL_DELAY_LOAD -sASYNCIFY_ONLY=['emscripten_wget'] -sALLOW_BLOCKING_ON_MAIN_THREAD=0 -sPOLYFILL=0 --pre-js preBefore.js --pre-js preMiddle.js --pre-js preAfter.js -I. -I$LIBARCHIVE/include -I$VOSK/src -L$LIBARCHIVE/lib -larchive -L$ZSTD/lib -lzstd -L$KALDI/src -l:online2/kaldi-online2.a -l:decoder/kaldi-decoder.a -l:ivector/kaldi-ivector.a -l:gmm/kaldi-gmm.a -l:tree/kaldi-tree.a -l:feat/kaldi-feat.a -l:cudamatrix/kaldi-cudamatrix.a -l:lat/kaldi-lat.a -l:lm/kaldi-lm.a -l:rnnlm/kaldi-rnnlm.a -l:hmm/kaldi-hmm.a -l:nnet3/kaldi-nnet3.a -l:transform/kaldi-transform.a -l:matrix/kaldi-matrix.a -l:fstext/kaldi-fstext.a -l:util/kaldi-util.a -l:base/kaldi-base.a -L$OPENFST/lib -l:libfst.a -l:libfstngram.a -L$CLAPACK_WASM -l:CBLAS/lib/cblas.a -l:CLAPACK-3.2.1/lapack.a -l:CLAPACK-3.2.1/libcblaswr.a -l:f2c_BLAS-3.8.0/blas.a -l:libf2c/libf2c.a -L$VOSK/src -l:vosk.a -lopfs.js -lembind -pthread -flto -o BrowserRecognizer.js

3
src/preAfter.js Normal file
View File

@@ -0,0 +1,3 @@
`])))
return new recognizer(rec,ctx)
}

View File

@@ -1,17 +1,21 @@
let objs = [] let objs = []
class recognizer extends EventTarget { class recognizer extends EventTarget {
constructor(rec) { constructor(rec,ctx) {
super() super()
this.obj = rec this.obj = rec
objs.push(this) this.ptr = Module._malloc(512)
let channel = new MessageChannel()
this.copier = new AudioWorkletNode(ctx, 'BRCopier', { channelCount: 1, numberOfInputs: 1, numberOfOutputs: 0 })
this.copier.port.postMessage({cmd : "init", ptr: this.ptr},[channel.port1])
channel.port1.onmessage = (ev) => {
this.obj.acceptWaveForm(this.ptr, 512)
} }
processAudio(ctx) { objs.push(this)
let ptr = Module._malloc(512);
this.obj.acceptWaveForm(ptr)
} }
delete() { delete() {
this.obj.delete() this.obj.delete()
this.copier.port.postMessage({cmd : "deinit"})
Module.free(this.ptr)
} }
setWords(words) { setWords(words) {
this.obj.setWords(words) this.obj.setWords(words)
@@ -59,15 +63,14 @@ Module.makeSpkModel = async (url, path, id) => {
} }
objs.push(mdl) objs.push(mdl)
return mdl return mdl
} }, ctx.AudioWorklet
Module.makeRecognizer = async (model, sampleRate, ctx) => { Module.makeRecognizer = async (model, ctx) => {
let rec let rec
try { try {
rec = new Module.recognizer(model,sampleRate, objs.length) rec = new Module.recognizer(model, ctx.sampleRate, objs.length)
} }
catch(e) { catch(e) {
rec.delete() rec.delete()
return Promise.reject(e) return Promise.reject(e)
} }
return new recognizer(rec) await ctx.AudioWorklet.addModule(URL.createObjectURL(new Blob([`
}

23
src/preMiddle.js Normal file
View File

@@ -0,0 +1,23 @@
registerProcessor("BRCopier", class extends AudioWorkletProcessor {
constructor(options) {
super(options)
this.ret = true
this.port.onmessage = (ev) => {
switch(ev.cmd) {
case "init":
this.recognizerPort = ev.ports[0]
this.wasmMem = new Float32Array(WebAssembly.Memory.buffer).subarray(ev.ptr, ev.ptr+512)
break
case "deinit":
this.ret = false
break
}
}
}
process(inputs, outputs, params) {
if(!this.ret) return false;
inputs[0].copyFromChannel(this.wasmMem, 0)
this.recognizerPort.postMessage("done")
return true
}
})

View File

@@ -1,23 +0,0 @@
registerProcessor("wasmMemCpy", class extends AudioWorkletProcessor {
constructor(options) {
super(options)
this.retval = true
this.port.onmessage = (ev) => {
switch(ev.cmd) {
case "init":
this.ptr = ev.ptr
this.wasmMem = ev.wasmMem
this.recognizerPort = ev.ports[0]
break
case "deinit":
this.retval = false
break
}
}
}
process(input, output, param) {
const data = input[0][0]
this.recognizerPort.postMessage("done")
return this.retval
}
})

View File

@@ -1,16 +1,16 @@
#include "recognizer.h" #include "recognizer.h"
audioData::audioData(int addr, int len) : addr(reinterpret_cast<float*>(addr)), len(len) {}
recognizer::recognizer(model* mdl, float sampleRate, int index) : index(index) { recognizer::recognizer(model* mdl, float sampleRate, int index) : index(index) {
rec = vosk_recognizer_new(mdl->mdl,sampleRate); rec = vosk_recognizer_new(mdl->mdl,sampleRate);
if(rec == nullptr) { if(rec == nullptr) {
throwJS("Unable to initialize recognizer"); throwJS("Unable to initialize recognizer");
return; return;
} }
controller.lock();
std::thread t{[this](){ std::thread t{[this](){
while(!queue.empty()) { while(!done.test()) {
audioData data {queue.front()}; controller.lock();
queue.pop(); if(!done.test()) {
switch(vosk_recognizer_accept_waveform_f(rec, data.addr, data.len)) { switch(vosk_recognizer_accept_waveform_f(rec, dataPtr, 512)) {
case 0: case 0:
fireEv("result", vosk_recognizer_result(rec)); fireEv("result", vosk_recognizer_result(rec));
break; break;
@@ -18,10 +18,13 @@ recognizer::recognizer(model* mdl, float sampleRate, int index) : index(index) {
fireEv("partialResult", vosk_recognizer_partial_result(rec)); fireEv("partialResult", vosk_recognizer_partial_result(rec));
} }
} }
}
}}; }};
t.detach(); t.detach();
} }
recognizer::~recognizer() { recognizer::~recognizer() {
done.test_and_set(std::memory_order_relaxed);
controller.unlock();
vosk_recognizer_free(rec); vosk_recognizer_free(rec);
} }
void recognizer::fireEv(const char *type, const char *content) { void recognizer::fireEv(const char *type, const char *content) {
@@ -29,8 +32,9 @@ void recognizer::fireEv(const char *type, const char *content) {
recognizers[$0].dispatchEvent(new CustomEvent(UTF8ToString($1), {"details" : UTF8ToString($2)})); recognizers[$0].dispatchEvent(new CustomEvent(UTF8ToString($1), {"details" : UTF8ToString($2)}));
},this->index, type, content); },this->index, type, content);
} }
void recognizer::acceptWaveForm(int addr, int len) { void recognizer::acceptWaveForm() {
queue.emplace(addr, len); controller.unlock();
controller.lock();
} }
void recognizer::setGrm(const std::string& grm) { void recognizer::setGrm(const std::string& grm) {
vosk_recognizer_set_grm(rec, grm.c_str()); vosk_recognizer_set_grm(rec, grm.c_str());

View File

@@ -5,7 +5,6 @@
#include <filesystem> #include <filesystem>
#include <atomic> #include <atomic>
#include <thread> #include <thread>
#include <queue>
#include <emscripten/wasmfs.h> #include <emscripten/wasmfs.h>
#include <emscripten/webaudio.h> #include <emscripten/webaudio.h>
@@ -16,17 +15,15 @@
extern void throwJS(const char* msg, bool err = false); extern void throwJS(const char* msg, bool err = false);
namespace fs = std::filesystem; namespace fs = std::filesystem;
struct audioData {
float* addr{};
int len{};
audioData(int addr, int len);
};
struct recognizer { struct recognizer {
std::atomic_flag done{};
std::mutex controller{};
float* dataPtr{};
int index{}; int index{};
VoskRecognizer* rec{}; VoskRecognizer* rec{};
recognizer(model* model, float sampleRate, int index); recognizer(model* model, float sampleRate, int index);
~recognizer(); ~recognizer();
void acceptWaveForm(int addr, int len); void acceptWaveForm();
void fireEv(const char* type, const char* content); void fireEv(const char* type, const char* content);
void setSpkModel(spkModel* model); void setSpkModel(spkModel* model);
void setGrm(const std::string& grm); void setGrm(const std::string& grm);