-
Notifications
You must be signed in to change notification settings - Fork 473
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
677bc1d
commit eee5d8a
Showing
15 changed files
with
914 additions
and
10 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
crash.log |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,88 @@ | ||
// Copyright (c) 2023-2024 Xiaomi Corporation (authors: Fangjun Kuang) | ||
|
||
const portAudio = require('naudiodon2'); | ||
// console.log(portAudio.getDevices()); | ||
|
||
const sherpa_onnx = require('sherpa-onnx-node'); | ||
|
||
function createVad() { | ||
// please download silero_vad.onnx from | ||
// https://github.com/k2-fsa/sherpa-onnx/releases/download/asr-models/silero_vad.onnx | ||
const config = { | ||
sileroVad: { | ||
model: './silero_vad.onnx', | ||
threshold: 0.5, | ||
minSpeechDuration: 0.25, | ||
minSilenceDuration: 0.5, | ||
windowSize: 512, | ||
}, | ||
sampleRate: 16000, | ||
debug: true, | ||
numThreads: 1, | ||
}; | ||
|
||
const bufferSizeInSeconds = 60; | ||
|
||
return new sherpa_onnx.Vad(config, bufferSizeInSeconds); | ||
} | ||
|
||
vad = createVad(); | ||
|
||
const bufferSizeInSeconds = 30; | ||
const buffer = | ||
new sherpa_onnx.CircularBuffer(bufferSizeInSeconds * vad.config.sampleRate); | ||
|
||
|
||
const ai = new portAudio.AudioIO({ | ||
inOptions: { | ||
channelCount: 1, | ||
closeOnError: true, // Close the stream if an audio error is detected, if | ||
// set false then just log the error | ||
deviceId: -1, // Use -1 or omit the deviceId to select the default device | ||
sampleFormat: portAudio.SampleFormatFloat32, | ||
sampleRate: vad.config.sampleRate, | ||
} | ||
}); | ||
|
||
let printed = false; | ||
let index = 0; | ||
ai.on('data', data => { | ||
const windowSize = vad.config.sileroVad.windowSize; | ||
buffer.push(new Float32Array(data.buffer)); | ||
while (buffer.size() > windowSize) { | ||
const samples = buffer.get(buffer.head(), windowSize); | ||
buffer.pop(windowSize); | ||
vad.acceptWaveform(samples) | ||
if (vad.isDetected() && !printed) { | ||
console.log(`${index}: Detected speech`) | ||
printed = true; | ||
} | ||
|
||
if (!vad.isDetected()) { | ||
printed = false; | ||
} | ||
|
||
while (!vad.isEmpty()) { | ||
const segment = vad.front(); | ||
vad.pop(); | ||
const filename = `${index}-${ | ||
new Date() | ||
.toLocaleTimeString('en-US', {hour12: false}) | ||
.split(' ')[0]}.wav`; | ||
sherpa_onnx.writeWave( | ||
filename, | ||
{samples: segment.samples, sampleRate: vad.config.sampleRate}) | ||
const duration = segment.samples.length / vad.config.sampleRate; | ||
console.log(`${index} End of speech. Duration: ${duration} seconds`); | ||
console.log(`Saved to ${filename}`); | ||
index += 1; | ||
} | ||
} | ||
}); | ||
|
||
ai.on('close', () => { | ||
console.log('Free resources'); | ||
}); | ||
|
||
ai.start(); | ||
console.log('Started! Please speak') |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,8 +1,12 @@ | ||
const addon = require('./addon.js') | ||
const streaming_asr = require('./streaming-asr.js'); | ||
const vad = require('./vad.js'); | ||
|
||
module.exports = { | ||
OnlineRecognizer: streaming_asr.OnlineRecognizer, | ||
readWave: addon.readWave, | ||
writeWave: addon.writeWave, | ||
Display: streaming_asr.Display, | ||
Vad: vad.Vad, | ||
CircularBuffer: vad.CircularBuffer, | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,88 @@ | ||
const addon = require('./addon.js'); | ||
|
||
class CircularBuffer { | ||
constructor(capacity) { | ||
this.handle = addon.createCircularBuffer(capacity); | ||
} | ||
|
||
// samples is a float32 array | ||
push(samples) { | ||
addon.circularBufferPush(this.handle, samples); | ||
} | ||
|
||
// return a float32 array | ||
get(startIndex, n) { | ||
return addon.circularBufferGet(this.handle, startIndex, n); | ||
} | ||
|
||
pop(n) { | ||
return addon.circularBufferPop(this.handle, n); | ||
} | ||
|
||
size() { | ||
return addon.circularBufferSize(this.handle); | ||
} | ||
|
||
head() { | ||
return addon.circularBufferHead(this.handle); | ||
} | ||
|
||
reset() { | ||
return addon.circularBufferReset(this.handle); | ||
} | ||
} | ||
|
||
class Vad { | ||
/* | ||
config = { | ||
sileroVad: { | ||
model: "./silero_vad.onnx", | ||
threshold: 0.5, | ||
} | ||
} | ||
*/ | ||
constructor(config, bufferSizeInSeconds) { | ||
this.handle = | ||
addon.createVoiceActivityDetector(config, bufferSizeInSeconds); | ||
this.config = config; | ||
} | ||
|
||
acceptWaveform(samples) { | ||
addon.voiceActivityDetectorAcceptWaveform(this.handle, samples) | ||
} | ||
|
||
isEmpty() { | ||
return addon.voiceActivityDetectorIsEmpty(this.handle) | ||
} | ||
|
||
isDetected() { | ||
return addon.voiceActivityDetectorIsDetected(this.handle) | ||
} | ||
|
||
pop() { | ||
addon.voiceActivityDetectorPop(this.handle) | ||
} | ||
|
||
clear() { | ||
addon.VoiceActivityDetectorClearWrapper(this.handle) | ||
} | ||
|
||
/* | ||
{ | ||
samples: a 1-d float32 array, | ||
start: a int32 | ||
} | ||
*/ | ||
front() { | ||
return addon.voiceActivityDetectorFront(this.handle) | ||
} | ||
|
||
reset() { | ||
return addon.VoiceActivityDetectorResetWrapper(this.handle) | ||
} | ||
} | ||
|
||
module.exports = { | ||
Vad, | ||
CircularBuffer, | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.