-
Notifications
You must be signed in to change notification settings - Fork 13
/
Copy pathfile.js
executable file
·95 lines (80 loc) · 2.64 KB
/
file.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
#! /usr/bin/env node
//
// Copyright 2024 Picovoice Inc.
//
// You may not use this file except in compliance with the license. A copy of the license is located in the "LICENSE"
// file accompanying this source.
//
// Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
// an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
// specific language governing permissions and limitations under the License.
//
"use strict";
const { program } = require("commander");
const fs = require("fs");
const WaveFile = require("wavefile").WaveFile;
const {
Cobra,
getInt16Frames,
checkWaveFile,
} = require("@picovoice/cobra-node");
program
.requiredOption(
"-a, --access_key <string>",
"AccessKey obtain from the Picovoice Console (https://console.picovoice.ai/)"
)
.requiredOption("-i, --input_audio_file_path <string>", "input wav file")
.option(
"-l, --library_file_path <string>",
"absolute path to cobra dynamic library"
)
.option(
"-t --threshold <string>",
"Threshold for the probability of voice activity"
);
if (process.argv.length < 2) {
program.help();
}
program.parse(process.argv);
function fileDemo() {
let audioPath = program["input_audio_file_path"];
let accessKey = program["access_key"];
let libraryFilePath = program["library_file_path"];
let threshold = program["threshold"] ?? 0.8;
let engineInstance = new Cobra(accessKey, {
libraryPath: libraryFilePath,
});
if (!fs.existsSync(audioPath)) {
console.error(`--input_audio_file_path file not found: ${audioPath}`);
return;
}
let waveBuffer = fs.readFileSync(audioPath);
let inputWaveFile;
try {
inputWaveFile = new WaveFile(waveBuffer);
} catch (error) {
console.error(`Exception trying to read file as wave format: ${audioPath}`);
console.error(error);
return;
}
if (!checkWaveFile(inputWaveFile, engineInstance.sampleRate)) {
console.error(
"Audio file did not meet requirements. Wave file must be 16KHz, 16-bit, linear PCM (mono)."
);
}
let frames = getInt16Frames(inputWaveFile, engineInstance.frameLength);
const printedNumbers = new Set();
for (let i = 0; i < frames.length; i++) {
const result = engineInstance.process(frames[i]);
const timestamp = (
(i * engineInstance.frameLength) /
engineInstance.sampleRate
).toFixed(1);
if (result >= threshold && !printedNumbers.has(timestamp)) {
console.log(`Detected voice activity at ${timestamp} sec`);
printedNumbers.add(timestamp);
}
}
engineInstance.release();
}
fileDemo();