Add initial project files including Vosk model and audio recognition script

This commit is contained in:
2024-11-30 20:42:31 +01:00
parent 20cdafb2bf
commit 7c416c5f85
21 changed files with 407 additions and 0 deletions
+10
View File
@@ -0,0 +1,10 @@
Copyright 2022-2050 AC Technologies LLC
Small Spanish model for Vosk
WER
%WER 42.63 [ 52779 / 123813, 4570 ins, 22135 del, 26074 sub ] exp/chain/tdnn/decode_test_call/wer_10_0.0
%WER 16.02 [ 24405 / 152364, 3121 ins, 5007 del, 16277 sub ] exp/chain/tdnn/decode_test_cv/wer_11_0.0
%WER 11.21 [ 9922 / 88499, 1811 ins, 1675 del, 6436 sub ] exp/chain/tdnn/decode_test_mls/wer_10_0.0
%WER 16.72 [ 2410 / 14416, 445 ins, 696 del, 1269 sub ] exp/chain/tdnn/decode_test_mtedx/wer_10_0.0
Binary file not shown.
+8
View File
@@ -0,0 +1,8 @@
--sample-frequency=16000.0
--use-energy=false
--num-mel-bins=40
--num-ceps=40
--low-freq=20
--high-freq=7600
--allow-upsample=true
--allow-downsample=true
+10
View File
@@ -0,0 +1,10 @@
--min-active=200
--max-active=4000
--beam=11.0
--lattice-beam=4.0
--acoustic-scale=1.0
--frame-subsampling-factor=3
--endpoint.silence-phones=1:2:3:4:5:6:7:8:9:10
--endpoint.rule2.min-trailing-silence=0.5
--endpoint.rule3.min-trailing-silence=1.0
--endpoint.rule4.min-trailing-silence=2.0
Binary file not shown.
Binary file not shown.
@@ -0,0 +1,10 @@
7601
7602
7603
7604
7605
7606
7607
7608
7609
7610
@@ -0,0 +1,110 @@
1 nonword
2 begin
3 end
4 internal
5 singleton
6 nonword
7 begin
8 end
9 internal
10 singleton
11 begin
12 end
13 internal
14 singleton
15 begin
16 end
17 internal
18 singleton
19 begin
20 end
21 internal
22 singleton
23 begin
24 end
25 internal
26 singleton
27 begin
28 end
29 internal
30 singleton
31 begin
32 end
33 internal
34 singleton
35 begin
36 end
37 internal
38 singleton
39 begin
40 end
41 internal
42 singleton
43 begin
44 end
45 internal
46 singleton
47 begin
48 end
49 internal
50 singleton
51 begin
52 end
53 internal
54 singleton
55 begin
56 end
57 internal
58 singleton
59 begin
60 end
61 internal
62 singleton
63 begin
64 end
65 internal
66 singleton
67 begin
68 end
69 internal
70 singleton
71 begin
72 end
73 internal
74 singleton
75 begin
76 end
77 internal
78 singleton
79 begin
80 end
81 internal
82 singleton
83 begin
84 end
85 internal
86 singleton
87 begin
88 end
89 internal
90 singleton
91 begin
92 end
93 internal
94 singleton
95 begin
96 end
97 internal
98 singleton
99 begin
100 end
101 internal
102 singleton
103 begin
104 end
105 internal
106 singleton
107 begin
108 end
109 internal
110 singleton
Binary file not shown.
Binary file not shown.
Binary file not shown.
@@ -0,0 +1,3 @@
[
8.46276e+10 7.072285e+08 -1.289904e+10 5.671974e+09 -1.209136e+10 -2.034736e+10 -6.875634e+09 -1.557388e+10 -2.806233e+09 -3.674485e+09 -6.921794e+09 6.946679e+08 -8.52497e+09 -7.260168e+08 -4.343575e+09 -5.486674e+09 -1.710502e+09 -1.996049e+09 -2.165263e+09 -6.832425e+07 -9.641756e+08 5.967002e+07 -1.110601e+08 4.368464e+07 -1.341292e+07 5.138013e+08 1.807307e+08 -1.273191e+08 9.086873e+08 -7.03787e+08 6.228164e+08 2.102328e+08 4.091046e+07 1.103751e+09 1.753195e+07 6.810451e+08 3.860742e+08 -6.252538e+08 2.375626e+08 -4.708622e+08 8.625583e+08
8.661931e+12 5.440279e+11 7.661625e+11 5.86159e+11 5.687293e+11 1.020851e+12 6.045613e+11 8.250028e+11 4.274593e+11 3.851017e+11 4.398129e+11 4.172123e+11 3.736421e+11 2.438057e+11 2.363456e+11 2.023758e+11 1.314776e+11 8.931146e+10 5.928187e+10 3.395453e+10 1.88439e+10 6.181701e+09 7.988108e+08 2.281808e+08 3.149188e+09 8.009975e+09 1.215929e+10 1.646801e+10 2.218979e+10 2.492957e+10 2.43543e+10 2.243619e+10 2.445217e+10 2.796862e+10 2.215869e+10 1.68782e+10 1.565755e+10 1.461083e+10 1.140419e+10 7.335776e+09 0 ]
@@ -0,0 +1 @@
# configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh
@@ -0,0 +1,2 @@
--left-context=3
--right-context=3