kaldi-asr
diff --git a/‎egs/xbmu_amdo31/README.txt‎
Lines changed: 11 additions & 0 deletions b/‎egs/xbmu_amdo31/README.txt‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/RESULTS‎
Lines changed: 8 additions & 0 deletions b/‎egs/xbmu_amdo31/s5/RESULTS‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/cmd.sh‎
Lines changed: 15 additions & 0 deletions b/‎egs/xbmu_amdo31/s5/cmd.sh‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/conf/decode.config‎
Lines changed: 5 additions & 0 deletions b/‎egs/xbmu_amdo31/s5/conf/decode.config‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/conf/mfcc.conf‎
Lines changed: 2 additions & 0 deletions b/‎egs/xbmu_amdo31/s5/conf/mfcc.conf‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/conf/mfcc_hires.conf‎
Lines changed: 10 additions & 0 deletions b/‎egs/xbmu_amdo31/s5/conf/mfcc_hires.conf‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/conf/online_cmvn.conf‎
Lines changed: 1 addition & 0 deletions b/‎egs/xbmu_amdo31/s5/conf/online_cmvn.conf‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/conf/online_pitch.conf‎
Lines changed: 4 additions & 0 deletions b/‎egs/xbmu_amdo31/s5/conf/online_pitch.conf‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/conf/pitch.conf‎
Lines changed: 1 addition & 0 deletions b/‎egs/xbmu_amdo31/s5/conf/pitch.conf‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎egs/xbmu_amdo31/s5/local/chain/run_tdnn.sh‎
Lines changed: 1 addition & 0 deletions b/‎egs/xbmu_amdo31/s5/local/chain/run_tdnn.sh‎
Lines changed: 1 addition & 0 deletions
@@ -0,0 +1,11 @@
+About the XBMU-AMDO31 corpus XBMU-AMDO31 is an open-source Amdo Tibetan speech corpus published by Northwest Minzu University. 
+
+XBMU-AMDO31 dataset is a speech recognition corpus of Tibetan Amdo dialect. The open source corpus contains 31 hours of speech data and resources related to build speech recognition systems,including transcribed texts and a Tibetan pronunciation lexicon. (The lexicon is a Tibetan lexicon of the Lhasa dialect, which has been reused for the Amdo dialect because of the uniformity of the Tibetan language) The dataset can be used to train a model for Amdo Tibetan Automatic Speech Recognition (ASR).
+
+The database can be downloaded from openslr:
+http://www.openslr.org/133/
+
+For more details, please visit: 
+https://huggingface.co/datasets/syzym/xbmu_amdo31
+
+This recipe includes some different ASR models trained with XBMU-AMDO31.
@@ -0,0 +1,8 @@
+%WER 46.16 [ 15522 / 33628, 380 ins, 2208 del, 12934 sub ] exp/mono/decode_test/wer_10_0.0
+%WER 24.60 [ 8274 / 33628, 330 ins, 860 del, 7084 sub ] exp/tri1/decode_test/wer_13_0.0
+%WER 24.42 [ 8213 / 33628, 323 ins, 847 del, 7043 sub ] exp/tri2/decode_test/wer_13_0.0
+%WER 22.93 [ 7712 / 33628, 336 ins, 814 del, 6562 sub ] exp/tri3a/decode_test/wer_12_0.0
+%WER 20.17 [ 6783 / 33628, 275 ins, 764 del, 5744 sub ] exp/tri4a/decode_test/wer_15_0.0
+%WER 19.03 [ 6400 / 33628, 292 ins, 667 del, 5441 sub ] exp/tri5a/decode_test/wer_14_0.0
+%WER 15.45 [ 5196 / 33628, 229 ins, 646 del, 4321 sub ] exp/nnet3/tdnn_sp/decode_test/wer_16_0.0
+%WER 15.57 [ 5235 / 33628, 244 ins, 575 del, 4416 sub ] exp/chain/tdnn_1a_sp/decode_test/wer_11_0.0
@@ -0,0 +1,15 @@
+# you can change cmd.sh depending on what type of queue you are using.
+# If you have no queueing system and want to run on a local machine, you
+# can change all instances 'queue.pl' to run.pl (but be careful and run
+# commands one by one: most recipes will exhaust the memory on your
+# machine).  queue.pl works with GridEngine (qsub).  slurm.pl works
+# with slurm.  Different queues are configured differently, with different
+# queue names and different ways of specifying things like memory;
+# to account for these differences you can create and edit the file
+# conf/queue.conf to match your queue's configuration.  Search for
+# conf/queue.conf in http://kaldi-asr.org/doc/queue.html for more information,
+# or search for the string 'default_config' in utils/queue.pl or utils/slurm.pl.
+
+export train_cmd="queue.pl --mem 2G"
+export decode_cmd="queue.pl --mem 4G"
+export mkgraph_cmd="queue.pl --mem 8G"
@@ -0,0 +1,5 @@
+beam=11.0 # beam for decoding.  Was 13.0 in the scripts.
+first_beam=8.0 # beam for 1st-pass decoding in SAT.
+
+
+
@@ -0,0 +1,2 @@
+--use-energy=false   # only non-default option.
+--sample-frequency=16000
@@ -0,0 +1,10 @@
+# config for high-resolution MFCC features, intended for neural network training.
+# Note: we keep all cepstra, so it has the same info as filterbank features,
+# but MFCC is more easily compressible (because less correlated) which is why
+# we prefer this method.
+--use-energy=false   # use average of log energy, not energy.
+--sample-frequency=16000 #  Switchboard is sampled at 8kHz
+--num-mel-bins=40     # similar to Google's setup.
+--num-ceps=40     # there is no dimensionality reduction.
+--low-freq=40    # low cutoff frequency for mel bins
+--high-freq=-200 # high cutoff frequently, relative to Nyquist of 8000 (=3800)
@@ -0,0 +1 @@
+# configuration file for apply-cmvn-online, used when invoking online2-wav-nnet3-latgen-faster.
@@ -0,0 +1,4 @@
+--sample-frequency=16000
+--simulate-first-pass-online=true
+--normalization-right-context=25
+--frames-per-chunk=10
@@ -0,0 +1 @@
+--sample-frequency=16000
@@ -0,0 +1 @@
+tuning/run_tdnn_1a.sh
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +beam=11.0 # beam for decoding.  Was 13.0 in the scripts.
 +first_beam=8.0 # beam for 1st-pass decoding in SAT.
++
++
++
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+--use-energy=false # only non-default option.`
	`2`	`+--sample-frequency=16000`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+# configuration file for apply-cmvn-online, used when invoking online2-wav-nnet3-latgen-faster.`