From 119f9091ea60d81efabd7d20ff2490b9e7084778 Mon Sep 17 00:00:00 2001 From: Eric Bi Date: Tue, 1 Dec 2015 17:03:39 +0800 Subject: add detection of utterances without alignment, and skip them --- kaldi_io/init.lua | 8 ++++++++ 1 file changed, 8 insertions(+) (limited to 'kaldi_io/init.lua') diff --git a/kaldi_io/init.lua b/kaldi_io/init.lua index e538ee5..5193504 100644 --- a/kaldi_io/init.lua +++ b/kaldi_io/init.lua @@ -36,6 +36,7 @@ function KaldiReader:__init(global_conf, reader_conf) end function KaldiReader:get_data() + local fail_to_read_alignment = false if self.feat_repo:is_end() then return nil end @@ -75,6 +76,9 @@ function KaldiReader:get_data() local lab_utter = repo:get_utter(self.feat_repo, feat_utter:nrow(), self.debug) + if lab_utter == nil then + fail_to_read_alignment = true + end res[id] = lab_utter end -- add corresponding lookup features @@ -98,5 +102,9 @@ function KaldiReader:get_data() -- move the pointer to next self.feat_repo:next() collectgarbage("collect") + if fail_to_read_alignment then + nerv.info("[Kaldi IO] utterance %s alignment not found, skip it.", self.feat_repo:key()) + res = self:get_data() + end return res end -- cgit v1.2.3-70-g09d2 From 24d56605428467e604afded423ba2ff49f2644e3 Mon Sep 17 00:00:00 2001 From: Eric Bi Date: Thu, 3 Dec 2015 20:12:59 +0800 Subject: fix last commit that broke decoding --- kaldi_io/init.lua | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) (limited to 'kaldi_io/init.lua') diff --git a/kaldi_io/init.lua b/kaldi_io/init.lua index 5193504..9f3ad55 100644 --- a/kaldi_io/init.lua +++ b/kaldi_io/init.lua @@ -76,7 +76,8 @@ function KaldiReader:get_data() local lab_utter = repo:get_utter(self.feat_repo, feat_utter:nrow(), self.debug) - if lab_utter == nil then + -- need provide 'gconf.decoding = true' while decoding + if not self.gconf.decoding and lab_utter == nil then fail_to_read_alignment = true end res[id] = lab_utter -- cgit v1.2.3-70-g09d2