blob: 9fdb0807f70b87ea86cb9dc0138fd90b49cab5ee (
plain) (
tree)
|
|
require 'libkaldiio'
require 'speech_utils'
local KaldiReader = nerv.class("nerv.KaldiReader", "nerv.DataReader")
function KaldiReader:__init(global_conf, reader_conf)
self.feat_id = reader_conf.id
self.frm_ext = reader_conf.frm_ext
self.gconf = global_conf
self.global_transf = reader_conf.global_transf
self.debug = global_conf.debug
if self.debug == nil then
self.debug = false
end
self.feat_repo = nerv.KaldiFeatureRepo(reader_conf.feature_rspecifier)
self.lab_repo = {}
for id, mlf_spec in pairs(reader_conf.mlfs) do
self.lab_repo[id] = nerv.KaldiLabelRepo(mlf_spec.targets_rspecifier,
mlf_spec.format)
end
end
function KaldiReader:get_data()
if self.feat_repo:is_end() then
return nil
end
local res = {}
-- read Kaldi feature
local feat_utter = self.feat_repo:cur_utter(self.debug)
-- global transf
local transformed = nerv.speech_utils.global_transf(feat_utter,
self.global_transf, self.frm_ext, 0, self.gconf)
res[self.feat_id] = transformed
-- add corresponding labels
for id, repo in pairs(self.lab_repo) do
local lab_utter = repo:get_utter(self.feat_repo,
self.frm_ext,
transformed:nrow(),
self.debug)
res[id] = lab_utter
end
-- move the pointer to next
self.feat_repo:next()
collectgarbage("collect")
return res
end
|