blob: 3d1a470f5ffea250269206003dead9359d62fdfb (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
|
nerv.speech_utils = {}
function nerv.speech_utils.global_transf(feat_utter, global_transf, frm_ext, gconf)
local rearranged
feat_utter = gconf.cumat_type.new_from_host(feat_utter)
if frm_ext > 0 then
local step = frm_ext * 2 + 1
-- expand the feature
local expanded = gconf.cumat_type(feat_utter:nrow(), feat_utter:ncol() * step)
expanded:expand_frm(feat_utter, frm_ext)
-- rearrange the feature (``transpose'' operation in TNet)
rearranged = expanded:create()
rearranged:rearrange_frm(expanded, step)
else
rearranged = feat_utter
end
-- prepare for transf
local input = {rearranged}
local output = {rearranged:create()}
-- do transf
global_transf:init(input[1]:nrow())
global_transf:propagate(input, output)
-- trim frames
expanded = gconf.mmat_type(output[1]:nrow() - frm_ext * 2, output[1]:ncol())
output[1]:copy_toh(expanded, frm_ext, feat_utter:nrow() - frm_ext)
collectgarbage("collect")
return expanded
end
|