Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
DeepSpeech
提交
0d7d8712
D
DeepSpeech
项目概览
PaddlePaddle
/
DeepSpeech
大约 2 年 前同步成功
通知
210
Star
8425
Fork
1598
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
245
列表
看板
标记
里程碑
合并请求
3
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
D
DeepSpeech
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
245
Issue
245
列表
看板
标记
里程碑
合并请求
3
合并请求
3
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
0d7d8712
编写于
9月 14, 2022
作者:
H
Hui Zhang
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
simplify feature pipeline graph
上级
8690a00b
变更
1
隐藏空白更改
内联
并排
Showing
1 changed file
with
9 addition
and
5 deletion
+9
-5
paddlespeech/audio/compliance/kaldi.py
paddlespeech/audio/compliance/kaldi.py
+9
-5
未找到文件。
paddlespeech/audio/compliance/kaldi.py
浏览文件 @
0d7d8712
...
@@ -357,10 +357,13 @@ def _get_mel_banks(num_bins: int,
...
@@ -357,10 +357,13 @@ def _get_mel_banks(num_bins: int,
(
'Bad values in options: vtln-low {} and vtln-high {}, versus '
(
'Bad values in options: vtln-low {} and vtln-high {}, versus '
'low-freq {} and high-freq {}'
.
format
(
vtln_low
,
vtln_high
,
low_freq
,
high_freq
))
'low-freq {} and high-freq {}'
.
format
(
vtln_low
,
vtln_high
,
low_freq
,
high_freq
))
bin
=
paddle
.
arange
(
num_bins
).
unsqueeze
(
1
)
bin
=
paddle
.
arange
(
num_bins
,
dtype
=
paddle
.
float32
).
unsqueeze
(
1
)
# left_mel = mel_low_freq + bin * mel_freq_delta # (num_bins, 1)
# center_mel = mel_low_freq + (bin + 1.0) * mel_freq_delta # (num_bins, 1)
# right_mel = mel_low_freq + (bin + 2.0) * mel_freq_delta # (num_bins, 1)
left_mel
=
mel_low_freq
+
bin
*
mel_freq_delta
# (num_bins, 1)
left_mel
=
mel_low_freq
+
bin
*
mel_freq_delta
# (num_bins, 1)
center_mel
=
mel_low_freq
+
(
bin
+
1.0
)
*
mel_freq_delta
# (num_bins, 1)
center_mel
=
left_mel
+
mel_freq_delta
right_mel
=
mel_low_freq
+
(
bin
+
2.0
)
*
mel_freq_delta
# (num_bins, 1)
right_mel
=
center_mel
+
mel_freq_delta
if
vtln_warp_factor
!=
1.0
:
if
vtln_warp_factor
!=
1.0
:
left_mel
=
_vtln_warp_mel_freq
(
vtln_low
,
vtln_high
,
low_freq
,
high_freq
,
left_mel
=
_vtln_warp_mel_freq
(
vtln_low
,
vtln_high
,
low_freq
,
high_freq
,
...
@@ -373,7 +376,7 @@ def _get_mel_banks(num_bins: int,
...
@@ -373,7 +376,7 @@ def _get_mel_banks(num_bins: int,
center_freqs
=
_inverse_mel_scale
(
center_mel
)
# (num_bins)
center_freqs
=
_inverse_mel_scale
(
center_mel
)
# (num_bins)
# (1, num_fft_bins)
# (1, num_fft_bins)
mel
=
_mel_scale
(
fft_bin_width
*
paddle
.
arange
(
num_fft_bins
)).
unsqueeze
(
0
)
mel
=
_mel_scale
(
fft_bin_width
*
paddle
.
arange
(
num_fft_bins
,
dtype
=
paddle
.
float32
)).
unsqueeze
(
0
)
# (num_bins, num_fft_bins)
# (num_bins, num_fft_bins)
up_slope
=
(
mel
-
left_mel
)
/
(
center_mel
-
left_mel
)
up_slope
=
(
mel
-
left_mel
)
/
(
center_mel
-
left_mel
)
...
@@ -472,7 +475,8 @@ def fbank(waveform: Tensor,
...
@@ -472,7 +475,8 @@ def fbank(waveform: Tensor,
# (n_mels, padded_window_size // 2)
# (n_mels, padded_window_size // 2)
mel_energies
,
_
=
_get_mel_banks
(
n_mels
,
padded_window_size
,
sr
,
low_freq
,
mel_energies
,
_
=
_get_mel_banks
(
n_mels
,
padded_window_size
,
sr
,
low_freq
,
high_freq
,
vtln_low
,
vtln_high
,
vtln_warp
)
high_freq
,
vtln_low
,
vtln_high
,
vtln_warp
)
mel_energies
=
mel_energies
.
astype
(
dtype
)
# mel_energies = mel_energies.astype(dtype)
assert
mel_energies
.
dtype
==
dtype
# (n_mels, padded_window_size // 2 + 1)
# (n_mels, padded_window_size // 2 + 1)
mel_energies
=
paddle
.
nn
.
functional
.
pad
(
mel_energies
=
paddle
.
nn
.
functional
.
pad
(
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录