Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
DeepSpeech
提交
caa8eb4d
D
DeepSpeech
项目概览
PaddlePaddle
/
DeepSpeech
大约 2 年 前同步成功
通知
210
Star
8425
Fork
1598
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
245
列表
看板
标记
里程碑
合并请求
3
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
D
DeepSpeech
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
245
Issue
245
列表
看板
标记
里程碑
合并请求
3
合并请求
3
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
caa8eb4d
编写于
4月 24, 2022
作者:
K
KP
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
Add KWS example.
上级
43659b98
变更
4
显示空白变更内容
内联
并排
Showing
4 changed file
with
28 addition
and
18 deletion
+28
-18
examples/hey_snips/kws0/local/train.sh
examples/hey_snips/kws0/local/train.sh
+1
-0
examples/hey_snips/kws0/run.sh
examples/hey_snips/kws0/run.sh
+5
-0
paddlespeech/kws/exps/mdtc/compute_det.py
paddlespeech/kws/exps/mdtc/compute_det.py
+12
-9
paddlespeech/kws/models/loss.py
paddlespeech/kws/models/loss.py
+10
-9
未找到文件。
examples/hey_snips/kws0/local/train.sh
浏览文件 @
caa8eb4d
...
@@ -7,6 +7,7 @@ if [ ${ngpu} -gt 0 ]; then
...
@@ -7,6 +7,7 @@ if [ ${ngpu} -gt 0 ]; then
python3
-m
paddle.distributed.launch
--gpus
$CUDA_VISIBLE_DEVICES
${
BIN_DIR
}
/train.py
\
python3
-m
paddle.distributed.launch
--gpus
$CUDA_VISIBLE_DEVICES
${
BIN_DIR
}
/train.py
\
--cfg_path
${
cfg_path
}
--cfg_path
${
cfg_path
}
else
else
echo
"set CUDA_VISIBLE_DEVICES to enable multi-gpus trainning."
python3
${
BIN_DIR
}
/train.py
\
python3
${
BIN_DIR
}
/train.py
\
--cfg_path
${
cfg_path
}
--cfg_path
${
cfg_path
}
fi
fi
examples/hey_snips/kws0/run.sh
浏览文件 @
caa8eb4d
...
@@ -18,6 +18,11 @@ source path.sh
...
@@ -18,6 +18,11 @@ source path.sh
ngpu
=
$(
echo
$CUDA_VISIBLE_DEVICES
|
awk
-F
","
'{print NF}'
)
ngpu
=
$(
echo
$CUDA_VISIBLE_DEVICES
|
awk
-F
","
'{print NF}'
)
if
[
$#
!=
1
]
;
then
echo
"usage: CUDA_VISIBLE_DEVICES=0
${
0
}
config_path"
exit
-1
fi
stage
=
1
stage
=
1
stop_stage
=
3
stop_stage
=
3
...
...
paddlespeech/kws/exps/mdtc/compute_det.py
浏览文件 @
caa8eb4d
...
@@ -15,6 +15,7 @@
...
@@ -15,6 +15,7 @@
import
argparse
import
argparse
import
os
import
os
import
paddle
import
yaml
import
yaml
from
tqdm
import
tqdm
from
tqdm
import
tqdm
...
@@ -23,32 +24,34 @@ from paddlespeech.s2t.utils.dynamic_import import dynamic_import
...
@@ -23,32 +24,34 @@ from paddlespeech.s2t.utils.dynamic_import import dynamic_import
# yapf: disable
# yapf: disable
parser
=
argparse
.
ArgumentParser
(
__doc__
)
parser
=
argparse
.
ArgumentParser
(
__doc__
)
parser
.
add_argument
(
"--cfg_path"
,
type
=
str
,
required
=
True
)
parser
.
add_argument
(
"--cfg_path"
,
type
=
str
,
required
=
True
)
parser
.
add_argument
(
'--keyword
'
,
type
=
int
,
default
=
0
,
help
=
'keyword label
'
)
parser
.
add_argument
(
'--keyword
_index'
,
type
=
int
,
default
=
0
,
help
=
'keyword index
'
)
parser
.
add_argument
(
'--step'
,
type
=
float
,
default
=
0.01
,
help
=
'threshold step'
)
parser
.
add_argument
(
'--step'
,
type
=
float
,
default
=
0.01
,
help
=
'threshold step
of trigger score
'
)
parser
.
add_argument
(
'--window_shift'
,
type
=
int
,
default
=
50
,
help
=
'window_shift is used to skip the frames after triggered'
)
parser
.
add_argument
(
'--window_shift'
,
type
=
int
,
default
=
50
,
help
=
'window_shift is used to skip the frames after triggered'
)
args
=
parser
.
parse_args
()
args
=
parser
.
parse_args
()
# yapf: enable
# yapf: enable
def
load_label_and_score
(
keyword
,
ds
,
score_file
):
def
load_label_and_score
(
keyword_index
:
int
,
score_table
=
{}
ds
:
paddle
.
io
.
Dataset
,
score_file
:
os
.
PathLike
):
score_table
=
{}
# {utt_id: scores_over_frames}
with
open
(
score_file
,
'r'
,
encoding
=
'utf8'
)
as
fin
:
with
open
(
score_file
,
'r'
,
encoding
=
'utf8'
)
as
fin
:
for
line
in
fin
:
for
line
in
fin
:
arr
=
line
.
strip
().
split
()
arr
=
line
.
strip
().
split
()
key
=
arr
[
0
]
key
=
arr
[
0
]
current_keyword
=
arr
[
1
]
current_keyword
=
arr
[
1
]
str_list
=
arr
[
2
:]
str_list
=
arr
[
2
:]
if
int
(
current_keyword
)
==
keyword
:
if
int
(
current_keyword
)
==
keyword
_index
:
scores
=
list
(
map
(
float
,
str_list
))
scores
=
list
(
map
(
float
,
str_list
))
if
key
not
in
score_table
:
if
key
not
in
score_table
:
score_table
.
update
({
key
:
scores
})
score_table
.
update
({
key
:
scores
})
keyword_table
=
{}
keyword_table
=
{}
# scores of keyword utt_id
filler_table
=
{}
filler_table
=
{}
# scores of non-keyword utt_id
filler_duration
=
0.0
filler_duration
=
0.0
for
key
,
index
,
duration
in
zip
(
ds
.
keys
,
ds
.
labels
,
ds
.
durations
):
for
key
,
index
,
duration
in
zip
(
ds
.
keys
,
ds
.
labels
,
ds
.
durations
):
assert
key
in
score_table
assert
key
in
score_table
if
index
==
keyword
:
if
index
==
keyword
_index
:
keyword_table
[
key
]
=
score_table
[
key
]
keyword_table
[
key
]
=
score_table
[
key
]
else
:
else
:
filler_table
[
key
]
=
score_table
[
key
]
filler_table
[
key
]
=
score_table
[
key
]
...
@@ -78,7 +81,7 @@ if __name__ == '__main__':
...
@@ -78,7 +81,7 @@ if __name__ == '__main__':
print
(
'Filler total duration Hours: {}'
.
format
(
filler_duration
/
3600.0
))
print
(
'Filler total duration Hours: {}'
.
format
(
filler_duration
/
3600.0
))
pbar
=
tqdm
(
total
=
int
(
1.0
/
args
.
step
))
pbar
=
tqdm
(
total
=
int
(
1.0
/
args
.
step
))
with
open
(
stats_file
,
'w'
,
encoding
=
'utf8'
)
as
fout
:
with
open
(
stats_file
,
'w'
,
encoding
=
'utf8'
)
as
fout
:
keyword_index
=
args
.
keyword
keyword_index
=
args
.
keyword
_index
threshold
=
0.0
threshold
=
0.0
while
threshold
<=
1.0
:
while
threshold
<=
1.0
:
num_false_reject
=
0
num_false_reject
=
0
...
...
paddlespeech/kws/models/loss.py
浏览文件 @
caa8eb4d
...
@@ -15,7 +15,16 @@
...
@@ -15,7 +15,16 @@
import
paddle
import
paddle
def
fill_mask_elements
(
condition
,
value
,
x
):
def
padding_mask
(
lengths
:
paddle
.
Tensor
)
->
paddle
.
Tensor
:
batch_size
=
lengths
.
shape
[
0
]
max_len
=
int
(
lengths
.
max
().
item
())
seq
=
paddle
.
arange
(
max_len
,
dtype
=
paddle
.
int64
)
seq
=
seq
.
expand
((
batch_size
,
max_len
))
return
seq
>=
lengths
.
unsqueeze
(
1
)
def
fill_mask_elements
(
condition
:
paddle
.
Tensor
,
value
:
float
,
x
:
paddle
.
Tensor
)
->
paddle
.
Tensor
:
assert
condition
.
shape
==
x
.
shape
assert
condition
.
shape
==
x
.
shape
values
=
paddle
.
ones_like
(
x
,
dtype
=
x
.
dtype
)
*
value
values
=
paddle
.
ones_like
(
x
,
dtype
=
x
.
dtype
)
*
value
return
paddle
.
where
(
condition
,
values
,
x
)
return
paddle
.
where
(
condition
,
values
,
x
)
...
@@ -70,11 +79,3 @@ def max_pooling_loss(logits: paddle.Tensor,
...
@@ -70,11 +79,3 @@ def max_pooling_loss(logits: paddle.Tensor,
acc
=
num_correct
/
num_utts
acc
=
num_correct
/
num_utts
# acc = 0.0
# acc = 0.0
return
loss
,
num_correct
,
acc
return
loss
,
num_correct
,
acc
def
padding_mask
(
lengths
:
paddle
.
Tensor
)
->
paddle
.
Tensor
:
batch_size
=
lengths
.
shape
[
0
]
max_len
=
int
(
lengths
.
max
().
item
())
seq
=
paddle
.
arange
(
max_len
,
dtype
=
paddle
.
int64
)
seq
=
seq
.
expand
((
batch_size
,
max_len
))
return
seq
>=
lengths
.
unsqueeze
(
1
)
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录