Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
DeepSpeech
提交
622d3883
D
DeepSpeech
项目概览
PaddlePaddle
/
DeepSpeech
大约 1 年 前同步成功
通知
206
Star
8425
Fork
1598
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
245
列表
看板
标记
里程碑
合并请求
3
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
D
DeepSpeech
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
245
Issue
245
列表
看板
标记
里程碑
合并请求
3
合并请求
3
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
体验新版 GitCode,发现更多精彩内容 >>
提交
622d3883
编写于
8月 17, 2022
作者:
Y
YangZhou
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
make soundfile compatible
上级
91ce0d87
变更
13
隐藏空白更改
内联
并排
Showing
13 changed file
with
21 addition
and
17 deletion
+21
-17
examples/voxceleb/sv0/local/make_rirs_noise_csv_dataset_from_json.py
...xceleb/sv0/local/make_rirs_noise_csv_dataset_from_json.py
+1
-1
examples/voxceleb/sv0/local/make_vox_csv_dataset_from_json.py
...ples/voxceleb/sv0/local/make_vox_csv_dataset_from_json.py
+1
-1
paddlespeech/audio/__init__.py
paddlespeech/audio/__init__.py
+2
-0
paddlespeech/audio/backends/soundfile_backend.py
paddlespeech/audio/backends/soundfile_backend.py
+6
-5
paddlespeech/cli/cls/infer.py
paddlespeech/cli/cls/infer.py
+1
-1
paddlespeech/cli/kws/infer.py
paddlespeech/cli/kws/infer.py
+1
-1
paddlespeech/cli/vector/infer.py
paddlespeech/cli/vector/infer.py
+1
-1
paddlespeech/cls/exps/panns/deploy/predict.py
paddlespeech/cls/exps/panns/deploy/predict.py
+2
-2
paddlespeech/server/engine/vector/python/vector_engine.py
paddlespeech/server/engine/vector/python/vector_engine.py
+1
-1
paddlespeech/vector/exps/ecapa_tdnn/extract_emb.py
paddlespeech/vector/exps/ecapa_tdnn/extract_emb.py
+1
-1
paddlespeech/vector/io/dataset.py
paddlespeech/vector/io/dataset.py
+2
-1
paddlespeech/vector/io/dataset_from_json.py
paddlespeech/vector/io/dataset_from_json.py
+1
-1
tests/unit/audio/features/base.py
tests/unit/audio/features/base.py
+1
-1
未找到文件。
examples/voxceleb/sv0/local/make_rirs_noise_csv_dataset_from_json.py
浏览文件 @
622d3883
...
...
@@ -23,7 +23,7 @@ from typing import List
import
tqdm
from
yacs.config
import
CfgNode
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.s2t.utils.log
import
Log
from
paddlespeech.vector.utils.vector_utils
import
get_chunks
...
...
examples/voxceleb/sv0/local/make_vox_csv_dataset_from_json.py
浏览文件 @
622d3883
...
...
@@ -24,7 +24,7 @@ import random
import
tqdm
from
yacs.config
import
CfgNode
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.s2t.utils.log
import
Log
from
paddlespeech.vector.utils.vector_utils
import
get_chunks
...
...
paddlespeech/audio/__init__.py
浏览文件 @
622d3883
...
...
@@ -26,6 +26,7 @@ from . import utils
from
paddlespeech.audio.backends
import
get_audio_backend
from
paddlespeech.audio.backends
import
list_audio_backends
from
paddlespeech.audio.backends
import
set_audio_backend
from
paddlespeech.audio.backends
import
soundfile_backend
__all__
=
[
"io"
,
...
...
@@ -37,4 +38,5 @@ __all__ = [
"list_audio_backends"
,
"get_audio_backend"
,
"set_audio_backend"
,
"soudfile_backend"
,
]
paddlespeech/audio/backends/soundfile_backend.py
浏览文件 @
622d3883
...
...
@@ -34,8 +34,9 @@ __all__ = [
'save'
,
'soudfile_save'
,
'load'
,
'soundfile_load'
,
'info'
'load_old'
,
'info'
,
'to_mono'
]
NORMALMIZE_TYPES
=
[
'linear'
,
'gaussian'
]
MERGE_TYPES
=
[
'ch0'
,
'ch1'
,
'random'
,
'average'
]
...
...
@@ -122,7 +123,7 @@ def to_mono(y: np.ndarray, merge_type: str='average') -> np.ndarray:
return
y_out
def
soundfile_load
(
file
:
os
.
PathLike
,
def
soundfile_load
_
(
file
:
os
.
PathLike
,
offset
:
Optional
[
float
]
=
None
,
dtype
:
str
=
'int16'
,
duration
:
Optional
[
int
]
=
None
)
->
Tuple
[
np
.
ndarray
,
int
]:
...
...
@@ -204,7 +205,7 @@ def soundfile_save(y: np.ndarray, sr: int, file: os.PathLike) -> None:
wavfile
.
write
(
file
,
sr
,
y_out
)
def
soudfile_load
(
def
sou
n
dfile_load
(
file
:
os
.
PathLike
,
sr
:
Optional
[
int
]
=
None
,
mono
:
bool
=
True
,
...
...
@@ -235,7 +236,7 @@ def soudfile_load(
Tuple[np.ndarray, int]: Waveform in ndarray and its samplerate.
"""
y
,
r
=
sound
_file_load
(
file
,
offset
=
offset
,
dtype
=
dtype
,
duration
=
duration
)
y
,
r
=
sound
file_load_
(
file
,
offset
=
offset
,
dtype
=
dtype
,
duration
=
duration
)
if
not
((
y
.
ndim
==
1
and
len
(
y
)
>
0
)
or
(
y
.
ndim
==
2
and
len
(
y
[
0
])
>
0
)):
raise
ParameterError
(
f
'audio file
{
file
}
looks empty'
)
...
...
paddlespeech/cli/cls/infer.py
浏览文件 @
622d3883
...
...
@@ -25,7 +25,7 @@ import yaml
from
..executor
import
BaseExecutor
from
..log
import
logger
from
..utils
import
stats_wrapper
from
paddlespeech.audio
import
load
from
paddlespeech.audio
.soundfile_backend
import
soundfile_load
as
load
from
paddlespeech.audio.features
import
LogMelSpectrogram
__all__
=
[
'CLSExecutor'
]
...
...
paddlespeech/cli/kws/infer.py
浏览文件 @
622d3883
...
...
@@ -24,7 +24,7 @@ import yaml
from
..executor
import
BaseExecutor
from
..log
import
logger
from
..utils
import
stats_wrapper
from
paddlespeech.audio
import
load
from
paddlespeech.audio
.soundfile_backend
import
soundfile_load
as
load_audio
from
paddlespeech.audio.compliance.kaldi
import
fbank
as
kaldi_fbank
__all__
=
[
'KWSExecutor'
]
...
...
paddlespeech/cli/vector/infer.py
浏览文件 @
622d3883
...
...
@@ -27,7 +27,7 @@ from yacs.config import CfgNode
from
..executor
import
BaseExecutor
from
..log
import
logger
from
..utils
import
stats_wrapper
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.audio.compliance.librosa
import
melspectrogram
from
paddlespeech.vector.io.batch
import
feature_normalize
from
paddlespeech.vector.modules.sid_model
import
SpeakerIdetification
...
...
paddlespeech/cls/exps/panns/deploy/predict.py
浏览文件 @
622d3883
...
...
@@ -18,7 +18,7 @@ import numpy as np
from
paddle
import
inference
from
scipy.special
import
softmax
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.audio.datasets
import
ESC50
from
paddlespeech.audio.features
import
melspectrogram
...
...
@@ -42,7 +42,7 @@ def extract_features(files: str, **kwargs):
srs
=
[]
max_length
=
float
(
'-inf'
)
for
file
in
files
:
waveform
,
sr
=
load_audio
(
file
,
sr
=
None
)
waveform
,
sr
=
load_audio
(
file
)
max_length
=
max
(
max_length
,
len
(
waveform
))
waveforms
.
append
(
waveform
)
srs
.
append
(
sr
)
...
...
paddlespeech/server/engine/vector/python/vector_engine.py
浏览文件 @
622d3883
...
...
@@ -17,7 +17,7 @@ from collections import OrderedDict
import
numpy
as
np
import
paddle
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.audio.compliance.librosa
import
melspectrogram
from
paddlespeech.cli.log
import
logger
from
paddlespeech.cli.vector.infer
import
VectorExecutor
...
...
paddlespeech/vector/exps/ecapa_tdnn/extract_emb.py
浏览文件 @
622d3883
...
...
@@ -18,7 +18,7 @@ import time
import
paddle
from
yacs.config
import
CfgNode
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.audio.compliance.librosa
import
melspectrogram
from
paddlespeech.s2t.utils.log
import
Log
from
paddlespeech.vector.io.batch
import
feature_normalize
...
...
paddlespeech/vector/io/dataset.py
浏览文件 @
622d3883
...
...
@@ -16,7 +16,8 @@ from dataclasses import fields
from
paddle.io
import
Dataset
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio.soundfile_backend
import
soundfile_load
as
load_audio
from
paddlespeech.audio.compliance.librosa
import
melspectrogram
from
paddlespeech.s2t.utils.log
import
Log
logger
=
Log
(
__name__
).
getlog
()
...
...
paddlespeech/vector/io/dataset_from_json.py
浏览文件 @
622d3883
...
...
@@ -17,7 +17,7 @@ from dataclasses import fields
from
paddle.io
import
Dataset
from
paddlespeech.audio
import
load
as
load_audio
from
paddlespeech.audio
.soundfile_backend
import
soundfile_
load
as
load_audio
from
paddlespeech.audio.compliance.librosa
import
melspectrogram
from
paddlespeech.audio.compliance.librosa
import
mfcc
...
...
tests/unit/audio/features/base.py
浏览文件 @
622d3883
...
...
@@ -18,7 +18,7 @@ import urllib.request
import
numpy
as
np
import
paddle
from
paddlespeech.audio
import
load
from
paddlespeech.audio
.soundfile_backend
import
soundfile_load
as
load
wav_url
=
'https://paddlespeech.bj.bcebos.com/PaddleAudio/zh.wav'
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录