Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
DeepSpeech
提交
38c55e44
D
DeepSpeech
项目概览
PaddlePaddle
/
DeepSpeech
大约 2 年 前同步成功
通知
210
Star
8425
Fork
1598
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
245
列表
看板
标记
里程碑
合并请求
3
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
D
DeepSpeech
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
245
Issue
245
列表
看板
标记
里程碑
合并请求
3
合并请求
3
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
38c55e44
编写于
7月 18, 2022
作者:
Y
Yang Zhou
浏览文件
操作
浏览文件
下载
差异文件
merge audio
上级
cffe555c
a2e8b76a
变更
9
显示空白变更内容
内联
并排
Showing
9 changed file
with
73 addition
and
58 deletion
+73
-58
CMakeLists.txt
CMakeLists.txt
+1
-1
cmake/summary.cmake
cmake/summary.cmake
+5
-1
paddlespeech/audio/_internal/module_utils.py
paddlespeech/audio/_internal/module_utils.py
+1
-0
paddlespeech/audio/backends/no_backend.py
paddlespeech/audio/backends/no_backend.py
+14
-10
paddlespeech/audio/backends/sox_io_backend.py
paddlespeech/audio/backends/sox_io_backend.py
+12
-10
paddlespeech/audio/backends/utils.py
paddlespeech/audio/backends/utils.py
+4
-2
paddlespeech/audio/kaldi/kaldi.py
paddlespeech/audio/kaldi/kaldi.py
+33
-31
paddlespeech/audio/src/CMakeLists.txt
paddlespeech/audio/src/CMakeLists.txt
+1
-1
paddlespeech/audio/src/pybind/kaldi/feature_common.h
paddlespeech/audio/src/pybind/kaldi/feature_common.h
+2
-2
未找到文件。
CMakeLists.txt
浏览文件 @
38c55e44
...
@@ -57,7 +57,7 @@ include(openblas)
...
@@ -57,7 +57,7 @@ include(openblas)
# packages
# packages
find_package
(
Python3 COMPONENTS Interpreter Development
)
find_package
(
Python3 COMPONENTS Interpreter Development
)
find_package
(
pybind11 CONFIG
)
find_package
(
pybind11 CONFIG
REQUIRED
)
# set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -pthread -O0 -Wall -g")
# set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -pthread -O0 -Wall -g")
...
...
cmake/summary.cmake
浏览文件 @
38c55e44
...
@@ -37,5 +37,9 @@ function (onnx_print_configuration_summary)
...
@@ -37,5 +37,9 @@ function (onnx_print_configuration_summary)
message
(
STATUS
" Python executable :
${
Python_EXECUTABLE
}
"
)
message
(
STATUS
" Python executable :
${
Python_EXECUTABLE
}
"
)
message
(
STATUS
" Python includes :
${
Python_INCLUDE_DIR
}
"
)
message
(
STATUS
" Python includes :
${
Python_INCLUDE_DIR
}
"
)
message
(
STATUS
" Python libraries :
${
Python_LIBRARY
}
"
)
message
(
STATUS
" Python libraries :
${
Python_LIBRARY
}
"
)
message
(
STATUS
" PYBIND11 :
${
pybind11_FOUND
}
"
)
message
(
STATUS
" Pybind11 version :
${
pybind11_VERSION
}
"
)
message
(
STATUS
" Pybind11 include :
${
pybind11_INCLUDE_DIR
}
"
)
message
(
STATUS
" Pybind11 includes :
${
pybind11_INCLUDE_DIRS
}
"
)
message
(
STATUS
" Pybind11 libraries :
${
pybind11_LIBRARIES
}
"
)
endfunction
()
endfunction
()
\ No newline at end of file
paddlespeech/audio/_internal/module_utils.py
浏览文件 @
38c55e44
...
@@ -5,6 +5,7 @@ from typing import Optional
...
@@ -5,6 +5,7 @@ from typing import Optional
#code is from https://github.com/pytorch/audio/blob/main/torchaudio/_internal/module_utils.py
#code is from https://github.com/pytorch/audio/blob/main/torchaudio/_internal/module_utils.py
def
is_module_available
(
*
modules
:
str
)
->
bool
:
def
is_module_available
(
*
modules
:
str
)
->
bool
:
r
"""Returns if a top-level module with :attr:`name` exists *without**
r
"""Returns if a top-level module with :attr:`name` exists *without**
importing it. This is generally safer than try-catch block around a
importing it. This is generally safer than try-catch block around a
...
...
paddlespeech/audio/backends/no_backend.py
浏览文件 @
38c55e44
...
@@ -8,19 +8,23 @@ from paddle import Tensor
...
@@ -8,19 +8,23 @@ from paddle import Tensor
#code is from: https://github.com/pytorch/audio/blob/main/torchaudio/backend/no_backend.py
#code is from: https://github.com/pytorch/audio/blob/main/torchaudio/backend/no_backend.py
def
load
(
def
load
(
filepath
:
Union
[
str
,
Path
],
filepath
:
Union
[
str
,
Path
],
out
:
Optional
[
Tensor
]
=
None
,
out
:
Optional
[
Tensor
]
=
None
,
normalization
:
Union
[
bool
,
float
,
Callable
]
=
True
,
normalization
:
Union
[
bool
,
float
,
Callable
]
=
True
,
channels_first
:
bool
=
True
,
channels_first
:
bool
=
True
,
num_frames
:
int
=
0
,
num_frames
:
int
=
0
,
offset
:
int
=
0
,
offset
:
int
=
0
,
filetype
:
Optional
[
str
]
=
None
,
filetype
:
Optional
[
str
]
=
None
,
)
->
Tuple
[
Tensor
,
int
]:
)
->
Tuple
[
Tensor
,
int
]:
raise
RuntimeError
(
"No audio I/O backend is available."
)
raise
RuntimeError
(
"No audio I/O backend is available."
)
def
save
(
filepath
:
str
,
src
:
Tensor
,
sample_rate
:
int
,
precision
:
int
=
16
,
channels_first
:
bool
=
True
)
->
None
:
def
save
(
filepath
:
str
,
src
:
Tensor
,
sample_rate
:
int
,
precision
:
int
=
16
,
channels_first
:
bool
=
True
)
->
None
:
raise
RuntimeError
(
"No audio I/O backend is available."
)
raise
RuntimeError
(
"No audio I/O backend is available."
)
...
...
paddlespeech/audio/backends/sox_io_backend.py
浏览文件 @
38c55e44
from
pathlib
import
Path
from
pathlib
import
Path
from
typing
import
Callable
from
typing
import
Callable
from
typing
import
Optional
from
typing
import
Optional
...
@@ -44,16 +43,19 @@ _fallback_load_filebj = _fail_load_fileobj
...
@@ -44,16 +43,19 @@ _fallback_load_filebj = _fail_load_fileobj
def
load
(
def
load
(
filepath
:
Union
[
str
,
Path
],
filepath
:
Union
[
str
,
Path
],
out
:
Optional
[
Tensor
]
=
None
,
out
:
Optional
[
Tensor
]
=
None
,
normalization
:
Union
[
bool
,
float
,
Callable
]
=
True
,
normalization
:
Union
[
bool
,
float
,
Callable
]
=
True
,
channels_first
:
bool
=
True
,
channels_first
:
bool
=
True
,
num_frames
:
int
=
0
,
num_frames
:
int
=
0
,
offset
:
int
=
0
,
offset
:
int
=
0
,
filetype
:
Optional
[
str
]
=
None
,
filetype
:
Optional
[
str
]
=
None
,
)
->
Tuple
[
Tensor
,
int
]:
)
->
Tuple
[
Tensor
,
int
]:
raise
RuntimeError
(
"No audio I/O backend is available."
)
raise
RuntimeError
(
"No audio I/O backend is available."
)
def
save
(
filepath
:
str
,
src
:
Tensor
,
sample_rate
:
int
,
precision
:
int
=
16
,
channels_first
:
bool
=
True
)
->
None
:
def
save
(
filepath
:
str
,
src
:
Tensor
,
sample_rate
:
int
,
precision
:
int
=
16
,
channels_first
:
bool
=
True
)
->
None
:
raise
RuntimeError
(
"No audio I/O backend is available."
)
raise
RuntimeError
(
"No audio I/O backend is available."
)
@
_mod_utils
.
requires_sox
()
@
_mod_utils
.
requires_sox
()
...
...
paddlespeech/audio/backends/utils.py
浏览文件 @
38c55e44
...
@@ -40,7 +40,8 @@ def set_audio_backend(backend: Optional[str]):
...
@@ -40,7 +40,8 @@ def set_audio_backend(backend: Optional[str]):
of the system. If ``None`` is provided the current backend is unassigned.
of the system. If ``None`` is provided the current backend is unassigned.
"""
"""
if
backend
is
not
None
and
backend
not
in
list_audio_backends
():
if
backend
is
not
None
and
backend
not
in
list_audio_backends
():
raise
RuntimeError
(
f
'Backend "
{
backend
}
" is not one of '
f
"available backends:
{
list_audio_backends
()
}
."
)
raise
RuntimeError
(
f
'Backend "
{
backend
}
" is not one of '
f
"available backends:
{
list_audio_backends
()
}
."
)
if
backend
is
None
:
if
backend
is
None
:
module
=
no_backend
module
=
no_backend
...
@@ -76,6 +77,7 @@ def _init_audio_backend():
...
@@ -76,6 +77,7 @@ def _init_audio_backend():
warnings
.
warn
(
"No audio backend is available."
)
warnings
.
warn
(
"No audio backend is available."
)
set_audio_backend
(
None
)
set_audio_backend
(
None
)
def
get_audio_backend
()
->
Optional
[
str
]:
def
get_audio_backend
()
->
Optional
[
str
]:
"""Get the name of the current backend
"""Get the name of the current backend
...
...
paddlespeech/audio/kaldi/kaldi.py
浏览文件 @
38c55e44
...
@@ -27,7 +27,8 @@ __all__ = [
...
@@ -27,7 +27,8 @@ __all__ = [
@
module_utils
.
requires_kaldi
()
@
module_utils
.
requires_kaldi
()
def
fbank
(
wav
,
def
fbank
(
wav
,
samp_freq
:
int
=
16000
,
samp_freq
:
int
=
16000
,
frame_shift_ms
:
float
=
10.0
,
frame_shift_ms
:
float
=
10.0
,
frame_length_ms
:
float
=
25.0
,
frame_length_ms
:
float
=
25.0
,
...
@@ -88,6 +89,7 @@ def fbank(wav,
...
@@ -88,6 +89,7 @@ def fbank(wav,
feat
=
ComputeFbank
(
frame_opts
,
mel_opts
,
fbank_opts
,
wav
)
feat
=
ComputeFbank
(
frame_opts
,
mel_opts
,
fbank_opts
,
wav
)
return
feat
return
feat
@
module_utils
.
requires_kaldi
()
@
module_utils
.
requires_kaldi
()
def
pitch
(
wav
,
def
pitch
(
wav
,
samp_freq
:
int
=
16000
,
samp_freq
:
int
=
16000
,
...
...
paddlespeech/audio/src/CMakeLists.txt
浏览文件 @
38c55e44
...
@@ -105,7 +105,7 @@ function(define_extension name sources include_dirs libraries definitions)
...
@@ -105,7 +105,7 @@ function(define_extension name sources include_dirs libraries definitions)
add_library
(
${
name
}
SHARED
${
sources
}
)
add_library
(
${
name
}
SHARED
${
sources
}
)
target_compile_definitions
(
${
name
}
PRIVATE
"
${
definitions
}
"
)
target_compile_definitions
(
${
name
}
PRIVATE
"
${
definitions
}
"
)
target_include_directories
(
target_include_directories
(
${
name
}
PRIVATE
${
PROJECT_SOURCE_DIR
}
${
Python_INCLUDE_DIR
}
${
include_dirs
}
)
${
name
}
PRIVATE
${
PROJECT_SOURCE_DIR
}
${
Python_INCLUDE_DIR
}
${
pybind11_INCLUDE_DIR
}
${
include_dirs
}
)
target_link_libraries
(
target_link_libraries
(
${
name
}
${
name
}
${
libraries
}
${
libraries
}
...
...
paddlespeech/audio/src/pybind/kaldi/feature_common.h
浏览文件 @
38c55e44
...
@@ -14,8 +14,8 @@
...
@@ -14,8 +14,8 @@
#pragma once
#pragma once
#include
<pybind11/numpy.h>
#include
"pybind11/pybind11.h"
#include
<pybind11/pybind11.h>
#include
"pybind11/numpy.h"
#include "feat/feature-window.h"
#include "feat/feature-window.h"
namespace
paddleaudio
{
namespace
paddleaudio
{
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录