Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
PaddlePaddle
DeepSpeech
提交
42c7537c
D
DeepSpeech
项目概览
PaddlePaddle
/
DeepSpeech
大约 2 年 前同步成功
通知
210
Star
8425
Fork
1598
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
245
列表
看板
标记
里程碑
合并请求
3
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
D
DeepSpeech
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
245
Issue
245
列表
看板
标记
里程碑
合并请求
3
合并请求
3
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
42c7537c
编写于
4月 01, 2022
作者:
H
Hui Zhang
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
frontend to audio dir
上级
8d66a254
变更
23
隐藏空白更改
内联
并排
Showing
23 changed file
with
36 addition
and
51 deletion
+36
-51
speechx/examples/decoder/offline_decoder_main.cc
speechx/examples/decoder/offline_decoder_main.cc
+1
-1
speechx/examples/decoder/offline_decoder_sliding_chunk_main.cc
...hx/examples/decoder/offline_decoder_sliding_chunk_main.cc
+1
-1
speechx/examples/feat/linear_spectrogram_main.cc
speechx/examples/feat/linear_spectrogram_main.cc
+6
-7
speechx/speechx/frontend/CMakeLists.txt
speechx/speechx/frontend/CMakeLists.txt
+1
-10
speechx/speechx/frontend/audio/CMakeLists.txt
speechx/speechx/frontend/audio/CMakeLists.txt
+11
-0
speechx/speechx/frontend/audio/audio_cache.cc
speechx/speechx/frontend/audio/audio_cache.cc
+1
-1
speechx/speechx/frontend/audio/audio_cache.h
speechx/speechx/frontend/audio/audio_cache.h
+1
-1
speechx/speechx/frontend/audio/cmvn.cc
speechx/speechx/frontend/audio/cmvn.cc
+1
-2
speechx/speechx/frontend/audio/cmvn.h
speechx/speechx/frontend/audio/cmvn.h
+1
-1
speechx/speechx/frontend/audio/data_cache.h
speechx/speechx/frontend/audio/data_cache.h
+1
-1
speechx/speechx/frontend/audio/db_norm.cc
speechx/speechx/frontend/audio/db_norm.cc
+1
-1
speechx/speechx/frontend/audio/db_norm.h
speechx/speechx/frontend/audio/db_norm.h
+1
-1
speechx/speechx/frontend/audio/fbank.h
speechx/speechx/frontend/audio/fbank.h
+0
-0
speechx/speechx/frontend/audio/feature_cache.cc
speechx/speechx/frontend/audio/feature_cache.cc
+1
-1
speechx/speechx/frontend/audio/feature_cache.h
speechx/speechx/frontend/audio/feature_cache.h
+1
-1
speechx/speechx/frontend/audio/frontend_itf.h
speechx/speechx/frontend/audio/frontend_itf.h
+0
-0
speechx/speechx/frontend/audio/linear_spectrogram.cc
speechx/speechx/frontend/audio/linear_spectrogram.cc
+1
-1
speechx/speechx/frontend/audio/linear_spectrogram.h
speechx/speechx/frontend/audio/linear_spectrogram.h
+1
-1
speechx/speechx/frontend/audio/mfcc.h
speechx/speechx/frontend/audio/mfcc.h
+0
-0
speechx/speechx/frontend/audio/normalizer.h
speechx/speechx/frontend/audio/normalizer.h
+4
-0
speechx/speechx/frontend/normalizer.h
speechx/speechx/frontend/normalizer.h
+0
-4
speechx/speechx/frontend/window.h
speechx/speechx/frontend/window.h
+0
-15
speechx/speechx/nnet/decodable.h
speechx/speechx/nnet/decodable.h
+1
-1
未找到文件。
speechx/examples/decoder/offline_decoder_main.cc
浏览文件 @
42c7537c
...
...
@@ -17,7 +17,7 @@
#include "base/flags.h"
#include "base/log.h"
#include "decoder/ctc_beam_search_decoder.h"
#include "frontend/data_cache.h"
#include "frontend/
audio/
data_cache.h"
#include "kaldi/util/table-types.h"
#include "nnet/decodable.h"
#include "nnet/paddle_nnet.h"
...
...
speechx/examples/decoder/offline_decoder_sliding_chunk_main.cc
浏览文件 @
42c7537c
...
...
@@ -17,7 +17,7 @@
#include "base/flags.h"
#include "base/log.h"
#include "decoder/ctc_beam_search_decoder.h"
#include "frontend/data_cache.h"
#include "frontend/
audio/
data_cache.h"
#include "kaldi/util/table-types.h"
#include "nnet/decodable.h"
#include "nnet/paddle_nnet.h"
...
...
speechx/examples/feat/linear_spectrogram_main.cc
浏览文件 @
42c7537c
...
...
@@ -14,19 +14,18 @@
// todo refactor, repalce with gtest
#include "frontend/linear_spectrogram.h"
#include "base/flags.h"
#include "base/log.h"
#include "frontend/audio_cache.h"
#include "frontend/data_cache.h"
#include "frontend/feature_cache.h"
#include "frontend/frontend_itf.h"
#include "frontend/normalizer.h"
#include "kaldi/feat/wave-reader.h"
#include "kaldi/util/kaldi-io.h"
#include "kaldi/util/table-types.h"
#include <glog/logging.h>
#include "frontend/audio/linear_spectrogram.h"
#include "frontend/audio/audio_cache.h"
#include "frontend/audio/data_cache.h"
#include "frontend/audio/feature_cache.h"
#include "frontend/audio/frontend_itf.h"
#include "frontend/audio/normalizer.h"
DEFINE_string
(
wav_rspecifier
,
""
,
"test wav scp path"
);
DEFINE_string
(
feature_wspecifier
,
""
,
"output feats wspecifier"
);
...
...
speechx/speechx/frontend/CMakeLists.txt
浏览文件 @
42c7537c
project
(
frontend
)
add_library
(
frontend STATIC
cmvn.cc
db_norm.cc
linear_spectrogram.cc
audio_cache.cc
feature_cache.cc
)
target_link_libraries
(
frontend PUBLIC kaldi-matrix
)
\ No newline at end of file
add_subdirectory
(
audio
)
\ No newline at end of file
speechx/speechx/frontend/audio/CMakeLists.txt
浏览文件 @
42c7537c
project
(
frontend
)
add_library
(
frontend STATIC
cmvn.cc
db_norm.cc
linear_spectrogram.cc
audio_cache.cc
feature_cache.cc
)
target_link_libraries
(
frontend PUBLIC kaldi-matrix
)
\ No newline at end of file
speechx/speechx/frontend/audio_cache.cc
→
speechx/speechx/frontend/audio
/audio
_cache.cc
浏览文件 @
42c7537c
...
...
@@ -12,7 +12,7 @@
// See the License for the specific language governing permissions and
// limitations under the License.
#include "frontend/audio_cache.h"
#include "frontend/audio
/audio
_cache.h"
#include "kaldi/base/timer.h"
namespace
ppspeech
{
...
...
speechx/speechx/frontend/audio_cache.h
→
speechx/speechx/frontend/audio
/audio
_cache.h
浏览文件 @
42c7537c
...
...
@@ -16,7 +16,7 @@
#pragma once
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
namespace
ppspeech
{
...
...
speechx/speechx/frontend/cmvn.cc
→
speechx/speechx/frontend/
audio/
cmvn.cc
浏览文件 @
42c7537c
#include "frontend/
normalizer
.h"
#include "frontend/
audio/cmvn
.h"
#include "kaldi/feat/cmvn.h"
#include "kaldi/util/kaldi-io.h"
...
...
@@ -13,7 +13,6 @@ using kaldi::SubVector;
using
std
::
unique_ptr
;
CMVN
::
CMVN
(
std
::
string
cmvn_file
,
unique_ptr
<
FrontendInterface
>
base_extractor
)
:
var_norm_
(
true
)
{
...
...
speechx/speechx/frontend/cmvn.h
→
speechx/speechx/frontend/
audio/
cmvn.h
浏览文件 @
42c7537c
#pragma once
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
#include "kaldi/matrix/kaldi-matrix.h"
#include "kaldi/util/options-itf.h"
...
...
speechx/speechx/frontend/data_cache.h
→
speechx/speechx/frontend/
audio/
data_cache.h
浏览文件 @
42c7537c
...
...
@@ -17,7 +17,7 @@
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
namespace
ppspeech
{
...
...
speechx/speechx/frontend/db_norm.cc
→
speechx/speechx/frontend/
audio/
db_norm.cc
浏览文件 @
42c7537c
...
...
@@ -13,7 +13,7 @@
// limitations under the License.
#include "frontend/
normalizer
.h"
#include "frontend/
audio/db_norm
.h"
#include "kaldi/feat/cmvn.h"
#include "kaldi/util/kaldi-io.h"
...
...
speechx/speechx/frontend/db_norm.h
→
speechx/speechx/frontend/
audio/
db_norm.h
浏览文件 @
42c7537c
...
...
@@ -16,7 +16,7 @@
#pragma once
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
#include "kaldi/matrix/kaldi-matrix.h"
#include "kaldi/util/options-itf.h"
...
...
speechx/speechx/frontend/fbank.h
→
speechx/speechx/frontend/
audio/
fbank.h
浏览文件 @
42c7537c
文件已移动
speechx/speechx/frontend/feature_cache.cc
→
speechx/speechx/frontend/
audio/
feature_cache.cc
浏览文件 @
42c7537c
...
...
@@ -12,7 +12,7 @@
// See the License for the specific language governing permissions and
// limitations under the License.
#include "frontend/feature_cache.h"
#include "frontend/
audio/
feature_cache.h"
namespace
ppspeech
{
...
...
speechx/speechx/frontend/feature_cache.h
→
speechx/speechx/frontend/
audio/
feature_cache.h
浏览文件 @
42c7537c
...
...
@@ -15,7 +15,7 @@
#pragma once
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
namespace
ppspeech
{
...
...
speechx/speechx/frontend/frontend_itf.h
→
speechx/speechx/frontend/
audio/
frontend_itf.h
浏览文件 @
42c7537c
文件已移动
speechx/speechx/frontend/linear_spectrogram.cc
→
speechx/speechx/frontend/
audio/
linear_spectrogram.cc
浏览文件 @
42c7537c
...
...
@@ -12,7 +12,7 @@
// See the License for the specific language governing permissions and
// limitations under the License.
#include "frontend/linear_spectrogram.h"
#include "frontend/
audio/
linear_spectrogram.h"
#include "kaldi/base/kaldi-math.h"
#include "kaldi/matrix/matrix-functions.h"
...
...
speechx/speechx/frontend/linear_spectrogram.h
→
speechx/speechx/frontend/
audio/
linear_spectrogram.h
浏览文件 @
42c7537c
...
...
@@ -16,7 +16,7 @@
#pragma once
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
#include "kaldi/feat/feature-window.h"
namespace
ppspeech
{
...
...
speechx/speechx/frontend/mfcc.h
→
speechx/speechx/frontend/
audio/
mfcc.h
浏览文件 @
42c7537c
文件已移动
speechx/speechx/frontend/audio/normalizer.h
0 → 100644
浏览文件 @
42c7537c
#pragma once
#include "frontend/audio/cmvn.h"
#include "frontend/audio/db_norm.h"
\ No newline at end of file
speechx/speechx/frontend/normalizer.h
已删除
100644 → 0
浏览文件 @
8d66a254
#pragma once
#include "frontend/cmvn.h"
#include "frontend/db_norm.h"
\ No newline at end of file
speechx/speechx/frontend/window.h
已删除
100644 → 0
浏览文件 @
8d66a254
// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// extract the window of kaldi feat.
speechx/speechx/nnet/decodable.h
浏览文件 @
42c7537c
...
...
@@ -13,7 +13,7 @@
// limitations under the License.
#include "base/common.h"
#include "frontend/frontend_itf.h"
#include "frontend/
audio/
frontend_itf.h"
#include "kaldi/matrix/kaldi-matrix.h"
#include "nnet/decodable-itf.h"
#include "nnet/nnet_interface.h"
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录