PaddleSpeech/runtime/engine/common/frontend/feature_cache.cc

// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "frontend/feature_cache.h"

namespace ppspeech {

using kaldi::BaseFloat;
using std::unique_ptr;
using std::vector;

FeatureCache::FeatureCache(size_t max_size,
                           unique_ptr<FrontendInterface> base_extractor) {
    max_size_ = max_size;
    base_extractor_ = std::move(base_extractor);
    dim_ = base_extractor_->Dim();
}

void FeatureCache::Accept(const std::vector<kaldi::BaseFloat>& inputs) {
    // read inputs
    base_extractor_->Accept(inputs);
}

// pop feature chunk
bool FeatureCache::Read(std::vector<kaldi::BaseFloat>* feats) {
    kaldi::Timer timer;
    std::unique_lock<std::mutex> lock(mutex_);
    // feed current data
    if (cache_.empty()) {
        bool result = false;
        do {
            result = Compute();
        } while (result);
    }

    if (cache_.empty()) return false;

    // read from cache
    *feats = cache_.front();
    cache_.pop();
    VLOG(1) << "FeatureCache::Read cost: " << timer.Elapsed() << " sec.";
    return true;
}

// read all data from base_feature_extractor_ into cache_
bool FeatureCache::Compute() {
    // compute and feed
    vector<BaseFloat> feature;
    bool result = base_extractor_->Read(&feature);
    if (result == false || feature.size() == 0) return false;

    kaldi::Timer timer;

    int32 num_chunk = feature.size() / dim_;
    VLOG(3) << "nframe computed: " << nframe_;

    for (int chunk_idx = 0; chunk_idx < num_chunk; ++chunk_idx) {
        int32 start = chunk_idx * dim_;
        vector<BaseFloat> feature_chunk(feature.data() + start,
                                        feature.data() + start + dim_);
        // feed cache
        cache_.push(feature_chunk);
        ++nframe_;
    }

    VLOG(1) << "FeatureCache::Compute cost: " << timer.Elapsed() << " sec. "
            << num_chunk << " feats.";
    return true;
}

}  // namespace ppspeech
make feature cache& raw audio work 3 years ago			`// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

[speechx] rm openblas && refactor kaldi-matrix, kaldi-vector (#2824) * rm openblas && refactor kaldi-matrix kaldi-vector 2 years ago			`#include "frontend/feature_cache.h"`
add raw_audio & feature_cache 3 years ago
make feature cache& raw audio work 3 years ago			`namespace ppspeech {`

			`using kaldi::BaseFloat;`
			`using std::unique_ptr;`
format code 2 years ago			`using std::vector;`
make feature cache& raw audio work 3 years ago
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`FeatureCache::FeatureCache(size_t max_size,`
format code 3 years ago			`unique_ptr<FrontendInterface> base_extractor) {`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`max_size_ = max_size;`
make feature cache& raw audio work 3 years ago			`base_extractor_ = std::move(base_extractor);`
add websocket 3 years ago			`dim_ = base_extractor_->Dim();`
make feature cache& raw audio work 3 years ago			`}`

[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`void FeatureCache::Accept(const std::vector<kaldi::BaseFloat>& inputs) {`
to_float32, fix shell script 3 years ago			`// read inputs`
rename interface & add comment to Dim() 3 years ago			`base_extractor_->Accept(inputs);`
add raw_audio & feature_cache 3 years ago			`}`

make feature cache& raw audio work 3 years ago			`// pop feature chunk`
[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`bool FeatureCache::Read(std::vector<kaldi::BaseFloat>* feats) {`
make feature cache& raw audio work 3 years ago			`kaldi::Timer timer;`
			`std::unique_lock<std::mutex> lock(mutex_);`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`// feed current data`
			`if (cache_.empty()) {`
			`bool result = false;`
			`do {`
			`result = Compute();`
			`} while (result);`
add raw_audio & feature_cache 3 years ago			`}`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago
make feature cache& raw audio work 3 years ago			`if (cache_.empty()) return false;`
config param for nnet 3 years ago
			`// read from cache`
[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`*feats = cache_.front();`
add raw_audio & feature_cache 3 years ago			`cache_.pop();`
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`VLOG(1) << "FeatureCache::Read cost: " << timer.Elapsed() << " sec.";`
make feature cache& raw audio work 3 years ago			`return true;`
add raw_audio & feature_cache 3 years ago			`}`

			`// read all data from base_feature_extractor_ into cache_`
make feature cache& raw audio work 3 years ago			`bool FeatureCache::Compute() {`
add raw_audio & feature_cache 3 years ago			`// compute and feed`
[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`vector<BaseFloat> feature;`
add websocket 3 years ago			`bool result = base_extractor_->Read(&feature);`
[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`if (result == false \|\| feature.size() == 0) return false;`
to_float32, fix shell script 3 years ago
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`kaldi::Timer timer;`

[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`int32 num_chunk = feature.size() / dim_;`
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`VLOG(3) << "nframe computed: " << nframe_;`
fix assembler buf, which not clear cache, and fill zero default 2 years ago
add websocket 3 years ago			`for (int chunk_idx = 0; chunk_idx < num_chunk; ++chunk_idx) {`
fix #2013; and format 2 years ago			`int32 start = chunk_idx * dim_;`
[engine] rename speechx (#2892) * rename speechx * fix wfst decode error * replace reset with make_unique 2 years ago			`vector<BaseFloat> feature_chunk(feature.data() + start,`
[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`feature.data() + start + dim_);`
add websocket 3 years ago			`// feed cache`
make feature cache& raw audio work 3 years ago			`cache_.push(feature_chunk);`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`++nframe_;`
make feature cache& raw audio work 3 years ago			`}`
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago
			`VLOG(1) << "FeatureCache::Compute cost: " << timer.Elapsed() << " sec. "`
			`<< num_chunk << " feats.";`
			`return true;`
add raw_audio & feature_cache 3 years ago			`}`

[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`} // namespace ppspeech`