PaddleSpeech/runtime/engine/asr/recognizer/u2_recognizer.cc

// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "recognizer/u2_recognizer.h"

#include "nnet/u2_nnet.h"
#ifdef USE_ONNX
#include "nnet/u2_onnx_nnet.h"
#endif

namespace ppspeech {

using kaldi::BaseFloat;
using std::unique_ptr;
using std::vector;

U2Recognizer::U2Recognizer(const U2RecognizerResource& resource)
    : opts_(resource) {
    BaseFloat am_scale = resource.acoustic_scale;
    const FeaturePipelineOptions& feature_opts = resource.feature_pipeline_opts;
    std::shared_ptr<FeaturePipeline> feature_pipeline(
        new FeaturePipeline(feature_opts));
    std::shared_ptr<NnetBase> nnet;
#ifndef USE_ONNX
    nnet.reset(new U2Nnet(resource.model_opts));
#else
    if (resource.model_opts.with_onnx_model){
        nnet.reset(new U2OnnxNnet(resource.model_opts));
    } else {
        nnet.reset(new U2Nnet(resource.model_opts));
    }
#endif
    nnet_producer_.reset(new NnetProducer(nnet, feature_pipeline));
    decodable_.reset(new Decodable(nnet_producer_, am_scale));

    CHECK_NE(resource.vocab_path, "");
    if (resource.decoder_opts.tlg_decoder_opts.fst_path.empty()) {
        LOG(INFO) << resource.decoder_opts.tlg_decoder_opts.fst_path;
        decoder_ = std::make_unique<CTCPrefixBeamSearch>(
            resource.vocab_path, resource.decoder_opts.ctc_prefix_search_opts);
    } else {
        decoder_ = std::make_unique<TLGDecoder>(
            resource.decoder_opts.tlg_decoder_opts);
    }

    symbol_table_ = decoder_->WordSymbolTable();

    global_frame_offset_ = 0;
    input_finished_ = false;
    num_frames_ = 0;
    result_.clear();
}

U2Recognizer::U2Recognizer(const U2RecognizerResource& resource,
                           std::shared_ptr<NnetBase> nnet)
    : opts_(resource) {
    BaseFloat am_scale = resource.acoustic_scale;
    const FeaturePipelineOptions& feature_opts = resource.feature_pipeline_opts;
    std::shared_ptr<FeaturePipeline> feature_pipeline =
        std::make_shared<FeaturePipeline>(feature_opts);
    nnet_producer_.reset(new NnetProducer(nnet, feature_pipeline));
    decodable_.reset(new Decodable(nnet_producer_, am_scale));

    CHECK_NE(resource.vocab_path, "");
    if (resource.decoder_opts.tlg_decoder_opts.fst_path == "") {
        decoder_.reset(new CTCPrefixBeamSearch(
            resource.vocab_path, resource.decoder_opts.ctc_prefix_search_opts));
    } else {
        decoder_.reset(new TLGDecoder(resource.decoder_opts.tlg_decoder_opts));
    }

    symbol_table_ = decoder_->WordSymbolTable();

    global_frame_offset_ = 0;
    input_finished_ = false;
    num_frames_ = 0;
    result_.clear();
}

U2Recognizer::~U2Recognizer() {
    SetInputFinished();
    WaitDecodeFinished();
}

void U2Recognizer::WaitDecodeFinished() {
    if (thread_.joinable()) thread_.join();
}

void U2Recognizer::WaitFinished() {
    if (thread_.joinable()) thread_.join();
    nnet_producer_->Wait();
}

void U2Recognizer::InitDecoder() {
    global_frame_offset_ = 0;
    input_finished_ = false;
    num_frames_ = 0;
    result_.clear();

    decodable_->Reset();
    decoder_->Reset();
    thread_ = std::thread(RunDecoderSearch, this);
}

void U2Recognizer::ResetContinuousDecoding() {
    global_frame_offset_ = num_frames_;
    num_frames_ = 0;
    result_.clear();

    decodable_->Reset();
    decoder_->Reset();
}

void U2Recognizer::RunDecoderSearch(U2Recognizer* me) {
    me->RunDecoderSearchInternal();
}

void U2Recognizer::RunDecoderSearchInternal() {
    LOG(INFO) << "DecoderSearchInteral begin";
    while (!nnet_producer_->IsFinished()) {
        nnet_producer_->WaitProduce();
        decoder_->AdvanceDecode(decodable_);
    }
    decoder_->AdvanceDecode(decodable_);
    UpdateResult(false);
    LOG(INFO) << "DecoderSearchInteral exit";
}

void U2Recognizer::Accept(const vector<BaseFloat>& waves) {
    kaldi::Timer timer;
    nnet_producer_->Accept(waves);
    VLOG(1) << "feed waves cost: " << timer.Elapsed() << " sec. "
            << waves.size() << " samples.";
}

void U2Recognizer::Decode() {
    decoder_->AdvanceDecode(decodable_);
    UpdateResult(false);
}

void U2Recognizer::Rescoring() {
    // Do attention Rescoring
    AttentionRescoring();
}

void U2Recognizer::UpdateResult(bool finish) {
    const auto& hypotheses = decoder_->Outputs();
    const auto& inputs = decoder_->Inputs();
    const auto& likelihood = decoder_->Likelihood();
    const auto& times = decoder_->Times();
    result_.clear();

    CHECK_EQ(inputs.size(), likelihood.size());
    for (size_t i = 0; i < hypotheses.size(); i++) {
        const std::vector<int>& hypothesis = hypotheses[i];

        DecodeResult path;
        path.score = likelihood[i];
        for (size_t j = 0; j < hypothesis.size(); j++) {
            std::string word = symbol_table_->Find(hypothesis[j]);
            // path.sentence += (" " + word); // todo SmileGoat: add blank
            // processor
            path.sentence += word;  // todo SmileGoat: add blank processor
        }

        // TimeStamp is only supported in final result
        // TimeStamp of the output of CtcWfstBeamSearch may be inaccurate due to
        // various FST operations when building the decoding graph. So here we
        // use time stamp of the input(e2e model unit), which is more accurate,
        // and it requires the symbol table of the e2e model used in training.
        if (symbol_table_ != nullptr && finish) {
            int offset = global_frame_offset_ * FrameShiftInMs();

            const std::vector<int>& input = inputs[i];
            const std::vector<int> time_stamp = times[i];
            CHECK_EQ(input.size(), time_stamp.size());

            for (size_t j = 0; j < input.size(); j++) {
                std::string word = symbol_table_->Find(input[j]);

                int start =
                    time_stamp[j] * FrameShiftInMs() - time_stamp_gap_ > 0
                        ? time_stamp[j] * FrameShiftInMs() - time_stamp_gap_
                        : 0;
                if (j > 0) {
                    start =
                        (time_stamp[j] - time_stamp[j - 1]) * FrameShiftInMs() <
                                time_stamp_gap_
                            ? (time_stamp[j - 1] + time_stamp[j]) / 2 *
                                  FrameShiftInMs()
                            : start;
                }

                int end = time_stamp[j] * FrameShiftInMs();
                if (j < input.size() - 1) {
                    end =
                        (time_stamp[j + 1] - time_stamp[j]) * FrameShiftInMs() <
                                time_stamp_gap_
                            ? (time_stamp[j + 1] + time_stamp[j]) / 2 *
                                  FrameShiftInMs()
                            : end;
                }

                WordPiece word_piece(word, offset + start, offset + end);
                path.word_pieces.emplace_back(word_piece);
            }
        }

        // if (post_processor_ != nullptr) {
        //   path.sentence = post_processor_->Process(path.sentence, finish);
        // }

        result_.emplace_back(path);
    }

    if (DecodedSomething()) {
        VLOG(1) << "Partial CTC result " << result_[0].sentence;
    }
}

void U2Recognizer::AttentionRescoring() {
    decoder_->FinalizeSearch();
    UpdateResult(false);

    // No need to do rescoring
    if (0.0 == opts_.decoder_opts.rescoring_weight) {
        LOG_EVERY_N(WARNING, 3) << "Not do AttentionRescoring!";
        return;
    }
    LOG_EVERY_N(WARNING, 3) << "Do AttentionRescoring!";

    // Inputs() returns N-best input ids, which is the basic unit for rescoring
    // In CtcPrefixBeamSearch, inputs are the same to outputs
    const auto& hypotheses = decoder_->Inputs();
    int num_hyps = hypotheses.size();
    if (num_hyps <= 0) {
        return;
    }

    std::vector<float> rescoring_score;
    decodable_->AttentionRescoring(
        hypotheses, opts_.decoder_opts.reverse_weight, &rescoring_score);

    // combine ctc score and rescoring score
    for (size_t i = 0; i < num_hyps; i++) {
        VLOG(3) << "hyp " << i << " rescoring_score: " << rescoring_score[i]
                << " ctc_score: " << result_[i].score
                << " rescoring_weight: " << opts_.decoder_opts.rescoring_weight
                << " ctc_weight: " << opts_.decoder_opts.ctc_weight;
        result_[i].score =
            opts_.decoder_opts.rescoring_weight * rescoring_score[i] +
            opts_.decoder_opts.ctc_weight * result_[i].score;

        VLOG(3) << "hyp: " << result_[0].sentence
                << " score: " << result_[0].score;
    }

    std::sort(result_.begin(), result_.end(), DecodeResult::CompareFunc);
    VLOG(3) << "result: " << result_[0].sentence
            << " score: " << result_[0].score;
}

std::string U2Recognizer::GetFinalResult() { return result_[0].sentence; }

std::string U2Recognizer::GetPartialResult() { return result_[0].sentence; }

void U2Recognizer::SetInputFinished() {
    nnet_producer_->SetInputFinished();
    input_finished_ = true;
}


}  // namespace ppspeech
add u2 recg 2 years ago			`// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.`
			`//`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

seprate recognizer; NnetBase as base class 2 years ago			`#include "recognizer/u2_recognizer.h"`
format 2 years ago
add u2 recg 2 years ago			`#include "nnet/u2_nnet.h"`
[runtime] support onnx runtime && support ios compile (#3101) * support vad ios compile * support onnx model recognize * add build ios sh 2 years ago			`#ifdef USE_ONNX`
			`#include "nnet/u2_onnx_nnet.h"`
			`#endif`
add u2 recg 2 years ago
			`namespace ppspeech {`

			`using kaldi::BaseFloat;`
			`using std::unique_ptr;`
format 2 years ago			`using std::vector;`
add u2 recg 2 years ago
format 2 years ago			`U2Recognizer::U2Recognizer(const U2RecognizerResource& resource)`
			`: opts_(resource) {`
[Speechx] add nnet prob cache && make 2 thread decode work (#2769) * add nnet cache && make 2 thread work * do not compile websocket 2 years ago			`BaseFloat am_scale = resource.acoustic_scale;`
add u2 recg 2 years ago			`const FeaturePipelineOptions& feature_opts = resource.feature_pipeline_opts;`
[Speechx] add nnet prob cache && make 2 thread decode work (#2769) * add nnet cache && make 2 thread work * do not compile websocket 2 years ago			`std::shared_ptr<FeaturePipeline> feature_pipeline(`
			`new FeaturePipeline(feature_opts));`
[runtime] support onnx runtime && support ios compile (#3101) * support vad ios compile * support onnx model recognize * add build ios sh 2 years ago			`std::shared_ptr<NnetBase> nnet;`
			`#ifndef USE_ONNX`
			`nnet.reset(new U2Nnet(resource.model_opts));`
			`#else`
			`if (resource.model_opts.with_onnx_model){`
			`nnet.reset(new U2OnnxNnet(resource.model_opts));`
			`} else {`
			`nnet.reset(new U2Nnet(resource.model_opts));`
			`}`
			`#endif`
[Speechx] add nnet prob cache && make 2 thread decode work (#2769) * add nnet cache && make 2 thread work * do not compile websocket 2 years ago			`nnet_producer_.reset(new NnetProducer(nnet, feature_pipeline));`
			`decodable_.reset(new Decodable(nnet_producer_, am_scale));`
add u2 recg 2 years ago
cpplint 2 years ago			`CHECK_NE(resource.vocab_path, "");`
[engine] rename speechx (#2892) * rename speechx * fix wfst decode error * replace reset with make_unique 2 years ago			`if (resource.decoder_opts.tlg_decoder_opts.fst_path.empty()) {`
add wfst decoder (#2886) 2 years ago			`LOG(INFO) << resource.decoder_opts.tlg_decoder_opts.fst_path;`
[engine] rename speechx (#2892) * rename speechx * fix wfst decode error * replace reset with make_unique 2 years ago			`decoder_ = std::make_unique<CTCPrefixBeamSearch>(`
			`resource.vocab_path, resource.decoder_opts.ctc_prefix_search_opts);`
add wfst decoder (#2886) 2 years ago			`} else {`
opt to compile asr,cls,vad; add vad; format code (#2968) 2 years ago			`decoder_ = std::make_unique<TLGDecoder>(`
			`resource.decoder_opts.tlg_decoder_opts);`
add wfst decoder (#2886) 2 years ago			`}`
add u2 recg 2 years ago
add wfst decoder (#2886) 2 years ago			`symbol_table_ = decoder_->WordSymbolTable();`
add u2 recg 2 years ago
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`global_frame_offset_ = 0;`
add u2 recg 2 years ago			`input_finished_ = false;`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`num_frames_ = 0;`
			`result_.clear();`
[speechx] add batch recognizer decode. (#2866) * add recognizer_batch 2 years ago			`}`

			`U2Recognizer::U2Recognizer(const U2RecognizerResource& resource,`
			`std::shared_ptr<NnetBase> nnet)`
			`: opts_(resource) {`
			`BaseFloat am_scale = resource.acoustic_scale;`
			`const FeaturePipelineOptions& feature_opts = resource.feature_pipeline_opts;`
			`std::shared_ptr<FeaturePipeline> feature_pipeline =`
			`std::make_shared<FeaturePipeline>(feature_opts);`
			`nnet_producer_.reset(new NnetProducer(nnet, feature_pipeline));`
			`decodable_.reset(new Decodable(nnet_producer_, am_scale));`

			`CHECK_NE(resource.vocab_path, "");`
add wfst decoder (#2886) 2 years ago			`if (resource.decoder_opts.tlg_decoder_opts.fst_path == "") {`
			`decoder_.reset(new CTCPrefixBeamSearch(`
			`resource.vocab_path, resource.decoder_opts.ctc_prefix_search_opts));`
			`} else {`
			`decoder_.reset(new TLGDecoder(resource.decoder_opts.tlg_decoder_opts));`
			`}`
[speechx] add batch recognizer decode. (#2866) * add recognizer_batch 2 years ago
add wfst decoder (#2886) 2 years ago			`symbol_table_ = decoder_->WordSymbolTable();`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago
[speechx] add batch recognizer decode. (#2866) * add recognizer_batch 2 years ago			`global_frame_offset_ = 0;`
			`input_finished_ = false;`
			`num_frames_ = 0;`
			`result_.clear();`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`}`

			`U2Recognizer::~U2Recognizer() {`
[speechx] add batch recognizer decode. (#2866) * add recognizer_batch 2 years ago			`SetInputFinished();`
			`WaitDecodeFinished();`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`}`
u2 recog test main ok 2 years ago
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`void U2Recognizer::WaitDecodeFinished() {`
			`if (thread_.joinable()) thread_.join();`
add u2 recg 2 years ago			`}`

[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`void U2Recognizer::WaitFinished() {`
			`if (thread_.joinable()) thread_.join();`
			`nnet_producer_->Wait();`
			`}`

			`void U2Recognizer::InitDecoder() {`
add u2 recg 2 years ago			`global_frame_offset_ = 0;`
[Speechx] add nnet prob cache && make 2 thread decode work (#2769) * add nnet cache && make 2 thread work * do not compile websocket 2 years ago			`input_finished_ = false;`
add u2 recg 2 years ago			`num_frames_ = 0;`
			`result_.clear();`

			`decodable_->Reset();`
			`decoder_->Reset();`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`thread_ = std::thread(RunDecoderSearch, this);`
add u2 recg 2 years ago			`}`

			`void U2Recognizer::ResetContinuousDecoding() {`
			`global_frame_offset_ = num_frames_;`
			`num_frames_ = 0;`
			`result_.clear();`

			`decodable_->Reset();`
			`decoder_->Reset();`
			`}`

[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`void U2Recognizer::RunDecoderSearch(U2Recognizer* me) {`
			`me->RunDecoderSearchInternal();`
			`}`

			`void U2Recognizer::RunDecoderSearchInternal() {`
			`LOG(INFO) << "DecoderSearchInteral begin";`
			`while (!nnet_producer_->IsFinished()) {`
add wfst decoder (#2886) 2 years ago			`nnet_producer_->WaitProduce();`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`decoder_->AdvanceDecode(decodable_);`
			`}`
add wfst decoder (#2886) 2 years ago			`decoder_->AdvanceDecode(decodable_);`
			`UpdateResult(false);`
[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`LOG(INFO) << "DecoderSearchInteral exit";`
			`}`
add u2 recg 2 years ago
[speechx]add kaldi-native-fbank && refactor frontend (#2794) * replace kaldi-fbank with kaldi-native-fbank * make kaldi-native-fbank work 2 years ago			`void U2Recognizer::Accept(const vector<BaseFloat>& waves) {`
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`kaldi::Timer timer;`
[Speechx] add nnet prob cache && make 2 thread decode work (#2769) * add nnet cache && make 2 thread work * do not compile websocket 2 years ago			`nnet_producer_->Accept(waves);`
[speechx] add batch recognizer decode. (#2866) * add recognizer_batch 2 years ago			`VLOG(1) << "feed waves cost: " << timer.Elapsed() << " sec. "`
			`<< waves.size() << " samples.";`
add u2 recg 2 years ago			`}`

format 2 years ago			`void U2Recognizer::Decode() {`
			`decoder_->AdvanceDecode(decodable_);`
u2 recog test main ok 2 years ago			`UpdateResult(false);`
add u2 recg 2 years ago			`}`

			`void U2Recognizer::Rescoring() {`
format 2 years ago			`// Do attention Rescoring`
			`AttentionRescoring();`
add u2 recg 2 years ago			`}`

			`void U2Recognizer::UpdateResult(bool finish) {`
format 2 years ago			`const auto& hypotheses = decoder_->Outputs();`
			`const auto& inputs = decoder_->Inputs();`
			`const auto& likelihood = decoder_->Likelihood();`
			`const auto& times = decoder_->Times();`
			`result_.clear();`
add u2 recg 2 years ago
add wfst decoder (#2886) 2 years ago			`CHECK_EQ(inputs.size(), likelihood.size());`
format 2 years ago			`for (size_t i = 0; i < hypotheses.size(); i++) {`
			`const std::vector<int>& hypothesis = hypotheses[i];`

			`DecodeResult path;`
			`path.score = likelihood[i];`
			`for (size_t j = 0; j < hypothesis.size(); j++) {`
			`std::string word = symbol_table_->Find(hypothesis[j]);`
add wfst decoder (#2886) 2 years ago			`// path.sentence += (" " + word); // todo SmileGoat: add blank`
			`// processor`
			`path.sentence += word; // todo SmileGoat: add blank processor`
format 2 years ago			`}`

			`// TimeStamp is only supported in final result`
			`// TimeStamp of the output of CtcWfstBeamSearch may be inaccurate due to`
			`// various FST operations when building the decoding graph. So here we`
			`// use time stamp of the input(e2e model unit), which is more accurate,`
			`// and it requires the symbol table of the e2e model used in training.`
add wfst decoder (#2886) 2 years ago			`if (symbol_table_ != nullptr && finish) {`
format 2 years ago			`int offset = global_frame_offset_ * FrameShiftInMs();`
add u2 recg 2 years ago
format 2 years ago			`const std::vector<int>& input = inputs[i];`
			`const std::vector<int> time_stamp = times[i];`
			`CHECK_EQ(input.size(), time_stamp.size());`
add u2 recg 2 years ago
format 2 years ago			`for (size_t j = 0; j < input.size(); j++) {`
add wfst decoder (#2886) 2 years ago			`std::string word = symbol_table_->Find(input[j]);`
add u2 recg 2 years ago
format 2 years ago			`int start =`
			`time_stamp[j] * FrameShiftInMs() - time_stamp_gap_ > 0`
add u2 recg 2 years ago			`? time_stamp[j] * FrameShiftInMs() - time_stamp_gap_`
			`: 0;`
format 2 years ago			`if (j > 0) {`
			`start =`
			`(time_stamp[j] - time_stamp[j - 1]) * FrameShiftInMs() <`
			`time_stamp_gap_`
			`? (time_stamp[j - 1] + time_stamp[j]) / 2 *`
			`FrameShiftInMs()`
			`: start;`
			`}`

			`int end = time_stamp[j] * FrameShiftInMs();`
			`if (j < input.size() - 1) {`
			`end =`
			`(time_stamp[j + 1] - time_stamp[j]) * FrameShiftInMs() <`
			`time_stamp_gap_`
			`? (time_stamp[j + 1] + time_stamp[j]) / 2 *`
			`FrameShiftInMs()`
			`: end;`
			`}`

			`WordPiece word_piece(word, offset + start, offset + end);`
			`path.word_pieces.emplace_back(word_piece);`
			`}`
add u2 recg 2 years ago			`}`

format 2 years ago			`// if (post_processor_ != nullptr) {`
			`// path.sentence = post_processor_->Process(path.sentence, finish);`
			`// }`
add u2 recg 2 years ago
format 2 years ago			`result_.emplace_back(path);`
add u2 recg 2 years ago			`}`

format 2 years ago			`if (DecodedSomething()) {`
			`VLOG(1) << "Partial CTC result " << result_[0].sentence;`
			`}`
add u2 recg 2 years ago			`}`

			`void U2Recognizer::AttentionRescoring() {`
format 2 years ago			`decoder_->FinalizeSearch();`
add wfst decoder (#2886) 2 years ago			`UpdateResult(false);`
add u2 recg 2 years ago
format 2 years ago			`// No need to do rescoring`
			`if (0.0 == opts_.decoder_opts.rescoring_weight) {`
			`LOG_EVERY_N(WARNING, 3) << "Not do AttentionRescoring!";`
			`return;`
			`}`
			`LOG_EVERY_N(WARNING, 3) << "Do AttentionRescoring!";`

			`// Inputs() returns N-best input ids, which is the basic unit for rescoring`
			`// In CtcPrefixBeamSearch, inputs are the same to outputs`
			`const auto& hypotheses = decoder_->Inputs();`
			`int num_hyps = hypotheses.size();`
			`if (num_hyps <= 0) {`
			`return;`
			`}`

			`std::vector<float> rescoring_score;`
			`decodable_->AttentionRescoring(`
			`hypotheses, opts_.decoder_opts.reverse_weight, &rescoring_score);`

			`// combine ctc score and rescoring score`
			`for (size_t i = 0; i < num_hyps; i++) {`
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`VLOG(3) << "hyp " << i << " rescoring_score: " << rescoring_score[i]`
format code 2 years ago			`<< " ctc_score: " << result_[i].score`
			`<< " rescoring_weight: " << opts_.decoder_opts.rescoring_weight`
			`<< " ctc_weight: " << opts_.decoder_opts.ctc_weight;`
format 2 years ago			`result_[i].score =`
			`opts_.decoder_opts.rescoring_weight * rescoring_score[i] +`
			`opts_.decoder_opts.ctc_weight * result_[i].score;`
more debug info 2 years ago
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`VLOG(3) << "hyp: " << result_[0].sentence`
format code 2 years ago			`<< " score: " << result_[0].score;`
format 2 years ago			`}`
add u2 recg 2 years ago
format 2 years ago			`std::sort(result_.begin(), result_.end(), DecodeResult::CompareFunc);`
[speechx] fix compile and add more doc (#2591) * update u2pp latest static graph * add requirement * add utils * update doc * update result * update result * update result * fix cmake * imporove scripts * update result * add quant model and script * add profiling timer 2 years ago			`VLOG(3) << "result: " << result_[0].sentence`
format 2 years ago			`<< " score: " << result_[0].score;`
add u2 recg 2 years ago			`}`

format 2 years ago			`std::string U2Recognizer::GetFinalResult() { return result_[0].sentence; }`

			`std::string U2Recognizer::GetPartialResult() { return result_[0].sentence; }`

[speechx] thread decode (#2839) * fix nnet thread crash && rescore cost time * add nnet thread main 2 years ago			`void U2Recognizer::SetInputFinished() {`
			`nnet_producer_->SetInputFinished();`
add u2 recg 2 years ago			`input_finished_ = true;`
			`}`


[engine] rename speechx (#2892) * rename speechx * fix wfst decode error * replace reset with make_unique 2 years ago			`} // namespace ppspeech`