Support clang-tidy (#1034)

Fangjun Kuang · GitHub
Commit a11c8599710dbbd2484e93b452acf2bb7196354f a11c8599 1 parent 656b9fa1
.clang-tidy
.github/workflows/clang-tidy.yaml
.github/workflows/flutter-macos.yaml
.github/workflows/flutter-windows-x64.yaml
CMakeLists.txt
cmake/openfst.cmake
sherpa-onnx/csrc/CMakeLists.txt
sherpa-onnx/csrc/audio-tagging-label-file.cc
sherpa-onnx/csrc/base64-decode.cc
sherpa-onnx/csrc/cat.cc
sherpa-onnx/csrc/circular-buffer.cc
sherpa-onnx/csrc/context-graph.cc
sherpa-onnx/csrc/endpoint.cc
sherpa-onnx/csrc/endpoint.h
sherpa-onnx/csrc/jieba-lexicon.cc
sherpa-onnx/csrc/keyword-spotter.cc
sherpa-onnx/csrc/lexicon.cc
sherpa-onnx/csrc/lexicon.h
sherpa-onnx/csrc/offline-ct-transformer-model.cc
sherpa-onnx/csrc/offline-ctc-model.cc
--- a/.clang-tidy 0 → 100644
查看文件 @a11c859
+++ b/.clang-tidy 0 → 100644
查看文件 @a11c859
+ ---
+ # NOTE there must be no spaces before the '-', so put the comma last.
+ # The check bugprone-unchecked-optional-access is also turned off atm
+ # because it causes clang-tidy to hang randomly. The tracking issue
+ # can be found at https://github.com/llvm/llvm-project/issues/69369.
+ #
+ # Modified from
+ # https://github.com/pytorch/pytorch/blob/main/.clang-tidy
+ InheritParentConfig: true
+ Checks: '
+ bugprone-*,
+ -bugprone-easily-swappable-parameters,
+ -bugprone-forward-declaration-namespace,
+ -bugprone-implicit-widening-of-multiplication-result,
+ -bugprone-macro-parentheses,
+ -bugprone-lambda-function-name,
+ -bugprone-narrowing-conversions,
+ -bugprone-reserved-identifier,
+ -bugprone-swapped-arguments,
+ -bugprone-unchecked-optional-access,
+ clang-diagnostic-missing-prototypes,
+ cppcoreguidelines-*,
+ -cppcoreguidelines-avoid-const-or-ref-data-members,
+ -cppcoreguidelines-avoid-do-while,
+ -cppcoreguidelines-avoid-magic-numbers,
+ -cppcoreguidelines-avoid-non-const-global-variables,
+ -cppcoreguidelines-interfaces-global-init,
+ -cppcoreguidelines-macro-usage,
+ -cppcoreguidelines-narrowing-conversions,
+ -cppcoreguidelines-owning-memory,
+ -cppcoreguidelines-pro-bounds-array-to-pointer-decay,
+ -cppcoreguidelines-pro-bounds-constant-array-index,
+ -cppcoreguidelines-pro-bounds-pointer-arithmetic,
+ -cppcoreguidelines-pro-type-const-cast,
+ -cppcoreguidelines-pro-type-cstyle-cast,
+ -cppcoreguidelines-pro-type-reinterpret-cast,
+ -cppcoreguidelines-pro-type-static-cast-downcast,
+ -cppcoreguidelines-pro-type-union-access,
+ -cppcoreguidelines-pro-type-vararg,
+ -cppcoreguidelines-special-member-functions,
+ -cppcoreguidelines-non-private-member-variables-in-classes,
+ -facebook-hte-RelativeInclude,
+ hicpp-exception-baseclass,
+ hicpp-avoid-goto,
+ misc-*,
+ -misc-const-correctness,
+ -misc-include-cleaner,
+ -misc-use-anonymous-namespace,
+ -misc-unused-parameters,
+ -misc-no-recursion,
+ -misc-non-private-member-variables-in-classes,
+ -misc-confusable-identifiers,
+ modernize-*,
+ -modernize-macro-to-enum,
+ -modernize-pass-by-value,
+ -modernize-return-braced-init-list,
+ -modernize-use-auto,
+ -modernize-use-default-member-init,
+ -modernize-use-using,
+ -modernize-use-trailing-return-type,
+ -modernize-use-nodiscard,
+ performance-*,
+ readability-container-size-empty,
+ readability-delete-null-pointer,
+ readability-duplicate-include
+ readability-misplaced-array-index,
+ readability-redundant-function-ptr-dereference,
+ readability-redundant-smartptr-get,
+ readability-simplify-subscript-expr,
+ readability-string-compare,
+ '
+ WarningsAsErrors: '*'
+ ...
--- a/.github/workflows/clang-tidy.yaml 0 → 100644
查看文件 @a11c859
+++ b/.github/workflows/clang-tidy.yaml 0 → 100644
查看文件 @a11c859
+ name: clang-tidy
+ 
+ on:
+   push:
+     branches:
+       - master
+       - clang-tidy
+     paths:
+       - 'sherpa-onnx/csrc/**'
+ 
+   pull_request:
+     branches:
+       - master
+     paths:
+       - 'sherpa-onnx/csrc/**'
+ 
+   workflow_dispatch:
+ 
+ concurrency:
+   group: clang-tidy-${{ github.ref }}
+   cancel-in-progress: true
+ 
+ jobs:
+   clang-tidy:
+     runs-on: ubuntu-latest
+     strategy:
+       matrix:
+         python-version: [3.8]
+       fail-fast: false
+ 
+     steps:
+       - uses: actions/checkout@v4
+         with:
+           fetch-depth: 0
+ 
+       - name: Setup Python ${{ matrix.python-version }}
+         uses: actions/setup-python@v5
+         with:
+           python-version: ${{ matrix.python-version }}
+ 
+       - name: Install clang-tidy
+         shell: bash
+         run: |
+           pip install clang-tidy
+ 
+       - name: Configure
+         shell: bash
+         run: |
+           mkdir build
+           cd build
+           cmake -DSHERPA_ONNX_ENABLE_PYTHON=ON -DCMAKE_EXPORT_COMPILE_COMMANDS=ON ..
+ 
+       - name: Check with clang-tidy
+         shell: bash
+         run: |
+           cd build
+           make check
--- a/.github/workflows/flutter-macos.yaml
查看文件 @a11c859
+++ b/.github/workflows/flutter-macos.yaml
查看文件 @a11c859
@@ -184,6 +184,7 @@ jobs:
           path: ./*.tar.bz2
 
       - name: Publish to huggingface
+         if: (github.repository_owner == 'csukuangfj' || github.repository_owner == 'k2-fsa') && github.event_name == 'push' && contains(github.ref, 'refs/tags/') && matrix.build_type == 'Release'
         env:
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
         uses: nick-fields/retry@v3
--- a/.github/workflows/flutter-windows-x64.yaml
查看文件 @a11c859
+++ b/.github/workflows/flutter-windows-x64.yaml
查看文件 @a11c859
@@ -133,6 +133,7 @@ jobs:
         shell: bash
         run: |
           d=$PWD
+           SHERPA_ONNX_VERSION=v$(grep "SHERPA_ONNX_VERSION" ./CMakeLists.txt  | cut -d " " -f 2  | cut -d '"' -f 2)
 
           pushd sherpa-onnx/flutter
           dart pub get
@@ -159,6 +160,7 @@ jobs:
           path: ./*.tar.bz2
 
       - name: Publish to huggingface
+         if: (github.repository_owner == 'csukuangfj' || github.repository_owner == 'k2-fsa') && github.event_name == 'push' && contains(github.ref, 'refs/tags/') && matrix.build_type == 'Release'
         env:
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
         uses: nick-fields/retry@v3
--- a/CMakeLists.txt
查看文件 @a11c859
+++ b/CMakeLists.txt
查看文件 @a11c859
@@ -167,7 +167,7 @@ if(SHERPA_ONNX_ENABLE_WASM_KWS)
 endif()
 
 if(NOT CMAKE_CXX_STANDARD)
-   set(CMAKE_CXX_STANDARD 14 CACHE STRING "The C++ version to be used.")
+   set(CMAKE_CXX_STANDARD 17 CACHE STRING "The C++ version to be used.")
 endif()
 set(CMAKE_CXX_EXTENSIONS OFF)
 message(STATUS "C++ Standard version: ${CMAKE_CXX_STANDARD}")
--- a/cmake/openfst.cmake
查看文件 @a11c859
+++ b/cmake/openfst.cmake
查看文件 @a11c859
@@ -3,18 +3,18 @@
 function(download_openfst)
   include(FetchContent)
 
-   set(openfst_URL  "https://github.com/csukuangfj/openfst/archive/refs/tags/sherpa-onnx-2024-06-13.tar.gz")
-   set(openfst_URL2 "https://hub.nuaa.cf/csukuangfj/openfst/archive/refs/tags/sherpa-onnx-2024-06-13.tar.gz")
-   set(openfst_HASH "SHA256=f10a71c6b64d89eabdc316d372b956c30c825c7c298e2f20c780320e8181ffb6")
+   set(openfst_URL  "https://github.com/csukuangfj/openfst/archive/refs/tags/sherpa-onnx-2024-06-19.tar.gz")
+   set(openfst_URL2 "https://hub.nuaa.cf/csukuangfj/openfst/archive/refs/tags/sherpa-onnx-2024-06-19.tar.gz")
+   set(openfst_HASH "SHA256=5c98e82cc509c5618502dde4860b8ea04d843850ed57e6d6b590b644b268853d")
 
   # If you don't have access to the Internet,
   # please pre-download it
   set(possible_file_locations
-     $ENV{HOME}/Downloads/openfst-sherpa-onnx-2024-06-13.tar.gz
-     ${CMAKE_SOURCE_DIR}/openfst-sherpa-onnx-2024-06-13.tar.gz
-     ${CMAKE_BINARY_DIR}/openfst-sherpa-onnx-2024-06-13.tar.gz
-     /tmp/openfst-sherpa-onnx-2024-06-13.tar.gz
-     /star-fj/fangjun/download/github/openfst-sherpa-onnx-2024-06-13.tar.gz
+     $ENV{HOME}/Downloads/openfst-sherpa-onnx-2024-06-19.tar.gz
+     ${CMAKE_SOURCE_DIR}/openfst-sherpa-onnx-2024-06-19.tar.gz
+     ${CMAKE_BINARY_DIR}/openfst-sherpa-onnx-2024-06-19.tar.gz
+     /tmp/openfst-sherpa-onnx-2024-06-19.tar.gz
+     /star-fj/fangjun/download/github/openfst-sherpa-onnx-2024-06-19.tar.gz
   )
 
   foreach(f IN LISTS possible_file_locations)
--- a/sherpa-onnx/csrc/CMakeLists.txt
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/CMakeLists.txt
查看文件 @a11c859
@@ -534,3 +534,17 @@ if(SHERPA_ONNX_ENABLE_TESTS)
     sherpa_onnx_add_test(${source})
   endforeach()
 endif()
+ 
+ set(srcs_to_check)
+ foreach(s IN LISTS sources)
+   list(APPEND srcs_to_check ${CMAKE_CURRENT_LIST_DIR}/${s})
+ endforeach()
+ 
+ # For clang-tidy
+ add_custom_target(
+   clang-tidy-check
+   clang-tidy -p ${CMAKE_BINARY_DIR}/compile_commands.json --config-file ${CMAKE_SOURCE_DIR}/.clang-tidy ${srcs_to_check}
+   DEPENDS ${sources})
+ 
+ add_custom_target(check DEPENDS clang-tidy-check)
+ 
--- a/sherpa-onnx/csrc/audio-tagging-label-file.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/audio-tagging-label-file.cc
查看文件 @a11c859
@@ -60,7 +60,7 @@ void AudioTaggingLabels::Init(std::istream &is) {
 
     std::size_t pos{};
     int32_t i = std::stoi(index, &pos);
-     if (index.size() == 0 || pos != index.size()) {
+     if (index.empty() || pos != index.size()) {
       SHERPA_ONNX_LOGE("Invalid line: %s", line.c_str());
       exit(-1);
     }
--- a/sherpa-onnx/csrc/base64-decode.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/base64-decode.cc
查看文件 @a11c859
@@ -34,7 +34,7 @@ std::string Base64Decode(const std::string &s) {
     exit(-1);
   }
 
-   int32_t n = s.size() / 4 * 3;
+   int32_t n = static_cast<int32_t>(s.size()) / 4 * 3;
 
   std::string ans;
   ans.reserve(n);
@@ -46,16 +46,16 @@ std::string Base64Decode(const std::string &s) {
     }
 
     int32_t first = (Ord(s[i]) << 2) + ((Ord(s[i + 1]) & 0x30) >> 4);
-     ans.push_back(first);
+     ans.push_back(static_cast<char>(first));
 
     if (i + 2 < static_cast<int32_t>(s.size()) && s[i + 2] != '=') {
       int32_t second =
           ((Ord(s[i + 1]) & 0x0f) << 4) + ((Ord(s[i + 2]) & 0x3c) >> 2);
-       ans.push_back(second);
+       ans.push_back(static_cast<char>(second));
 
       if (i + 3 < static_cast<int32_t>(s.size()) && s[i + 3] != '=') {
         int32_t third = ((Ord(s[i + 2]) & 0x03) << 6) + Ord(s[i + 3]);
-         ans.push_back(third);
+         ans.push_back(static_cast<char>(third));
       }
     }
     i += 4;
--- a/sherpa-onnx/csrc/cat.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/cat.cc
查看文件 @a11c859
@@ -82,9 +82,9 @@ Ort::Value Cat(OrtAllocator *allocator,
   T *dst = ans.GetTensorMutableData<T>();
 
   for (int32_t i = 0; i != leading_size; ++i) {
-     for (int32_t n = 0; n != static_cast<int32_t>(values.size()); ++n) {
-       auto this_dim = values[n]->GetTensorTypeAndShapeInfo().GetShape()[dim];
-       const T *src = values[n]->GetTensorData<T>();
+     for (auto value : values) {
+       auto this_dim = value->GetTensorTypeAndShapeInfo().GetShape()[dim];
+       const T *src = value->GetTensorData<T>();
       src += i * this_dim * trailing_size;
 
       std::copy(src, src + this_dim * trailing_size, dst);
--- a/sherpa-onnx/csrc/circular-buffer.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/circular-buffer.cc
查看文件 @a11c859
@@ -20,7 +20,7 @@ CircularBuffer::CircularBuffer(int32_t capacity) {
 }
 
 void CircularBuffer::Resize(int32_t new_capacity) {
-   int32_t capacity = buffer_.size();
+   int32_t capacity = static_cast<int32_t>(buffer_.size());
   if (new_capacity <= capacity) {
     SHERPA_ONNX_LOGE("new_capacity (%d) <= original capacity (%d). Skip it.",
                      new_capacity, capacity);
@@ -86,7 +86,7 @@ void CircularBuffer::Resize(int32_t new_capacity) {
 }
 
 void CircularBuffer::Push(const float *p, int32_t n) {
-   int32_t capacity = buffer_.size();
+   int32_t capacity = static_cast<int32_t>(buffer_.size());
   int32_t size = Size();
   if (n + size > capacity) {
     int32_t new_capacity = std::max(capacity * 2, n + size);
@@ -126,7 +126,7 @@ std::vector<float> CircularBuffer::Get(int32_t start_index, int32_t n) const {
     return {};
   }
 
-   int32_t capacity = buffer_.size();
+   int32_t capacity = static_cast<int32_t>(buffer_.size());
 
   if (start_index - head_ + n > size) {
     SHERPA_ONNX_LOGE("Invalid start_index: %d and n: %d. head_: %d, size: %d",
--- a/sherpa-onnx/csrc/context-graph.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/context-graph.cc
查看文件 @a11c859
@@ -67,8 +67,8 @@ void ContextGraph::Build(const std::vector<std::vector<int32_t>> &token_ids,
 std::tuple<float, const ContextState *, const ContextState *>
 ContextGraph::ForwardOneStep(const ContextState *state, int32_t token,
                              bool strict_mode /*= true*/) const {
-   const ContextState *node;
-   float score;
+   const ContextState *node = nullptr;
+   float score = 0;
   if (1 == state->next.count(token)) {
     node = state->next.at(token).get();
     score = node->token_score;
@@ -84,7 +84,10 @@ ContextGraph::ForwardOneStep(const ContextState *state, int32_t token,
     score = node->node_score - state->node_score;
   }
 
-   SHERPA_ONNX_CHECK(nullptr != node);
+   if (!node) {
+     SHERPA_ONNX_LOGE("Some bad things happened.");
+     exit(-1);
+   }
 
   const ContextState *matched_node =
       node->is_end ? node : (node->output != nullptr ? node->output : nullptr);
--- a/sherpa-onnx/csrc/endpoint.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/endpoint.cc
查看文件 @a11c859
@@ -73,10 +73,15 @@ std::string EndpointConfig::ToString() const {
   return os.str();
 }
 
- bool Endpoint::IsEndpoint(int num_frames_decoded, int trailing_silence_frames,
+ bool Endpoint::IsEndpoint(int32_t num_frames_decoded,
+                           int32_t trailing_silence_frames,
                           float frame_shift_in_seconds) const {
-   float utterance_length = num_frames_decoded * frame_shift_in_seconds;
-   float trailing_silence = trailing_silence_frames * frame_shift_in_seconds;
+   float utterance_length =
+       static_cast<float>(num_frames_decoded) * frame_shift_in_seconds;
+ 
+   float trailing_silence =
+       static_cast<float>(trailing_silence_frames) * frame_shift_in_seconds;
+ 
   if (RuleActivated(config_.rule1, "rule1", trailing_silence,
                     utterance_length) ||
       RuleActivated(config_.rule2, "rule2", trailing_silence,
--- a/sherpa-onnx/csrc/endpoint.h
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/endpoint.h
查看文件 @a11c859
@@ -64,7 +64,7 @@ class Endpoint {
 
   /// This function returns true if this set of endpointing rules thinks we
   /// should terminate decoding.
-   bool IsEndpoint(int num_frames_decoded, int trailing_silence_frames,
+   bool IsEndpoint(int32_t num_frames_decoded, int32_t trailing_silence_frames,
                   float frame_shift_in_seconds) const;
 
  private:
--- a/sherpa-onnx/csrc/jieba-lexicon.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/jieba-lexicon.cc
查看文件 @a11c859
@@ -103,6 +103,7 @@ class JiebaLexicon::Impl {
 
       if (w == "。" || w == "！" || w == "？" || w == "，") {
         ans.push_back(std::move(this_sentence));
+         this_sentence = {};
       }
     }  // for (const auto &w : words)
 
--- a/sherpa-onnx/csrc/keyword-spotter.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/keyword-spotter.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/keyword-spotter.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <fstream>
 #include <iomanip>
 #include <memory>
--- a/sherpa-onnx/csrc/lexicon.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/lexicon.cc
查看文件 @a11c859
@@ -82,7 +82,7 @@ std::unordered_map<std::string, int32_t> ReadTokens(std::istream &is) {
   std::string line;
 
   std::string sym;
-   int32_t id;
+   int32_t id = -1;
   while (std::getline(is, line)) {
     std::istringstream iss(line);
     iss >> sym;
@@ -254,6 +254,7 @@ std::vector<std::vector<int64_t>> Lexicon::ConvertTextToTokenIdsChinese(
           this_sentence.push_back(eos);
         }
         ans.push_back(std::move(this_sentence));
+         this_sentence = {};
 
         if (sil != -1) {
           this_sentence.push_back(sil);
@@ -324,6 +325,7 @@ std::vector<std::vector<int64_t>> Lexicon::ConvertTextToTokenIdsNotChinese(
       if (w != ",") {
         this_sentence.push_back(blank);
         ans.push_back(std::move(this_sentence));
+         this_sentence = {};
       }
 
       continue;
--- a/sherpa-onnx/csrc/lexicon.h
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/lexicon.h
查看文件 @a11c859
@@ -62,8 +62,8 @@ class Lexicon : public OfflineTtsFrontend {
   std::unordered_map<std::string, std::vector<int32_t>> word2ids_;
   std::unordered_set<std::string> punctuations_;
   std::unordered_map<std::string, int32_t> token2id_;
-   Language language_;
-   bool debug_;
+   Language language_ = Language::kUnknown;
+   bool debug_ = false;
 };
 
 }  // namespace sherpa_onnx
--- a/sherpa-onnx/csrc/offline-ct-transformer-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-ct-transformer-model.cc
查看文件 @a11c859
@@ -67,7 +67,7 @@ class OfflineCtTransformerModel::Impl {
     std::vector<std::string> tokens;
     SHERPA_ONNX_READ_META_DATA_VEC_STRING_SEP(tokens, "tokens", "|");
 
-     int32_t vocab_size;
+     int32_t vocab_size = 0;
     SHERPA_ONNX_READ_META_DATA(vocab_size, "vocab_size");
     if (static_cast<int32_t>(tokens.size()) != vocab_size) {
       SHERPA_ONNX_LOGE("tokens.size() %d != vocab_size %d",
--- a/sherpa-onnx/csrc/offline-ctc-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-ctc-model.cc
查看文件 @a11c859
@@ -19,7 +19,7 @@
 
 namespace {
 
- enum class ModelType {
+ enum class ModelType : std::uint8_t {
   kEncDecCTCModelBPE,
   kEncDecHybridRNNTCTCBPEModel,
   kTdnn,
--- a/sherpa-onnx/csrc/offline-stream.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-stream.cc
查看文件 @a11c859
@@ -4,11 +4,11 @@
 
 #include "sherpa-onnx/csrc/offline-stream.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <cmath>
 #include <iomanip>
+ #include <utility>
 
 #include "kaldi-native-fbank/csrc/online-feature.h"
 #include "sherpa-onnx/csrc/macros.h"
@@ -56,7 +56,7 @@ class OfflineStream::Impl {
  public:
   explicit Impl(const FeatureExtractorConfig &config,
                 ContextGraphPtr context_graph)
-       : config_(config), context_graph_(context_graph) {
+       : config_(config), context_graph_(std::move(context_graph)) {
     if (config.is_mfcc) {
       mfcc_opts_.frame_opts.dither = config_.dither;
       mfcc_opts_.frame_opts.snip_edges = config_.snip_edges;
@@ -266,7 +266,7 @@ class OfflineStream::Impl {
 
 OfflineStream::OfflineStream(const FeatureExtractorConfig &config /*= {}*/,
                              ContextGraphPtr context_graph /*= nullptr*/)
-     : impl_(std::make_unique<Impl>(config, context_graph)) {}
+     : impl_(std::make_unique<Impl>(config, std::move(context_graph))) {}
 
 OfflineStream::OfflineStream(WhisperTag tag)
     : impl_(std::make_unique<Impl>(tag)) {}
--- a/sherpa-onnx/csrc/offline-transducer-modified-beam-search-decoder.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-transducer-modified-beam-search-decoder.cc
查看文件 @a11c859
@@ -42,7 +42,7 @@ OfflineTransducerModifiedBeamSearchDecoder::Decode(
   std::vector<ContextGraphPtr> context_graphs(batch_size, nullptr);
 
   for (int32_t i = 0; i < batch_size; ++i) {
-     const ContextState *context_state;
+     const ContextState *context_state = nullptr;
     if (ss != nullptr) {
       context_graphs[i] =
           ss[packed_encoder_out.sorted_indexes[i]]->GetContextGraph();
--- a/sherpa-onnx/csrc/offline-tts-character-frontend.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-tts-character-frontend.cc
查看文件 @a11c859
@@ -30,7 +30,7 @@ static std::unordered_map<char32_t, int32_t> ReadTokens(std::istream &is) {
 
   std::string sym;
   std::u32string s;
-   int32_t id;
+   int32_t id = 0;
   while (std::getline(is, line)) {
     std::istringstream iss(line);
     iss >> sym;
@@ -138,6 +138,7 @@ OfflineTtsCharacterFrontend::ConvertTextToTokenIds(
         }
 
         ans.push_back(std::move(this_sentence));
+         this_sentence = {};
 
         // re-initialize this_sentence
         if (use_eos_bos) {
@@ -172,6 +173,7 @@ OfflineTtsCharacterFrontend::ConvertTextToTokenIds(
         }
 
         ans.push_back(std::move(this_sentence));
+         this_sentence = {};
 
         // re-initialize this_sentence
         if (use_eos_bos) {
--- a/sherpa-onnx/csrc/offline-tts.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-tts.cc
查看文件 @a11c859
@@ -5,6 +5,7 @@
 #include "sherpa-onnx/csrc/offline-tts.h"
 
 #include <string>
+ #include <utility>
 
 #include "sherpa-onnx/csrc/file-utils.h"
 #include "sherpa-onnx/csrc/macros.h"
@@ -87,7 +88,7 @@ OfflineTts::~OfflineTts() = default;
 GeneratedAudio OfflineTts::Generate(
     const std::string &text, int64_t sid /*=0*/, float speed /*= 1.0*/,
     GeneratedAudioCallback callback /*= nullptr*/) const {
-   return impl_->Generate(text, sid, speed, callback);
+   return impl_->Generate(text, sid, speed, std::move(callback));
 }
 
 int32_t OfflineTts::SampleRate() const { return impl_->SampleRate(); }
--- a/sherpa-onnx/csrc/offline-whisper-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/offline-whisper-model.cc
查看文件 @a11c859
@@ -22,9 +22,9 @@ class OfflineWhisperModel::Impl {
   explicit Impl(const OfflineModelConfig &config)
       : config_(config),
         env_(ORT_LOGGING_LEVEL_ERROR),
+         debug_(config.debug),
         sess_opts_(GetSessionOptions(config)),
         allocator_{} {
-     debug_ = config_.debug;
     {
       auto buf = ReadFile(config.whisper.encoder);
       InitEncoder(buf.data(), buf.size());
@@ -39,9 +39,9 @@ class OfflineWhisperModel::Impl {
   explicit Impl(const SpokenLanguageIdentificationConfig &config)
       : lid_config_(config),
         env_(ORT_LOGGING_LEVEL_ERROR),
+         debug_(config_.debug),
         sess_opts_(GetSessionOptions(config)),
         allocator_{} {
-     debug_ = config_.debug;
     {
       auto buf = ReadFile(config.whisper.encoder);
       InitEncoder(buf.data(), buf.size());
@@ -148,7 +148,6 @@ class OfflineWhisperModel::Impl {
     cross_v = std::move(std::get<4>(decoder_out));
 
     const float *p_logits = std::get<0>(decoder_out).GetTensorData<float>();
-     int32_t vocab_size = VocabSize();
     const auto &all_language_ids = GetAllLanguageIDs();
 
     int32_t lang_id = all_language_ids[0];
@@ -317,18 +316,18 @@ class OfflineWhisperModel::Impl {
   std::unordered_map<int32_t, std::string> id2lang_;
 
   // model meta data
-   int32_t n_text_layer_;
-   int32_t n_text_ctx_;
-   int32_t n_text_state_;
-   int32_t n_vocab_;
-   int32_t sot_;
-   int32_t eot_;
-   int32_t blank_;
-   int32_t translate_;
-   int32_t transcribe_;
-   int32_t no_timestamps_;
-   int32_t no_speech_;
-   int32_t is_multilingual_;
+   int32_t n_text_layer_ = 0;
+   int32_t n_text_ctx_ = 0;
+   int32_t n_text_state_ = 0;
+   int32_t n_vocab_ = 0;
+   int32_t sot_ = 0;
+   int32_t eot_ = 0;
+   int32_t blank_ = 0;
+   int32_t translate_ = 0;
+   int32_t transcribe_ = 0;
+   int32_t no_timestamps_ = 0;
+   int32_t no_speech_ = 0;
+   int32_t is_multilingual_ = 0;
   std::vector<int64_t> sot_sequence_;
 };
 
--- a/sherpa-onnx/csrc/online-conformer-transducer-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-conformer-transducer-model.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/online-conformer-transducer-model.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <memory>
 #include <sstream>
 #include <string>
--- a/sherpa-onnx/csrc/online-ctc-fst-decoder.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-ctc-fst-decoder.cc
查看文件 @a11c859
@@ -52,8 +52,9 @@ static void DecodeOne(const float *log_probs, int32_t num_rows,
     if (ok) {
       std::vector<int32_t> isymbols_out;
       std::vector<int32_t> osymbols_out;
-       ok = fst::GetLinearSymbolSequence(fst_out, &isymbols_out, &osymbols_out,
-                                         nullptr);
+       /*ok =*/fst::GetLinearSymbolSequence(fst_out, &isymbols_out,
+                                            &osymbols_out, nullptr);
+       // TODO(fangjun): handle ok is false
       std::vector<int64_t> tokens;
       tokens.reserve(isymbols_out.size());
 
--- a/sherpa-onnx/csrc/online-lstm-transducer-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-lstm-transducer-model.cc
查看文件 @a11c859
@@ -3,9 +3,8 @@
 // Copyright (c)  2023  Xiaomi Corporation
 #include "sherpa-onnx/csrc/online-lstm-transducer-model.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <memory>
 #include <sstream>
 #include <string>
--- a/sherpa-onnx/csrc/online-nemo-ctc-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-nemo-ctc-model.cc
查看文件 @a11c859
@@ -265,16 +265,16 @@ class OnlineNeMoCtcModel::Impl {
   std::vector<std::string> output_names_;
   std::vector<const char *> output_names_ptr_;
 
-   int32_t window_size_;
-   int32_t chunk_shift_;
-   int32_t subsampling_factor_;
-   int32_t vocab_size_;
-   int32_t cache_last_channel_dim1_;
-   int32_t cache_last_channel_dim2_;
-   int32_t cache_last_channel_dim3_;
-   int32_t cache_last_time_dim1_;
-   int32_t cache_last_time_dim2_;
-   int32_t cache_last_time_dim3_;
+   int32_t window_size_ = 0;
+   int32_t chunk_shift_ = 0;
+   int32_t subsampling_factor_ = 0;
+   int32_t vocab_size_ = 0;
+   int32_t cache_last_channel_dim1_ = 0;
+   int32_t cache_last_channel_dim2_ = 0;
+   int32_t cache_last_channel_dim3_ = 0;
+   int32_t cache_last_time_dim1_ = 0;
+   int32_t cache_last_time_dim2_ = 0;
+   int32_t cache_last_time_dim3_ = 0;
 
   Ort::Value cache_last_channel_{nullptr};
   Ort::Value cache_last_time_{nullptr};
--- a/sherpa-onnx/csrc/online-recognizer.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-recognizer.cc
查看文件 @a11c859
@@ -5,9 +5,8 @@
 
 #include "sherpa-onnx/csrc/online-recognizer.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <iomanip>
 #include <memory>
 #include <sstream>
--- a/sherpa-onnx/csrc/online-stream.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-stream.cc
查看文件 @a11c859
@@ -8,6 +8,7 @@
 #include <vector>
 
 #include "sherpa-onnx/csrc/features.h"
+ #include "sherpa-onnx/csrc/transducer-keyword-decoder.h"
 
 namespace sherpa_onnx {
 
@@ -15,7 +16,7 @@ class OnlineStream::Impl {
  public:
   explicit Impl(const FeatureExtractorConfig &config,
                 ContextGraphPtr context_graph)
-       : feat_extractor_(config), context_graph_(context_graph) {}
+       : feat_extractor_(config), context_graph_(std::move(context_graph)) {}
 
   void AcceptWaveform(int32_t sampling_rate, const float *waveform, int32_t n) {
     feat_extractor_.AcceptWaveform(sampling_rate, waveform, n);
@@ -146,7 +147,7 @@ class OnlineStream::Impl {
 
 OnlineStream::OnlineStream(const FeatureExtractorConfig &config /*= {}*/,
                            ContextGraphPtr context_graph /*= nullptr */)
-     : impl_(std::make_unique<Impl>(config, context_graph)) {}
+     : impl_(std::make_unique<Impl>(config, std::move(context_graph))) {}
 
 OnlineStream::~OnlineStream() = default;
 
--- a/sherpa-onnx/csrc/online-stream.h
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-stream.h
查看文件 @a11c859
@@ -15,7 +15,6 @@
 #include "sherpa-onnx/csrc/online-ctc-decoder.h"
 #include "sherpa-onnx/csrc/online-paraformer-decoder.h"
 #include "sherpa-onnx/csrc/online-transducer-decoder.h"
- #include "sherpa-onnx/csrc/transducer-keyword-decoder.h"
 
 namespace sherpa_onnx {
 
--- a/sherpa-onnx/csrc/online-transducer-decoder.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-transducer-decoder.cc
查看文件 @a11c859
@@ -45,13 +45,13 @@ OnlineTransducerDecoderResult &OnlineTransducerDecoderResult::operator=(
 }
 
 OnlineTransducerDecoderResult::OnlineTransducerDecoderResult(
-     OnlineTransducerDecoderResult &&other)
+     OnlineTransducerDecoderResult &&other) noexcept
     : OnlineTransducerDecoderResult() {
   *this = std::move(other);
 }
 
 OnlineTransducerDecoderResult &OnlineTransducerDecoderResult::operator=(
-     OnlineTransducerDecoderResult &&other) {
+     OnlineTransducerDecoderResult &&other) noexcept {
   if (this == &other) {
     return *this;
   }
--- a/sherpa-onnx/csrc/online-transducer-decoder.h
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-transducer-decoder.h
查看文件 @a11c859
@@ -44,10 +44,10 @@ struct OnlineTransducerDecoderResult {
   OnlineTransducerDecoderResult &operator=(
       const OnlineTransducerDecoderResult &other);
 
-   OnlineTransducerDecoderResult(OnlineTransducerDecoderResult &&other);
+   OnlineTransducerDecoderResult(OnlineTransducerDecoderResult &&other) noexcept;
 
   OnlineTransducerDecoderResult &operator=(
-       OnlineTransducerDecoderResult &&other);
+       OnlineTransducerDecoderResult &&other) noexcept;
 };
 
 class OnlineStream;
--- a/sherpa-onnx/csrc/online-transducer-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-transducer-model.cc
查看文件 @a11c859
@@ -23,7 +23,7 @@
 
 namespace {
 
- enum class ModelType {
+ enum class ModelType : std::uint8_t {
   kConformer,
   kLstm,
   kZipformer,
--- a/sherpa-onnx/csrc/online-transducer-nemo-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-transducer-nemo-model.cc
查看文件 @a11c859
@@ -5,10 +5,9 @@
 
 #include "sherpa-onnx/csrc/online-transducer-nemo-model.h"
 
- #include <assert.h>
- #include <math.h>
- 
 #include <algorithm>
+ #include <cassert>
+ #include <cmath>
 #include <memory>
 #include <numeric>
 #include <sstream>
@@ -429,8 +428,8 @@ class OnlineTransducerNeMoModel::Impl {
   std::vector<std::string> joiner_output_names_;
   std::vector<const char *> joiner_output_names_ptr_;
 
-   int32_t window_size_;
-   int32_t chunk_shift_;
+   int32_t window_size_ = 0;
+   int32_t chunk_shift_ = 0;
   int32_t vocab_size_ = 0;
   int32_t subsampling_factor_ = 8;
   std::string normalize_type_;
@@ -438,12 +437,12 @@ class OnlineTransducerNeMoModel::Impl {
   int32_t pred_hidden_ = -1;
 
   // encoder states
-   int32_t cache_last_channel_dim1_;
-   int32_t cache_last_channel_dim2_;
-   int32_t cache_last_channel_dim3_;
-   int32_t cache_last_time_dim1_;
-   int32_t cache_last_time_dim2_;
-   int32_t cache_last_time_dim3_;
+   int32_t cache_last_channel_dim1_ = 0;
+   int32_t cache_last_channel_dim2_ = 0;
+   int32_t cache_last_channel_dim3_ = 0;
+   int32_t cache_last_time_dim1_ = 0;
+   int32_t cache_last_time_dim2_ = 0;
+   int32_t cache_last_time_dim3_ = 0;
 
   // init encoder states
   Ort::Value cache_last_channel_{nullptr};
--- a/sherpa-onnx/csrc/online-wenet-ctc-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-wenet-ctc-model.cc
查看文件 @a11c859
@@ -192,15 +192,15 @@ class OnlineWenetCtcModel::Impl {
   std::vector<std::string> output_names_;
   std::vector<const char *> output_names_ptr_;
 
-   int32_t head_;
-   int32_t num_blocks_;
-   int32_t output_size_;
-   int32_t cnn_module_kernel_;
-   int32_t right_context_;
-   int32_t subsampling_factor_;
-   int32_t vocab_size_;
- 
-   int32_t required_cache_size_;
+   int32_t head_ = 0;
+   int32_t num_blocks_ = 0;
+   int32_t output_size_ = 0;
+   int32_t cnn_module_kernel_ = 0;
+   int32_t right_context_ = 0;
+   int32_t subsampling_factor_ = 0;
+   int32_t vocab_size_ = 0;
+ 
+   int32_t required_cache_size_ = 0;
 
   Ort::Value attn_cache_{nullptr};
   Ort::Value conv_cache_{nullptr};
--- a/sherpa-onnx/csrc/online-zipformer-transducer-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-zipformer-transducer-model.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/online-zipformer-transducer-model.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <memory>
 #include <sstream>
 #include <string>
--- a/sherpa-onnx/csrc/online-zipformer2-ctc-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-zipformer2-ctc-model.cc
查看文件 @a11c859
@@ -4,10 +4,8 @@
 
 #include "sherpa-onnx/csrc/online-zipformer2-ctc-model.h"
 
- #include <assert.h>
- #include <math.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <cmath>
 #include <numeric>
 #include <string>
@@ -90,7 +88,6 @@ class OnlineZipformer2CtcModel::Impl {
   std::vector<Ort::Value> StackStates(
       std::vector<std::vector<Ort::Value>> states) const {
     int32_t batch_size = static_cast<int32_t>(states.size());
-     int32_t num_encoders = static_cast<int32_t>(num_encoder_layers_.size());
 
     std::vector<const Ort::Value *> buf(batch_size);
 
@@ -168,7 +165,6 @@ class OnlineZipformer2CtcModel::Impl {
     assert(states.size() == m * 6 + 2);
 
     int32_t batch_size = states[0].GetTensorTypeAndShapeInfo().GetShape()[1];
-     int32_t num_encoders = num_encoder_layers_.size();
 
     std::vector<std::vector<Ort::Value>> ans;
     ans.resize(batch_size);
--- a/sherpa-onnx/csrc/online-zipformer2-transducer-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/online-zipformer2-transducer-model.cc
查看文件 @a11c859
@@ -4,10 +4,9 @@
 
 #include "sherpa-onnx/csrc/online-zipformer2-transducer-model.h"
 
- #include <assert.h>
- #include <math.h>
- 
 #include <algorithm>
+ #include <cassert>
+ #include <cmath>
 #include <memory>
 #include <numeric>
 #include <sstream>
--- a/sherpa-onnx/csrc/onnx-utils.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/onnx-utils.cc
查看文件 @a11c859
@@ -281,11 +281,12 @@ CopyableOrtValue &CopyableOrtValue::operator=(const CopyableOrtValue &other) {
   return *this;
 }
 
- CopyableOrtValue::CopyableOrtValue(CopyableOrtValue &&other) {
+ CopyableOrtValue::CopyableOrtValue(CopyableOrtValue &&other) noexcept {
   *this = std::move(other);
 }
 
- CopyableOrtValue &CopyableOrtValue::operator=(CopyableOrtValue &&other) {
+ CopyableOrtValue &CopyableOrtValue::operator=(
+     CopyableOrtValue &&other) noexcept {
   if (this == &other) {
     return *this;
   }
--- a/sherpa-onnx/csrc/onnx-utils.h
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/onnx-utils.h
查看文件 @a11c859
@@ -110,9 +110,9 @@ struct CopyableOrtValue {
 
   CopyableOrtValue &operator=(const CopyableOrtValue &other);
 
-   CopyableOrtValue(CopyableOrtValue &&other);
+   CopyableOrtValue(CopyableOrtValue &&other) noexcept;
 
-   CopyableOrtValue &operator=(CopyableOrtValue &&other);
+   CopyableOrtValue &operator=(CopyableOrtValue &&other) noexcept;
 };
 
 std::vector<CopyableOrtValue> Convert(std::vector<Ort::Value> values);
--- a/sherpa-onnx/csrc/packed-sequence.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/packed-sequence.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/packed-sequence.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <numeric>
 #include <utility>
 
@@ -57,7 +56,7 @@ PackedSequence PackPaddedSequence(OrtAllocator *allocator,
 
   int64_t max_T = p_length[indexes[0]];
 
-   int32_t sum_T = std::accumulate(p_length, p_length + n, 0);
+   auto sum_T = std::accumulate(p_length, p_length + n, static_cast<int64_t>(0));
 
   std::array<int64_t, 2> data_shape{sum_T, v_shape[2]};
 
--- a/sherpa-onnx/csrc/pad-sequence.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/pad-sequence.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/pad-sequence.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <vector>
 
 namespace sherpa_onnx {
--- a/sherpa-onnx/csrc/parse-options.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/parse-options.cc
查看文件 @a11c859
@@ -11,9 +11,8 @@
 
 #include "sherpa-onnx/csrc/parse-options.h"
 
- #include <ctype.h>
- 
 #include <algorithm>
+ #include <array>
 #include <cctype>
 #include <cstring>
 #include <fstream>
@@ -33,7 +32,7 @@ ParseOptions::ParseOptions(const std::string &prefix, ParseOptions *po)
   } else {
     other_parser_ = po;
   }
-   if (po != nullptr && po->prefix_ != "") {
+   if (po != nullptr && !po->prefix_.empty()) {
     prefix_ = po->prefix_ + std::string(".") + prefix;
   } else {
     prefix_ = prefix;
@@ -179,10 +178,10 @@ void ParseOptions::DisableOption(const std::string &name) {
   string_map_.erase(name);
 }
 
- int ParseOptions::NumArgs() const { return positional_args_.size(); }
+ int32_t ParseOptions::NumArgs() const { return positional_args_.size(); }
 
- std::string ParseOptions::GetArg(int i) const {
-   if (i < 1 || i > static_cast<int>(positional_args_.size())) {
+ std::string ParseOptions::GetArg(int32_t i) const {
+   if (i < 1 || i > static_cast<int32_t>(positional_args_.size())) {
     SHERPA_ONNX_LOGE("ParseOptions::GetArg, invalid index %d", i);
     exit(-1);
   }
@@ -191,7 +190,7 @@ std::string ParseOptions::GetArg(int i) const {
 }
 
 // We currently do not support any other options.
- enum ShellType { kBash = 0 };
+ enum ShellType : std::uint8_t { kBash = 0 };
 
 // This can be changed in the code if it ever does need to be changed (as it's
 // unlikely that one compilation of this tool-set would use both shells).
@@ -213,7 +212,7 @@ static bool MustBeQuoted(const std::string &str, ShellType st) {
   if (*c == '\0') {
     return true;  // Must quote empty string
   } else {
-     const char *ok_chars[2];
+     std::array<const char *, 2> ok_chars{};
 
     // These seem not to be interpreted as long as there are no other "bad"
     // characters involved (e.g. "," would be interpreted as part of something
@@ -229,7 +228,7 @@ static bool MustBeQuoted(const std::string &str, ShellType st) {
       // are OK. All others are forbidden (this is easier since the shell
       // interprets most non-alphanumeric characters).
       if (!isalnum(*c)) {
-         const char *d;
+         const char *d = nullptr;
         for (d = ok_chars[st]; *d != '\0'; ++d) {
           if (*c == *d) break;
         }
@@ -269,22 +268,22 @@ static std::string QuoteAndEscape(const std::string &str, ShellType /*st*/) {
     escape_str = "\\\"";  // should never be accessed.
   }
 
-   char buf[2];
+   std::array<char, 2> buf{};
   buf[1] = '\0';
 
   buf[0] = quote_char;
-   std::string ans = buf;
+   std::string ans = buf.data();
   const char *c = str.c_str();
   for (; *c != '\0'; ++c) {
     if (*c == quote_char) {
       ans += escape_str;
     } else {
       buf[0] = *c;
-       ans += buf;
+       ans += buf.data();
     }
   }
   buf[0] = quote_char;
-   ans += buf;
+   ans += buf.data();
   return ans;
 }
 
@@ -293,11 +292,11 @@ std::string ParseOptions::Escape(const std::string &str) {
   return MustBeQuoted(str, kShellType) ? QuoteAndEscape(str, kShellType) : str;
 }
 
- int ParseOptions::Read(int argc, const char *const argv[]) {
+ int32_t ParseOptions::Read(int32_t argc, const char *const *argv) {
   argc_ = argc;
   argv_ = argv;
   std::string key, value;
-   int i;
+   int32_t i = 0;
 
   // first pass: look for config parameter, look for priority
   for (i = 1; i < argc; ++i) {
@@ -306,13 +305,13 @@ int ParseOptions::Read(int argc, const char *const argv[]) {
         // a lone "--" marks the end of named options
         break;
       }
-       bool has_equal_sign;
+       bool has_equal_sign = false;
       SplitLongArg(argv[i], &key, &value, &has_equal_sign);
       NormalizeArgName(&key);
       Trim(&value);
-       if (key.compare("config") == 0) {
+       if (key == "config") {
         ReadConfigFile(value);
-       } else if (key.compare("help") == 0) {
+       } else if (key == "help") {
         PrintUsage();
         exit(0);
       }
@@ -330,7 +329,7 @@ int ParseOptions::Read(int argc, const char *const argv[]) {
         double_dash_seen = true;
         break;
       }
-       bool has_equal_sign;
+       bool has_equal_sign = false;
       SplitLongArg(argv[i], &key, &value, &has_equal_sign);
       NormalizeArgName(&key);
       Trim(&value);
@@ -349,14 +348,14 @@ int ParseOptions::Read(int argc, const char *const argv[]) {
     if ((std::strcmp(argv[i], "--") == 0) && !double_dash_seen) {
       double_dash_seen = true;
     } else {
-       positional_args_.push_back(std::string(argv[i]));
+       positional_args_.emplace_back(argv[i]);
     }
   }
 
   // if the user did not suppress this with --print-args = false....
   if (print_args_) {
     std::ostringstream strm;
-     for (int j = 0; j < argc; ++j) strm << Escape(argv[j]) << " ";
+     for (int32_t j = 0; j < argc; ++j) strm << Escape(argv[j]) << " ";
     strm << '\n';
     SHERPA_ONNX_LOGE("%s", strm.str().c_str());
   }
@@ -368,14 +367,14 @@ void ParseOptions::PrintUsage(bool print_command_line /*=false*/) const {
   os << '\n' << usage_ << '\n';
   // first we print application-specific options
   bool app_specific_header_printed = false;
-   for (auto it = doc_map_.begin(); it != doc_map_.end(); ++it) {
-     if (it->second.is_standard_ == false) {  // application-specific option
+   for (const auto &it : doc_map_) {
+     if (it.second.is_standard_ == false) {  // application-specific option
       if (app_specific_header_printed == false) {  // header was not yet printed
         os << "Options:" << '\n';
         app_specific_header_printed = true;
       }
-       os << "  --" << std::setw(25) << std::left << it->second.name_ << " : "
-          << it->second.use_msg_ << '\n';
+       os << "  --" << std::setw(25) << std::left << it.second.name_ << " : "
+          << it.second.use_msg_ << '\n';
     }
   }
   if (app_specific_header_printed == true) {
@@ -384,17 +383,17 @@ void ParseOptions::PrintUsage(bool print_command_line /*=false*/) const {
 
   // then the standard options
   os << "Standard options:" << '\n';
-   for (auto it = doc_map_.begin(); it != doc_map_.end(); ++it) {
-     if (it->second.is_standard_ == true) {  // we have standard option
-       os << "  --" << std::setw(25) << std::left << it->second.name_ << " : "
-          << it->second.use_msg_ << '\n';
+   for (const auto &it : doc_map_) {
+     if (it.second.is_standard_ == true) {  // we have standard option
+       os << "  --" << std::setw(25) << std::left << it.second.name_ << " : "
+          << it.second.use_msg_ << '\n';
     }
   }
   os << '\n';
   if (print_command_line) {
     std::ostringstream strm;
     strm << "Command line was: ";
-     for (int j = 0; j < argc_; ++j) strm << Escape(argv_[j]) << " ";
+     for (int32_t j = 0; j < argc_; ++j) strm << Escape(argv_[j]) << " ";
     strm << '\n';
     os << strm.str();
   }
@@ -405,9 +404,9 @@ void ParseOptions::PrintUsage(bool print_command_line /*=false*/) const {
 void ParseOptions::PrintConfig(std::ostream &os) const {
   os << '\n' << "[[ Configuration of UI-Registered options ]]" << '\n';
   std::string key;
-   for (auto it = doc_map_.begin(); it != doc_map_.end(); ++it) {
-     key = it->first;
-     os << it->second.name_ << " = ";
+   for (const auto &it : doc_map_) {
+     key = it.first;
+     os << it.second.name_ << " = ";
     if (bool_map_.end() != bool_map_.find(key)) {
       os << (*bool_map_.at(key) ? "true" : "false");
     } else if (int_map_.end() != int_map_.find(key)) {
@@ -442,13 +441,13 @@ void ParseOptions::ReadConfigFile(const std::string &filename) {
   while (std::getline(is, line)) {
     ++line_number;
     // trim out the comments
-     size_t pos;
-     if ((pos = line.find_first_of('#')) != std::string::npos) {
+     size_t pos = line.find_first_of('#');
+     if (pos != std::string::npos) {
       line.erase(pos);
     }
     // skip empty lines
     Trim(&line);
-     if (line.length() == 0) continue;
+     if (line.empty()) continue;
 
     if (line.substr(0, 2) != "--") {
       SHERPA_ONNX_LOGE(
@@ -461,7 +460,7 @@ void ParseOptions::ReadConfigFile(const std::string &filename) {
     }
 
     // parse option
-     bool has_equal_sign;
+     bool has_equal_sign = false;
     SplitLongArg(line, &key, &value, &has_equal_sign);
     NormalizeArgName(&key);
     Trim(&value);
@@ -527,7 +526,7 @@ void ParseOptions::Trim(std::string *str) const {
 bool ParseOptions::SetOption(const std::string &key, const std::string &value,
                              bool has_equal_sign) {
   if (bool_map_.end() != bool_map_.find(key)) {
-     if (has_equal_sign && value == "") {
+     if (has_equal_sign && value.empty()) {
       SHERPA_ONNX_LOGE("Invalid option --%s=", key.c_str());
       exit(-1);
     }
@@ -557,12 +556,10 @@ bool ParseOptions::ToBool(std::string str) const {
   std::transform(str.begin(), str.end(), str.begin(), ::tolower);
 
   // allow "" as a valid option for "true", so that --x is the same as --x=true
-   if ((str.compare("true") == 0) || (str.compare("t") == 0) ||
-       (str.compare("1") == 0) || (str.compare("") == 0)) {
+   if (str == "true" || str == "t" || str == "1" || str.empty()) {
     return true;
   }
-   if ((str.compare("false") == 0) || (str.compare("f") == 0) ||
-       (str.compare("0") == 0)) {
+   if (str == "false" || str == "f" || str == "0") {
     return false;
   }
   // if it is neither true nor false:
@@ -593,7 +590,7 @@ uint32_t ParseOptions::ToUint(const std::string &str) const {
 }
 
 float ParseOptions::ToFloat(const std::string &str) const {
-   float ret;
+   float ret = 0;
   if (!ConvertStringToReal(str, &ret)) {
     SHERPA_ONNX_LOGE("Invalid floating-point option \"%s\"", str.c_str());
     exit(-1);
@@ -602,7 +599,7 @@ float ParseOptions::ToFloat(const std::string &str) const {
 }
 
 double ParseOptions::ToDouble(const std::string &str) const {
-   double ret;
+   double ret = 0;
   if (!ConvertStringToReal(str, &ret)) {
     SHERPA_ONNX_LOGE("Invalid floating-point option \"%s\"", str.c_str());
     exit(-1);
--- a/sherpa-onnx/csrc/piper-phonemize-lexicon.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/piper-phonemize-lexicon.cc
查看文件 @a11c859
@@ -37,7 +37,7 @@ static std::unordered_map<char32_t, int32_t> ReadTokens(std::istream &is) {
 
   std::string sym;
   std::u32string s;
-   int32_t id;
+   int32_t id = 0;
   while (std::getline(is, line)) {
     std::istringstream iss(line);
     iss >> sym;
--- a/sherpa-onnx/csrc/resample.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/resample.cc
查看文件 @a11c859
@@ -24,10 +24,9 @@
 
 #include "sherpa-onnx/csrc/resample.h"
 
- #include <assert.h>
- #include <math.h>
- #include <stdio.h>
- 
+ #include <cassert>
+ #include <cmath>
+ #include <cstdio>
 #include <cstdlib>
 #include <type_traits>
 
@@ -54,8 +53,8 @@ I Gcd(I m, I n) {
   }
   // could use compile-time assertion
   // but involves messing with complex template stuff.
-   static_assert(std::is_integral<I>::value, "");
-   while (1) {
+   static_assert(std::is_integral_v<I>);
+   while (true) {
     m %= n;
     if (m == 0) return (n > 0 ? n : -n);
     n %= m;
@@ -139,10 +138,10 @@ void LinearResample::SetIndexesAndWeights() {
     in the header as h(t) = f(t)g(t), evaluated at t.
 */
 float LinearResample::FilterFunc(float t) const {
-   float window,  // raised-cosine (Hanning) window of width
+   float window = 0,  // raised-cosine (Hanning) window of width
                      // num_zeros_/2*filter_cutoff_
-       filter;    // sinc filter function
-   if (fabs(t) < num_zeros_ / (2.0 * filter_cutoff_))
+       filter = 0;    // sinc filter function
+   if (std::fabs(t) < num_zeros_ / (2.0 * filter_cutoff_))
     window = 0.5 * (1 + cos(M_2PI * filter_cutoff_ / num_zeros_ * t));
   else
     window = 0.0;  // outside support of window function
@@ -172,15 +171,15 @@ void LinearResample::Resample(const float *input, int32_t input_dim, bool flush,
   // of it we are producing here.
   for (int64_t samp_out = output_sample_offset_; samp_out < tot_output_samp;
        samp_out++) {
-     int64_t first_samp_in;
-     int32_t samp_out_wrapped;
+     int64_t first_samp_in = 0;
+     int32_t samp_out_wrapped = 0;
     GetIndexes(samp_out, &first_samp_in, &samp_out_wrapped);
     const std::vector<float> &weights = weights_[samp_out_wrapped];
     // first_input_index is the first index into "input" that we have a weight
     // for.
     int32_t first_input_index =
         static_cast<int32_t>(first_samp_in - input_sample_offset_);
-     float this_output;
+     float this_output = 0;
     if (first_input_index >= 0 &&
         first_input_index + static_cast<int32_t>(weights.size()) <= input_dim) {
       this_output =
@@ -239,7 +238,7 @@ int64_t LinearResample::GetNumOutputSamples(int64_t input_num_samp,
     // largest integer in the interval [ 0, 2 - 0.9 ) are the same (both one).
     // So when we're subtracting the window-width we can ignore the fractional
     // part.
-     int32_t window_width_ticks = floor(window_width * tick_freq);
+     int32_t window_width_ticks = std::floor(window_width * tick_freq);
     // The time-period of the output that we can sample gets reduced
     // by the window-width (which is actually the distance from the
     // center to the edge of the windowing function) if we're not
@@ -287,7 +286,7 @@ void LinearResample::SetRemainder(const float *input, int32_t input_dim) {
   // that are "in the past" relative to the beginning of the latest
   // input... anyway, storing more remainder than needed is not harmful.
   int32_t max_remainder_needed =
-       ceil(samp_rate_in_ * num_zeros_ / filter_cutoff_);
+       std::ceil(samp_rate_in_ * num_zeros_ / filter_cutoff_);
   input_remainder_.resize(max_remainder_needed);
   for (int32_t index = -static_cast<int32_t>(input_remainder_.size());
        index < 0; index++) {
--- a/sherpa-onnx/csrc/resample.h
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/resample.h
查看文件 @a11c859
@@ -130,10 +130,10 @@ class LinearResample {
   // the following variables keep track of where we are in a particular signal,
   // if it is being provided over multiple calls to Resample().
 
-   int64_t input_sample_offset_;   ///< The number of input samples we have
+   int64_t input_sample_offset_ = 0;   ///< The number of input samples we have
                                       ///< already received for this signal
                                       ///< (including anything in remainder_)
-   int64_t output_sample_offset_;  ///< The number of samples we have already
+   int64_t output_sample_offset_ = 0;  ///< The number of samples we have already
                                       ///< output for this signal.
   std::vector<float> input_remainder_;  ///< A small trailing part of the
                                         ///< previously seen input signal.
--- a/sherpa-onnx/csrc/session.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/session.cc
查看文件 @a11c859
@@ -21,13 +21,13 @@
 
 namespace sherpa_onnx {
 
- 
 static void OrtStatusFailure(OrtStatus *status, const char *s) {
   const auto &api = Ort::GetApi();
   const char *msg = api.GetErrorMessage(status);
   SHERPA_ONNX_LOGE(
       "Failed to enable TensorRT : %s."
-       "Available providers: %s. Fallback to cuda", msg, s);
+       "Available providers: %s. Fallback to cuda",
+       msg, s);
   api.ReleaseStatus(status);
 }
 
@@ -65,8 +65,8 @@ static Ort::SessionOptions GetSessionOptionsImpl(int32_t num_threads,
     }
     case Provider::kTRT: {
       struct TrtPairs {
-         const char* op_keys;
-         const char* op_values;
+         const char *op_keys;
+         const char *op_values;
       };
 
       std::vector<TrtPairs> trt_options = {
@@ -79,15 +79,14 @@ static Ort::SessionOptions GetSessionOptionsImpl(int32_t num_threads,
           {"trt_engine_cache_enable", "1"},
           {"trt_engine_cache_path", "."},
           {"trt_timing_cache_enable", "1"},
-         {"trt_timing_cache_path", "."}
-       };
+           {"trt_timing_cache_path", "."}};
       // ToDo : Trt configs
       // "trt_int8_enable"
       // "trt_int8_use_native_calibration_table"
       // "trt_dump_subgraphs"
 
-       std::vector<const char*> option_keys, option_values;
-       for (const TrtPairs& pair : trt_options) {
+       std::vector<const char *> option_keys, option_values;
+       for (const TrtPairs &pair : trt_options) {
         option_keys.emplace_back(pair.op_keys);
         option_values.emplace_back(pair.op_values);
       }
@@ -96,18 +95,22 @@ static Ort::SessionOptions GetSessionOptionsImpl(int32_t num_threads,
           Ort::GetAvailableProviders();
       if (std::find(available_providers.begin(), available_providers.end(),
                     "TensorrtExecutionProvider") != available_providers.end()) {
-         const auto& api = Ort::GetApi();
+         const auto &api = Ort::GetApi();
 
-         OrtTensorRTProviderOptionsV2* tensorrt_options;
-         OrtStatus *statusC = api.CreateTensorRTProviderOptions(
-                                     &tensorrt_options);
+         OrtTensorRTProviderOptionsV2 *tensorrt_options = nullptr;
+         OrtStatus *statusC =
+             api.CreateTensorRTProviderOptions(&tensorrt_options);
         OrtStatus *statusU = api.UpdateTensorRTProviderOptions(
             tensorrt_options, option_keys.data(), option_values.data(),
             option_keys.size());
         sess_opts.AppendExecutionProvider_TensorRT_V2(*tensorrt_options);
 
-         if (statusC) { OrtStatusFailure(statusC, os.str().c_str()); }
-         if (statusU) { OrtStatusFailure(statusU, os.str().c_str()); }
+         if (statusC) {
+           OrtStatusFailure(statusC, os.str().c_str());
+         }
+         if (statusU) {
+           OrtStatusFailure(statusU, os.str().c_str());
+         }
 
         api.ReleaseTensorRTProviderOptions(tensorrt_options);
       }
--- a/sherpa-onnx/csrc/silero-vad-model.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/silero-vad-model.cc
查看文件 @a11c859
@@ -20,11 +20,11 @@ class SileroVadModel::Impl {
       : config_(config),
         env_(ORT_LOGGING_LEVEL_ERROR),
         sess_opts_(GetSessionOptions(config)),
-         allocator_{} {
+         allocator_{},
+         sample_rate_(config.sample_rate) {
     auto buf = ReadFile(config.silero_vad.model);
     Init(buf.data(), buf.size());
 
-     sample_rate_ = config.sample_rate;
     if (sample_rate_ != 16000) {
       SHERPA_ONNX_LOGE("Expected sample rate 16000. Given: %d",
                        config.sample_rate);
--- a/sherpa-onnx/csrc/slice.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/slice.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/slice.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <vector>
 
 namespace sherpa_onnx {
--- a/sherpa-onnx/csrc/speaker-embedding-extractor-impl.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/speaker-embedding-extractor-impl.cc
查看文件 @a11c859
@@ -12,7 +12,7 @@ namespace sherpa_onnx {
 
 namespace {
 
- enum class ModelType {
+ enum class ModelType : std::uint8_t {
   kWeSpeaker,
   k3dSpeaker,
   kNeMo,
--- a/sherpa-onnx/csrc/speaker-embedding-manager.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/speaker-embedding-manager.cc
查看文件 @a11c859
@@ -122,7 +122,7 @@ class SpeakerEmbeddingManager::Impl {
 
     Eigen::VectorXf scores = embedding_matrix_ * v;
 
-     Eigen::VectorXf::Index max_index;
+     Eigen::VectorXf::Index max_index = 0;
     float max_score = scores.maxCoeff(&max_index);
     if (max_score < threshold) {
       return {};
@@ -178,11 +178,12 @@ class SpeakerEmbeddingManager::Impl {
 
   std::vector<std::string> GetAllSpeakers() const {
     std::vector<std::string> all_speakers;
+     all_speakers.reserve(name2row_.size());
     for (const auto &p : name2row_) {
       all_speakers.push_back(p.first);
     }
 
-     std::stable_sort(all_speakers.begin(), all_speakers.end());
+     std::sort(all_speakers.begin(), all_speakers.end());
     return all_speakers;
   }
 
--- a/sherpa-onnx/csrc/spoken-language-identification-impl.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/spoken-language-identification-impl.cc
查看文件 @a11c859
@@ -18,7 +18,7 @@ namespace sherpa_onnx {
 
 namespace {
 
- enum class ModelType {
+ enum class ModelType : std::uint8_t {
   kWhisper,
   kUnknown,
 };
--- a/sherpa-onnx/csrc/stack.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/stack.cc
查看文件 @a11c859
@@ -71,8 +71,8 @@ Ort::Value Stack(OrtAllocator *allocator,
   T *dst = ans.GetTensorMutableData<T>();
 
   for (int32_t i = 0; i != leading_size; ++i) {
-     for (int32_t n = 0; n != static_cast<int32_t>(values.size()); ++n) {
-       const T *src = values[n]->GetTensorData<T>();
+     for (auto value : values) {
+       const T *src = value->GetTensorData<T>();
       src += i * trailing_size;
 
       std::copy(src, src + trailing_size, dst);
--- a/sherpa-onnx/csrc/symbol-table.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/symbol-table.cc
查看文件 @a11c859
@@ -36,7 +36,7 @@ SymbolTable::SymbolTable(AAssetManager *mgr, const std::string &filename) {
 
 void SymbolTable::Init(std::istream &is) {
   std::string sym;
-   int32_t id;
+   int32_t id = 0;
   while (is >> sym >> id) {
 #if 0
     // we disable the test here since for some multi-lingual BPE models
--- a/sherpa-onnx/csrc/text-utils.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/text-utils.cc
查看文件 @a11c859
@@ -5,9 +5,8 @@
 
 #include "sherpa-onnx/csrc/text-utils.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <cctype>
 #include <cstdint>
 #include <limits>
--- a/sherpa-onnx/csrc/transducer-keyword-decoder.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/transducer-keyword-decoder.cc
查看文件 @a11c859
@@ -151,7 +151,6 @@ void TransducerKeywordDecoder::Decode(
 
       if (matched) {
         float ys_prob = 0.0;
-         int32_t length = best_hyp.ys_probs.size();
         for (int32_t i = 0; i < matched_state->level; ++i) {
           ys_prob += best_hyp.ys_probs[i];
         }
--- a/sherpa-onnx/csrc/transpose.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/transpose.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/transpose.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <vector>
 
 namespace sherpa_onnx {
--- a/sherpa-onnx/csrc/unbind.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/unbind.cc
查看文件 @a11c859
@@ -4,9 +4,8 @@
 
 #include "sherpa-onnx/csrc/unbind.h"
 
- #include <assert.h>
- 
 #include <algorithm>
+ #include <cassert>
 #include <functional>
 #include <numeric>
 #include <utility>
--- a/sherpa-onnx/csrc/utils.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/utils.cc
查看文件 @a11c859
@@ -30,7 +30,6 @@ static bool EncodeBase(const std::vector<std::string> &lines,
   std::vector<float> tmp_thresholds;
   std::vector<std::string> tmp_phrases;
 
-   std::string line;
   std::string word;
   bool has_scores = false;
   bool has_thresholds = false;
@@ -72,6 +71,7 @@ static bool EncodeBase(const std::vector<std::string> &lines,
       }
     }
     ids->push_back(std::move(tmp_ids));
+     tmp_ids = {};
     tmp_scores.push_back(score);
     tmp_phrases.push_back(phrase);
     tmp_thresholds.push_back(threshold);
--- a/sherpa-onnx/csrc/wave-reader.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/wave-reader.cc
查看文件 @a11c859
@@ -100,13 +100,13 @@ struct WaveHeader {
   int32_t subchunk2_id;    // a tag of this chunk
   int32_t subchunk2_size;  // size of subchunk2
 };
- static_assert(sizeof(WaveHeader) == 44, "");
+ static_assert(sizeof(WaveHeader) == 44);
 
 // Read a wave file of mono-channel.
 // Return its samples normalized to the range [-1, 1).
 std::vector<float> ReadWaveImpl(std::istream &is, int32_t *sampling_rate,
                                 bool *is_ok) {
-   WaveHeader header;
+   WaveHeader header{};
   is.read(reinterpret_cast<char *>(&header), sizeof(header));
   if (!is) {
     *is_ok = false;
--- a/sherpa-onnx/csrc/wave-writer.cc
查看文件 @a11c859
+++ b/sherpa-onnx/csrc/wave-writer.cc
查看文件 @a11c859
@@ -37,7 +37,7 @@ struct WaveHeader {
 
 bool WriteWave(const std::string &filename, int32_t sampling_rate,
                const float *samples, int32_t n) {
-   WaveHeader header;
+   WaveHeader header{};
   header.chunk_id = 0x46464952;      // FFIR
   header.format = 0x45564157;        // EVAW
   header.subchunk1_id = 0x20746d66;  // "fmt "