danpovey
diff --git a/‎.clang-tidy
+13-2 b/‎.clang-tidy
+13-2
diff --git a/‎.github/workflows/build.yml
+14-3 b/‎.github/workflows/build.yml
+14-3
diff --git a/‎.github/workflows/style_check.yml
+3-3 b/‎.github/workflows/style_check.yml
+3-3
diff --git a/‎.style.yapf
+1 b/‎.style.yapf
+1
diff --git a/‎k2/csrc/CMakeLists.txt
+4-1 b/‎k2/csrc/CMakeLists.txt
+4-1
diff --git a/‎k2/csrc/determinize.cc
+8-6 b/‎k2/csrc/determinize.cc
+8-6
diff --git a/‎k2/csrc/determinize.h
+14-14 b/‎k2/csrc/determinize.h
+14-14
@@ -52,17 +52,28 @@ Checks: >
   -google-readability-braces-around-statements,
   -google-runtime-references,
   cppcoreguidelines-*,
+  -cppcoreguidelines-avoid-c-arrays,
   -cppcoreguidelines-avoid-magic-numbers,
+  -cppcoreguidelines-macro-usage,
+  -cppcoreguidelines-no-malloc,
   -cppcoreguidelines-non-private-member-variables-in-classes,
   -cppcoreguidelines-owning-memory,
   -cppcoreguidelines-pro-bounds-pointer-arithmetic,
-  -cppcoreguidelines-special-member-functions,
+  -cppcoreguidelines-pro-type-const-cast,
+  -cppcoreguidelines-pro-type-member-init,
+  -cppcoreguidelines-pro-type-reinterpret-cast,
   -cppcoreguidelines-pro-type-vararg,
+  -cppcoreguidelines-special-member-functions,
   modernize-*,
+  -modernize-avoid-c-arrays,
+  -modernize-deprecated-headers,
+  -modernize-use-default-member-init,
   -modernize-use-trailing-return-type,
   readability-*,
-  -readability-magic-numbers,
   -readability-braces-around-statements,
+  -readability-isolate-declaration,
+  -readability-magic-numbers,
+  -readability-static-definition-in-anonymous-namespace,
   -readability-uppercase-literal-suffix,
   performance-*,
 
 
@@ -15,19 +15,30 @@ on:
       - master
 
 env:
-  BUILD_TYPE: Release
+  BUILD_TYPE: Debug
 
 jobs:
   build:
     runs-on: ${{ matrix.os }}
     strategy:
       matrix:
-        os: [ubuntu-latest, macOS-latest, windows-latest]
+        os: [ubuntu-latest, macOS-latest] #, windows-latest]
+        python-version: [3.5, 3.6, 3.7, 3.8]
 
     steps:
       # refer to https://github.com/actions/checkout
       - uses: actions/checkout@v2
 
+      - name: Setup Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v1
+        with:
+          python-version: ${{ matrix.python-version }}
+
+      - name: Install Python dependencies
+        run: |
+          python3 -m pip install --upgrade pip
+          python3 -m pip install torch==1.5.0
+
       - name: Create Build Directory
         run: cmake -E make_directory ${{runner.workspace}}/build
 
@@ -44,4 +55,4 @@ jobs:
       - name: Test
         shell: bash
         working-directory: ${{runner.workspace}}/build
-        run: CTEST_OUTPUT_ON_FAILURE=1 ctest --build-config $BUILD_TYPE
+        run: ctest --verbose --build-config $BUILD_TYPE
@@ -41,8 +41,8 @@ jobs:
         run: |
           # stop the build if there are Python syntax errors or undefined names
           flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
-          # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
-          flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
+          # exit-zero treats all errors as warnings.
+          flake8 . --count --exit-zero --max-complexity=10 --max-line-length=79 --statistics
 
           #      - name: Install cppcheck
           #        run: |
@@ -54,7 +54,7 @@ jobs:
           #          cmake ..
           #          make -j
           #          sudo make install
-          
+
       - name: Create Build Directory
         run: cmake -E make_directory ${{runner.workspace}}/build
 
 
@@ -1,2 +1,3 @@
 [style]
 based_on_style = google
+column_limit = 79
@@ -1,13 +1,15 @@
 # please sort the source files alphabetically
 add_library(fsa
   aux_labels.cc
+  determinize.cc
+  fsa.cc
   fsa_algo.cc
   fsa_equivalent.cc
   fsa_renderer.cc
   fsa_util.cc
   properties.cc
+  util.cc
   weights.cc
-  determinize.cc
 )
 
 target_include_directories(fsa PUBLIC ${CMAKE_SOURCE_DIR})
@@ -40,6 +42,7 @@ set(fsa_tests
   fsa_algo_test
   fsa_equivalent_test
   fsa_renderer_test
+  fsa_test
   fsa_util_test
   properties_test
   weights_test
 
@@ -74,8 +74,9 @@ void TraceBack(std::unordered_set<LogSumTracebackState *> *cur_states,
   for (int32_t i = 0; i < num_steps; i++) {
     for (LogSumTracebackState *state_ptr : *cur_states) {
       double backward_prob = state_ptr->backward_prob;
-      for (auto link : state_ptr->prev_elements) {
-        float arc_log_posterior = link.forward_prob + backward_prob;
+      for (const auto &link : state_ptr->prev_elements) {
+        auto arc_log_posterior =
+            static_cast<float>(link.forward_prob + backward_prob);
         deriv_out->push_back(
             std::pair<int32_t, float>(link.arc_index, expf(arc_log_posterior)));
         LogSumTracebackState *prev_state = link.prev_state.get();
@@ -96,7 +97,7 @@ void TraceBack(std::unordered_set<LogSumTracebackState *> *cur_states,
   // algorithm.
   CHECK_EQ(cur_states->size(), 1);
   double prev_forward_prob = (*(cur_states->begin()))->forward_prob;
-  *weight_out = cur_forward_prob - prev_forward_prob;
+  *weight_out = static_cast<float>(cur_forward_prob - prev_forward_prob);
   // The following is mostly for ease of interpretability of the output;
   // conceptually the order makes no difference.
   // TODO(dpovey): maybe remove this, for efficiency?
@@ -105,20 +106,21 @@ void TraceBack(std::unordered_set<LogSumTracebackState *> *cur_states,
 
 void TraceBack(std::unordered_set<MaxTracebackState *> *cur_states,
                int32_t num_steps,
-               const float *,  // arc_weights_in, unused.
+               const float *unused,  // arc_weights_in, unused.
                float *weight_out, std::vector<int32_t> *deriv_out) {
+  (void)unused;
   CHECK_EQ(cur_states->size(), 1);
   MaxTracebackState *state = *(cur_states->begin());
   double cur_forward_prob = state->forward_prob;
   deriv_out->resize(num_steps);
-  for (int32_t i = num_steps - 1; i >= 0; i--) {
+  for (int32_t i = num_steps - 1; i >= 0; --i) {
     // `deriv_out` is just a list of arc indexes in the input FSA
     // that this output arc depends on (it's their sum).
     (*deriv_out)[i] = state->arc_id;
     state = state->prev_state.get();
   }
   double prev_forward_prob = state->forward_prob;
-  *weight_out = cur_forward_prob - prev_forward_prob;
+  *weight_out = static_cast<float>(cur_forward_prob - prev_forward_prob);
 }
 
 template <>
 
@@ -86,7 +86,7 @@ namespace k2 {
   arcs in the output FSA.
 
 
-   *The problem with differentability
+   *The problem with differentiability
 
    Consider how to differentiate the weights of the output weighted FSA
    w.r.t. those of the input.  The problem with differentiability if we use the
@@ -113,7 +113,7 @@ namespace k2 {
 
     *Different normalization
 
-    Our form of "normalization" of this representation is differen too.  The
+    Our form of "normalization" of this representation is different too.  The
     normalization is to make `symbol_sequence` as short as possible, and advance
     `base_state` to compensate.  For instance, if `symbol_sequence` is `a b c
     d`, but the weighted subset of states we can reach by this symbol sequence
@@ -177,7 +177,7 @@ struct MaxTracebackState {
 
   /**
      @param [in] state_id  State in input FSA that this corresponds to
-     @param [in] src   Previous LogSumTracebackState that we'll point back
+     @param [in] src   Previous MaxTracebackState that we'll point back
                       to, or NULL
      @param [in] incoming_arc_index  Arc-index in input FSA.
                       Its src_state will equal src->state_id,
@@ -213,7 +213,7 @@ class LogSumTracebackState;
 /*
   This struct is used inside LogSumTracebackState; it represents an
   arc that traces back to a previous LogSumTracebackState.
-  A LogSumTracebackState represents a weighted colletion of paths
+  A LogSumTracebackState represents a weighted collection of paths
   terminating in a specific state.
 */
 struct LogSumTracebackLink {
@@ -364,7 +364,7 @@ void TraceBack(std::unordered_set<LogSumTracebackState *> *cur_states,
 // for LogSumTracebackState, above.  This version is simpler.
 void TraceBack(std::unordered_set<MaxTracebackState *> *cur_states,
                int32_t num_steps,
-               const float *,  // arc_weights_in, unused.
+               const float *unused,  // arc_weights_in, unused.
                float *weight_out, std::vector<int32_t> *deriv_out);
 
 template <class TracebackState>
@@ -633,7 +633,7 @@ void DetState<TracebackState>::Normalize(const WfsaWithFbWeights &wfsa_in,
   std::unordered_set<TracebackState *> cur_states;
 
   double fb_prob = -std::numeric_limits<double>::infinity();
-  for (auto p : elements) {
+  for (const auto &p : elements) {
     TracebackState *state = p.second.get();
     fb_prob = LogSumOrMax<TracebackState>(
         fb_prob,
@@ -701,19 +701,19 @@ class DetStateMap {
     if (inserted) {
       a->state_id = cur_output_state_++;
       return true;
-    } else {
-      a->state_id = p.first->second;
-      return false;
     }
+
+    a->state_id = p.first->second;
+    return false;
   }
 
   int32_t size() const { return cur_output_state_; }
 
  private:
   // simple hashing function that just takes the first element of the pair.
   struct PairHasher {
-    size_t operator()(const std::pair<uint64_t, uint64_t> &p) const {
-      return static_cast<size_t>(p.first);
+    std::size_t operator()(const std::pair<uint64_t, uint64_t> &p) const {
+      return static_cast<std::size_t>(p.first);
     }
   };
 
@@ -781,7 +781,7 @@ class DetStateMap {
   }
 
   struct DetStateHasher {
-    size_t operator()(const std::pair<uint64_t, uint64_t> &p) const {
+    std::size_t operator()(const std::pair<uint64_t, uint64_t> &p) const {
       return p.first;
     }
   };
@@ -837,9 +837,9 @@ float DeterminizePrunedTpl(
                arc_derivs_out->begin());
   if (!queue.empty()) {  // We stopped early due to max_step
     return total_prob - queue.top()->forward_backward_prob;
-  } else {
-    return beam;
   }
+
+  return beam;
 }
 }  // namespace k2
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,3 @@`
`1`	`1`	`[style]`
`2`	`2`	`based_on_style = google`
	`3`	`+column_limit = 79`