2 年之前 · 37f75ae61e
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -26,6 +26,7 @@ option(SHERPA_NCNN_ENABLE_PYTHON "Whether to build Python" OFF)
 
				 option(SHERPA_NCNN_ENABLE_PORTAUDIO "Whether to build with portaudio" ON)
			
 
				 option(SHERPA_NCNN_ENABLE_JNI "Whether to build JNI internface" OFF)
			
 
				 option(SHERPA_NCNN_ENABLE_BINARY "Whether to build the binary sherpa-ncnn" ON)
			
 
				+option(SHERPA_NCNN_ENABLE_TEST "Whether to build tests" OFF)
			
 
				 
			
 
				 if(DEFINED ANDROID_ABI)
			
 
				   message(STATUS "Set SHERPA_NCNN_ENABLE_JNI to ON for Android")
			
@@ -34,7 +35,10 @@ endif()
 
				 
			
 
				 message(STATUS "BUILD_SHARED_LIBS ${BUILD_SHARED_LIBS}")
			
 
				 message(STATUS "SHERPA_NCNN_ENABLE_PYTHON ${SHERPA_NCNN_ENABLE_PYTHON}")
			
 
				+message(STATUS "SHERPA_NCNN_ENABLE_PORTAUDIO ${SHERPA_NCNN_ENABLE_PORTAUDIO}")
			
 
				 message(STATUS "SHERPA_NCNN_ENABLE_JNI ${SHERPA_NCNN_ENABLE_JNI}")
			
 
				+message(STATUS "SHERPA_NCNN_ENABLE_BINARY ${SHERPA_NCNN_ENABLE_BINARY}")
			
 
				+message(STATUS "SHERPA_NCNN_ENABLE_TEST ${SHERPA_NCNN_ENABLE_TEST}")
			
 
				 
			
 
				 if(NOT CMAKE_BUILD_TYPE)
			
 
				   message(STATUS "No CMAKE_BUILD_TYPE given, default to Release")
			
@@ -58,5 +62,4 @@ if(SHERPA_NCNN_ENABLE_PYTHON)
 
				   include(pybind11)
			
 
				 endif()
			
 
				 
			
 
				-
			
 
				 add_subdirectory(sherpa-ncnn)
			
--- a/sherpa-ncnn/csrc/CMakeLists.txt
+++ b/sherpa-ncnn/csrc/CMakeLists.txt
@@ -11,6 +11,7 @@ set(sherpa_ncnn_core_srcs
 
				   model.cc
			
 
				   modified-beam-search-decoder.cc
			
 
				   recognizer.cc
			
 
				+  resample.cc
			
 
				   symbol-table.cc
			
 
				   wave-reader.cc
			
 
				 )
			
@@ -57,3 +58,8 @@ if(NOT SHERPA_NCNN_ENABLE_PYTHON)
 
				   add_executable(generate-int8-scale-table generate-int8-scale-table.cc)
			
 
				   target_link_libraries(generate-int8-scale-table sherpa-ncnn-core)
			
 
				 endif()
			
 
				+
			
 
				+if(SHERPA_NCNN_ENABLE_TEST)
			
 
				+  add_executable(test-resample test-resample.cc)
			
 
				+  target_link_libraries(test-resample sherpa-ncnn-core)
			
 
				+endif()
			
--- a/sherpa-ncnn/csrc/resample.cc
+++ b/sherpa-ncnn/csrc/resample.cc
@@ -0,0 +1,309 @@
 
				+/**
			
 
				+ * Copyright     2013  Pegah Ghahremani
			
 
				+ *               2014  IMSL, PKU-HKUST (author: Wei Shi)
			
 
				+ *               2014  Yanqing Sun, Junjie Wang
			
 
				+ *               2014  Johns Hopkins University (author: Daniel Povey)
			
 
				+ * Copyright     2023  Xiaomi Corporation (authors: Fangjun Kuang)
			
 
				+ *
			
 
				+ * See LICENSE for clarification regarding multiple authors
			
 
				+ *
			
 
				+ * Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+ * you may not use this file except in compliance with the License.
			
 
				+ * You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+// this file is copied and modified from
			
 
				+// kaldi/src/feat/resample.cc
			
 
				+
			
 
				+#include "sherpa-ncnn/csrc/resample.h"
			
 
				+
			
 
				+#include <assert.h>
			
 
				+#include <math.h>
			
 
				+#include <stdio.h>
			
 
				+
			
 
				+#include <cstdlib>
			
 
				+#include <type_traits>
			
 
				+
			
 
				+#ifndef M_2PI
			
 
				+#define M_2PI 6.283185307179586476925286766559005
			
 
				+#endif
			
 
				+
			
 
				+#ifndef M_PI
			
 
				+#define M_PI 3.1415926535897932384626433832795
			
 
				+#endif
			
 
				+
			
 
				+namespace sherpa_ncnn {
			
 
				+
			
 
				+template <class I>
			
 
				+I Gcd(I m, I n) {
			
 
				+  // this function is copied from kaldi/src/base/kaldi-math.h
			
 
				+  if (m == 0 || n == 0) {
			
 
				+    if (m == 0 && n == 0) {  // gcd not defined, as all integers are divisors.
			
 
				+      fprintf(stderr, "Undefined GCD since m = 0, n = 0.");
			
 
				+      exit(-1);
			
 
				+    }
			
 
				+    return (m == 0 ? (n > 0 ? n : -n) : (m > 0 ? m : -m));
			
 
				+    // return absolute value of whichever is nonzero
			
 
				+  }
			
 
				+  // could use compile-time assertion
			
 
				+  // but involves messing with complex template stuff.
			
 
				+  static_assert(std::is_integral<I>::value, "");
			
 
				+  while (1) {
			
 
				+    m %= n;
			
 
				+    if (m == 0) return (n > 0 ? n : -n);
			
 
				+    n %= m;
			
 
				+    if (n == 0) return (m > 0 ? m : -m);
			
 
				+  }
			
 
				+}
			
 
				+
			
 
				+/// Returns the least common multiple of two integers.  Will
			
 
				+/// crash unless the inputs are positive.
			
 
				+template <class I>
			
 
				+I Lcm(I m, I n) {
			
 
				+  // This function is copied from kaldi/src/base/kaldi-math.h
			
 
				+  assert(m > 0 && n > 0);
			
 
				+  I gcd = Gcd(m, n);
			
 
				+  return gcd * (m / gcd) * (n / gcd);
			
 
				+}
			
 
				+
			
 
				+static float DotProduct(const float *a, const float *b, int32_t n) {
			
 
				+  float sum = 0;
			
 
				+  for (int32_t i = 0; i != n; ++i) {
			
 
				+    sum += a[i] * b[i];
			
 
				+  }
			
 
				+  return sum;
			
 
				+}
			
 
				+
			
 
				+LinearResample::LinearResample(int32_t samp_rate_in_hz,
			
 
				+                               int32_t samp_rate_out_hz, float filter_cutoff_hz,
			
 
				+                               int32_t num_zeros)
			
 
				+    : samp_rate_in_(samp_rate_in_hz),
			
 
				+      samp_rate_out_(samp_rate_out_hz),
			
 
				+      filter_cutoff_(filter_cutoff_hz),
			
 
				+      num_zeros_(num_zeros) {
			
 
				+  assert(samp_rate_in_hz > 0.0 && samp_rate_out_hz > 0.0 &&
			
 
				+         filter_cutoff_hz > 0.0 && filter_cutoff_hz * 2 <= samp_rate_in_hz &&
			
 
				+         filter_cutoff_hz * 2 <= samp_rate_out_hz && num_zeros > 0);
			
 
				+
			
 
				+  // base_freq is the frequency of the repeating unit, which is the gcd
			
 
				+  // of the input frequencies.
			
 
				+  int32_t base_freq = Gcd(samp_rate_in_, samp_rate_out_);
			
 
				+  input_samples_in_unit_ = samp_rate_in_ / base_freq;
			
 
				+  output_samples_in_unit_ = samp_rate_out_ / base_freq;
			
 
				+
			
 
				+  SetIndexesAndWeights();
			
 
				+  Reset();
			
 
				+}
			
 
				+
			
 
				+void LinearResample::SetIndexesAndWeights() {
			
 
				+  first_index_.resize(output_samples_in_unit_);
			
 
				+  weights_.resize(output_samples_in_unit_);
			
 
				+
			
 
				+  double window_width = num_zeros_ / (2.0 * filter_cutoff_);
			
 
				+
			
 
				+  for (int32_t i = 0; i < output_samples_in_unit_; i++) {
			
 
				+    double output_t = i / static_cast<double>(samp_rate_out_);
			
 
				+    double min_t = output_t - window_width, max_t = output_t + window_width;
			
 
				+    // we do ceil on the min and floor on the max, because if we did it
			
 
				+    // the other way around we would unnecessarily include indexes just
			
 
				+    // outside the window, with zero coefficients.  It's possible
			
 
				+    // if the arguments to the ceil and floor expressions are integers
			
 
				+    // (e.g. if filter_cutoff_ has an exact ratio with the sample rates),
			
 
				+    // that we unnecessarily include something with a zero coefficient,
			
 
				+    // but this is only a slight efficiency issue.
			
 
				+    int32_t min_input_index = ceil(min_t * samp_rate_in_),
			
 
				+            max_input_index = floor(max_t * samp_rate_in_),
			
 
				+            num_indices = max_input_index - min_input_index + 1;
			
 
				+    first_index_[i] = min_input_index;
			
 
				+    weights_[i].resize(num_indices);
			
 
				+    for (int32_t j = 0; j < num_indices; j++) {
			
 
				+      int32_t input_index = min_input_index + j;
			
 
				+      double input_t = input_index / static_cast<double>(samp_rate_in_),
			
 
				+             delta_t = input_t - output_t;
			
 
				+      // sign of delta_t doesn't matter.
			
 
				+      weights_[i][j] = FilterFunc(delta_t) / samp_rate_in_;
			
 
				+    }
			
 
				+  }
			
 
				+}
			
 
				+
			
 
				+/** Here, t is a time in seconds representing an offset from
			
 
				+    the center of the windowed filter function, and FilterFunction(t)
			
 
				+    returns the windowed filter function, described
			
 
				+    in the header as h(t) = f(t)g(t), evaluated at t.
			
 
				+*/
			
 
				+float LinearResample::FilterFunc(float t) const {
			
 
				+  float window,  // raised-cosine (Hanning) window of width
			
 
				+                 // num_zeros_/2*filter_cutoff_
			
 
				+      filter;    // sinc filter function
			
 
				+  if (fabs(t) < num_zeros_ / (2.0 * filter_cutoff_))
			
 
				+    window = 0.5 * (1 + cos(M_2PI * filter_cutoff_ / num_zeros_ * t));
			
 
				+  else
			
 
				+    window = 0.0;  // outside support of window function
			
 
				+  if (t != 0)
			
 
				+    filter = sin(M_2PI * filter_cutoff_ * t) / (M_PI * t);
			
 
				+  else
			
 
				+    filter = 2 * filter_cutoff_;  // limit of the function at t = 0
			
 
				+  return filter * window;
			
 
				+}
			
 
				+
			
 
				+void LinearResample::Reset() {
			
 
				+  input_sample_offset_ = 0;
			
 
				+  output_sample_offset_ = 0;
			
 
				+  input_remainder_.resize(0);
			
 
				+}
			
 
				+
			
 
				+void LinearResample::Resample(const float *input, int32_t input_dim, bool flush,
			
 
				+                              std::vector<float> *output) {
			
 
				+  int64_t tot_input_samp = input_sample_offset_ + input_dim,
			
 
				+          tot_output_samp = GetNumOutputSamples(tot_input_samp, flush);
			
 
				+
			
 
				+  assert(tot_output_samp >= output_sample_offset_);
			
 
				+
			
 
				+  output->resize(tot_output_samp - output_sample_offset_);
			
 
				+
			
 
				+  // samp_out is the index into the total output signal, not just the part
			
 
				+  // of it we are producing here.
			
 
				+  for (int64_t samp_out = output_sample_offset_; samp_out < tot_output_samp;
			
 
				+       samp_out++) {
			
 
				+    int64_t first_samp_in;
			
 
				+    int32_t samp_out_wrapped;
			
 
				+    GetIndexes(samp_out, &first_samp_in, &samp_out_wrapped);
			
 
				+    const std::vector<float> &weights = weights_[samp_out_wrapped];
			
 
				+    // first_input_index is the first index into "input" that we have a weight
			
 
				+    // for.
			
 
				+    int32_t first_input_index =
			
 
				+        static_cast<int32_t>(first_samp_in - input_sample_offset_);
			
 
				+    float this_output;
			
 
				+    if (first_input_index >= 0 &&
			
 
				+        first_input_index + weights.size() <= input_dim) {
			
 
				+      this_output =
			
 
				+          DotProduct(input + first_input_index, weights.data(), weights.size());
			
 
				+    } else {  // Handle edge cases.
			
 
				+      this_output = 0.0;
			
 
				+      for (int32_t i = 0; i < weights.size(); i++) {
			
 
				+        float weight = weights[i];
			
 
				+        int32_t input_index = first_input_index + i;
			
 
				+        if (input_index < 0 &&
			
 
				+            static_cast<int32_t>(input_remainder_.size()) + input_index >= 0) {
			
 
				+          this_output +=
			
 
				+              weight * input_remainder_[input_remainder_.size() + input_index];
			
 
				+        } else if (input_index >= 0 && input_index < input_dim) {
			
 
				+          this_output += weight * input[input_index];
			
 
				+        } else if (input_index >= input_dim) {
			
 
				+          // We're past the end of the input and are adding zero; should only
			
 
				+          // happen if the user specified flush == true, or else we would not
			
 
				+          // be trying to output this sample.
			
 
				+          assert(flush);
			
 
				+        }
			
 
				+      }
			
 
				+    }
			
 
				+    int32_t output_index =
			
 
				+        static_cast<int32_t>(samp_out - output_sample_offset_);
			
 
				+    (*output)[output_index] = this_output;
			
 
				+  }
			
 
				+
			
 
				+  if (flush) {
			
 
				+    Reset();  // Reset the internal state.
			
 
				+  } else {
			
 
				+    SetRemainder(input, input_dim);
			
 
				+    input_sample_offset_ = tot_input_samp;
			
 
				+    output_sample_offset_ = tot_output_samp;
			
 
				+  }
			
 
				+}
			
 
				+
			
 
				+int64_t LinearResample::GetNumOutputSamples(int64_t input_num_samp,
			
 
				+                                            bool flush) const {
			
 
				+  // For exact computation, we measure time in "ticks" of 1.0 / tick_freq,
			
 
				+  // where tick_freq is the least common multiple of samp_rate_in_ and
			
 
				+  // samp_rate_out_.
			
 
				+  int32_t tick_freq = Lcm(samp_rate_in_, samp_rate_out_);
			
 
				+  int32_t ticks_per_input_period = tick_freq / samp_rate_in_;
			
 
				+
			
 
				+  // work out the number of ticks in the time interval
			
 
				+  // [ 0, input_num_samp/samp_rate_in_ ).
			
 
				+  int64_t interval_length_in_ticks = input_num_samp * ticks_per_input_period;
			
 
				+  if (!flush) {
			
 
				+    float window_width = num_zeros_ / (2.0 * filter_cutoff_);
			
 
				+    // To count the window-width in ticks we take the floor.  This
			
 
				+    // is because since we're looking for the largest integer num-out-samp
			
 
				+    // that fits in the interval, which is open on the right, a reduction
			
 
				+    // in interval length of less than a tick will never make a difference.
			
 
				+    // For example, the largest integer in the interval [ 0, 2 ) and the
			
 
				+    // largest integer in the interval [ 0, 2 - 0.9 ) are the same (both one).
			
 
				+    // So when we're subtracting the window-width we can ignore the fractional
			
 
				+    // part.
			
 
				+    int32_t window_width_ticks = floor(window_width * tick_freq);
			
 
				+    // The time-period of the output that we can sample gets reduced
			
 
				+    // by the window-width (which is actually the distance from the
			
 
				+    // center to the edge of the windowing function) if we're not
			
 
				+    // "flushing the output".
			
 
				+    interval_length_in_ticks -= window_width_ticks;
			
 
				+  }
			
 
				+  if (interval_length_in_ticks <= 0) return 0;
			
 
				+
			
 
				+  int32_t ticks_per_output_period = tick_freq / samp_rate_out_;
			
 
				+  // Get the last output-sample in the closed interval, i.e. replacing [ ) with
			
 
				+  // [ ].  Note: integer division rounds down.  See
			
 
				+  // http://en.wikipedia.org/wiki/Interval_(mathematics) for an explanation of
			
 
				+  // the notation.
			
 
				+  int64_t last_output_samp = interval_length_in_ticks / ticks_per_output_period;
			
 
				+  // We need the last output-sample in the open interval, so if it takes us to
			
 
				+  // the end of the interval exactly, subtract one.
			
 
				+  if (last_output_samp * ticks_per_output_period == interval_length_in_ticks)
			
 
				+    last_output_samp--;
			
 
				+
			
 
				+  // First output-sample index is zero, so the number of output samples
			
 
				+  // is the last output-sample plus one.
			
 
				+  int64_t num_output_samp = last_output_samp + 1;
			
 
				+  return num_output_samp;
			
 
				+}
			
 
				+
			
 
				+// inline
			
 
				+void LinearResample::GetIndexes(int64_t samp_out, int64_t *first_samp_in,
			
 
				+                                int32_t *samp_out_wrapped) const {
			
 
				+  // A unit is the smallest nonzero amount of time that is an exact
			
 
				+  // multiple of the input and output sample periods.  The unit index
			
 
				+  // is the answer to "which numbered unit we are in".
			
 
				+  int64_t unit_index = samp_out / output_samples_in_unit_;
			
 
				+  // samp_out_wrapped is equal to samp_out % output_samples_in_unit_
			
 
				+  *samp_out_wrapped =
			
 
				+      static_cast<int32_t>(samp_out - unit_index * output_samples_in_unit_);
			
 
				+  *first_samp_in =
			
 
				+      first_index_[*samp_out_wrapped] + unit_index * input_samples_in_unit_;
			
 
				+}
			
 
				+
			
 
				+void LinearResample::SetRemainder(const float *input, int32_t input_dim) {
			
 
				+  std::vector<float> old_remainder(input_remainder_);
			
 
				+  // max_remainder_needed is the width of the filter from side to side,
			
 
				+  // measured in input samples.  you might think it should be half that,
			
 
				+  // but you have to consider that you might be wanting to output samples
			
 
				+  // that are "in the past" relative to the beginning of the latest
			
 
				+  // input... anyway, storing more remainder than needed is not harmful.
			
 
				+  int32_t max_remainder_needed =
			
 
				+      ceil(samp_rate_in_ * num_zeros_ / filter_cutoff_);
			
 
				+  input_remainder_.resize(max_remainder_needed);
			
 
				+  for (int32_t index = -static_cast<int32_t>(input_remainder_.size());
			
 
				+       index < 0; index++) {
			
 
				+    // we interpret "index" as an offset from the end of "input" and
			
 
				+    // from the end of input_remainder_.
			
 
				+    int32_t input_index = index + input_dim;
			
 
				+    if (input_index >= 0) {
			
 
				+      input_remainder_[index + static_cast<int32_t>(input_remainder_.size())] =
			
 
				+          input[input_index];
			
 
				+    } else if (input_index + static_cast<int32_t>(old_remainder.size()) >= 0) {
			
 
				+      input_remainder_[index + static_cast<int32_t>(input_remainder_.size())] =
			
 
				+          old_remainder[input_index +
			
 
				+                        static_cast<int32_t>(old_remainder.size())];
			
 
				+      // else leave it at zero.
			
 
				+    }
			
 
				+  }
			
 
				+}
			
 
				+
			
 
				+}  // namespace sherpa_ncnn
			
--- a/sherpa-ncnn/csrc/resample.h
+++ b/sherpa-ncnn/csrc/resample.h
@@ -0,0 +1,144 @@
 
				+/**
			
 
				+ * Copyright     2013  Pegah Ghahremani
			
 
				+ *               2014  IMSL, PKU-HKUST (author: Wei Shi)
			
 
				+ *               2014  Yanqing Sun, Junjie Wang
			
 
				+ *               2014  Johns Hopkins University (author: Daniel Povey)
			
 
				+ * Copyright     2023  Xiaomi Corporation (authors: Fangjun Kuang)
			
 
				+ *
			
 
				+ * See LICENSE for clarification regarding multiple authors
			
 
				+ *
			
 
				+ * Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+ * you may not use this file except in compliance with the License.
			
 
				+ * You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+// this file is copied and modified from
			
 
				+// kaldi/src/feat/resample.h
			
 
				+#ifndef SHERPA_NCNN_CSRC_RESAMPLE_H_
			
 
				+#define SHERPA_NCNN_CSRC_RESAMPLE_H_
			
 
				+
			
 
				+#include <cstdint>
			
 
				+#include <vector>
			
 
				+
			
 
				+namespace sherpa_ncnn {
			
 
				+
			
 
				+/*
			
 
				+   We require that the input and output sampling rate be specified as
			
 
				+   integers, as this is an easy way to specify that their ratio be rational.
			
 
				+*/
			
 
				+
			
 
				+class LinearResample {
			
 
				+ public:
			
 
				+  /// Constructor.  We make the input and output sample rates integers, because
			
 
				+  /// we are going to need to find a common divisor.  This should just remind
			
 
				+  /// you that they need to be integers.  The filter cutoff needs to be less
			
 
				+  /// than samp_rate_in_hz/2 and less than samp_rate_out_hz/2.  num_zeros
			
 
				+  /// controls the sharpness of the filter, more == sharper but less efficient.
			
 
				+  /// We suggest around 4 to 10 for normal use.
			
 
				+  LinearResample(int32_t samp_rate_in_hz, int32_t samp_rate_out_hz,
			
 
				+                 float filter_cutoff_hz, int32_t num_zeros);
			
 
				+
			
 
				+  /// Calling the function Reset() resets the state of the object prior to
			
 
				+  /// processing a new signal; it is only necessary if you have called
			
 
				+  /// Resample(x, x_size, false, y) for some signal, leading to a remainder of
			
 
				+  /// the signal being called, but then abandon processing the signal before
			
 
				+  /// calling Resample(x, x_size, true, y) for the last piece.  Call it
			
 
				+  /// unnecessarily between signals will not do any harm.
			
 
				+  void Reset();
			
 
				+
			
 
				+  /// This function does the resampling.  If you call it with flush == true and
			
 
				+  /// you have never called it with flush == false, it just resamples the input
			
 
				+  /// signal (it resizes the output to a suitable number of samples).
			
 
				+  ///
			
 
				+  /// You can also use this function to process a signal a piece at a time.
			
 
				+  /// suppose you break it into piece1, piece2, ... pieceN.  You can call
			
 
				+  /// \code{.cc}
			
 
				+  /// Resample(piece1, piece1_size, false, &output1);
			
 
				+  /// Resample(piece2, piece2_size, false, &output2);
			
 
				+  /// Resample(piece3, piece3_size, true, &output3);
			
 
				+  /// \endcode
			
 
				+  /// If you call it with flush == false, it won't output the last few samples
			
 
				+  /// but will remember them, so that if you later give it a second piece of
			
 
				+  /// the input signal it can process it correctly.
			
 
				+  /// If your most recent call to the object was with flush == false, it will
			
 
				+  /// have internal state; you can remove this by calling Reset().
			
 
				+  /// Empty input is acceptable.
			
 
				+  void Resample(const float *input, int32_t input_dim, bool flush,
			
 
				+                std::vector<float> *output);
			
 
				+
			
 
				+  //// Return the input and output sampling rates (for checks, for example)
			
 
				+  int32_t GetInputSamplingRate() const { return samp_rate_in_; }
			
 
				+  int32_t GetOutputSamplingRate() const { return samp_rate_out_; }
			
 
				+
			
 
				+ private:
			
 
				+  void SetIndexesAndWeights();
			
 
				+
			
 
				+  float FilterFunc(float) const;
			
 
				+
			
 
				+  /// This function outputs the number of output samples we will output
			
 
				+  /// for a signal with "input_num_samp" input samples.  If flush == true,
			
 
				+  /// we return the largest n such that
			
 
				+  /// (n/samp_rate_out_) is in the interval [ 0, input_num_samp/samp_rate_in_ ),
			
 
				+  /// and note that the interval is half-open.  If flush == false,
			
 
				+  /// define window_width as num_zeros / (2.0 * filter_cutoff_);
			
 
				+  /// we return the largest n such that (n/samp_rate_out_) is in the interval
			
 
				+  /// [ 0, input_num_samp/samp_rate_in_ - window_width ).
			
 
				+  int64_t GetNumOutputSamples(int64_t input_num_samp, bool flush) const;
			
 
				+
			
 
				+  /// Given an output-sample index, this function outputs to *first_samp_in the
			
 
				+  /// first input-sample index that we have a weight on (may be negative),
			
 
				+  /// and to *samp_out_wrapped the index into weights_ where we can get the
			
 
				+  /// corresponding weights on the input.
			
 
				+  inline void GetIndexes(int64_t samp_out, int64_t *first_samp_in,
			
 
				+                         int32_t *samp_out_wrapped) const;
			
 
				+
			
 
				+  void SetRemainder(const float *input, int32_t input_dim);
			
 
				+
			
 
				+ private:
			
 
				+  // The following variables are provided by the user.
			
 
				+  int32_t samp_rate_in_;
			
 
				+  int32_t samp_rate_out_;
			
 
				+  float filter_cutoff_;
			
 
				+  int32_t num_zeros_;
			
 
				+
			
 
				+  int32_t input_samples_in_unit_;  ///< The number of input samples in the
			
 
				+                                   ///< smallest repeating unit: num_samp_in_ =
			
 
				+                                   ///< samp_rate_in_hz / Gcd(samp_rate_in_hz,
			
 
				+                                   ///< samp_rate_out_hz)
			
 
				+
			
 
				+  int32_t output_samples_in_unit_;  ///< The number of output samples in the
			
 
				+                                    ///< smallest repeating unit: num_samp_out_
			
 
				+                                    ///< = samp_rate_out_hz /
			
 
				+                                    ///< Gcd(samp_rate_in_hz, samp_rate_out_hz)
			
 
				+
			
 
				+  /// The first input-sample index that we sum over, for this output-sample
			
 
				+  /// index.  May be negative; any truncation at the beginning is handled
			
 
				+  /// separately.  This is just for the first few output samples, but we can
			
 
				+  /// extrapolate the correct input-sample index for arbitrary output samples.
			
 
				+  std::vector<int32_t> first_index_;
			
 
				+
			
 
				+  /// Weights on the input samples, for this output-sample index.
			
 
				+  std::vector<std::vector<float>> weights_;
			
 
				+
			
 
				+  // the following variables keep track of where we are in a particular signal,
			
 
				+  // if it is being provided over multiple calls to Resample().
			
 
				+
			
 
				+  int64_t input_sample_offset_;   ///< The number of input samples we have
			
 
				+                                  ///< already received for this signal
			
 
				+                                  ///< (including anything in remainder_)
			
 
				+  int64_t output_sample_offset_;  ///< The number of samples we have already
			
 
				+                                  ///< output for this signal.
			
 
				+  std::vector<float> input_remainder_;  ///< A small trailing part of the
			
 
				+                                        ///< previously seen input signal.
			
 
				+};
			
 
				+
			
 
				+}  // namespace sherpa_ncnn
			
 
				+
			
 
				+#endif  // SHERPA_NCNN_CSRC_RESAMPLE_H_
			
--- a/sherpa-ncnn/csrc/test-resample.cc
+++ b/sherpa-ncnn/csrc/test-resample.cc
@@ -0,0 +1,120 @@
 
				+/**
			
 
				+ * Copyright (c)  2023  Xiaomi Corporation (authors: Fangjun Kuang)
			
 
				+ *
			
 
				+ * See LICENSE for clarification regarding multiple authors
			
 
				+ *
			
 
				+ * Licensed under the Apache License, Version 2.0 (the "License");
			
 
				+ * you may not use this file except in compliance with the License.
			
 
				+ * You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+#include <stdio.h>
			
 
				+
			
 
				+#include <fstream>
			
 
				+#include <string>
			
 
				+#include <vector>
			
 
				+
			
 
				+#include "sherpa-ncnn/csrc/resample.h"
			
 
				+
			
 
				+int32_t main(int32_t argc, char *argv[]) {
			
 
				+  const char *kUsage = R"(
			
 
				+Usage:
			
 
				+
			
 
				+  ./bin/test-resample in.raw in_sample_rate out.raw out_sample_rate
			
 
				+
			
 
				+where
			
 
				+
			
 
				+ - in.raw, containing input raw PCM samples, mono, 16-bit
			
 
				+ - in_sample_rate, sample rate for in.raw
			
 
				+ - out.raw, containing output raw PCM samples, mono, 16-bit
			
 
				+ - out_sample_rate, sample rate for out.raw
			
 
				+
			
 
				+For instance, if in_sample_rate is 48000 and out_sample_rate is 16000,
			
 
				+you can use
			
 
				+
			
 
				+  sox -t raw -r 48000 -e signed -b 16 -c 1 in.raw in.wav
			
 
				+  sox -t raw -r 16000 -e signed -b 16 -c 1 out.raw out.wav
			
 
				+
			
 
				+  soxi in.wav
			
 
				+  soxi out.wav
			
 
				+
			
 
				+You can compare the number of samples in in.wav and out.wav.
			
 
				+Also, you can play a.wav and b.wav.
			
 
				+
			
 
				+  )";
			
 
				+  if (argc != 5) {
			
 
				+    fprintf(stderr, "%s", kUsage);
			
 
				+    exit(-1);
			
 
				+  }
			
 
				+
			
 
				+  std::string in_raw = argv[1];
			
 
				+  int32_t in_sample_rate = atoi(argv[2]);
			
 
				+
			
 
				+  std::string out_raw = argv[3];
			
 
				+  int32_t out_sample_rate = atoi(argv[4]);
			
 
				+  fprintf(stderr, "in sample rate: %d, out_sample_rate: %d\n", in_sample_rate,
			
 
				+          out_sample_rate);
			
 
				+  fprintf(stderr, "in_raw : %s, out_raw: %s\n", in_raw.c_str(),
			
 
				+          out_raw.c_str());
			
 
				+
			
 
				+  std::ifstream is(in_raw, std::ios::binary);
			
 
				+  std::vector<int8_t> buffer(std::istreambuf_iterator<char>(is), {});
			
 
				+  if (buffer.size() % 2 != 0) {
			
 
				+    fprintf(stderr, "expect int16 samples\n");
			
 
				+    exit(-1);
			
 
				+  }
			
 
				+
			
 
				+  int32_t num_samples = buffer.size() / 2;
			
 
				+  fprintf(stderr, "num_samples: %d\n", num_samples);
			
 
				+  const int16_t *p = reinterpret_cast<int16_t *>(buffer.data());
			
 
				+
			
 
				+  std::vector<float> in_float(buffer.size() / 2);
			
 
				+  for (int32_t i = 0; i != num_samples; ++i) {
			
 
				+    in_float[i] = p[i] / 32768.0f;
			
 
				+  }
			
 
				+
			
 
				+  float min_freq = std::min(in_sample_rate, out_sample_rate);
			
 
				+  float lowpass_cutoff = 0.99 * 0.5 * min_freq;
			
 
				+
			
 
				+  int32_t lowpass_filter_width = 6;
			
 
				+  sherpa_ncnn::LinearResample resampler(in_sample_rate, out_sample_rate,
			
 
				+                                        lowpass_cutoff, lowpass_filter_width);
			
 
				+
			
 
				+  // simulate streaming
			
 
				+  int32_t chunk = 100;
			
 
				+  const float *q = in_float.data();
			
 
				+
			
 
				+  std::vector<float> out_float;
			
 
				+
			
 
				+  int32_t start = 0;
			
 
				+  for (start = 0; start + chunk < num_samples; start += chunk) {
			
 
				+    std::vector<float> tmp;
			
 
				+    resampler.Resample(q, chunk, false, &tmp);
			
 
				+    out_float.insert(out_float.end(), tmp.begin(), tmp.end());
			
 
				+    q += chunk;
			
 
				+  }
			
 
				+
			
 
				+  std::vector<float> tmp;
			
 
				+  resampler.Resample(q, num_samples - start, true, &tmp);
			
 
				+  out_float.insert(out_float.end(), tmp.begin(), tmp.end());
			
 
				+
			
 
				+  std::vector<int16_t> out_short(out_float.size());
			
 
				+  int32_t num_out_samples = out_float.size();
			
 
				+  for (int32_t i = 0; i != num_out_samples; ++i) {
			
 
				+    out_short[i] = std::min(32767, static_cast<int32_t>(out_float[i] * 32767));
			
 
				+  }
			
 
				+
			
 
				+  std::ofstream os(out_raw, std::ios::binary);
			
 
				+  os.write(reinterpret_cast<char *>(out_short.data()),
			
 
				+           out_short.size() * sizeof(int16_t));
			
 
				+
			
 
				+  return 0;
			
 
				+}