2 years ago · 302b501515
--- a/ggml/LJ037-0171_sr16k_test.wav
+++ b/ggml/LJ037-0171_sr16k_test.wav
--- a/ggml/examples/kaldi-native-fbank/python/CMakeLists.txt
+++ b/ggml/examples/kaldi-native-fbank/python/CMakeLists.txt
@@ -1,2 +0,0 @@
 
															-add_subdirectory(csrc)
														
 
															-add_subdirectory(tests)
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/CMakeLists.txt
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/CMakeLists.txt
@@ -1,28 +0,0 @@
 
															-pybind11_add_module(_kaldi_native_fbank
														
 
															-  feature-fbank.cc
														
 
															-  feature-window.cc
														
 
															-  kaldi-native-fbank.cc
														
 
															-  mel-computations.cc
														
 
															-  online-feature.cc
														
 
															-  utils.cc
														
 
															-)
														
 
															-
														
 
															-if(APPLE)
														
 
															-  execute_process(
														
 
															-    COMMAND "${PYTHON_EXECUTABLE}" -c "from distutils.sysconfig import get_python_lib; print(get_python_lib())"
														
 
															-    OUTPUT_STRIP_TRAILING_WHITESPACE
														
 
															-    OUTPUT_VARIABLE PYTHON_SITE_PACKAGE_DIR
														
 
															-  )
														
 
															-  message(STATUS "PYTHON_SITE_PACKAGE_DIR: ${PYTHON_SITE_PACKAGE_DIR}")
														
 
															-  target_link_libraries(_kaldi_native_fbank PRIVATE "-Wl,-rpath,${PYTHON_SITE_PACKAGE_DIR}")
														
 
															-endif()
														
 
															-
														
 
															-if(NOT WIN32)
														
 
															-  target_link_libraries(_kaldi_native_fbank PRIVATE "-Wl,-rpath,${kaldi_native_fbank_rpath_origin}/kaldi_native_fbank/lib")
														
 
															-endif()
														
 
															-
														
 
															-target_link_libraries(_kaldi_native_fbank PRIVATE kaldi-native-fbank-core)
														
 
															-
														
 
															-install(TARGETS _kaldi_native_fbank
														
 
															-  DESTINATION ../
														
 
															-)
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/feature-fbank.cc
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/feature-fbank.cc
@@ -1,57 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/feature-fbank.h"
														
 
															-
														
 
															-#include <memory>
														
 
															-#include <string>
														
 
															-
														
 
															-#include "feature-fbank.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/utils.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-static void PybindFbankOptions(py::module &m) {  // NOLINT
														
 
															-  using PyClass = FbankOptions;
														
 
															-  py::class_<PyClass>(m, "FbankOptions")
														
 
															-      .def(py::init<>())
														
 
															-      .def_readwrite("frame_opts", &PyClass::frame_opts)
														
 
															-      .def_readwrite("mel_opts", &PyClass::mel_opts)
														
 
															-      .def_readwrite("use_energy", &PyClass::use_energy)
														
 
															-      .def_readwrite("energy_floor", &PyClass::energy_floor)
														
 
															-      .def_readwrite("raw_energy", &PyClass::raw_energy)
														
 
															-      .def_readwrite("htk_compat", &PyClass::htk_compat)
														
 
															-      .def_readwrite("use_log_fbank", &PyClass::use_log_fbank)
														
 
															-      .def_readwrite("use_power", &PyClass::use_power)
														
 
															-      .def("__str__",
														
 
															-           [](const PyClass &self) -> std::string { return self.ToString(); })
														
 
															-      .def("as_dict",
														
 
															-           [](const PyClass &self) -> py::dict { return AsDict(self); })
														
 
															-      .def_static(
														
 
															-          "from_dict",
														
 
															-          [](py::dict dict) -> PyClass { return FbankOptionsFromDict(dict); })
														
 
															-      .def(py::pickle(
														
 
															-          [](const PyClass &self) -> py::dict { return AsDict(self); },
														
 
															-          [](py::dict dict) -> PyClass { return FbankOptionsFromDict(dict); }));
														
 
															-}
														
 
															-
														
 
															-void PybindFeatureFbank(py::module &m) {  // NOLINT
														
 
															-  PybindFbankOptions(m);
														
 
															-}
														
 
															-
														
 
															-}  // namespace knf
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/feature-fbank.h
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/feature-fbank.h
@@ -1,30 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#ifndef KALDI_NATIVE_FBANK_PYTHON_CSRC_FEATURE_FBANK_H_
														
 
															-#define KALDI_NATIVE_FBANK_PYTHON_CSRC_FEATURE_FBANK_H_
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/kaldi-native-fbank.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-void PybindFeatureFbank(py::module &m);  // NOLINT
														
 
															-
														
 
															-}  // namespace knf
														
 
															-
														
 
															-#endif  // KALDI_NATIVE_FBANK_PYTHON_CSRC_FEATURE_FBANK_H_
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/feature-window.cc
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/feature-window.cc
@@ -1,66 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/feature-window.h"
														
 
															-
														
 
															-#include <string>
														
 
															-
														
 
															-#include "feature-window.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/utils.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-static void PybindFrameExtractionOptions(py::module &m) {  // NOLINT
														
 
															-  using PyClass = FrameExtractionOptions;
														
 
															-  py::class_<PyClass>(m, "FrameExtractionOptions")
														
 
															-      .def(py::init<>())
														
 
															-      .def_readwrite("samp_freq", &PyClass::samp_freq)
														
 
															-      .def_readwrite("frame_shift_ms", &PyClass::frame_shift_ms)
														
 
															-      .def_readwrite("frame_length_ms", &PyClass::frame_length_ms)
														
 
															-      .def_readwrite("dither", &PyClass::dither)
														
 
															-      .def_readwrite("preemph_coeff", &PyClass::preemph_coeff)
														
 
															-      .def_readwrite("remove_dc_offset", &PyClass::remove_dc_offset)
														
 
															-      .def_readwrite("window_type", &PyClass::window_type)
														
 
															-      .def_readwrite("round_to_power_of_two", &PyClass::round_to_power_of_two)
														
 
															-      .def_readwrite("blackman_coeff", &PyClass::blackman_coeff)
														
 
															-      .def_readwrite("snip_edges", &PyClass::snip_edges)
														
 
															-      .def("as_dict",
														
 
															-           [](const PyClass &self) -> py::dict { return AsDict(self); })
														
 
															-      .def_static("from_dict",
														
 
															-                  [](py::dict dict) -> PyClass {
														
 
															-                    return FrameExtractionOptionsFromDict(dict);
														
 
															-                  })
														
 
															-#if 0
														
 
															-      .def_readwrite("allow_downsample",
														
 
															-                     &PyClass::allow_downsample)
														
 
															-      .def_readwrite("allow_upsample", &PyClass::allow_upsample)
														
 
															-#endif
														
 
															-      .def("__str__",
														
 
															-           [](const PyClass &self) -> std::string { return self.ToString(); })
														
 
															-      .def(py::pickle(
														
 
															-          [](const PyClass &self) -> py::dict { return AsDict(self); },
														
 
															-          [](py::dict dict) -> PyClass {
														
 
															-            return FrameExtractionOptionsFromDict(dict);
														
 
															-          }));
														
 
															-}
														
 
															-
														
 
															-void PybindFeatureWindow(py::module &m) {  // NOLINT
														
 
															-  PybindFrameExtractionOptions(m);
														
 
															-}
														
 
															-
														
 
															-}  // namespace knf
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/feature-window.h
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/feature-window.h
@@ -1,30 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#ifndef KALDI_NATIVE_FBANK_PYTHON_CSRC_FEATURE_WINDOW_H_
														
 
															-#define KALDI_NATIVE_FBANK_PYTHON_CSRC_FEATURE_WINDOW_H_
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/kaldi-native-fbank.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-void PybindFeatureWindow(py::module &m);  // NOLINT
														
 
															-
														
 
															-}  // namespace knf
														
 
															-
														
 
															-#endif  // KALDI_NATIVE_FBANK_PYTHON_CSRC_FEATURE_WINDOW_H_
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/kaldi-native-fbank.cc
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/kaldi-native-fbank.cc
@@ -1,37 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/kaldi-native-fbank.h"
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/feature-fbank.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/feature-window.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/mel-computations.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/online-feature.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-PYBIND11_MODULE(_kaldi_native_fbank, m) {
														
 
															-  m.doc() = "Python wrapper for kaldi native fbank";
														
 
															-  PybindFeatureWindow(m);
														
 
															-  PybindMelComputations(m);
														
 
															-  PybindFeatureFbank(m);
														
 
															-
														
 
															-  PybindOnlineFeature(m);
														
 
															-}
														
 
															-
														
 
															-}  // namespace knf
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/kaldi-native-fbank.h
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/kaldi-native-fbank.h
@@ -1,27 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#ifndef KALDI_NATIVE_FBANK_PYTHON_CSRC_KALDI_NATIVE_FBANK_H_
														
 
															-#define KALDI_NATIVE_FBANK_PYTHON_CSRC_KALDI_NATIVE_FBANK_H_
														
 
															-
														
 
															-#include "pybind11/numpy.h"
														
 
															-#include "pybind11/pybind11.h"
														
 
															-#include "pybind11/stl.h"
														
 
															-namespace py = pybind11;
														
 
															-
														
 
															-#endif  // KALDI_NATIVE_FBANK_PYTHON_CSRC_KALDI_NATIVE_FBANK_H_
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/mel-computations.cc
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/mel-computations.cc
@@ -1,58 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/mel-computations.h"
														
 
															-
														
 
															-#include <string>
														
 
															-
														
 
															-#include "mel-computations.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/utils.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-static void PybindMelBanksOptions(py::module &m) {  // NOLINT
														
 
															-  using PyClass = MelBanksOptions;
														
 
															-  py::class_<PyClass>(m, "MelBanksOptions")
														
 
															-      .def(py::init<>())
														
 
															-      .def_readwrite("num_bins", &PyClass::num_bins)
														
 
															-      .def_readwrite("low_freq", &PyClass::low_freq)
														
 
															-      .def_readwrite("high_freq", &PyClass::high_freq)
														
 
															-      .def_readwrite("vtln_low", &PyClass::vtln_low)
														
 
															-      .def_readwrite("vtln_high", &PyClass::vtln_high)
														
 
															-      .def_readwrite("debug_mel", &PyClass::debug_mel)
														
 
															-      .def_readwrite("htk_mode", &PyClass::htk_mode)
														
 
															-      .def("__str__",
														
 
															-           [](const PyClass &self) -> std::string { return self.ToString(); })
														
 
															-      .def("as_dict",
														
 
															-           [](const PyClass &self) -> py::dict { return AsDict(self); })
														
 
															-      .def_static("from_dict",
														
 
															-                  [](py::dict dict) -> PyClass {
														
 
															-                    return MelBanksOptionsFromDict(dict);
														
 
															-                  })
														
 
															-      .def(py::pickle(
														
 
															-          [](const PyClass &self) -> py::dict { return AsDict(self); },
														
 
															-          [](py::dict dict) -> PyClass {
														
 
															-            return MelBanksOptionsFromDict(dict);
														
 
															-          }));
														
 
															-}
														
 
															-
														
 
															-void PybindMelComputations(py::module &m) {  // NOLINT
														
 
															-  PybindMelBanksOptions(m);
														
 
															-}
														
 
															-
														
 
															-}  // namespace knf
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/mel-computations.h
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/mel-computations.h
@@ -1,30 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#ifndef KALDI_NATIVE_FBANK_PYTHON_CSRC_MEL_COMPUTATIONS_H_
														
 
															-#define KALDI_NATIVE_FBANK_PYTHON_CSRC_MEL_COMPUTATIONS_H_
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/kaldi-native-fbank.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-void PybindMelComputations(py::module &m);  // NOLINT
														
 
															-
														
 
															-}  // namespace knf
														
 
															-
														
 
															-#endif  // KALDI_NATIVE_FBANK_PYTHON_CSRC_MEL_COMPUTATIONS_H_
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/online-feature.cc
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/online-feature.cc
@@ -1,68 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/online-feature.h"
														
 
															-
														
 
															-#include <string>
														
 
															-#include <vector>
														
 
															-
														
 
															-#include "online-feature.h"
														
 
															-namespace knf {
														
 
															-
														
 
															-template <typename C>
														
 
															-void PybindOnlineFeatureTpl(py::module &m,  // NOLINT
														
 
															-                            const std::string &class_name,
														
 
															-                            const std::string &class_help_doc = "") {
														
 
															-  using PyClass = OnlineGenericBaseFeature<C>;
														
 
															-  using Options = typename C::Options;
														
 
															-  py::class_<PyClass>(m, class_name.c_str(), class_help_doc.c_str())
														
 
															-      .def(py::init<const Options &>(), py::arg("opts"))
														
 
															-      .def_property_readonly("dim", &PyClass::Dim)
														
 
															-      .def_property_readonly("frame_shift_in_seconds",
														
 
															-                             &PyClass::FrameShiftInSeconds)
														
 
															-      .def_property_readonly("num_frames_ready", &PyClass::NumFramesReady)
														
 
															-      .def("is_last_frame", &PyClass::IsLastFrame, py::arg("frame"))
														
 
															-      .def(
														
 
															-          "get_frame",
														
 
															-          [](py::object obj, int32_t frame) {
														
 
															-            auto *self = obj.cast<PyClass *>();
														
 
															-            const float *f = self->GetFrame(frame);
														
 
															-            return py::array_t<float>({self->Dim()},    // shape
														
 
															-                                      {sizeof(float)},  // stride in bytes
														
 
															-                                      f,                // ptr
														
 
															-                                      obj);  // it will increase the reference
														
 
															-                                             // count of **this** vector
														
 
															-          },
														
 
															-          py::arg("frame"))
														
 
															-      .def(
														
 
															-          "accept_waveform",
														
 
															-          [](PyClass &self, float sampling_rate,
														
 
															-             const std::vector<float> &waveform) {
														
 
															-            self.AcceptWaveform(sampling_rate, waveform.data(),
														
 
															-                                waveform.size());
														
 
															-          },
														
 
															-          py::arg("sampling_rate"), py::arg("waveform"),
														
 
															-          py::call_guard<py::gil_scoped_release>())
														
 
															-      .def("input_finished", &PyClass::InputFinished);
														
 
															-}
														
 
															-
														
 
															-void PybindOnlineFeature(py::module &m) {  // NOLINT
														
 
															-  PybindOnlineFeatureTpl<FbankComputer>(m, "OnlineFbank");
														
 
															-}
														
 
															-
														
 
															-}  // namespace knf
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/online-feature.h
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/online-feature.h
@@ -1,30 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#ifndef KALDI_NATIVE_FBANK_PYTHON_CSRC_ONLINE_FEATURE_H_
														
 
															-#define KALDI_NATIVE_FBANK_PYTHON_CSRC_ONLINE_FEATURE_H_
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/kaldi-native-fbank.h"
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-void PybindOnlineFeature(py::module &m);  // NOLINT
														
 
															-
														
 
															-}  // namespace knf
														
 
															-
														
 
															-#endif  // KALDI_NATIVE_FBANK_PYTHON_CSRC_ONLINE_FEATURE_H_
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/utils.cc
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/utils.cc
@@ -1,134 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#include "kaldi-native-fbank/python/csrc/utils.h"
														
 
															-
														
 
															-#include <string>
														
 
															-
														
 
															-#include "feature-window.h"
														
 
															-
														
 
															-#define FROM_DICT(type, key)         \
														
 
															-  if (dict.contains(#key)) {         \
														
 
															-    opts.key = py::type(dict[#key]); \
														
 
															-  }
														
 
															-
														
 
															-#define AS_DICT(key) dict[#key] = opts.key
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-FrameExtractionOptions FrameExtractionOptionsFromDict(py::dict dict) {
														
 
															-  FrameExtractionOptions opts;
														
 
															-
														
 
															-  FROM_DICT(float_, samp_freq);
														
 
															-  FROM_DICT(float_, frame_shift_ms);
														
 
															-  FROM_DICT(float_, frame_length_ms);
														
 
															-  FROM_DICT(float_, dither);
														
 
															-  FROM_DICT(float_, preemph_coeff);
														
 
															-  FROM_DICT(bool_, remove_dc_offset);
														
 
															-  FROM_DICT(str, window_type);
														
 
															-  FROM_DICT(bool_, round_to_power_of_two);
														
 
															-  FROM_DICT(float_, blackman_coeff);
														
 
															-  FROM_DICT(bool_, snip_edges);
														
 
															-
														
 
															-  return opts;
														
 
															-}
														
 
															-
														
 
															-py::dict AsDict(const FrameExtractionOptions &opts) {
														
 
															-  py::dict dict;
														
 
															-
														
 
															-  AS_DICT(samp_freq);
														
 
															-  AS_DICT(frame_shift_ms);
														
 
															-  AS_DICT(frame_length_ms);
														
 
															-  AS_DICT(dither);
														
 
															-  AS_DICT(preemph_coeff);
														
 
															-  AS_DICT(remove_dc_offset);
														
 
															-  AS_DICT(window_type);
														
 
															-  AS_DICT(round_to_power_of_two);
														
 
															-  AS_DICT(blackman_coeff);
														
 
															-  AS_DICT(snip_edges);
														
 
															-
														
 
															-  return dict;
														
 
															-}
														
 
															-
														
 
															-MelBanksOptions MelBanksOptionsFromDict(py::dict dict) {
														
 
															-  MelBanksOptions opts;
														
 
															-
														
 
															-  FROM_DICT(int_, num_bins);
														
 
															-  FROM_DICT(float_, low_freq);
														
 
															-  FROM_DICT(float_, high_freq);
														
 
															-  FROM_DICT(float_, vtln_low);
														
 
															-  FROM_DICT(float_, vtln_high);
														
 
															-  FROM_DICT(bool_, debug_mel);
														
 
															-  FROM_DICT(bool_, htk_mode);
														
 
															-
														
 
															-  return opts;
														
 
															-}
														
 
															-py::dict AsDict(const MelBanksOptions &opts) {
														
 
															-  py::dict dict;
														
 
															-
														
 
															-  AS_DICT(num_bins);
														
 
															-  AS_DICT(low_freq);
														
 
															-  AS_DICT(high_freq);
														
 
															-  AS_DICT(vtln_low);
														
 
															-  AS_DICT(vtln_high);
														
 
															-  AS_DICT(debug_mel);
														
 
															-  AS_DICT(htk_mode);
														
 
															-
														
 
															-  return dict;
														
 
															-}
														
 
															-
														
 
															-FbankOptions FbankOptionsFromDict(py::dict dict) {
														
 
															-  FbankOptions opts;
														
 
															-
														
 
															-  if (dict.contains("frame_opts")) {
														
 
															-    opts.frame_opts = FrameExtractionOptionsFromDict(dict["frame_opts"]);
														
 
															-  }
														
 
															-
														
 
															-  if (dict.contains("mel_opts")) {
														
 
															-    opts.mel_opts = MelBanksOptionsFromDict(dict["mel_opts"]);
														
 
															-  }
														
 
															-
														
 
															-  FROM_DICT(bool_, use_energy);
														
 
															-  FROM_DICT(float_, energy_floor);
														
 
															-  FROM_DICT(bool_, raw_energy);
														
 
															-  FROM_DICT(bool_, htk_compat);
														
 
															-  FROM_DICT(bool_, use_log_fbank);
														
 
															-  FROM_DICT(bool_, use_power);
														
 
															-
														
 
															-  return opts;
														
 
															-}
														
 
															-
														
 
															-py::dict AsDict(const FbankOptions &opts) {
														
 
															-  py::dict dict;
														
 
															-
														
 
															-  dict["frame_opts"] = AsDict(opts.frame_opts);
														
 
															-  dict["mel_opts"] = AsDict(opts.mel_opts);
														
 
															-  AS_DICT(use_energy);
														
 
															-  AS_DICT(energy_floor);
														
 
															-  AS_DICT(raw_energy);
														
 
															-  AS_DICT(htk_compat);
														
 
															-  AS_DICT(use_log_fbank);
														
 
															-  AS_DICT(use_power);
														
 
															-
														
 
															-  return dict;
														
 
															-}
														
 
															-
														
 
															-#undef FROM_DICT
														
 
															-#undef AS_DICT
														
 
															-
														
 
															-}  // namespace knf
														
--- a/ggml/examples/kaldi-native-fbank/python/csrc/utils.h
+++ b/ggml/examples/kaldi-native-fbank/python/csrc/utils.h
@@ -1,52 +0,0 @@
 
															-/**
														
 
															- * Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															- *
														
 
															- * See LICENSE for clarification regarding multiple authors
														
 
															- *
														
 
															- * Licensed under the Apache License, Version 2.0 (the "License");
														
 
															- * you may not use this file except in compliance with the License.
														
 
															- * You may obtain a copy of the License at
														
 
															- *
														
 
															- *     http://www.apache.org/licenses/LICENSE-2.0
														
 
															- *
														
 
															- * Unless required by applicable law or agreed to in writing, software
														
 
															- * distributed under the License is distributed on an "AS IS" BASIS,
														
 
															- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															- * See the License for the specific language governing permissions and
														
 
															- * limitations under the License.
														
 
															- */
														
 
															-
														
 
															-#ifndef KALDI_NATIVE_FBANK_PYTHON_CSRC_UTILS_H_
														
 
															-#define KALDI_NATIVE_FBANK_PYTHON_CSRC_UTILS_H_
														
 
															-
														
 
															-#include "feature-fbank.h"
														
 
															-#include "feature-window.h"
														
 
															-#include "mel-computations.h"
														
 
															-#include "kaldi-native-fbank/python/csrc/kaldi-native-fbank.h"
														
 
															-
														
 
															-/*
														
 
															- * This file contains code about `from_dict` and
														
 
															- * `as_dict` for various options in kaldi-native-fbank.
														
 
															- *
														
 
															- * Regarding `from_dict`, users don't need to provide
														
 
															- * all the fields in the options. If some fields
														
 
															- * are not provided, it just uses the default one.
														
 
															- *
														
 
															- * If the provided dict in `from_dict` is empty,
														
 
															- * all fields use their default values.
														
 
															- */
														
 
															-
														
 
															-namespace knf {
														
 
															-
														
 
															-FrameExtractionOptions FrameExtractionOptionsFromDict(py::dict dict);
														
 
															-py::dict AsDict(const FrameExtractionOptions &opts);
														
 
															-
														
 
															-MelBanksOptions MelBanksOptionsFromDict(py::dict dict);
														
 
															-py::dict AsDict(const MelBanksOptions &opts);
														
 
															-
														
 
															-FbankOptions FbankOptionsFromDict(py::dict dict);
														
 
															-py::dict AsDict(const FbankOptions &opts);
														
 
															-
														
 
															-}  // namespace knf
														
 
															-
														
 
															-#endif  // KALDI_NATIVE_FBANK_PYTHON_CSRC_UTILS_H_
														
--- a/ggml/examples/kaldi-native-fbank/python/kaldi_native_fbank/__init__.py
+++ b/ggml/examples/kaldi-native-fbank/python/kaldi_native_fbank/__init__.py
@@ -1,6 +0,0 @@
 
															-from _kaldi_native_fbank import (
														
 
															-    FrameExtractionOptions,
														
 
															-    MelBanksOptions,
														
 
															-    OnlineFbank,
														
 
															-    FbankOptions,
														
 
															-)
														
--- a/ggml/examples/kaldi-native-fbank/python/tests/CMakeLists.txt
+++ b/ggml/examples/kaldi-native-fbank/python/tests/CMakeLists.txt
@@ -1,31 +0,0 @@
 
															-function(kaldi_native_fbank_add_py_test source)
														
 
															-  get_filename_component(name ${source} NAME_WE)
														
 
															-  set(name "${name}_py")
														
 
															-
														
 
															-    message(STATUS "source: ${source}")
														
 
															-
														
 
															-  add_test(NAME ${name}
														
 
															-    COMMAND
														
 
															-      "${PYTHON_EXECUTABLE}"
														
 
															-      "${CMAKE_CURRENT_SOURCE_DIR}/${source}"
														
 
															-  )
														
 
															-
														
 
															-  get_filename_component(kaldi_native_fbank_path ${CMAKE_CURRENT_LIST_DIR} DIRECTORY)
														
 
															-
														
 
															-  set_property(TEST ${name}
														
 
															-    PROPERTY ENVIRONMENT "PYTHONPATH=${kaldi_native_fbank_path}:$<TARGET_FILE_DIR:_kaldi_native_fbank>:$ENV{PYTHONPATH}"
														
 
															-  )
														
 
															-endfunction()
														
 
															-
														
 
															-# please sort the files in alphabetic order
														
 
															-set(py_test_files
														
 
															-  test_frame_extraction_options.py
														
 
															-  test_mel_bank_options.py
														
 
															-  test_fbank_options.py
														
 
															-)
														
 
															-
														
 
															-if(KALDI_NATIVE_FBANK_BUILD_TESTS)
														
 
															-  foreach(source IN LISTS py_test_files)
														
 
															-    kaldi_native_fbank_add_py_test(${source})
														
 
															-  endforeach()
														
 
															-endif()
														
--- a/ggml/examples/kaldi-native-fbank/python/tests/test_fbank_options.py
+++ b/ggml/examples/kaldi-native-fbank/python/tests/test_fbank_options.py
@@ -1,198 +0,0 @@
 
															-#!/usr/bin/env python3
														
 
															-#
														
 
															-# Copyright (c)  2021  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															-
														
 
															-
														
 
															-import pickle
														
 
															-
														
 
															-import kaldi_native_fbank as knf
														
 
															-
														
 
															-
														
 
															-def test_default():
														
 
															-    opts = knf.FbankOptions()
														
 
															-    assert opts.frame_opts.samp_freq == 16000
														
 
															-    assert opts.frame_opts.frame_shift_ms == 10.0
														
 
															-    assert opts.frame_opts.frame_length_ms == 25.0
														
 
															-    assert opts.frame_opts.dither == 1.0
														
 
															-    assert abs(opts.frame_opts.preemph_coeff - 0.97) < 1e-6
														
 
															-    assert opts.frame_opts.remove_dc_offset is True
														
 
															-    assert opts.frame_opts.window_type == "povey"
														
 
															-    assert opts.frame_opts.round_to_power_of_two is True
														
 
															-    assert abs(opts.frame_opts.blackman_coeff - 0.42) < 1e-6
														
 
															-    assert opts.frame_opts.snip_edges is True
														
 
															-
														
 
															-    assert opts.mel_opts.num_bins == 23
														
 
															-    assert opts.mel_opts.low_freq == 20
														
 
															-    assert opts.mel_opts.high_freq == 0
														
 
															-    assert opts.mel_opts.vtln_low == 100
														
 
															-    assert opts.mel_opts.vtln_high == -500
														
 
															-    assert opts.mel_opts.debug_mel is False
														
 
															-    assert opts.mel_opts.htk_mode is False
														
 
															-
														
 
															-    assert opts.use_energy is False
														
 
															-    assert opts.energy_floor == 0.0
														
 
															-    assert opts.raw_energy is True
														
 
															-    assert opts.htk_compat is False
														
 
															-    assert opts.use_log_fbank is True
														
 
															-    assert opts.use_power is True
														
 
															-
														
 
															-
														
 
															-def test_set_get():
														
 
															-    opts = knf.FbankOptions()
														
 
															-    opts.use_energy = True
														
 
															-    assert opts.use_energy is True
														
 
															-
														
 
															-    opts.energy_floor = 1
														
 
															-    assert opts.energy_floor == 1
														
 
															-
														
 
															-    opts.raw_energy = False
														
 
															-    assert opts.raw_energy is False
														
 
															-
														
 
															-    opts.htk_compat = True
														
 
															-    assert opts.htk_compat is True
														
 
															-
														
 
															-    opts.use_log_fbank = False
														
 
															-    assert opts.use_log_fbank is False
														
 
															-
														
 
															-    opts.use_power = False
														
 
															-    assert opts.use_power is False
														
 
															-
														
 
															-
														
 
															-def test_set_get_frame_opts():
														
 
															-    opts = knf.FbankOptions()
														
 
															-
														
 
															-    opts.frame_opts.samp_freq = 44100
														
 
															-    assert opts.frame_opts.samp_freq == 44100
														
 
															-
														
 
															-    opts.frame_opts.frame_shift_ms = 20.5
														
 
															-    assert opts.frame_opts.frame_shift_ms == 20.5
														
 
															-
														
 
															-    opts.frame_opts.frame_length_ms = 1
														
 
															-    assert opts.frame_opts.frame_length_ms == 1
														
 
															-
														
 
															-    opts.frame_opts.dither = 0.5
														
 
															-    assert opts.frame_opts.dither == 0.5
														
 
															-
														
 
															-    opts.frame_opts.preemph_coeff = 0.25
														
 
															-    assert opts.frame_opts.preemph_coeff == 0.25
														
 
															-
														
 
															-    opts.frame_opts.remove_dc_offset = False
														
 
															-    assert opts.frame_opts.remove_dc_offset is False
														
 
															-
														
 
															-    opts.frame_opts.window_type = "hanning"
														
 
															-    assert opts.frame_opts.window_type == "hanning"
														
 
															-
														
 
															-    opts.frame_opts.round_to_power_of_two = False
														
 
															-    assert opts.frame_opts.round_to_power_of_two is False
														
 
															-
														
 
															-    opts.frame_opts.blackman_coeff = 0.25
														
 
															-    assert opts.frame_opts.blackman_coeff == 0.25
														
 
															-
														
 
															-    opts.frame_opts.snip_edges = False
														
 
															-    assert opts.frame_opts.snip_edges is False
														
 
															-
														
 
															-
														
 
															-def test_set_get_mel_opts():
														
 
															-    opts = knf.FbankOptions()
														
 
															-
														
 
															-    opts.mel_opts.num_bins = 100
														
 
															-    assert opts.mel_opts.num_bins == 100
														
 
															-
														
 
															-    opts.mel_opts.low_freq = 22
														
 
															-    assert opts.mel_opts.low_freq == 22
														
 
															-
														
 
															-    opts.mel_opts.high_freq = 1
														
 
															-    assert opts.mel_opts.high_freq == 1
														
 
															-
														
 
															-    opts.mel_opts.vtln_low = 101
														
 
															-    assert opts.mel_opts.vtln_low == 101
														
 
															-
														
 
															-    opts.mel_opts.vtln_high = -100
														
 
															-    assert opts.mel_opts.vtln_high == -100
														
 
															-
														
 
															-    opts.mel_opts.debug_mel = True
														
 
															-    assert opts.mel_opts.debug_mel is True
														
 
															-
														
 
															-    opts.mel_opts.htk_mode = True
														
 
															-    assert opts.mel_opts.htk_mode is True
														
 
															-
														
 
															-
														
 
															-def test_from_empty_dict():
														
 
															-    opts = knf.FbankOptions.from_dict({})
														
 
															-    opts2 = knf.FbankOptions()
														
 
															-
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-
														
 
															-def test_from_dict_partial():
														
 
															-    d = {
														
 
															-        "energy_floor": 10.5,
														
 
															-        "htk_compat": True,
														
 
															-        "mel_opts": {"num_bins": 80, "vtln_low": 1},
														
 
															-        "frame_opts": {"window_type": "hanning"},
														
 
															-    }
														
 
															-    opts = knf.FbankOptions.from_dict(d)
														
 
															-    assert opts.energy_floor == 10.5
														
 
															-    assert opts.htk_compat is True
														
 
															-    assert opts.mel_opts.num_bins == 80
														
 
															-    assert opts.mel_opts.vtln_low == 1
														
 
															-    assert opts.frame_opts.window_type == "hanning"
														
 
															-
														
 
															-    mel_opts = knf.MelBanksOptions.from_dict(d["mel_opts"])
														
 
															-    assert str(opts.mel_opts) == str(mel_opts)
														
 
															-
														
 
															-
														
 
															-def test_from_dict_full_and_as_dict():
														
 
															-    opts = knf.FbankOptions()
														
 
															-    opts.htk_compat = True
														
 
															-    opts.mel_opts.num_bins = 80
														
 
															-    opts.frame_opts.samp_freq = 10
														
 
															-
														
 
															-    d = opts.as_dict()
														
 
															-    assert d["htk_compat"] is True
														
 
															-    assert d["mel_opts"]["num_bins"] == 80
														
 
															-    assert d["frame_opts"]["samp_freq"] == 10
														
 
															-
														
 
															-    mel_opts = knf.MelBanksOptions()
														
 
															-    mel_opts.num_bins = 80
														
 
															-    assert d["mel_opts"] == mel_opts.as_dict()
														
 
															-
														
 
															-    frame_opts = knf.FrameExtractionOptions()
														
 
															-    frame_opts.samp_freq = 10
														
 
															-    assert d["frame_opts"] == frame_opts.as_dict()
														
 
															-
														
 
															-    opts2 = knf.FbankOptions.from_dict(d)
														
 
															-    assert str(opts2) == str(opts)
														
 
															-
														
 
															-    d["htk_compat"] = False
														
 
															-    opts3 = knf.FbankOptions.from_dict(d)
														
 
															-    assert opts3.htk_compat is False
														
 
															-
														
 
															-
														
 
															-def test_pickle():
														
 
															-    opts = knf.FbankOptions()
														
 
															-    opts.use_energy = True
														
 
															-    opts.use_power = False
														
 
															-
														
 
															-    opts.frame_opts.samp_freq = 44100
														
 
															-    opts.mel_opts.num_bins = 100
														
 
															-
														
 
															-    data = pickle.dumps(opts)
														
 
															-
														
 
															-    opts2 = pickle.loads(data)
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-
														
 
															-def main():
														
 
															-    test_default()
														
 
															-    test_set_get()
														
 
															-    test_set_get_frame_opts()
														
 
															-    test_set_get_mel_opts()
														
 
															-    test_from_empty_dict()
														
 
															-    test_from_dict_partial()
														
 
															-    test_from_dict_full_and_as_dict()
														
 
															-    test_pickle()
														
 
															-
														
 
															-
														
 
															-if __name__ == "__main__":
														
 
															-    main()
														
--- a/ggml/examples/kaldi-native-fbank/python/tests/test_frame_extraction_options.py
+++ b/ggml/examples/kaldi-native-fbank/python/tests/test_frame_extraction_options.py
@@ -1,119 +0,0 @@
 
															-#!/usr/bin/env python3
														
 
															-#
														
 
															-# Copyright (c)  2022  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															-
														
 
															-import pickle
														
 
															-
														
 
															-import kaldi_native_fbank as knf
														
 
															-
														
 
															-
														
 
															-def test_default():
														
 
															-    opts = knf.FrameExtractionOptions()
														
 
															-    assert opts.samp_freq == 16000
														
 
															-    assert opts.frame_shift_ms == 10.0
														
 
															-    assert opts.frame_length_ms == 25.0
														
 
															-    assert opts.dither == 1.0
														
 
															-    assert abs(opts.preemph_coeff - 0.97) < 1e-6
														
 
															-    assert opts.remove_dc_offset is True
														
 
															-    assert opts.window_type == "povey"
														
 
															-    assert opts.round_to_power_of_two is True
														
 
															-    assert abs(opts.blackman_coeff - 0.42) < 1e-6
														
 
															-    assert opts.snip_edges is True
														
 
															-
														
 
															-
														
 
															-def test_set_get():
														
 
															-    opts = knf.FrameExtractionOptions()
														
 
															-    opts.samp_freq = 44100
														
 
															-    assert opts.samp_freq == 44100
														
 
															-
														
 
															-    opts.frame_shift_ms = 20.5
														
 
															-    assert opts.frame_shift_ms == 20.5
														
 
															-
														
 
															-    opts.frame_length_ms = 1
														
 
															-    assert opts.frame_length_ms == 1
														
 
															-
														
 
															-    opts.dither = 0.5
														
 
															-    assert opts.dither == 0.5
														
 
															-
														
 
															-    opts.preemph_coeff = 0.25
														
 
															-    assert opts.preemph_coeff == 0.25
														
 
															-
														
 
															-    opts.remove_dc_offset = False
														
 
															-    assert opts.remove_dc_offset is False
														
 
															-
														
 
															-    opts.window_type = "hanning"
														
 
															-    assert opts.window_type == "hanning"
														
 
															-
														
 
															-    opts.round_to_power_of_two = False
														
 
															-    assert opts.round_to_power_of_two is False
														
 
															-
														
 
															-    opts.blackman_coeff = 0.25
														
 
															-    assert opts.blackman_coeff == 0.25
														
 
															-
														
 
															-    opts.snip_edges = False
														
 
															-    assert opts.snip_edges is False
														
 
															-
														
 
															-
														
 
															-def test_from_empty_dict():
														
 
															-    opts = knf.FrameExtractionOptions.from_dict({})
														
 
															-    opts2 = knf.FrameExtractionOptions()
														
 
															-
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-
														
 
															-def test_from_dict_partial():
														
 
															-    d = {"samp_freq": 10, "frame_shift_ms": 2}
														
 
															-
														
 
															-    opts = knf.FrameExtractionOptions.from_dict(d)
														
 
															-
														
 
															-    opts2 = knf.FrameExtractionOptions()
														
 
															-    assert str(opts) != str(opts2)
														
 
															-
														
 
															-    opts2.samp_freq = 10
														
 
															-    assert str(opts) != str(opts2)
														
 
															-
														
 
															-    opts2.frame_shift_ms = 2
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-    opts2.frame_shift_ms = 3
														
 
															-    assert str(opts) != str(opts2)
														
 
															-
														
 
															-
														
 
															-def test_from_dict_full_and_as_dict():
														
 
															-    opts = knf.FrameExtractionOptions()
														
 
															-    opts.samp_freq = 20
														
 
															-    opts.frame_length_ms = 100
														
 
															-
														
 
															-    d = opts.as_dict()
														
 
															-    for key, value in d.items():
														
 
															-        assert value == getattr(opts, key)
														
 
															-
														
 
															-    opts2 = knf.FrameExtractionOptions.from_dict(d)
														
 
															-    assert str(opts2) == str(opts)
														
 
															-
														
 
															-    d["window_type"] = "hanning"
														
 
															-    opts3 = knf.FrameExtractionOptions.from_dict(d)
														
 
															-    assert opts3.window_type == "hanning"
														
 
															-
														
 
															-
														
 
															-def test_pickle():
														
 
															-    opts = knf.FrameExtractionOptions()
														
 
															-    opts.samp_freq = 44100
														
 
															-    opts.dither = 5.5
														
 
															-    data = pickle.dumps(opts)
														
 
															-
														
 
															-    opts2 = pickle.loads(data)
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-
														
 
															-def main():
														
 
															-    test_default()
														
 
															-    test_set_get()
														
 
															-    test_from_empty_dict()
														
 
															-    test_from_dict_partial()
														
 
															-    test_from_dict_full_and_as_dict()
														
 
															-    test_pickle()
														
 
															-
														
 
															-
														
 
															-if __name__ == "__main__":
														
 
															-    main()
														
--- a/ggml/examples/kaldi-native-fbank/python/tests/test_mel_bank_options.py
+++ b/ggml/examples/kaldi-native-fbank/python/tests/test_mel_bank_options.py
@@ -1,107 +0,0 @@
 
															-#!/usr/bin/env python3
														
 
															-#
														
 
															-# Copyright (c)  2021  Xiaomi Corporation (authors: Fangjun Kuang)
														
 
															-
														
 
															-import pickle
														
 
															-
														
 
															-import kaldi_native_fbank as knf
														
 
															-
														
 
															-
														
 
															-def test_default():
														
 
															-    opts = knf.MelBanksOptions()
														
 
															-    assert opts.num_bins == 25
														
 
															-    assert opts.low_freq == 20
														
 
															-    assert opts.high_freq == 0
														
 
															-    assert opts.vtln_low == 100
														
 
															-    assert opts.vtln_high == -500
														
 
															-    assert opts.debug_mel is False
														
 
															-    assert opts.htk_mode is False
														
 
															-
														
 
															-
														
 
															-def test_set_get():
														
 
															-    opts = knf.MelBanksOptions()
														
 
															-    opts.num_bins = 100
														
 
															-    assert opts.num_bins == 100
														
 
															-
														
 
															-    opts.low_freq = 22
														
 
															-    assert opts.low_freq == 22
														
 
															-
														
 
															-    opts.high_freq = 1
														
 
															-    assert opts.high_freq == 1
														
 
															-
														
 
															-    opts.vtln_low = 101
														
 
															-    assert opts.vtln_low == 101
														
 
															-
														
 
															-    opts.vtln_high = -100
														
 
															-    assert opts.vtln_high == -100
														
 
															-
														
 
															-    opts.debug_mel = True
														
 
															-    assert opts.debug_mel is True
														
 
															-
														
 
															-    opts.htk_mode = True
														
 
															-    assert opts.htk_mode is True
														
 
															-
														
 
															-
														
 
															-def test_from_empty_dict():
														
 
															-    opts = knf.MelBanksOptions.from_dict({})
														
 
															-    opts2 = knf.MelBanksOptions()
														
 
															-
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-
														
 
															-def test_from_dict_partial():
														
 
															-    d = {"num_bins": 10, "debug_mel": True}
														
 
															-
														
 
															-    opts = knf.MelBanksOptions.from_dict(d)
														
 
															-
														
 
															-    opts2 = knf.MelBanksOptions()
														
 
															-    assert str(opts) != str(opts2)
														
 
															-
														
 
															-    opts2.num_bins = 10
														
 
															-    assert str(opts) != str(opts2)
														
 
															-
														
 
															-    opts2.debug_mel = True
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-    opts2.debug_mel = False
														
 
															-    assert str(opts) != str(opts2)
														
 
															-
														
 
															-
														
 
															-def test_from_dict_full_and_as_dict():
														
 
															-    opts = knf.MelBanksOptions()
														
 
															-    opts.num_bins = 80
														
 
															-    opts.vtln_high = 2
														
 
															-
														
 
															-    d = opts.as_dict()
														
 
															-    for key, value in d.items():
														
 
															-        assert value == getattr(opts, key)
														
 
															-
														
 
															-    opts2 = knf.MelBanksOptions.from_dict(d)
														
 
															-    assert str(opts2) == str(opts)
														
 
															-
														
 
															-    d["htk_mode"] = True
														
 
															-    opts3 = knf.MelBanksOptions.from_dict(d)
														
 
															-    assert opts3.htk_mode is True
														
 
															-
														
 
															-
														
 
															-def test_pickle():
														
 
															-    opts = knf.MelBanksOptions()
														
 
															-    opts.num_bins = 100
														
 
															-    opts.low_freq = 22
														
 
															-    data = pickle.dumps(opts)
														
 
															-
														
 
															-    opts2 = pickle.loads(data)
														
 
															-    assert str(opts) == str(opts2)
														
 
															-
														
 
															-
														
 
															-def main():
														
 
															-    test_default()
														
 
															-    test_set_get()
														
 
															-    test_from_empty_dict()
														
 
															-    test_from_dict_partial()
														
 
															-    test_from_dict_full_and_as_dict()
														
 
															-    test_pickle()
														
 
															-
														
 
															-
														
 
															-if __name__ == "__main__":
														
 
															-    main()
														
--- a/ggml/examples/kaldi-native-fbank/python/tests/test_online_fbank.py
+++ b/ggml/examples/kaldi-native-fbank/python/tests/test_online_fbank.py
@@ -1,48 +0,0 @@
 
															-#!/usr/bin/env python3
														
 
															-
														
 
															-import sys
														
 
															-
														
 
															-try:
														
 
															-    import kaldifeat
														
 
															-except:
														
 
															-    print("Please install kaldifeat first")
														
 
															-    sys.exit(0)
														
 
															-
														
 
															-import kaldi_native_fbank as knf
														
 
															-import torch
														
 
															-
														
 
															-
														
 
															-def main():
														
 
															-    sampling_rate = 16000
														
 
															-    samples = torch.randn(16000 * 10)
														
 
															-
														
 
															-    opts = kaldifeat.FbankOptions()
														
 
															-    opts.frame_opts.dither = 0
														
 
															-    opts.mel_opts.num_bins = 80
														
 
															-    opts.frame_opts.snip_edges = False
														
 
															-    opts.mel_opts.debug_mel = False
														
 
															-
														
 
															-    online_fbank = kaldifeat.OnlineFbank(opts)
														
 
															-
														
 
															-    online_fbank.accept_waveform(sampling_rate, samples)
														
 
															-
														
 
															-    opts = knf.FbankOptions()
														
 
															-    opts.frame_opts.dither = 0
														
 
															-    opts.mel_opts.num_bins = 80
														
 
															-    opts.frame_opts.snip_edges = False
														
 
															-    opts.mel_opts.debug_mel = False
														
 
															-
														
 
															-    fbank = knf.OnlineFbank(opts)
														
 
															-    fbank.accept_waveform(sampling_rate, samples.tolist())
														
 
															-
														
 
															-    assert online_fbank.num_frames_ready == fbank.num_frames_ready
														
 
															-    for i in range(fbank.num_frames_ready):
														
 
															-        f1 = online_fbank.get_frame(i)
														
 
															-        f2 = torch.from_numpy(fbank.get_frame(i))
														
 
															-        assert torch.allclose(f1, f2, atol=1e-3), (i, (f1 - f2).abs().max())
														
 
															-
														
 
															-
														
 
															-if __name__ == "__main__":
														
 
															-    torch.manual_seed(20220825)
														
 
															-    main()
														
 
															-    print("success")
														
--- a/ggml/test_data/test.wav
+++ b/ggml/test_data/test.wav
--- a/ggml/test_unity_cpp.py
+++ b/ggml/test_unity_cpp.py
@@ -1,20 +1,23 @@
 
															+# Copyright (c) Meta Platforms, Inc. and affiliates
														
 
															+# All rights reserved.
														
 
															+#
														
 
															+# This source code is licensed under the license found in the
														
 
															+# LICENSE file in the root directory of this source tree.
														
 
															+
														
 
															 import ctypes
														
 
															 import functools
														
 
															-import logging
														
 
															-import sys
														
 
															 from ctypes import c_void_p
														
 
															 from pathlib import Path
														
 
															 from typing import Any, Iterator, List, Tuple
														
 
															 import fairseq2.nn
														
 
															 import fairseq2.nn.transformer
														
 
															-from fairseq2.nn.padding import PaddingMask
														
 
															 import numpy as np
														
 
															 import pytest
														
 
															 import torch
														
 
															 import torchaudio
														
 
															 from fairseq2.data.audio import WaveformToFbankConverter
														
 
															-from fairseq2.generation import SequenceGeneratorOptions
														
 
															+from seamless_communication.inference import SequenceGeneratorOptions
														
 
															 from fairseq2.models.wav2vec2.feature_extractor import Wav2Vec2FbankFeatureExtractor
														
 
															 from seamless_communication.inference.translator import Modality, Translator
														
@@ -22,6 +25,7 @@ import ggml
 
															 from ctypes_utils import NULLPTR, Ptr
														
 
															 from ggml import NativeObj
														
 
															 from ggml_convert import convert_model, read_layer_config
														
 
															+import requests
														
 
															 Ctx = ggml.ggml_context_p
														
@@ -32,11 +36,10 @@ FAIRSEQ2_CPP = Path(__file__).parent / "examples/unity/fairseq2.cpp"
 
															 UNITY_FLASH_ATTN = "\n# define UNITY_FLASH_ATTN 0\n" not in FAIRSEQ2_CPP.read_text()
														
 
															 DATA = Path(__file__).parent / "test_data"
														
 
															-DATA_DEV = DATA / "dev"
														
 
															-if not DATA_DEV.exists():
														
 
															-    DATA_DEV = Path(
														
 
															-        "/private/home/dnn/internal_sc/seamless_communication/ggml/examples/unity/dev"
														
 
															-    )
														
 
															+LOCAL_AUDIO_SAMPLE_PATH = DATA / "LJ037-0171_sr16k.wav"
														
 
															+TEST_AUDIO_SAMPLE_URL = (
														
 
															+    "https://dl.fbaipublicfiles.com/seamless/tests/LJ037-0171_sr16k.wav"
														
 
															+)
														
 
															 @pytest.fixture(name="ctx")
														
@@ -74,6 +77,14 @@ def load_pt_model() -> Any:
 
															     return load_translator().model
														
 
															+def download_sample_audio() -> Any:
														
 
															+    response = requests.get(TEST_AUDIO_SAMPLE_URL, stream=True)
														
 
															+    with open(DATA / "LJ037-0171_sr16k.wav", "wb") as file:
														
 
															+        for chunk in response.iter_content(chunk_size=1024):
														
 
															+            if chunk:
														
 
															+                file.write(chunk)
														
 
															+
														
 
															+
														
 
															 def test_convert_linear(tmp_path: Path) -> None:
														
 
															     module = fairseq2.nn.Linear(16, 24, True)
														
@@ -352,9 +363,6 @@ def test_StandardTransformerEncoderLayer_forward(ctx: Ctx, g_model: c_void_p) ->
 
															     gx = ggml.from_numpy(ctx, x)
														
 
															     ggml.ggml_set_name(gx, b"x")
														
 
															-    padding_mask = fairseq2.nn.padding.PaddingMask(torch.tensor([21, 21]), 21)
														
 
															-    gpad = ggml.from_numpy(ctx, padding_mask.materialize())
														
 
															-    ggml.ggml_set_name(gpad, b"padding_mask")
														
 
															     gy = ggml.forward(
														
 
															         "StandardTransformerEncoderLayer",
														
 
															         g_model,
														
@@ -376,17 +384,11 @@ def test_StandardTransformerEncoderLayer_forward(ctx: Ctx, g_model: c_void_p) ->
 
															 def test_StandardConformerEncoderLayer_forward(ctx: Ctx, g_model: c_void_p) -> None:
														
 
															     pt_model = load_pt_model()
														
 
															-    if not DATA_DEV.exists():
														
 
															-        pytest.skip(reason=f"Folder {DATA_DEV} not found !")
														
 
															-
														
 
															-    x = torch.load(DATA_DEV / "seqs_before_conformer_block.pt")
														
 
															-    padding_mask = PaddingMask(torch.ones(1, x.shape[1]), x.shape[1])
														
 
															+    x = torch.rand(1, 137, 1024)
														
 
															     layer = pt_model.speech_encoder.inner.layers[0]
														
 
															     gx = ggml.from_numpy(ctx, x[0])
														
 
															     ggml.ggml_set_name(gx, b"x")
														
 
															-    gpad = ggml.from_numpy(ctx, padding_mask[0])
														
 
															-    ggml.ggml_set_name(gpad, b"padding_mask")
														
 
															     gy = ggml.forward(
														
 
															         "StandardConformerEncoderLayer",
														
 
															         g_model,
														
@@ -399,8 +401,8 @@ def test_StandardConformerEncoderLayer_forward(ctx: Ctx, g_model: c_void_p) -> N
 
															     y = ggml.to_numpy(gy)
														
 
															-    y_exp, _ = layer(x, padding_mask)
														
 
															-    y_exp = y_exp.numpy()
														
 
															+    y_exp, _ = layer(x, padding_mask=None)
														
 
															+    y_exp = y_exp.squeeze(0).numpy()
														
 
															     assert y.shape == y_exp.shape
														
 
															     assert np.allclose(y_exp, y, atol=2e-3)
														
@@ -409,10 +411,8 @@ def test_StandardConformerEncoderAdaptorLayer_forward(
 
															     ctx: Ctx, g_model: c_void_p
														
 
															 ) -> None:
														
 
															     pt_model = load_pt_model()
														
 
															-    if not DATA_DEV.exists():
														
 
															-        pytest.skip(reason=f"Folder {DATA_DEV} not found !")
														
 
															-
														
 
															-    x = torch.load(DATA_DEV / "seqs_before_adaptor.pt")
														
 
															+    torch.random.manual_seed(0)
														
 
															+    x = torch.rand(1, 137, 1024)
														
 
															     layer = pt_model.speech_encoder.adaptor_layers[0]
														
 
															     gx = ggml.from_numpy(ctx, x[0])
														
 
															     ggml.ggml_set_name(gx, b"x")
														
@@ -467,7 +467,9 @@ def test_StandardTransformerEncoder_forward(ctx: Ctx, g_model: c_void_p) -> None
 
															 def test_StandardConformerEncoder_forward(ctx: Ctx, g_model: c_void_p) -> None:
														
 
															     pt_model = load_pt_model()
														
 
															-    wav, _ = torchaudio.load(DATA / "test.wav")
														
 
															+    if not LOCAL_AUDIO_SAMPLE_PATH.exists():
														
 
															+        download_sample_audio()
														
 
															+    wav, _ = torchaudio.load(LOCAL_AUDIO_SAMPLE_PATH)
														
 
															     gx = ggml.from_numpy(ctx, wav * 2**15)  # Apply scale before sending into ggml!
														
 
															     ggml.ggml_set_name(gx, b"x")
														
 
															     gy = ggml.forward(
														
@@ -508,13 +510,10 @@ def test_StandardConformerEncoder_forward(ctx: Ctx, g_model: c_void_p) -> None:
 
															         y_exp = np.load(cache)
														
 
															     assert y.shape == y_exp.shape
														
 
															-    assert np.allclose(
														
 
															-        y_exp, y, atol=1e-2
														
 
															-    )  # There are 10 elements in a 137*1024 tensor with error >1e-2
														
 
															+    assert np.allclose(y_exp, y, atol=1e-2)
														
 
															 def test_WaveformToFbank_forward(ctx: Ctx, g_model: c_void_p) -> None:
														
 
															-    pt_model = load_pt_model()
														
 
															     converter = WaveformToFbankConverter(
														
 
															         num_mel_bins=80,
														
 
															         waveform_scale=2**15,
														
@@ -522,7 +521,9 @@ def test_WaveformToFbank_forward(ctx: Ctx, g_model: c_void_p) -> None:
 
															         standardize=True,
														
 
															     )
														
 
															     extractor = Wav2Vec2FbankFeatureExtractor(80, stride=2, sample_every_k=1)
														
 
															-    wav, _ = torchaudio.load(DATA / "LJ037-0171_sr16k_test.wav")
														
 
															+    if not LOCAL_AUDIO_SAMPLE_PATH.exists():
														
 
															+        download_sample_audio()
														
 
															+    wav, _ = torchaudio.load(LOCAL_AUDIO_SAMPLE_PATH)
														
 
															     gx = ggml.from_numpy(ctx, wav * 2**15)  # Apply scale before sending into ggml!
														
 
															     ggml.ggml_set_name(gx, b"x")
														
@@ -642,117 +643,13 @@ def test_StandardTransformerDecoder_forward(ctx: Ctx, g_model: c_void_p) -> None
 
															     assert np.allclose(y_exp, y, atol=1e-4 if UNITY_FLASH_ATTN else 1e-3)
														
 
															-def test_tokenizer(ctx: Ctx) -> None:
														
 
															-    tokenizer = unity.load_unity_text_tokenizer("seamlessM4T_medium")
														
 
															-    enc = tokenizer.create_encoder(task="translation", lang="eng", mode="source")
														
 
															-
														
 
															-    spm_path = DATA / "seamlessM4T_medium.spm.ggml"
														
 
															-    # if not spm_path.exists():
														
 
															-    if True:
														
 
															-        vocab = ggml_convert.read_vocab(tokenizer)
														
 
															-        ggml_convert.write_ggml_file(spm_path, {"spm_vocab_only": True}, {}, vocab, {})
														
 
															-
														
 
															-    g_model = ggml.load_fairseq2_ggml_file(spm_path)
														
 
															-    ggml.lib.fairseq2_model_set_inference_ctx(g_model.ptr, ctx)
														
 
															-
														
 
															-    expected = enc("We are all in a yellow submarine.").tolist()[1:]
														
 
															-    tokens = ggml.ggml_new_tensor_1d(ctx, ggml.GGML_TYPE_I32, 256)
														
 
															-    ggml.fairseq2_spm_tokenize(
														
 
															-        g_model.ptr, b"We are all in a yellow submarine.", tokens
														
 
															-    )
														
 
															-    res = ggml.to_numpy(tokens).tolist()
														
 
															-    assert expected == res
														
 
															-
														
 
															-    out = ctypes.create_string_buffer(144)
														
 
															-    ggml.fairseq2_spm_detokenize(g_model.ptr, tokens, out)
														
 
															-    assert ctypes.string_at(out) == b"We are all in a yellow submarine."
														
 
															-
														
 
															-
														
 
															-def test_t2tt(ctx: Ctx, g_model: c_void_p) -> None:
														
 
															-    src_lang = "eng"
														
 
															-    src_text = "We are all in a yellow submarine."
														
 
															-    tgt_lang = "fra"
														
 
															-    sample_file = DATA / "sample_input.npz"
														
 
															-    beam_size = 2
														
 
															-
														
 
															-    if not sample_file.exists():
														
 
															-        translator = load_translator()
														
 
															-        device = translator.device
														
 
															-        token_encoder = translator.text_tokenizer.create_encoder(
														
 
															-            task="translation", lang=src_lang, mode="source", device=device
														
 
															-        )
														
 
															-        src = translator.collate(token_encoder(src_text))
														
 
															-
														
 
															-        text_out, _ = translator.get_prediction(
														
 
															-            translator.model,
														
 
															-            translator.text_tokenizer,
														
 
															-            translator.unit_tokenizer,
														
 
															-            src["seqs"],
														
 
															-            None,
														
 
															-            input_modality=Modality.TEXT,
														
 
															-            output_modality=Modality.TEXT,
														
 
															-            tgt_lang=tgt_lang,
														
 
															-            text_generation_opts=SequenceGeneratorOptions(beam_size=beam_size),
														
 
															-            unit_generation_opts=None,
														
 
															-        )
														
 
															-
														
 
															-        tgt_text = str(text_out.sentences[0])
														
 
															-        assert tgt_text == "Nous sommes tous dans un sous-marin jaune."
														
 
															-        hypotheses = [
														
 
															-            {
														
 
															-                "seq": h.seq.tolist(),
														
 
															-                "score": h.score.item(),
														
 
															-                "step_scores": h.step_scores.numpy(),
														
 
															-            }
														
 
															-            for h in text_out.generator_output.results[0]
														
 
															-        ]
														
 
															-        np.savez(
														
 
															-            sample_file,
														
 
															-            encoder_output=text_out.encoder_output.numpy(),
														
 
															-            hypotheses=hypotheses,
														
 
															-        )
														
 
															-
														
 
															-    # allow_pickle to load the hyp dicts
														
 
															-    text_out = np.load(sample_file, allow_pickle=True)
														
 
															-    encoder_out = ggml.from_numpy(ctx, text_out["encoder_output"])
														
 
															-    prefix_seq = np.array(text_out["hypotheses"][0]["seq"][:2]).astype(np.int32)
														
 
															-    max_seq_len = max(len(h["seq"]) for h in text_out["hypotheses"])
														
 
															-
														
 
															-    opts = ggml.SequenceGeneratorOptions(
														
 
															-        beam_size=beam_size,
														
 
															-        min_seq_len=1,
														
 
															-        soft_max_seq_len_a=1,
														
 
															-        soft_max_seq_len_b=200,
														
 
															-        hard_max_seq_len=int(max_seq_len * 1.5),
														
 
															-        len_penalty=1.0,
														
 
															-        unk_penalty=0.0,
														
 
															-        normalize_scores=True,
														
 
															-    )
														
 
															-    job = ggml.SequenceGeneratorJob(
														
 
															-        opts=opts,
														
 
															-        prefix_seq=ggml.from_numpy(ctx, prefix_seq),
														
 
															-        pad_idx=0,
														
 
															-        unk_idx=1,
														
 
															-        bos_idx=2,
														
 
															-        eos_idx=3,
														
 
															-        num_threads=16,
														
 
															-    )
														
 
															-
														
 
															-    result_ptr = ggml.generate_sequence(g_model, job, encoder_out, NULLPTR, ctx)
														
 
															-    results = [result_ptr[i] for i in range(beam_size) if result_ptr[i].seq != None]
														
 
															-
														
 
															-    # The step score error is big, this may negatively impact the beam search.
														
 
															-    assert_hypotheses(
														
 
															-        text_out["hypotheses"], results, score_rtol=1e-2, step_scores_rtol=0.1
														
 
															-    )
														
 
															-
														
 
															-
														
 
															 def test_s2tt(ctx: Ctx, g_model: c_void_p):
														
 
															-    src_audio_wav, _ = torchaudio.load(DATA / "test.wav")
														
 
															-    sample_file = DATA / "test.wav.npz"
														
 
															+    if not LOCAL_AUDIO_SAMPLE_PATH.exists():
														
 
															+        download_sample_audio()
														
 
															+    src_audio_wav, _ = torchaudio.load(LOCAL_AUDIO_SAMPLE_PATH)
														
 
															+    sample_file = DATA / "LJ037-0171_sr16k.wav.trans"
														
 
															+    translator = load_translator()
														
 
															     if not sample_file.exists():
														
 
															-        translator = load_translator()
														
 
															-        token_encoder = translator.text_tokenizer.create_encoder(task="translation")
														
 
															         decoded_audio = {
														
 
															             "waveform": src_audio_wav.t(),
														
 
															             "sample_rate": 16000.0,
														
@@ -773,27 +670,13 @@ def test_s2tt(ctx: Ctx, g_model: c_void_p):
 
															             unit_generation_opts=None,
														
 
															         )
														
 
															-        tgt_text = str(text_out.sentences[0])
														
 
															-        assert tgt_text == "大家好 , 世界无主题。"
														
 
															-        hypotheses = [
														
 
															-            {
														
 
															-                "seq": h.seq.tolist(),
														
 
															-                "score": h.score.item(),
														
 
															-                "step_scores": h.step_scores.numpy(),
														
 
															-            }
														
 
															-            for h in text_out.generator_output.results[0]
														
 
															-        ]
														
 
															-        np.savez(
														
 
															-            sample_file,
														
 
															-            encoder_output=text_out.encoder_output.numpy(),
														
 
															-            hypotheses=hypotheses,
														
 
															-        )
														
 
															+        tgt_text = str(text_out[0])
														
 
															+        assert tgt_text == "专家的检查和证据使该委员会得出了结论,可能有五次枪击."
														
 
															+        with open(sample_file, "w") as f:
														
 
															+            f.write(tgt_text)
														
 
															-    exp = np.load(sample_file, allow_pickle=True)
														
 
															-    encoder_out = ggml.from_numpy(ctx, exp["encoder_output"])
														
 
															-    tgt_tokens = exp["hypotheses"][0]["seq"]
														
 
															-    max_seq_len = max(len(h["seq"]) for h in exp["hypotheses"])
														
 
															-    max_seq_len = int(max_seq_len * 1.5)
														
 
															+    with open(sample_file, "r") as exp:
														
 
															+        exp_tgt_text = exp.readlines()[0].strip()
														
 
															     # Apply scale before sending into ggml!
														
 
															     gx = ggml.from_numpy(ctx, src_audio_wav * 2**15)
														
@@ -813,7 +696,7 @@ def test_s2tt(ctx: Ctx, g_model: c_void_p):
 
															         beam_size=beam_size,
														
 
															         soft_max_seq_len_a=1,
														
 
															         soft_max_seq_len_b=200,
														
 
															-        hard_max_seq_len=max_seq_len,
														
 
															+        hard_max_seq_len=500,
														
 
															     )
														
 
															     job = ggml.SequenceGeneratorJob(
														
 
															         opts=opts,
														
@@ -825,20 +708,9 @@ def test_s2tt(ctx: Ctx, g_model: c_void_p):
 
															     )
														
 
															     result_ptr = ggml.generate_sequence(g_model, Ptr(job), encoder_out, NULLPTR, ctx)
														
 
															     results = [result_ptr[i] for i in range(beam_size) if result_ptr[i].seq != None]
														
 
															-    assert_hypotheses(exp["hypotheses"], results, score_rtol=1e-2, step_scores_rtol=0.1)
														
 
															-
														
 
															-
														
 
															-def assert_hypotheses(
														
 
															-    expected: List[Any],
														
 
															-    results: List[Any],
														
 
															-    *,
														
 
															-    score_rtol: float,
														
 
															-    step_scores_rtol: float,
														
 
															-) -> None:
														
 
															-    assert len(results) == len(expected)
														
 
															-    for g_hyp, exp in zip(results, expected):
														
 
															-        g_tokens = list(ggml.to_numpy(g_hyp.seq))
														
 
															-        g_step_scores = ggml.to_numpy(g_hyp.step_scores)
														
 
															-        assert g_tokens == exp["seq"]
														
 
															-        assert g_hyp.score == pytest.approx(exp["score"], rel=score_rtol)
														
 
															-        assert np.allclose(g_step_scores, exp["step_scores"], rtol=step_scores_rtol)
														
 
															+    tokens = [
														
 
															+        translator.text_tokenizer.model.index_to_token(id)
														
 
															+        for id in ggml.to_numpy(results[0].seq).tolist()
														
 
															+    ][2:-1]
														
 
															+    tokens = "".join(tokens).replace("▁", " ")[1:]
														
 
															+    assert tokens == exp_tgt_text
	`@@ -1,2 +0,0 @@`
	`-add_subdirectory(csrc)`
	`-add_subdirectory(tests)`