mirror of
https://github.com/HumanAIGC/lite-avatar.git
synced 2026-02-05 18:09:20 +08:00
add files
This commit is contained in:
115
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/CMakeLists.txt
vendored
Normal file
115
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/CMakeLists.txt
vendored
Normal file
@@ -0,0 +1,115 @@
|
||||
if("x${CMAKE_SOURCE_DIR}" STREQUAL "x${CMAKE_BINARY_DIR}")
|
||||
message(FATAL_ERROR "\
|
||||
In-source build is not a good practice.
|
||||
Please use:
|
||||
mkdir build
|
||||
cd build
|
||||
cmake ..
|
||||
to build this project"
|
||||
)
|
||||
endif()
|
||||
|
||||
if(CMAKE_TOOLCHAIN_FILE)
|
||||
set(_BUILD_PYTHON OFF)
|
||||
set(_BUILD_TESTS OFF)
|
||||
else()
|
||||
set(_BUILD_PYTHON ON)
|
||||
set(_BUILD_TESTS ON)
|
||||
endif()
|
||||
|
||||
if(POLICY CMP0057)
|
||||
cmake_policy(SET CMP0057 NEW)
|
||||
endif()
|
||||
|
||||
cmake_minimum_required(VERSION 3.3 FATAL_ERROR)
|
||||
|
||||
project(kaldi-native-fbank CXX C)
|
||||
|
||||
set(KALDI_NATIVE_FBANK_VERSION "1.13")
|
||||
|
||||
if(NOT CMAKE_BUILD_TYPE)
|
||||
set(CMAKE_BUILD_TYPE Release)
|
||||
endif()
|
||||
|
||||
message(STATUS "CMAKE_BUILD_TYPE: ${CMAKE_BUILD_TYPE}")
|
||||
|
||||
set(CMAKE_ARCHIVE_OUTPUT_DIRECTORY "${CMAKE_BINARY_DIR}/lib")
|
||||
set(CMAKE_LIBRARY_OUTPUT_DIRECTORY "${CMAKE_BINARY_DIR}/lib")
|
||||
set(CMAKE_RUNTIME_OUTPUT_DIRECTORY "${CMAKE_BINARY_DIR}/bin")
|
||||
|
||||
set(CMAKE_SKIP_BUILD_RPATH FALSE)
|
||||
set(BUILD_RPATH_USE_ORIGIN TRUE)
|
||||
set(CMAKE_INSTALL_RPATH_USE_LINK_PATH TRUE)
|
||||
|
||||
if(NOT APPLE)
|
||||
set(kaldi_native_fbank_rpath_origin "$ORIGIN")
|
||||
else()
|
||||
set(kaldi_native_fbank_rpath_origin "@loader_path")
|
||||
endif()
|
||||
|
||||
set(CMAKE_INSTALL_RPATH ${kaldi_native_fbank_rpath_origin})
|
||||
set(CMAKE_BUILD_RPATH ${kaldi_native_fbank_rpath_origin})
|
||||
|
||||
set(CMAKE_CXX_STANDARD 14 CACHE STRING "The C++ version to be used.")
|
||||
|
||||
if(NOT DEFINED BUILD_SHARED_LIBS)
|
||||
set(BUILD_SHARED_LIBS ON)
|
||||
endif()
|
||||
message(STATUS "BUILD_SHARED_LIBS: ${BUILD_SHARED_LIBS}")
|
||||
|
||||
option(KALDI_NATIVE_FBANK_BUILD_TESTS "Whether to build tests or not" ${_BUILD_TESTS})
|
||||
option(KALDI_NATIVE_FBANK_BUILD_PYTHON "Whether to build Python extension" ${_BUILD_PYTHON})
|
||||
option(KALDI_NATIVE_FBANK_ENABLE_CHECK "Whether to build with log" OFF)
|
||||
|
||||
message(STATUS "KALDI_NATIVE_FBANK_BUILD_TESTS: ${KALDI_NATIVE_FBANK_BUILD_TESTS}")
|
||||
message(STATUS "KALDI_NATIVE_FBANK_BUILD_PYTHON: ${KALDI_NATIVE_FBANK_BUILD_PYTHON}")
|
||||
message(STATUS "KALDI_NATIVE_FBANK_ENABLE_CHECK: ${KALDI_NATIVE_FBANK_ENABLE_CHECK}")
|
||||
|
||||
list(APPEND CMAKE_MODULE_PATH ${CMAKE_SOURCE_DIR}/cmake/Modules)
|
||||
list(APPEND CMAKE_MODULE_PATH ${CMAKE_SOURCE_DIR}/cmake)
|
||||
|
||||
message(STATUS "KALDI_NATIVE_FBANK_ENABLE_CHECK: ${KALDI_NATIVE_FBANK_ENABLE_CHECK}")
|
||||
|
||||
if(WIN32)
|
||||
add_definitions(-DNOMINMAX) # Otherwise, std::max() and std::min() won't work
|
||||
endif()
|
||||
|
||||
if(KALDI_NATIVE_FBANK_BUILD_PYTHON)
|
||||
include(pybind11)
|
||||
endif()
|
||||
|
||||
if(KALDI_NATIVE_FBANK_BUILD_TESTS)
|
||||
enable_testing()
|
||||
include(googletest)
|
||||
endif()
|
||||
|
||||
if(NOT CMAKE_INSTALL_PREFIX)
|
||||
set(CMAKE_INSTALL_PREFIX "${CMAKE_BINARY_DIR}/install")
|
||||
endif()
|
||||
|
||||
message(STATUS "CMAKE_CXX_FLAGS: ${CMAKE_CXX_FLAGS}")
|
||||
message(STATUS "CMAKE_INSTALL_PREFIX: ${CMAKE_INSTALL_PREFIX}")
|
||||
|
||||
include(CheckIncludeFileCXX)
|
||||
check_include_file_cxx(cxxabi.h KNF_HAVE_CXXABI_H)
|
||||
check_include_file_cxx(execinfo.h KNF_HAVE_EXECINFO_H)
|
||||
|
||||
include_directories(${CMAKE_SOURCE_DIR})
|
||||
|
||||
if(WIN32 AND MSVC)
|
||||
# disable various warnings for MSVC
|
||||
# 4244: '=': conversion from 'double' to 'float', possible loss of data
|
||||
# 4267: 'return': conversion from 'size_t' to 'int32_t', possible loss of data
|
||||
# 4624: destructor was implicitly defined as deleted because a base class destructor is inaccessible or deleted
|
||||
set(disabled_warnings
|
||||
/wd4244
|
||||
/wd4267
|
||||
/wd4624
|
||||
)
|
||||
message(STATUS "Disabled warnings: ${disabled_warnings}")
|
||||
foreach(w IN LISTS disabled_warnings)
|
||||
string(APPEND CMAKE_CXX_FLAGS " ${w} ")
|
||||
endforeach()
|
||||
endif()
|
||||
|
||||
add_subdirectory(kaldi-native-fbank)
|
||||
916
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/Modules/FetchContent.cmake
vendored
Normal file
916
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/Modules/FetchContent.cmake
vendored
Normal file
@@ -0,0 +1,916 @@
|
||||
# Distributed under the OSI-approved BSD 3-Clause License. See accompanying
|
||||
# file Copyright.txt or https://cmake.org/licensing for details.
|
||||
|
||||
#[=======================================================================[.rst:
|
||||
FetchContent
|
||||
------------------
|
||||
|
||||
.. only:: html
|
||||
|
||||
.. contents::
|
||||
|
||||
Overview
|
||||
^^^^^^^^
|
||||
|
||||
This module enables populating content at configure time via any method
|
||||
supported by the :module:`ExternalProject` module. Whereas
|
||||
:command:`ExternalProject_Add` downloads at build time, the
|
||||
``FetchContent`` module makes content available immediately, allowing the
|
||||
configure step to use the content in commands like :command:`add_subdirectory`,
|
||||
:command:`include` or :command:`file` operations.
|
||||
|
||||
Content population details would normally be defined separately from the
|
||||
command that performs the actual population. Projects should also
|
||||
check whether the content has already been populated somewhere else in the
|
||||
project hierarchy. Typical usage would look something like this:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_Declare(
|
||||
googletest
|
||||
GIT_REPOSITORY https://github.com/google/googletest.git
|
||||
GIT_TAG release-1.8.0
|
||||
)
|
||||
|
||||
FetchContent_GetProperties(googletest)
|
||||
if(NOT googletest_POPULATED)
|
||||
FetchContent_Populate(googletest)
|
||||
add_subdirectory(${googletest_SOURCE_DIR} ${googletest_BINARY_DIR})
|
||||
endif()
|
||||
|
||||
When using the above pattern with a hierarchical project arrangement,
|
||||
projects at higher levels in the hierarchy are able to define or override
|
||||
the population details of content specified anywhere lower in the project
|
||||
hierarchy. The ability to detect whether content has already been
|
||||
populated ensures that even if multiple child projects want certain content
|
||||
to be available, the first one to populate it wins. The other child project
|
||||
can simply make use of the already available content instead of repeating
|
||||
the population for itself. See the
|
||||
:ref:`Examples <fetch-content-examples>` section which demonstrates
|
||||
this scenario.
|
||||
|
||||
The ``FetchContent`` module also supports defining and populating
|
||||
content in a single call, with no check for whether the content has been
|
||||
populated elsewhere in the project already. This is a more low level
|
||||
operation and would not normally be the way the module is used, but it is
|
||||
sometimes useful as part of implementing some higher level feature or to
|
||||
populate some content in CMake's script mode.
|
||||
|
||||
|
||||
Declaring Content Details
|
||||
^^^^^^^^^^^^^^^^^^^^^^^^^
|
||||
|
||||
.. command:: FetchContent_Declare
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_Declare(<name> <contentOptions>...)
|
||||
|
||||
The ``FetchContent_Declare()`` function records the options that describe
|
||||
how to populate the specified content, but if such details have already
|
||||
been recorded earlier in this project (regardless of where in the project
|
||||
hierarchy), this and all later calls for the same content ``<name>`` are
|
||||
ignored. This "first to record, wins" approach is what allows hierarchical
|
||||
projects to have parent projects override content details of child projects.
|
||||
|
||||
The content ``<name>`` can be any string without spaces, but good practice
|
||||
would be to use only letters, numbers and underscores. The name will be
|
||||
treated case-insensitively and it should be obvious for the content it
|
||||
represents, often being the name of the child project or the value given
|
||||
to its top level :command:`project` command (if it is a CMake project).
|
||||
For well-known public projects, the name should generally be the official
|
||||
name of the project. Choosing an unusual name makes it unlikely that other
|
||||
projects needing that same content will use the same name, leading to
|
||||
the content being populated multiple times.
|
||||
|
||||
The ``<contentOptions>`` can be any of the download or update/patch options
|
||||
that the :command:`ExternalProject_Add` command understands. The configure,
|
||||
build, install and test steps are explicitly disabled and therefore options
|
||||
related to them will be ignored. In most cases, ``<contentOptions>`` will
|
||||
just be a couple of options defining the download method and method-specific
|
||||
details like a commit tag or archive hash. For example:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_Declare(
|
||||
googletest
|
||||
GIT_REPOSITORY https://github.com/google/googletest.git
|
||||
GIT_TAG release-1.8.0
|
||||
)
|
||||
|
||||
FetchContent_Declare(
|
||||
myCompanyIcons
|
||||
URL https://intranet.mycompany.com/assets/iconset_1.12.tar.gz
|
||||
URL_HASH 5588a7b18261c20068beabfb4f530b87
|
||||
)
|
||||
|
||||
FetchContent_Declare(
|
||||
myCompanyCertificates
|
||||
SVN_REPOSITORY svn+ssh://svn.mycompany.com/srv/svn/trunk/certs
|
||||
SVN_REVISION -r12345
|
||||
)
|
||||
|
||||
Populating The Content
|
||||
^^^^^^^^^^^^^^^^^^^^^^
|
||||
|
||||
.. command:: FetchContent_Populate
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_Populate( <name> )
|
||||
|
||||
In most cases, the only argument given to ``FetchContent_Populate()`` is the
|
||||
``<name>``. When used this way, the command assumes the content details have
|
||||
been recorded by an earlier call to :command:`FetchContent_Declare`. The
|
||||
details are stored in a global property, so they are unaffected by things
|
||||
like variable or directory scope. Therefore, it doesn't matter where in the
|
||||
project the details were previously declared, as long as they have been
|
||||
declared before the call to ``FetchContent_Populate()``. Those saved details
|
||||
are then used to construct a call to :command:`ExternalProject_Add` in a
|
||||
private sub-build to perform the content population immediately. The
|
||||
implementation of ``ExternalProject_Add()`` ensures that if the content has
|
||||
already been populated in a previous CMake run, that content will be reused
|
||||
rather than repopulating them again. For the common case where population
|
||||
involves downloading content, the cost of the download is only paid once.
|
||||
|
||||
An internal global property records when a particular content population
|
||||
request has been processed. If ``FetchContent_Populate()`` is called more
|
||||
than once for the same content name within a configure run, the second call
|
||||
will halt with an error. Projects can and should check whether content
|
||||
population has already been processed with the
|
||||
:command:`FetchContent_GetProperties` command before calling
|
||||
``FetchContent_Populate()``.
|
||||
|
||||
``FetchContent_Populate()`` will set three variables in the scope of the
|
||||
caller; ``<lcName>_POPULATED``, ``<lcName>_SOURCE_DIR`` and
|
||||
``<lcName>_BINARY_DIR``, where ``<lcName>`` is the lowercased ``<name>``.
|
||||
``<lcName>_POPULATED`` will always be set to ``True`` by the call.
|
||||
``<lcName>_SOURCE_DIR`` is the location where the
|
||||
content can be found upon return (it will have already been populated), while
|
||||
``<lcName>_BINARY_DIR`` is a directory intended for use as a corresponding
|
||||
build directory. The main use case for the two directory variables is to
|
||||
call :command:`add_subdirectory` immediately after population, i.e.:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_Populate(FooBar ...)
|
||||
add_subdirectory(${foobar_SOURCE_DIR} ${foobar_BINARY_DIR})
|
||||
|
||||
The values of the three variables can also be retrieved from anywhere in the
|
||||
project hierarchy using the :command:`FetchContent_GetProperties` command.
|
||||
|
||||
A number of cache variables influence the behavior of all content population
|
||||
performed using details saved from a :command:`FetchContent_Declare` call:
|
||||
|
||||
``FETCHCONTENT_BASE_DIR``
|
||||
In most cases, the saved details do not specify any options relating to the
|
||||
directories to use for the internal sub-build, final source and build areas.
|
||||
It is generally best to leave these decisions up to the ``FetchContent``
|
||||
module to handle on the project's behalf. The ``FETCHCONTENT_BASE_DIR``
|
||||
cache variable controls the point under which all content population
|
||||
directories are collected, but in most cases developers would not need to
|
||||
change this. The default location is ``${CMAKE_BINARY_DIR}/_deps``, but if
|
||||
developers change this value, they should aim to keep the path short and
|
||||
just below the top level of the build tree to avoid running into path
|
||||
length problems on Windows.
|
||||
|
||||
``FETCHCONTENT_QUIET``
|
||||
The logging output during population can be quite verbose, making the
|
||||
configure stage quite noisy. This cache option (``ON`` by default) hides
|
||||
all population output unless an error is encountered. If experiencing
|
||||
problems with hung downloads, temporarily switching this option off may
|
||||
help diagnose which content population is causing the issue.
|
||||
|
||||
``FETCHCONTENT_FULLY_DISCONNECTED``
|
||||
When this option is enabled, no attempt is made to download or update
|
||||
any content. It is assumed that all content has already been populated in
|
||||
a previous run or the source directories have been pointed at existing
|
||||
contents the developer has provided manually (using options described
|
||||
further below). When the developer knows that no changes have been made to
|
||||
any content details, turning this option ``ON`` can significantly speed up
|
||||
the configure stage. It is ``OFF`` by default.
|
||||
|
||||
``FETCHCONTENT_UPDATES_DISCONNECTED``
|
||||
This is a less severe download/update control compared to
|
||||
``FETCHCONTENT_FULLY_DISCONNECTED``. Instead of bypassing all download and
|
||||
update logic, the ``FETCHCONTENT_UPDATES_DISCONNECTED`` only disables the
|
||||
update stage. Therefore, if content has not been downloaded previously,
|
||||
it will still be downloaded when this option is enabled. This can speed up
|
||||
the configure stage, but not as much as
|
||||
``FETCHCONTENT_FULLY_DISCONNECTED``. It is ``OFF`` by default.
|
||||
|
||||
In addition to the above cache variables, the following cache variables are
|
||||
also defined for each content name (``<ucName>`` is the uppercased value of
|
||||
``<name>``):
|
||||
|
||||
``FETCHCONTENT_SOURCE_DIR_<ucName>``
|
||||
If this is set, no download or update steps are performed for the specified
|
||||
content and the ``<lcName>_SOURCE_DIR`` variable returned to the caller is
|
||||
pointed at this location. This gives developers a way to have a separate
|
||||
checkout of the content that they can modify freely without interference
|
||||
from the build. The build simply uses that existing source, but it still
|
||||
defines ``<lcName>_BINARY_DIR`` to point inside its own build area.
|
||||
Developers are strongly encouraged to use this mechanism rather than
|
||||
editing the sources populated in the default location, as changes to
|
||||
sources in the default location can be lost when content population details
|
||||
are changed by the project.
|
||||
|
||||
``FETCHCONTENT_UPDATES_DISCONNECTED_<ucName>``
|
||||
This is the per-content equivalent of
|
||||
``FETCHCONTENT_UPDATES_DISCONNECTED``. If the global option or this option
|
||||
is ``ON``, then updates will be disabled for the named content.
|
||||
Disabling updates for individual content can be useful for content whose
|
||||
details rarely change, while still leaving other frequently changing
|
||||
content with updates enabled.
|
||||
|
||||
|
||||
The ``FetchContent_Populate()`` command also supports a syntax allowing the
|
||||
content details to be specified directly rather than using any saved
|
||||
details. This is more low-level and use of this form is generally to be
|
||||
avoided in favour of using saved content details as outlined above.
|
||||
Nevertheless, in certain situations it can be useful to invoke the content
|
||||
population as an isolated operation (typically as part of implementing some
|
||||
other higher level feature or when using CMake in script mode):
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_Populate( <name>
|
||||
[QUIET]
|
||||
[SUBBUILD_DIR <subBuildDir>]
|
||||
[SOURCE_DIR <srcDir>]
|
||||
[BINARY_DIR <binDir>]
|
||||
...
|
||||
)
|
||||
|
||||
This form has a number of key differences to that where only ``<name>`` is
|
||||
provided:
|
||||
|
||||
- All required population details are assumed to have been provided directly
|
||||
in the call to ``FetchContent_Populate()``. Any saved details for
|
||||
``<name>`` are ignored.
|
||||
- No check is made for whether content for ``<name>`` has already been
|
||||
populated.
|
||||
- No global property is set to record that the population has occurred.
|
||||
- No global properties record the source or binary directories used for the
|
||||
populated content.
|
||||
- The ``FETCHCONTENT_FULLY_DISCONNECTED`` and
|
||||
``FETCHCONTENT_UPDATES_DISCONNECTED`` cache variables are ignored.
|
||||
|
||||
The ``<lcName>_SOURCE_DIR`` and ``<lcName>_BINARY_DIR`` variables are still
|
||||
returned to the caller, but since these locations are not stored as global
|
||||
properties when this form is used, they are only available to the calling
|
||||
scope and below rather than the entire project hierarchy. No
|
||||
``<lcName>_POPULATED`` variable is set in the caller's scope with this form.
|
||||
|
||||
The supported options for ``FetchContent_Populate()`` are the same as those
|
||||
for :command:`FetchContent_Declare()`. Those few options shown just
|
||||
above are either specific to ``FetchContent_Populate()`` or their behavior is
|
||||
slightly modified from how :command:`ExternalProject_Add` treats them.
|
||||
|
||||
``QUIET``
|
||||
The ``QUIET`` option can be given to hide the output associated with
|
||||
populating the specified content. If the population fails, the output will
|
||||
be shown regardless of whether this option was given or not so that the
|
||||
cause of the failure can be diagnosed. The global ``FETCHCONTENT_QUIET``
|
||||
cache variable has no effect on ``FetchContent_Populate()`` calls where the
|
||||
content details are provided directly.
|
||||
|
||||
``SUBBUILD_DIR``
|
||||
The ``SUBBUILD_DIR`` argument can be provided to change the location of the
|
||||
sub-build created to perform the population. The default value is
|
||||
``${CMAKE_CURRENT_BINARY_DIR}/<lcName>-subbuild`` and it would be unusual
|
||||
to need to override this default. If a relative path is specified, it will
|
||||
be interpreted as relative to :variable:`CMAKE_CURRENT_BINARY_DIR`.
|
||||
|
||||
``SOURCE_DIR``, ``BINARY_DIR``
|
||||
The ``SOURCE_DIR`` and ``BINARY_DIR`` arguments are supported by
|
||||
:command:`ExternalProject_Add`, but different default values are used by
|
||||
``FetchContent_Populate()``. ``SOURCE_DIR`` defaults to
|
||||
``${CMAKE_CURRENT_BINARY_DIR}/<lcName>-src`` and ``BINARY_DIR`` defaults to
|
||||
``${CMAKE_CURRENT_BINARY_DIR}/<lcName>-build``. If a relative path is
|
||||
specified, it will be interpreted as relative to
|
||||
:variable:`CMAKE_CURRENT_BINARY_DIR`.
|
||||
|
||||
In addition to the above explicit options, any other unrecognized options are
|
||||
passed through unmodified to :command:`ExternalProject_Add` to perform the
|
||||
download, patch and update steps. The following options are explicitly
|
||||
prohibited (they are disabled by the ``FetchContent_Populate()`` command):
|
||||
|
||||
- ``CONFIGURE_COMMAND``
|
||||
- ``BUILD_COMMAND``
|
||||
- ``INSTALL_COMMAND``
|
||||
- ``TEST_COMMAND``
|
||||
|
||||
If using ``FetchContent_Populate()`` within CMake's script mode, be aware
|
||||
that the implementation sets up a sub-build which therefore requires a CMake
|
||||
generator and build tool to be available. If these cannot be found by
|
||||
default, then the :variable:`CMAKE_GENERATOR` and/or
|
||||
:variable:`CMAKE_MAKE_PROGRAM` variables will need to be set appropriately
|
||||
on the command line invoking the script.
|
||||
|
||||
|
||||
Retrieve Population Properties
|
||||
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
|
||||
|
||||
.. command:: FetchContent_GetProperties
|
||||
|
||||
When using saved content details, a call to :command:`FetchContent_Populate`
|
||||
records information in global properties which can be queried at any time.
|
||||
This information includes the source and binary directories associated with
|
||||
the content and also whether or not the content population has been processed
|
||||
during the current configure run.
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_GetProperties( <name>
|
||||
[SOURCE_DIR <srcDirVar>]
|
||||
[BINARY_DIR <binDirVar>]
|
||||
[POPULATED <doneVar>]
|
||||
)
|
||||
|
||||
The ``SOURCE_DIR``, ``BINARY_DIR`` and ``POPULATED`` options can be used to
|
||||
specify which properties should be retrieved. Each option accepts a value
|
||||
which is the name of the variable in which to store that property. Most of
|
||||
the time though, only ``<name>`` is given, in which case the call will then
|
||||
set the same variables as a call to
|
||||
:command:`FetchContent_Populate(name) <FetchContent_Populate>`. This allows
|
||||
the following canonical pattern to be used, which ensures that the relevant
|
||||
variables will always be defined regardless of whether or not the population
|
||||
has been performed elsewhere in the project already:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
FetchContent_GetProperties(foobar)
|
||||
if(NOT foobar_POPULATED)
|
||||
FetchContent_Populate(foobar)
|
||||
|
||||
# Set any custom variables, etc. here, then
|
||||
# populate the content as part of this build
|
||||
|
||||
add_subdirectory(${foobar_SOURCE_DIR} ${foobar_BINARY_DIR})
|
||||
endif()
|
||||
|
||||
The above pattern allows other parts of the overall project hierarchy to
|
||||
re-use the same content and ensure that it is only populated once.
|
||||
|
||||
|
||||
.. _`fetch-content-examples`:
|
||||
|
||||
Examples
|
||||
^^^^^^^^
|
||||
|
||||
Consider a project hierarchy where ``projA`` is the top level project and it
|
||||
depends on projects ``projB`` and ``projC``. Both ``projB`` and ``projC``
|
||||
can be built standalone and they also both depend on another project
|
||||
``projD``. For simplicity, this example will assume that all four projects
|
||||
are available on a company git server. The ``CMakeLists.txt`` of each project
|
||||
might have sections like the following:
|
||||
|
||||
*projA*:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
include(FetchContent)
|
||||
FetchContent_Declare(
|
||||
projB
|
||||
GIT_REPOSITORY git@mycompany.com/git/projB.git
|
||||
GIT_TAG 4a89dc7e24ff212a7b5167bef7ab079d
|
||||
)
|
||||
FetchContent_Declare(
|
||||
projC
|
||||
GIT_REPOSITORY git@mycompany.com/git/projC.git
|
||||
GIT_TAG 4ad4016bd1d8d5412d135cf8ceea1bb9
|
||||
)
|
||||
FetchContent_Declare(
|
||||
projD
|
||||
GIT_REPOSITORY git@mycompany.com/git/projD.git
|
||||
GIT_TAG origin/integrationBranch
|
||||
)
|
||||
|
||||
FetchContent_GetProperties(projB)
|
||||
if(NOT projb_POPULATED)
|
||||
FetchContent_Populate(projB)
|
||||
add_subdirectory(${projb_SOURCE_DIR} ${projb_BINARY_DIR})
|
||||
endif()
|
||||
|
||||
FetchContent_GetProperties(projC)
|
||||
if(NOT projc_POPULATED)
|
||||
FetchContent_Populate(projC)
|
||||
add_subdirectory(${projc_SOURCE_DIR} ${projc_BINARY_DIR})
|
||||
endif()
|
||||
|
||||
*projB*:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
include(FetchContent)
|
||||
FetchContent_Declare(
|
||||
projD
|
||||
GIT_REPOSITORY git@mycompany.com/git/projD.git
|
||||
GIT_TAG 20b415f9034bbd2a2e8216e9a5c9e632
|
||||
)
|
||||
|
||||
FetchContent_GetProperties(projD)
|
||||
if(NOT projd_POPULATED)
|
||||
FetchContent_Populate(projD)
|
||||
add_subdirectory(${projd_SOURCE_DIR} ${projd_BINARY_DIR})
|
||||
endif()
|
||||
|
||||
|
||||
*projC*:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
include(FetchContent)
|
||||
FetchContent_Declare(
|
||||
projD
|
||||
GIT_REPOSITORY git@mycompany.com/git/projD.git
|
||||
GIT_TAG 7d9a17ad2c962aa13e2fbb8043fb6b8a
|
||||
)
|
||||
|
||||
FetchContent_GetProperties(projD)
|
||||
if(NOT projd_POPULATED)
|
||||
FetchContent_Populate(projD)
|
||||
add_subdirectory(${projd_SOURCE_DIR} ${projd_BINARY_DIR})
|
||||
endif()
|
||||
|
||||
A few key points should be noted in the above:
|
||||
|
||||
- ``projB`` and ``projC`` define different content details for ``projD``,
|
||||
but ``projA`` also defines a set of content details for ``projD`` and
|
||||
because ``projA`` will define them first, the details from ``projB`` and
|
||||
``projC`` will not be used. The override details defined by ``projA``
|
||||
are not required to match either of those from ``projB`` or ``projC``, but
|
||||
it is up to the higher level project to ensure that the details it does
|
||||
define still make sense for the child projects.
|
||||
- While ``projA`` defined content details for ``projD``, it did not need
|
||||
to explicitly call ``FetchContent_Populate(projD)`` itself. Instead, it
|
||||
leaves that to a child project to do (in this case it will be ``projB``
|
||||
since it is added to the build ahead of ``projC``). If ``projA`` needed to
|
||||
customize how the ``projD`` content was brought into the build as well
|
||||
(e.g. define some CMake variables before calling
|
||||
:command:`add_subdirectory` after populating), it would do the call to
|
||||
``FetchContent_Populate()``, etc. just as it did for the ``projB`` and
|
||||
``projC`` content. For higher level projects, it is usually enough to
|
||||
just define the override content details and leave the actual population
|
||||
to the child projects. This saves repeating the same thing at each level
|
||||
of the project hierarchy unnecessarily.
|
||||
- Even though ``projA`` is the top level project in this example, it still
|
||||
checks whether ``projB`` and ``projC`` have already been populated before
|
||||
going ahead to do those populations. This makes ``projA`` able to be more
|
||||
easily incorporated as a child of some other higher level project in the
|
||||
future if required. Always protect a call to
|
||||
:command:`FetchContent_Populate` with a check to
|
||||
:command:`FetchContent_GetProperties`, even in what may be considered a top
|
||||
level project at the time.
|
||||
|
||||
|
||||
The following example demonstrates how one might download and unpack a
|
||||
firmware tarball using CMake's :manual:`script mode <cmake(1)>`. The call to
|
||||
:command:`FetchContent_Populate` specifies all the content details and the
|
||||
unpacked firmware will be placed in a ``firmware`` directory below the
|
||||
current working directory.
|
||||
|
||||
*getFirmware.cmake*:
|
||||
|
||||
.. code-block:: cmake
|
||||
|
||||
# NOTE: Intended to be run in script mode with cmake -P
|
||||
include(FetchContent)
|
||||
FetchContent_Populate(
|
||||
firmware
|
||||
URL https://mycompany.com/assets/firmware-1.23-arm.tar.gz
|
||||
URL_HASH MD5=68247684da89b608d466253762b0ff11
|
||||
SOURCE_DIR firmware
|
||||
)
|
||||
|
||||
#]=======================================================================]
|
||||
|
||||
|
||||
set(__FetchContent_privateDir "${CMAKE_CURRENT_LIST_DIR}/FetchContent")
|
||||
|
||||
#=======================================================================
|
||||
# Recording and retrieving content details for later population
|
||||
#=======================================================================
|
||||
|
||||
# Internal use, projects must not call this directly. It is
|
||||
# intended for use by FetchContent_Declare() only.
|
||||
#
|
||||
# Sets a content-specific global property (not meant for use
|
||||
# outside of functions defined here in this file) which can later
|
||||
# be retrieved using __FetchContent_getSavedDetails() with just the
|
||||
# same content name. If there is already a value stored in the
|
||||
# property, it is left unchanged and this call has no effect.
|
||||
# This allows parent projects to define the content details,
|
||||
# overriding anything a child project may try to set (properties
|
||||
# are not cached between runs, so the first thing to set it in a
|
||||
# build will be in control).
|
||||
function(__FetchContent_declareDetails contentName)
|
||||
|
||||
string(TOLOWER ${contentName} contentNameLower)
|
||||
set(propertyName "_FetchContent_${contentNameLower}_savedDetails")
|
||||
get_property(alreadyDefined GLOBAL PROPERTY ${propertyName} DEFINED)
|
||||
if(NOT alreadyDefined)
|
||||
define_property(GLOBAL PROPERTY ${propertyName}
|
||||
BRIEF_DOCS "Internal implementation detail of FetchContent_Populate()"
|
||||
FULL_DOCS "Details used by FetchContent_Populate() for ${contentName}"
|
||||
)
|
||||
set_property(GLOBAL PROPERTY ${propertyName} ${ARGN})
|
||||
endif()
|
||||
|
||||
endfunction()
|
||||
|
||||
|
||||
# Internal use, projects must not call this directly. It is
|
||||
# intended for use by the FetchContent_Declare() function.
|
||||
#
|
||||
# Retrieves details saved for the specified content in an
|
||||
# earlier call to __FetchContent_declareDetails().
|
||||
function(__FetchContent_getSavedDetails contentName outVar)
|
||||
|
||||
string(TOLOWER ${contentName} contentNameLower)
|
||||
set(propertyName "_FetchContent_${contentNameLower}_savedDetails")
|
||||
get_property(alreadyDefined GLOBAL PROPERTY ${propertyName} DEFINED)
|
||||
if(NOT alreadyDefined)
|
||||
message(FATAL_ERROR "No content details recorded for ${contentName}")
|
||||
endif()
|
||||
get_property(propertyValue GLOBAL PROPERTY ${propertyName})
|
||||
set(${outVar} "${propertyValue}" PARENT_SCOPE)
|
||||
|
||||
endfunction()
|
||||
|
||||
|
||||
# Saves population details of the content, sets defaults for the
|
||||
# SOURCE_DIR and BUILD_DIR.
|
||||
function(FetchContent_Declare contentName)
|
||||
|
||||
set(options "")
|
||||
set(oneValueArgs SVN_REPOSITORY)
|
||||
set(multiValueArgs "")
|
||||
|
||||
cmake_parse_arguments(ARG "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
|
||||
|
||||
unset(srcDirSuffix)
|
||||
unset(svnRepoArgs)
|
||||
if(ARG_SVN_REPOSITORY)
|
||||
# Add a hash of the svn repository URL to the source dir. This works
|
||||
# around the problem where if the URL changes, the download would
|
||||
# fail because it tries to checkout/update rather than switch the
|
||||
# old URL to the new one. We limit the hash to the first 7 characters
|
||||
# so that the source path doesn't get overly long (which can be a
|
||||
# problem on windows due to path length limits).
|
||||
string(SHA1 urlSHA ${ARG_SVN_REPOSITORY})
|
||||
string(SUBSTRING ${urlSHA} 0 7 urlSHA)
|
||||
set(srcDirSuffix "-${urlSHA}")
|
||||
set(svnRepoArgs SVN_REPOSITORY ${ARG_SVN_REPOSITORY})
|
||||
endif()
|
||||
|
||||
string(TOLOWER ${contentName} contentNameLower)
|
||||
__FetchContent_declareDetails(
|
||||
${contentNameLower}
|
||||
SOURCE_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-src${srcDirSuffix}"
|
||||
BINARY_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-build"
|
||||
${svnRepoArgs}
|
||||
# List these last so they can override things we set above
|
||||
${ARG_UNPARSED_ARGUMENTS}
|
||||
)
|
||||
|
||||
endfunction()
|
||||
|
||||
|
||||
#=======================================================================
|
||||
# Set/get whether the specified content has been populated yet.
|
||||
# The setter also records the source and binary dirs used.
|
||||
#=======================================================================
|
||||
|
||||
# Internal use, projects must not call this directly. It is
|
||||
# intended for use by the FetchContent_Populate() function to
|
||||
# record when FetchContent_Populate() is called for a particular
|
||||
# content name.
|
||||
function(__FetchContent_setPopulated contentName sourceDir binaryDir)
|
||||
|
||||
string(TOLOWER ${contentName} contentNameLower)
|
||||
set(prefix "_FetchContent_${contentNameLower}")
|
||||
|
||||
set(propertyName "${prefix}_sourceDir")
|
||||
define_property(GLOBAL PROPERTY ${propertyName}
|
||||
BRIEF_DOCS "Internal implementation detail of FetchContent_Populate()"
|
||||
FULL_DOCS "Details used by FetchContent_Populate() for ${contentName}"
|
||||
)
|
||||
set_property(GLOBAL PROPERTY ${propertyName} ${sourceDir})
|
||||
|
||||
set(propertyName "${prefix}_binaryDir")
|
||||
define_property(GLOBAL PROPERTY ${propertyName}
|
||||
BRIEF_DOCS "Internal implementation detail of FetchContent_Populate()"
|
||||
FULL_DOCS "Details used by FetchContent_Populate() for ${contentName}"
|
||||
)
|
||||
set_property(GLOBAL PROPERTY ${propertyName} ${binaryDir})
|
||||
|
||||
set(propertyName "${prefix}_populated")
|
||||
define_property(GLOBAL PROPERTY ${propertyName}
|
||||
BRIEF_DOCS "Internal implementation detail of FetchContent_Populate()"
|
||||
FULL_DOCS "Details used by FetchContent_Populate() for ${contentName}"
|
||||
)
|
||||
set_property(GLOBAL PROPERTY ${propertyName} True)
|
||||
|
||||
endfunction()
|
||||
|
||||
|
||||
# Set variables in the calling scope for any of the retrievable
|
||||
# properties. If no specific properties are requested, variables
|
||||
# will be set for all retrievable properties.
|
||||
#
|
||||
# This function is intended to also be used by projects as the canonical
|
||||
# way to detect whether they should call FetchContent_Populate()
|
||||
# and pull the populated source into the build with add_subdirectory(),
|
||||
# if they are using the populated content in that way.
|
||||
function(FetchContent_GetProperties contentName)
|
||||
|
||||
string(TOLOWER ${contentName} contentNameLower)
|
||||
|
||||
set(options "")
|
||||
set(oneValueArgs SOURCE_DIR BINARY_DIR POPULATED)
|
||||
set(multiValueArgs "")
|
||||
|
||||
cmake_parse_arguments(ARG "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
|
||||
|
||||
if(NOT ARG_SOURCE_DIR AND
|
||||
NOT ARG_BINARY_DIR AND
|
||||
NOT ARG_POPULATED)
|
||||
# No specific properties requested, provide them all
|
||||
set(ARG_SOURCE_DIR ${contentNameLower}_SOURCE_DIR)
|
||||
set(ARG_BINARY_DIR ${contentNameLower}_BINARY_DIR)
|
||||
set(ARG_POPULATED ${contentNameLower}_POPULATED)
|
||||
endif()
|
||||
|
||||
set(prefix "_FetchContent_${contentNameLower}")
|
||||
|
||||
if(ARG_SOURCE_DIR)
|
||||
set(propertyName "${prefix}_sourceDir")
|
||||
get_property(value GLOBAL PROPERTY ${propertyName})
|
||||
if(value)
|
||||
set(${ARG_SOURCE_DIR} ${value} PARENT_SCOPE)
|
||||
endif()
|
||||
endif()
|
||||
|
||||
if(ARG_BINARY_DIR)
|
||||
set(propertyName "${prefix}_binaryDir")
|
||||
get_property(value GLOBAL PROPERTY ${propertyName})
|
||||
if(value)
|
||||
set(${ARG_BINARY_DIR} ${value} PARENT_SCOPE)
|
||||
endif()
|
||||
endif()
|
||||
|
||||
if(ARG_POPULATED)
|
||||
set(propertyName "${prefix}_populated")
|
||||
get_property(value GLOBAL PROPERTY ${propertyName} DEFINED)
|
||||
set(${ARG_POPULATED} ${value} PARENT_SCOPE)
|
||||
endif()
|
||||
|
||||
endfunction()
|
||||
|
||||
|
||||
#=======================================================================
|
||||
# Performing the population
|
||||
#=======================================================================
|
||||
|
||||
# The value of contentName will always have been lowercased by the caller.
|
||||
# All other arguments are assumed to be options that are understood by
|
||||
# ExternalProject_Add(), except for QUIET and SUBBUILD_DIR.
|
||||
function(__FetchContent_directPopulate contentName)
|
||||
|
||||
set(options
|
||||
QUIET
|
||||
)
|
||||
set(oneValueArgs
|
||||
SUBBUILD_DIR
|
||||
SOURCE_DIR
|
||||
BINARY_DIR
|
||||
# Prevent the following from being passed through
|
||||
CONFIGURE_COMMAND
|
||||
BUILD_COMMAND
|
||||
INSTALL_COMMAND
|
||||
TEST_COMMAND
|
||||
)
|
||||
set(multiValueArgs "")
|
||||
|
||||
cmake_parse_arguments(ARG "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
|
||||
|
||||
if(NOT ARG_SUBBUILD_DIR)
|
||||
message(FATAL_ERROR "Internal error: SUBBUILD_DIR not set")
|
||||
elseif(NOT IS_ABSOLUTE "${ARG_SUBBUILD_DIR}")
|
||||
set(ARG_SUBBUILD_DIR "${CMAKE_CURRENT_BINARY_DIR}/${ARG_SUBBUILD_DIR}")
|
||||
endif()
|
||||
|
||||
if(NOT ARG_SOURCE_DIR)
|
||||
message(FATAL_ERROR "Internal error: SOURCE_DIR not set")
|
||||
elseif(NOT IS_ABSOLUTE "${ARG_SOURCE_DIR}")
|
||||
set(ARG_SOURCE_DIR "${CMAKE_CURRENT_BINARY_DIR}/${ARG_SOURCE_DIR}")
|
||||
endif()
|
||||
|
||||
if(NOT ARG_BINARY_DIR)
|
||||
message(FATAL_ERROR "Internal error: BINARY_DIR not set")
|
||||
elseif(NOT IS_ABSOLUTE "${ARG_BINARY_DIR}")
|
||||
set(ARG_BINARY_DIR "${CMAKE_CURRENT_BINARY_DIR}/${ARG_BINARY_DIR}")
|
||||
endif()
|
||||
|
||||
# Ensure the caller can know where to find the source and build directories
|
||||
# with some convenient variables. Doing this here ensures the caller sees
|
||||
# the correct result in the case where the default values are overridden by
|
||||
# the content details set by the project.
|
||||
set(${contentName}_SOURCE_DIR "${ARG_SOURCE_DIR}" PARENT_SCOPE)
|
||||
set(${contentName}_BINARY_DIR "${ARG_BINARY_DIR}" PARENT_SCOPE)
|
||||
|
||||
# The unparsed arguments may contain spaces, so build up ARG_EXTRA
|
||||
# in such a way that it correctly substitutes into the generated
|
||||
# CMakeLists.txt file with each argument quoted.
|
||||
unset(ARG_EXTRA)
|
||||
foreach(arg IN LISTS ARG_UNPARSED_ARGUMENTS)
|
||||
set(ARG_EXTRA "${ARG_EXTRA} \"${arg}\"")
|
||||
endforeach()
|
||||
|
||||
# Hide output if requested, but save it to a variable in case there's an
|
||||
# error so we can show the output upon failure. When not quiet, don't
|
||||
# capture the output to a variable because the user may want to see the
|
||||
# output as it happens (e.g. progress during long downloads). Combine both
|
||||
# stdout and stderr in the one capture variable so the output stays in order.
|
||||
if (ARG_QUIET)
|
||||
set(outputOptions
|
||||
OUTPUT_VARIABLE capturedOutput
|
||||
ERROR_VARIABLE capturedOutput
|
||||
)
|
||||
else()
|
||||
set(capturedOutput)
|
||||
set(outputOptions)
|
||||
message(STATUS "Populating ${contentName}")
|
||||
endif()
|
||||
|
||||
if(CMAKE_GENERATOR)
|
||||
set(generatorOpts "-G${CMAKE_GENERATOR}")
|
||||
if(CMAKE_GENERATOR_PLATFORM)
|
||||
list(APPEND generatorOpts "-A${CMAKE_GENERATOR_PLATFORM}")
|
||||
endif()
|
||||
if(CMAKE_GENERATOR_TOOLSET)
|
||||
list(APPEND generatorOpts "-T${CMAKE_GENERATOR_TOOLSET}")
|
||||
endif()
|
||||
|
||||
if(CMAKE_MAKE_PROGRAM)
|
||||
list(APPEND generatorOpts "-DCMAKE_MAKE_PROGRAM:FILEPATH=${CMAKE_MAKE_PROGRAM}")
|
||||
endif()
|
||||
|
||||
else()
|
||||
# Likely we've been invoked via CMake's script mode where no
|
||||
# generator is set (and hence CMAKE_MAKE_PROGRAM could not be
|
||||
# trusted even if provided). We will have to rely on being
|
||||
# able to find the default generator and build tool.
|
||||
unset(generatorOpts)
|
||||
endif()
|
||||
|
||||
# Create and build a separate CMake project to carry out the population.
|
||||
# If we've already previously done these steps, they will not cause
|
||||
# anything to be updated, so extra rebuilds of the project won't occur.
|
||||
# Make sure to pass through CMAKE_MAKE_PROGRAM in case the main project
|
||||
# has this set to something not findable on the PATH.
|
||||
configure_file("${__FetchContent_privateDir}/CMakeLists.cmake.in"
|
||||
"${ARG_SUBBUILD_DIR}/CMakeLists.txt")
|
||||
execute_process(
|
||||
COMMAND ${CMAKE_COMMAND} ${generatorOpts} .
|
||||
RESULT_VARIABLE result
|
||||
${outputOptions}
|
||||
WORKING_DIRECTORY "${ARG_SUBBUILD_DIR}"
|
||||
)
|
||||
if(result)
|
||||
if(capturedOutput)
|
||||
message("${capturedOutput}")
|
||||
endif()
|
||||
message(FATAL_ERROR "CMake step for ${contentName} failed: ${result}")
|
||||
endif()
|
||||
execute_process(
|
||||
COMMAND ${CMAKE_COMMAND} --build .
|
||||
RESULT_VARIABLE result
|
||||
${outputOptions}
|
||||
WORKING_DIRECTORY "${ARG_SUBBUILD_DIR}"
|
||||
)
|
||||
if(result)
|
||||
if(capturedOutput)
|
||||
message("${capturedOutput}")
|
||||
endif()
|
||||
message(FATAL_ERROR "Build step for ${contentName} failed: ${result}")
|
||||
endif()
|
||||
|
||||
endfunction()
|
||||
|
||||
|
||||
option(FETCHCONTENT_FULLY_DISCONNECTED "Disables all attempts to download or update content and assumes source dirs already exist")
|
||||
option(FETCHCONTENT_UPDATES_DISCONNECTED "Enables UPDATE_DISCONNECTED behavior for all content population")
|
||||
option(FETCHCONTENT_QUIET "Enables QUIET option for all content population" ON)
|
||||
set(FETCHCONTENT_BASE_DIR "${CMAKE_BINARY_DIR}/_deps" CACHE PATH "Directory under which to collect all populated content")
|
||||
|
||||
# Populate the specified content using details stored from
|
||||
# an earlier call to FetchContent_Declare().
|
||||
function(FetchContent_Populate contentName)
|
||||
|
||||
if(NOT contentName)
|
||||
message(FATAL_ERROR "Empty contentName not allowed for FetchContent_Populate()")
|
||||
endif()
|
||||
|
||||
string(TOLOWER ${contentName} contentNameLower)
|
||||
|
||||
if(ARGN)
|
||||
# This is the direct population form with details fully specified
|
||||
# as part of the call, so we already have everything we need
|
||||
__FetchContent_directPopulate(
|
||||
${contentNameLower}
|
||||
SUBBUILD_DIR "${CMAKE_CURRENT_BINARY_DIR}/${contentNameLower}-subbuild"
|
||||
SOURCE_DIR "${CMAKE_CURRENT_BINARY_DIR}/${contentNameLower}-src"
|
||||
BINARY_DIR "${CMAKE_CURRENT_BINARY_DIR}/${contentNameLower}-build"
|
||||
${ARGN} # Could override any of the above ..._DIR variables
|
||||
)
|
||||
|
||||
# Pass source and binary dir variables back to the caller
|
||||
set(${contentNameLower}_SOURCE_DIR "${${contentNameLower}_SOURCE_DIR}" PARENT_SCOPE)
|
||||
set(${contentNameLower}_BINARY_DIR "${${contentNameLower}_BINARY_DIR}" PARENT_SCOPE)
|
||||
|
||||
# Don't set global properties, or record that we did this population, since
|
||||
# this was a direct call outside of the normal declared details form.
|
||||
# We only want to save values in the global properties for content that
|
||||
# honours the hierarchical details mechanism so that projects are not
|
||||
# robbed of the ability to override details set in nested projects.
|
||||
return()
|
||||
endif()
|
||||
|
||||
# No details provided, so assume they were saved from an earlier call
|
||||
# to FetchContent_Declare(). Do a check that we haven't already
|
||||
# populated this content before in case the caller forgot to check.
|
||||
FetchContent_GetProperties(${contentName})
|
||||
if(${contentNameLower}_POPULATED)
|
||||
message(FATAL_ERROR "Content ${contentName} already populated in ${${contentNameLower}_SOURCE_DIR}")
|
||||
endif()
|
||||
|
||||
string(TOUPPER ${contentName} contentNameUpper)
|
||||
set(FETCHCONTENT_SOURCE_DIR_${contentNameUpper}
|
||||
"${FETCHCONTENT_SOURCE_DIR_${contentNameUpper}}"
|
||||
CACHE PATH "When not empty, overrides where to find pre-populated content for ${contentName}")
|
||||
|
||||
if(FETCHCONTENT_SOURCE_DIR_${contentNameUpper})
|
||||
# The source directory has been explicitly provided in the cache,
|
||||
# so no population is required
|
||||
set(${contentNameLower}_SOURCE_DIR "${FETCHCONTENT_SOURCE_DIR_${contentNameUpper}}")
|
||||
set(${contentNameLower}_BINARY_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-build")
|
||||
|
||||
elseif(FETCHCONTENT_FULLY_DISCONNECTED)
|
||||
# Bypass population and assume source is already there from a previous run
|
||||
set(${contentNameLower}_SOURCE_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-src")
|
||||
set(${contentNameLower}_BINARY_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-build")
|
||||
|
||||
else()
|
||||
# Support both a global "disconnect all updates" and a per-content
|
||||
# update test (either one being set disables updates for this content).
|
||||
option(FETCHCONTENT_UPDATES_DISCONNECTED_${contentNameUpper}
|
||||
"Enables UPDATE_DISCONNECTED behavior just for population of ${contentName}")
|
||||
if(FETCHCONTENT_UPDATES_DISCONNECTED OR
|
||||
FETCHCONTENT_UPDATES_DISCONNECTED_${contentNameUpper})
|
||||
set(disconnectUpdates True)
|
||||
else()
|
||||
set(disconnectUpdates False)
|
||||
endif()
|
||||
|
||||
if(FETCHCONTENT_QUIET)
|
||||
set(quietFlag QUIET)
|
||||
else()
|
||||
unset(quietFlag)
|
||||
endif()
|
||||
|
||||
__FetchContent_getSavedDetails(${contentName} contentDetails)
|
||||
if("${contentDetails}" STREQUAL "")
|
||||
message(FATAL_ERROR "No details have been set for content: ${contentName}")
|
||||
endif()
|
||||
|
||||
__FetchContent_directPopulate(
|
||||
${contentNameLower}
|
||||
${quietFlag}
|
||||
UPDATE_DISCONNECTED ${disconnectUpdates}
|
||||
SUBBUILD_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-subbuild"
|
||||
SOURCE_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-src"
|
||||
BINARY_DIR "${FETCHCONTENT_BASE_DIR}/${contentNameLower}-build"
|
||||
# Put the saved details last so they can override any of the
|
||||
# the options we set above (this can include SOURCE_DIR or
|
||||
# BUILD_DIR)
|
||||
${contentDetails}
|
||||
)
|
||||
endif()
|
||||
|
||||
__FetchContent_setPopulated(
|
||||
${contentName}
|
||||
${${contentNameLower}_SOURCE_DIR}
|
||||
${${contentNameLower}_BINARY_DIR}
|
||||
)
|
||||
|
||||
# Pass variables back to the caller. The variables passed back here
|
||||
# must match what FetchContent_GetProperties() sets when it is called
|
||||
# with just the content name.
|
||||
set(${contentNameLower}_SOURCE_DIR "${${contentNameLower}_SOURCE_DIR}" PARENT_SCOPE)
|
||||
set(${contentNameLower}_BINARY_DIR "${${contentNameLower}_BINARY_DIR}" PARENT_SCOPE)
|
||||
set(${contentNameLower}_POPULATED True PARENT_SCOPE)
|
||||
|
||||
endfunction()
|
||||
@@ -0,0 +1,21 @@
|
||||
# Distributed under the OSI-approved BSD 3-Clause License. See accompanying
|
||||
# file Copyright.txt or https://cmake.org/licensing for details.
|
||||
|
||||
cmake_minimum_required(VERSION ${CMAKE_VERSION})
|
||||
|
||||
# We name the project and the target for the ExternalProject_Add() call
|
||||
# to something that will highlight to the user what we are working on if
|
||||
# something goes wrong and an error message is produced.
|
||||
|
||||
project(${contentName}-populate NONE)
|
||||
|
||||
include(ExternalProject)
|
||||
ExternalProject_Add(${contentName}-populate
|
||||
${ARG_EXTRA}
|
||||
SOURCE_DIR "${ARG_SOURCE_DIR}"
|
||||
BINARY_DIR "${ARG_BINARY_DIR}"
|
||||
CONFIGURE_COMMAND ""
|
||||
BUILD_COMMAND ""
|
||||
INSTALL_COMMAND ""
|
||||
TEST_COMMAND ""
|
||||
)
|
||||
5
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/Modules/README.md
vendored
Normal file
5
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/Modules/README.md
vendored
Normal file
@@ -0,0 +1,5 @@
|
||||
|
||||
## FetchContent
|
||||
|
||||
`FetchContent.cmake` and `FetchContent/CMakeLists.cmake.in`
|
||||
are copied from `cmake/3.11.0/share/cmake-3.11/Modules`.
|
||||
120
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/cmake_extension.py
vendored
Normal file
120
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/cmake_extension.py
vendored
Normal file
@@ -0,0 +1,120 @@
|
||||
# Copyright (c) 2021 Xiaomi Corporation (author: Fangjun Kuang)
|
||||
|
||||
import glob
|
||||
import os
|
||||
import platform
|
||||
import shutil
|
||||
import sys
|
||||
from pathlib import Path
|
||||
|
||||
import setuptools
|
||||
from setuptools.command.build_ext import build_ext
|
||||
|
||||
|
||||
def is_for_pypi():
|
||||
ans = os.environ.get("KALDI_NATIVE_FBANK_IS_FOR_PYPI", None)
|
||||
return ans is not None
|
||||
|
||||
|
||||
def is_macos():
|
||||
return platform.system() == "Darwin"
|
||||
|
||||
|
||||
def is_windows():
|
||||
return platform.system() == "Windows"
|
||||
|
||||
|
||||
try:
|
||||
from wheel.bdist_wheel import bdist_wheel as _bdist_wheel
|
||||
|
||||
class bdist_wheel(_bdist_wheel):
|
||||
def finalize_options(self):
|
||||
_bdist_wheel.finalize_options(self)
|
||||
# In this case, the generated wheel has a name in the form
|
||||
# kaldifeat-xxx-pyxx-none-any.whl
|
||||
if is_for_pypi() and not is_macos():
|
||||
self.root_is_pure = True
|
||||
else:
|
||||
# The generated wheel has a name ending with
|
||||
# -linux_x86_64.whl
|
||||
self.root_is_pure = False
|
||||
|
||||
|
||||
except ImportError:
|
||||
bdist_wheel = None
|
||||
|
||||
|
||||
def cmake_extension(name, *args, **kwargs) -> setuptools.Extension:
|
||||
kwargs["language"] = "c++"
|
||||
sources = []
|
||||
return setuptools.Extension(name, sources, *args, **kwargs)
|
||||
|
||||
|
||||
class BuildExtension(build_ext):
|
||||
def build_extension(self, ext: setuptools.extension.Extension):
|
||||
# build/temp.linux-x86_64-3.8
|
||||
os.makedirs(self.build_temp, exist_ok=True)
|
||||
|
||||
# build/lib.linux-x86_64-3.8
|
||||
os.makedirs(self.build_lib, exist_ok=True)
|
||||
|
||||
install_dir = Path(self.build_lib).resolve() / "kaldi_native_fbank"
|
||||
|
||||
kaldi_native_fbank_dir = Path(__file__).parent.parent.resolve()
|
||||
|
||||
cmake_args = os.environ.get("KALDI_NATIVE_FBANK_CMAKE_ARGS", "")
|
||||
make_args = os.environ.get("KALDI_NATIVE_FBANK_MAKE_ARGS", "")
|
||||
system_make_args = os.environ.get("MAKEFLAGS", "")
|
||||
|
||||
if cmake_args == "":
|
||||
cmake_args = "-DCMAKE_BUILD_TYPE=Release"
|
||||
|
||||
extra_cmake_args = f" -DCMAKE_INSTALL_PREFIX={install_dir} "
|
||||
extra_cmake_args += " -DKALDI_NATIVE_FBANK_BUILD_TESTS=OFF "
|
||||
|
||||
if "PYTHON_EXECUTABLE" not in cmake_args:
|
||||
print(f"Setting PYTHON_EXECUTABLE to {sys.executable}")
|
||||
cmake_args += f" -DPYTHON_EXECUTABLE={sys.executable}"
|
||||
|
||||
cmake_args += extra_cmake_args
|
||||
|
||||
if is_windows():
|
||||
build_cmd = f"""
|
||||
cmake {cmake_args} -B {self.build_temp} -S {kaldi_native_fbank_dir}
|
||||
cmake --build {self.build_temp} --target install --config Release -- -m
|
||||
"""
|
||||
print(f"build command is:\n{build_cmd}")
|
||||
ret = os.system(
|
||||
f"cmake {cmake_args} -B {self.build_temp} -S {kaldi_native_fbank_dir}"
|
||||
)
|
||||
if ret != 0:
|
||||
raise Exception("Failed to configure kaldi_native_fbank")
|
||||
|
||||
ret = os.system(
|
||||
f"cmake --build {self.build_temp} --target install --config Release -- -m"
|
||||
)
|
||||
if ret != 0:
|
||||
raise Exception("Failed to install kaldi_native_fbank")
|
||||
else:
|
||||
if make_args == "" and system_make_args == "":
|
||||
print("For fast compilation, run:")
|
||||
print(
|
||||
'export KALDI_NATIVE_FBANK_MAKE_ARGS="-j"; python setup.py install'
|
||||
)
|
||||
|
||||
build_cmd = f"""
|
||||
cd {self.build_temp}
|
||||
|
||||
cmake {cmake_args} {kaldi_native_fbank_dir}
|
||||
|
||||
make {make_args} install
|
||||
"""
|
||||
print(f"build command is:\n{build_cmd}")
|
||||
|
||||
ret = os.system(build_cmd)
|
||||
if ret != 0:
|
||||
raise Exception(
|
||||
"\nBuild kaldi-native-fbank failed. Please check the error message.\n"
|
||||
"You can ask for help by creating an issue on GitHub.\n"
|
||||
"\nClick:\n\thttps://github.com/csukuangfj/kaldi-native-fbank/issues/new\n" # noqa
|
||||
)
|
||||
57
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/googletest.cmake
vendored
Normal file
57
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/googletest.cmake
vendored
Normal file
@@ -0,0 +1,57 @@
|
||||
function(download_googltest)
|
||||
if(CMAKE_VERSION VERSION_LESS 3.11)
|
||||
list(APPEND CMAKE_MODULE_PATH ${CMAKE_SOURCE_DIR}/cmake/Modules)
|
||||
endif()
|
||||
|
||||
include(FetchContent)
|
||||
|
||||
set(googletest_URL "https://github.com/google/googletest/archive/release-1.10.0.tar.gz")
|
||||
set(googletest_HASH "SHA256=9dc9157a9a1551ec7a7e43daea9a694a0bb5fb8bec81235d8a1e6ef64c716dcb")
|
||||
|
||||
set(BUILD_GMOCK ON CACHE BOOL "" FORCE)
|
||||
set(INSTALL_GTEST OFF CACHE BOOL "" FORCE)
|
||||
set(gtest_disable_pthreads ON CACHE BOOL "" FORCE)
|
||||
set(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
|
||||
|
||||
FetchContent_Declare(googletest
|
||||
URL ${googletest_URL}
|
||||
URL_HASH ${googletest_HASH}
|
||||
)
|
||||
|
||||
FetchContent_GetProperties(googletest)
|
||||
if(NOT googletest_POPULATED)
|
||||
message(STATUS "Downloading googletest from ${googletest_URL}")
|
||||
FetchContent_Populate(googletest)
|
||||
endif()
|
||||
message(STATUS "googletest is downloaded to ${googletest_SOURCE_DIR}")
|
||||
message(STATUS "googletest's binary dir is ${googletest_BINARY_DIR}")
|
||||
|
||||
if(APPLE)
|
||||
set(CMAKE_MACOSX_RPATH ON) # to solve the following warning on macOS
|
||||
endif()
|
||||
#[==[
|
||||
-- Generating done
|
||||
Policy CMP0042 is not set: MACOSX_RPATH is enabled by default. Run "cmake
|
||||
--help-policy CMP0042" for policy details. Use the cmake_policy command to
|
||||
set the policy and suppress this warning.
|
||||
|
||||
MACOSX_RPATH is not specified for the following targets:
|
||||
|
||||
gmock
|
||||
gmock_main
|
||||
gtest
|
||||
gtest_main
|
||||
|
||||
This warning is for project developers. Use -Wno-dev to suppress it.
|
||||
]==]
|
||||
|
||||
add_subdirectory(${googletest_SOURCE_DIR} ${googletest_BINARY_DIR} EXCLUDE_FROM_ALL)
|
||||
|
||||
target_include_directories(gtest
|
||||
INTERFACE
|
||||
${googletest_SOURCE_DIR}/googletest/include
|
||||
${googletest_SOURCE_DIR}/googlemock/include
|
||||
)
|
||||
endfunction()
|
||||
|
||||
download_googltest()
|
||||
35
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/pybind11.cmake
vendored
Normal file
35
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/cmake/pybind11.cmake
vendored
Normal file
@@ -0,0 +1,35 @@
|
||||
function(download_pybind11)
|
||||
if(CMAKE_VERSION VERSION_LESS 3.11)
|
||||
list(APPEND CMAKE_MODULE_PATH ${CMAKE_SOURCE_DIR}/cmake/Modules)
|
||||
endif()
|
||||
|
||||
include(FetchContent)
|
||||
|
||||
set(pybind11_URL "https://github.com/pybind/pybind11/archive/refs/tags/v2.9.2.tar.gz")
|
||||
set(pybind11_HASH "SHA256=6bd528c4dbe2276635dc787b6b1f2e5316cf6b49ee3e150264e455a0d68d19c1")
|
||||
|
||||
# If you don't have access to the Internet, please download it to your
|
||||
# local drive and modify the following line according to your needs.
|
||||
if(EXISTS "/star-fj/fangjun/download/github/pybind11-2.9.2.tar.gz")
|
||||
set(pybind11_URL "file:///star-fj/fangjun/download/github/pybind11-2.9.2.tar.gz")
|
||||
elseif(EXISTS "/Users/fangjun/Downloads/pybind11-2.9.2.tar.gz")
|
||||
set(pybind11_URL "file:///Users/fangjun/Downloads/pybind11-2.9.2.tar.gz")
|
||||
elseif(EXISTS "/tmp/pybind11-2.9.2.tar.gz")
|
||||
set(pybind11_URL "file:///tmp/pybind11-2.9.2.tar.gz")
|
||||
endif()
|
||||
|
||||
FetchContent_Declare(pybind11
|
||||
URL ${pybind11_URL}
|
||||
URL_HASH ${pybind11_HASH}
|
||||
)
|
||||
|
||||
FetchContent_GetProperties(pybind11)
|
||||
if(NOT pybind11_POPULATED)
|
||||
message(STATUS "Downloading pybind11 from ${pybind11_URL}")
|
||||
FetchContent_Populate(pybind11)
|
||||
endif()
|
||||
message(STATUS "pybind11 is downloaded to ${pybind11_SOURCE_DIR}")
|
||||
add_subdirectory(${pybind11_SOURCE_DIR} ${pybind11_BINARY_DIR} EXCLUDE_FROM_ALL)
|
||||
endfunction()
|
||||
|
||||
download_pybind11()
|
||||
@@ -0,0 +1,8 @@
|
||||
add_subdirectory(csrc)
|
||||
|
||||
if(KALDI_NATIVE_FBANK_BUILD_PYTHON)
|
||||
message(STATUS "Building Python")
|
||||
add_subdirectory(python)
|
||||
else()
|
||||
message(STATUS "Disable building Python")
|
||||
endif()
|
||||
@@ -0,0 +1,8 @@
|
||||
add_library(csrc STATIC
|
||||
feature-fbank.cc
|
||||
feature-functions.cc
|
||||
feature-window.cc
|
||||
fftsg.c
|
||||
mel-computations.cc
|
||||
online-feature.cc
|
||||
rfft.cc)
|
||||
@@ -0,0 +1,93 @@
|
||||
|
||||
include_directories(${PROJECT_SOURCE_DIR})
|
||||
set(sources
|
||||
feature-fbank.cc
|
||||
feature-functions.cc
|
||||
feature-window.cc
|
||||
fftsg.c
|
||||
mel-computations.cc
|
||||
online-feature.cc
|
||||
rfft.cc
|
||||
)
|
||||
|
||||
if(KALDI_NATIVE_FBANK_ENABLE_CHECK)
|
||||
list(APPEND sources log.cc)
|
||||
endif()
|
||||
|
||||
add_library(kaldi-native-fbank-core ${sources})
|
||||
if(KALDI_NATIVE_FBANK_ENABLE_CHECK)
|
||||
target_compile_definitions(kaldi-native-fbank-core PUBLIC KNF_ENABLE_CHECK=1)
|
||||
|
||||
if(KNF_HAVE_EXECINFO_H)
|
||||
target_compile_definitions(kaldi-native-fbank-core PRIVATE KNF_HAVE_EXECINFO_H=1)
|
||||
endif()
|
||||
|
||||
if(KNF_HAVE_CXXABI_H)
|
||||
target_compile_definitions(kaldi-native-fbank-core PRIVATE KNF_HAVE_CXXABI_H=1)
|
||||
endif()
|
||||
endif()
|
||||
|
||||
# We are using std::call_once() in log.h,which requires us to link with -pthread
|
||||
if(NOT WIN32 AND KALDI_NATIVE_FBANK_ENABLE_CHECK)
|
||||
target_link_libraries(kaldi-native-fbank-core -pthread)
|
||||
endif()
|
||||
|
||||
if(KALDI_NATIVE_FBANK_BUILD_TESTS)
|
||||
add_executable(test-online-fbank test-online-fbank.cc)
|
||||
target_link_libraries(test-online-fbank kaldi-native-fbank-core)
|
||||
endif()
|
||||
|
||||
function(kaldi_native_fbank_add_test source)
|
||||
get_filename_component(name ${source} NAME_WE)
|
||||
add_executable(${name} "${source}")
|
||||
target_link_libraries(${name}
|
||||
PRIVATE
|
||||
kaldi-native-fbank-core
|
||||
gtest
|
||||
gtest_main
|
||||
)
|
||||
|
||||
add_test(NAME "Test.${name}"
|
||||
COMMAND
|
||||
$<TARGET_FILE:${name}>
|
||||
)
|
||||
endfunction()
|
||||
|
||||
# please sort the source files alphabetically
|
||||
set(test_srcs
|
||||
# test-online-feature.cc
|
||||
test-log.cc
|
||||
test-rfft.cc
|
||||
)
|
||||
|
||||
if(KALDI_NATIVE_FBANK_BUILD_TESTS)
|
||||
foreach(source IN LISTS test_srcs)
|
||||
kaldi_native_fbank_add_test(${source})
|
||||
endforeach()
|
||||
endif()
|
||||
|
||||
install(TARGETS kaldi-native-fbank-core
|
||||
DESTINATION lib
|
||||
)
|
||||
|
||||
if(KALDI_NATIVE_FBANK_BUILD_TESTS)
|
||||
install(TARGETS test-online-fbank
|
||||
DESTINATION bin
|
||||
)
|
||||
endif()
|
||||
|
||||
file(MAKE_DIRECTORY
|
||||
DESTINATION
|
||||
${PROJECT_BINARY_DIR}/include/kaldi-native-fbank/csrc
|
||||
)
|
||||
file(GLOB_RECURSE all_headers *.h)
|
||||
|
||||
file(COPY
|
||||
${all_headers}
|
||||
DESTINATION
|
||||
${PROJECT_BINARY_DIR}/include/kaldi-native-fbank/csrc
|
||||
)
|
||||
|
||||
install(FILES ${all_headers}
|
||||
DESTINATION include/kaldi-native-fbank/csrc
|
||||
)
|
||||
@@ -0,0 +1,120 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/feature-fbank.cc
|
||||
//
|
||||
#include "kaldi-native-fbank/csrc/feature-fbank.h"
|
||||
|
||||
#include <algorithm>
|
||||
#include <cmath>
|
||||
#include <limits>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-functions.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
static void Sqrt(float *in_out, int32_t n) {
|
||||
for (int32_t i = 0; i != n; ++i) {
|
||||
in_out[i] = std::sqrt(in_out[i]);
|
||||
}
|
||||
}
|
||||
|
||||
std::ostream &operator<<(std::ostream &os, const FbankOptions &opts) {
|
||||
os << opts.ToString();
|
||||
return os;
|
||||
}
|
||||
|
||||
FbankComputer::FbankComputer(const FbankOptions &opts)
|
||||
: opts_(opts), rfft_(opts.frame_opts.PaddedWindowSize()) {
|
||||
if (opts.energy_floor > 0.0f) {
|
||||
log_energy_floor_ = logf(opts.energy_floor);
|
||||
}
|
||||
|
||||
// We'll definitely need the filterbanks info for VTLN warping factor 1.0.
|
||||
// [note: this call caches it.]
|
||||
GetMelBanks(1.0f);
|
||||
}
|
||||
|
||||
FbankComputer::~FbankComputer() {
|
||||
for (auto iter = mel_banks_.begin(); iter != mel_banks_.end(); ++iter)
|
||||
delete iter->second;
|
||||
}
|
||||
|
||||
const MelBanks *FbankComputer::GetMelBanks(float vtln_warp) {
|
||||
MelBanks *this_mel_banks = nullptr;
|
||||
|
||||
// std::map<float, MelBanks *>::iterator iter = mel_banks_.find(vtln_warp);
|
||||
auto iter = mel_banks_.find(vtln_warp);
|
||||
if (iter == mel_banks_.end()) {
|
||||
this_mel_banks = new MelBanks(opts_.mel_opts, opts_.frame_opts, vtln_warp);
|
||||
mel_banks_[vtln_warp] = this_mel_banks;
|
||||
} else {
|
||||
this_mel_banks = iter->second;
|
||||
}
|
||||
return this_mel_banks;
|
||||
}
|
||||
|
||||
void FbankComputer::Compute(float signal_raw_log_energy, float vtln_warp,
|
||||
std::vector<float> *signal_frame, float *feature) {
|
||||
const MelBanks &mel_banks = *(GetMelBanks(vtln_warp));
|
||||
|
||||
KNF_CHECK_EQ(signal_frame->size(), opts_.frame_opts.PaddedWindowSize());
|
||||
|
||||
// Compute energy after window function (not the raw one).
|
||||
if (opts_.use_energy && !opts_.raw_energy) {
|
||||
signal_raw_log_energy = std::log(
|
||||
std::max<float>(InnerProduct(signal_frame->data(), signal_frame->data(),
|
||||
signal_frame->size()),
|
||||
std::numeric_limits<float>::epsilon()));
|
||||
}
|
||||
rfft_.Compute(signal_frame->data()); // signal_frame is modified in-place
|
||||
ComputePowerSpectrum(signal_frame);
|
||||
|
||||
// Use magnitude instead of power if requested.
|
||||
if (!opts_.use_power) {
|
||||
Sqrt(signal_frame->data(), signal_frame->size() / 2 + 1);
|
||||
}
|
||||
|
||||
int32_t mel_offset = ((opts_.use_energy && !opts_.htk_compat) ? 1 : 0);
|
||||
|
||||
// Its length is opts_.mel_opts.num_bins
|
||||
float *mel_energies = feature + mel_offset;
|
||||
|
||||
// Sum with mel filter banks over the power spectrum
|
||||
mel_banks.Compute(signal_frame->data(), mel_energies);
|
||||
|
||||
if (opts_.use_log_fbank) {
|
||||
// Avoid log of zero (which should be prevented anyway by dithering).
|
||||
for (int32_t i = 0; i != opts_.mel_opts.num_bins; ++i) {
|
||||
auto t = std::max(mel_energies[i], std::numeric_limits<float>::epsilon());
|
||||
mel_energies[i] = std::log(t);
|
||||
}
|
||||
}
|
||||
|
||||
// Copy energy as first value (or the last, if htk_compat == true).
|
||||
if (opts_.use_energy) {
|
||||
if (opts_.energy_floor > 0.0 && signal_raw_log_energy < log_energy_floor_) {
|
||||
signal_raw_log_energy = log_energy_floor_;
|
||||
}
|
||||
int32_t energy_index = opts_.htk_compat ? opts_.mel_opts.num_bins : 0;
|
||||
feature[energy_index] = signal_raw_log_energy;
|
||||
}
|
||||
}
|
||||
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,134 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/feature-fbank.h
|
||||
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_FEATURE_FBANK_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_FEATURE_FBANK_H_
|
||||
|
||||
#include <map>
|
||||
#include <string>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-window.h"
|
||||
#include "kaldi-native-fbank/csrc/mel-computations.h"
|
||||
#include "kaldi-native-fbank/csrc/rfft.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
struct FbankOptions {
|
||||
FrameExtractionOptions frame_opts;
|
||||
MelBanksOptions mel_opts;
|
||||
// append an extra dimension with energy to the filter banks
|
||||
bool use_energy = false;
|
||||
float energy_floor = 0.0f; // active iff use_energy==true
|
||||
|
||||
// If true, compute log_energy before preemphasis and windowing
|
||||
// If false, compute log_energy after preemphasis ans windowing
|
||||
bool raw_energy = true; // active iff use_energy==true
|
||||
|
||||
// If true, put energy last (if using energy)
|
||||
// If false, put energy first
|
||||
bool htk_compat = false; // active iff use_energy==true
|
||||
|
||||
// if true (default), produce log-filterbank, else linear
|
||||
bool use_log_fbank = true;
|
||||
|
||||
// if true (default), use power in filterbank
|
||||
// analysis, else magnitude.
|
||||
bool use_power = true;
|
||||
|
||||
FbankOptions() { mel_opts.num_bins = 23; }
|
||||
|
||||
std::string ToString() const {
|
||||
std::ostringstream os;
|
||||
os << "frame_opts: \n";
|
||||
os << frame_opts << "\n";
|
||||
os << "\n";
|
||||
|
||||
os << "mel_opts: \n";
|
||||
os << mel_opts << "\n";
|
||||
|
||||
os << "use_energy: " << use_energy << "\n";
|
||||
os << "energy_floor: " << energy_floor << "\n";
|
||||
os << "raw_energy: " << raw_energy << "\n";
|
||||
os << "htk_compat: " << htk_compat << "\n";
|
||||
os << "use_log_fbank: " << use_log_fbank << "\n";
|
||||
os << "use_power: " << use_power << "\n";
|
||||
return os.str();
|
||||
}
|
||||
};
|
||||
|
||||
std::ostream &operator<<(std::ostream &os, const FbankOptions &opts);
|
||||
|
||||
class FbankComputer {
|
||||
public:
|
||||
using Options = FbankOptions;
|
||||
|
||||
explicit FbankComputer(const FbankOptions &opts);
|
||||
~FbankComputer();
|
||||
|
||||
int32_t Dim() const {
|
||||
return opts_.mel_opts.num_bins + (opts_.use_energy ? 1 : 0);
|
||||
}
|
||||
|
||||
// if true, compute log_energy_pre_window but after dithering and dc removal
|
||||
bool NeedRawLogEnergy() const { return opts_.use_energy && opts_.raw_energy; }
|
||||
|
||||
const FrameExtractionOptions &GetFrameOptions() const {
|
||||
return opts_.frame_opts;
|
||||
}
|
||||
|
||||
const FbankOptions &GetOptions() const { return opts_; }
|
||||
|
||||
/**
|
||||
Function that computes one frame of features from
|
||||
one frame of signal.
|
||||
|
||||
@param [in] signal_raw_log_energy The log-energy of the frame of the signal
|
||||
prior to windowing and pre-emphasis, or
|
||||
log(numeric_limits<float>::min()), whichever is greater. Must be
|
||||
ignored by this function if this class returns false from
|
||||
this->NeedsRawLogEnergy().
|
||||
@param [in] vtln_warp The VTLN warping factor that the user wants
|
||||
to be applied when computing features for this utterance. Will
|
||||
normally be 1.0, meaning no warping is to be done. The value will
|
||||
be ignored for feature types that don't support VLTN, such as
|
||||
spectrogram features.
|
||||
@param [in] signal_frame One frame of the signal,
|
||||
as extracted using the function ExtractWindow() using the options
|
||||
returned by this->GetFrameOptions(). The function will use the
|
||||
vector as a workspace, which is why it's a non-const pointer.
|
||||
@param [out] feature Pointer to a vector of size this->Dim(), to which
|
||||
the computed feature will be written. It should be pre-allocated.
|
||||
*/
|
||||
void Compute(float signal_raw_log_energy, float vtln_warp,
|
||||
std::vector<float> *signal_frame, float *feature);
|
||||
|
||||
private:
|
||||
const MelBanks *GetMelBanks(float vtln_warp);
|
||||
|
||||
FbankOptions opts_;
|
||||
float log_energy_floor_;
|
||||
std::map<float, MelBanks *> mel_banks_; // float is VTLN coefficient.
|
||||
Rfft rfft_;
|
||||
};
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_FEATURE_FBANK_H_
|
||||
@@ -0,0 +1,49 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/feature-functions.cc
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-functions.h"
|
||||
|
||||
#include <cstdint>
|
||||
#include <vector>
|
||||
|
||||
namespace knf {
|
||||
|
||||
void ComputePowerSpectrum(std::vector<float> *complex_fft) {
|
||||
int32_t dim = complex_fft->size();
|
||||
|
||||
// now we have in complex_fft, first half of complex spectrum
|
||||
// it's stored as [real0, realN/2, real1, im1, real2, im2, ...]
|
||||
|
||||
float *p = complex_fft->data();
|
||||
int32_t half_dim = dim / 2;
|
||||
float first_energy = p[0] * p[0];
|
||||
float last_energy = p[1] * p[1]; // handle this special case
|
||||
|
||||
for (int32_t i = 1; i < half_dim; ++i) {
|
||||
float real = p[i * 2];
|
||||
float im = p[i * 2 + 1];
|
||||
p[i] = real * real + im * im;
|
||||
}
|
||||
p[0] = first_energy;
|
||||
p[half_dim] = last_energy; // Will actually never be used, and anyway
|
||||
// if the signal has been bandlimited sensibly this should be zero.
|
||||
}
|
||||
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,38 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/feature-functions.h
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_FEATURE_FUNCTIONS_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_FEATURE_FUNCTIONS_H_
|
||||
|
||||
#include <vector>
|
||||
namespace knf {
|
||||
|
||||
// ComputePowerSpectrum converts a complex FFT (as produced by the FFT
|
||||
// functions in csrc/rfft.h), and converts it into
|
||||
// a power spectrum. If the complex FFT is a vector of size n (representing
|
||||
// half of the complex FFT of a real signal of size n, as described there),
|
||||
// this function computes in the first (n/2) + 1 elements of it, the
|
||||
// energies of the fft bins from zero to the Nyquist frequency. Contents of the
|
||||
// remaining (n/2) - 1 elements are undefined at output.
|
||||
|
||||
void ComputePowerSpectrum(std::vector<float> *complex_fft);
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_FEATURE_FUNCTIONS_H_
|
||||
@@ -0,0 +1,247 @@
|
||||
// kaldi-native-fbank/csrc/feature-window.cc
|
||||
//
|
||||
// Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/feature-window.cc
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-window.h"
|
||||
|
||||
#include <algorithm>
|
||||
#include <cmath>
|
||||
#include <limits>
|
||||
#include <vector>
|
||||
|
||||
#ifndef M_2PI
|
||||
#define M_2PI 6.283185307179586476925286766559005
|
||||
#endif
|
||||
|
||||
namespace knf {
|
||||
|
||||
std::ostream &operator<<(std::ostream &os, const FrameExtractionOptions &opts) {
|
||||
os << opts.ToString();
|
||||
return os;
|
||||
}
|
||||
|
||||
FeatureWindowFunction::FeatureWindowFunction(const FrameExtractionOptions &opts)
|
||||
: window_(opts.WindowSize()) {
|
||||
int32_t frame_length = opts.WindowSize();
|
||||
KNF_CHECK_GT(frame_length, 0);
|
||||
|
||||
float *window_data = window_.data();
|
||||
|
||||
double a = M_2PI / (frame_length - 1);
|
||||
for (int32_t i = 0; i < frame_length; i++) {
|
||||
double i_fl = static_cast<double>(i);
|
||||
if (opts.window_type == "hanning") {
|
||||
window_data[i] = 0.5 - 0.5 * cos(a * i_fl);
|
||||
} else if (opts.window_type == "sine") {
|
||||
// when you are checking ws wikipedia, please
|
||||
// note that 0.5 * a = M_PI/(frame_length-1)
|
||||
window_data[i] = sin(0.5 * a * i_fl);
|
||||
} else if (opts.window_type == "hamming") {
|
||||
window_data[i] = 0.54 - 0.46 * cos(a * i_fl);
|
||||
} else if (opts.window_type ==
|
||||
"povey") { // like hamming but goes to zero at edges.
|
||||
window_data[i] = pow(0.5 - 0.5 * cos(a * i_fl), 0.85);
|
||||
} else if (opts.window_type == "rectangular") {
|
||||
window_data[i] = 1.0;
|
||||
} else if (opts.window_type == "blackman") {
|
||||
window_data[i] = opts.blackman_coeff - 0.5 * cos(a * i_fl) +
|
||||
(0.5 - opts.blackman_coeff) * cos(2 * a * i_fl);
|
||||
} else {
|
||||
KNF_LOG(FATAL) << "Invalid window type " << opts.window_type;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void FeatureWindowFunction::Apply(float *wave) const {
|
||||
int32_t window_size = window_.size();
|
||||
const float *p = window_.data();
|
||||
for (int32_t k = 0; k != window_size; ++k) {
|
||||
wave[k] *= p[k];
|
||||
}
|
||||
}
|
||||
|
||||
int64_t FirstSampleOfFrame(int32_t frame, const FrameExtractionOptions &opts) {
|
||||
int64_t frame_shift = opts.WindowShift();
|
||||
if (opts.snip_edges) {
|
||||
return frame * frame_shift;
|
||||
} else {
|
||||
int64_t midpoint_of_frame = frame_shift * frame + frame_shift / 2,
|
||||
beginning_of_frame = midpoint_of_frame - opts.WindowSize() / 2;
|
||||
return beginning_of_frame;
|
||||
}
|
||||
}
|
||||
|
||||
int32_t NumFrames(int64_t num_samples, const FrameExtractionOptions &opts,
|
||||
bool flush /*= true*/) {
|
||||
int64_t frame_shift = opts.WindowShift();
|
||||
int64_t frame_length = opts.WindowSize();
|
||||
if (opts.snip_edges) {
|
||||
// with --snip-edges=true (the default), we use a HTK-like approach to
|
||||
// determining the number of frames-- all frames have to fit completely into
|
||||
// the waveform, and the first frame begins at sample zero.
|
||||
if (num_samples < frame_length)
|
||||
return 0;
|
||||
else
|
||||
return (1 + ((num_samples - frame_length) / frame_shift));
|
||||
// You can understand the expression above as follows: 'num_samples -
|
||||
// frame_length' is how much room we have to shift the frame within the
|
||||
// waveform; 'frame_shift' is how much we shift it each time; and the ratio
|
||||
// is how many times we can shift it (integer arithmetic rounds down).
|
||||
} else {
|
||||
// if --snip-edges=false, the number of frames is determined by rounding the
|
||||
// (file-length / frame-shift) to the nearest integer. The point of this
|
||||
// formula is to make the number of frames an obvious and predictable
|
||||
// function of the frame shift and signal length, which makes many
|
||||
// segmentation-related questions simpler.
|
||||
//
|
||||
// Because integer division in C++ rounds toward zero, we add (half the
|
||||
// frame-shift minus epsilon) before dividing, to have the effect of
|
||||
// rounding towards the closest integer.
|
||||
int32_t num_frames = (num_samples + (frame_shift / 2)) / frame_shift;
|
||||
|
||||
if (flush) return num_frames;
|
||||
|
||||
// note: 'end' always means the last plus one, i.e. one past the last.
|
||||
int64_t end_sample_of_last_frame =
|
||||
FirstSampleOfFrame(num_frames - 1, opts) + frame_length;
|
||||
|
||||
// the following code is optimized more for clarity than efficiency.
|
||||
// If flush == false, we can't output frames that extend past the end
|
||||
// of the signal.
|
||||
while (num_frames > 0 && end_sample_of_last_frame > num_samples) {
|
||||
num_frames--;
|
||||
end_sample_of_last_frame -= frame_shift;
|
||||
}
|
||||
return num_frames;
|
||||
}
|
||||
}
|
||||
|
||||
void ExtractWindow(int64_t sample_offset, const std::vector<float> &wave,
|
||||
int32_t f, const FrameExtractionOptions &opts,
|
||||
const FeatureWindowFunction &window_function,
|
||||
std::vector<float> *window,
|
||||
float *log_energy_pre_window /*= nullptr*/) {
|
||||
KNF_CHECK(sample_offset >= 0 && wave.size() != 0);
|
||||
|
||||
int32_t frame_length = opts.WindowSize();
|
||||
int32_t frame_length_padded = opts.PaddedWindowSize();
|
||||
|
||||
int64_t num_samples = sample_offset + wave.size();
|
||||
int64_t start_sample = FirstSampleOfFrame(f, opts);
|
||||
int64_t end_sample = start_sample + frame_length;
|
||||
|
||||
if (opts.snip_edges) {
|
||||
KNF_CHECK(start_sample >= sample_offset && end_sample <= num_samples);
|
||||
} else {
|
||||
KNF_CHECK(sample_offset == 0 || start_sample >= sample_offset);
|
||||
}
|
||||
|
||||
if (window->size() != frame_length_padded) {
|
||||
window->resize(frame_length_padded);
|
||||
}
|
||||
|
||||
// wave_start and wave_end are start and end indexes into 'wave', for the
|
||||
// piece of wave that we're trying to extract.
|
||||
int32_t wave_start = int32_t(start_sample - sample_offset);
|
||||
int32_t wave_end = wave_start + frame_length;
|
||||
|
||||
if (wave_start >= 0 && wave_end <= wave.size()) {
|
||||
// the normal case-- no edge effects to consider.
|
||||
std::copy(wave.begin() + wave_start,
|
||||
wave.begin() + wave_start + frame_length, window->data());
|
||||
} else {
|
||||
// Deal with any end effects by reflection, if needed. This code will only
|
||||
// be reached for about two frames per utterance, so we don't concern
|
||||
// ourselves excessively with efficiency.
|
||||
int32_t wave_dim = wave.size();
|
||||
for (int32_t s = 0; s < frame_length; ++s) {
|
||||
int32_t s_in_wave = s + wave_start;
|
||||
while (s_in_wave < 0 || s_in_wave >= wave_dim) {
|
||||
// reflect around the beginning or end of the wave.
|
||||
// e.g. -1 -> 0, -2 -> 1.
|
||||
// dim -> dim - 1, dim + 1 -> dim - 2.
|
||||
// the code supports repeated reflections, although this
|
||||
// would only be needed in pathological cases.
|
||||
if (s_in_wave < 0)
|
||||
s_in_wave = -s_in_wave - 1;
|
||||
else
|
||||
s_in_wave = 2 * wave_dim - 1 - s_in_wave;
|
||||
}
|
||||
(*window)[s] = wave[s_in_wave];
|
||||
}
|
||||
}
|
||||
|
||||
ProcessWindow(opts, window_function, window->data(), log_energy_pre_window);
|
||||
}
|
||||
|
||||
static void RemoveDcOffset(float *d, int32_t n) {
|
||||
float sum = 0;
|
||||
for (int32_t i = 0; i != n; ++i) {
|
||||
sum += d[i];
|
||||
}
|
||||
|
||||
float mean = sum / n;
|
||||
|
||||
for (int32_t i = 0; i != n; ++i) {
|
||||
d[i] -= mean;
|
||||
}
|
||||
}
|
||||
|
||||
float InnerProduct(const float *a, const float *b, int32_t n) {
|
||||
float sum = 0;
|
||||
for (int32_t i = 0; i != n; ++i) {
|
||||
sum += a[i] * b[i];
|
||||
}
|
||||
return sum;
|
||||
}
|
||||
|
||||
static void Preemphasize(float *d, int32_t n, float preemph_coeff) {
|
||||
if (preemph_coeff == 0.0) {
|
||||
return;
|
||||
}
|
||||
|
||||
KNF_CHECK(preemph_coeff >= 0.0 && preemph_coeff <= 1.0);
|
||||
|
||||
for (int32_t i = n - 1; i > 0; --i) {
|
||||
d[i] -= preemph_coeff * d[i - 1];
|
||||
}
|
||||
d[0] -= preemph_coeff * d[0];
|
||||
}
|
||||
|
||||
void ProcessWindow(const FrameExtractionOptions &opts,
|
||||
const FeatureWindowFunction &window_function, float *window,
|
||||
float *log_energy_pre_window /*= nullptr*/) {
|
||||
int32_t frame_length = opts.WindowSize();
|
||||
|
||||
// // TODO(fangjun): Remove dither
|
||||
// KNF_CHECK_EQ(opts.dither, 0);
|
||||
|
||||
// Add dither function
|
||||
// https://github.com/kaldi-asr/kaldi/blob/master/src/feat/feature-window.cc
|
||||
if (opts.dither!=0) {
|
||||
// kaldi::RandomState rstate;
|
||||
// rstate.seed=0;
|
||||
// for (int32 i = 0; i < frame_length; i++)
|
||||
// window[i] += RandGauss(&rstate) * opts.dither;
|
||||
}
|
||||
|
||||
if (opts.remove_dc_offset) {
|
||||
RemoveDcOffset(window, frame_length);
|
||||
}
|
||||
|
||||
if (log_energy_pre_window != NULL) {
|
||||
float energy = std::max<float>(InnerProduct(window, window, frame_length),
|
||||
std::numeric_limits<float>::epsilon());
|
||||
*log_energy_pre_window = std::log(energy);
|
||||
}
|
||||
|
||||
if (opts.preemph_coeff != 0.0) {
|
||||
Preemphasize(window, frame_length, opts.preemph_coeff);
|
||||
}
|
||||
|
||||
window_function.Apply(window);
|
||||
}
|
||||
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,178 @@
|
||||
// kaldi-native-fbank/csrc/feature-window.h
|
||||
//
|
||||
// Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/feature-window.h
|
||||
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_FEATURE_WINDOW_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_FEATURE_WINDOW_H_
|
||||
|
||||
#include <sstream>
|
||||
#include <string>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/log.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
inline int32_t RoundUpToNearestPowerOfTwo(int32_t n) {
|
||||
// copied from kaldi/src/base/kaldi-math.cc
|
||||
KNF_CHECK_GT(n, 0);
|
||||
n--;
|
||||
n |= n >> 1;
|
||||
n |= n >> 2;
|
||||
n |= n >> 4;
|
||||
n |= n >> 8;
|
||||
n |= n >> 16;
|
||||
return n + 1;
|
||||
}
|
||||
|
||||
struct FrameExtractionOptions {
|
||||
float samp_freq = 16000;
|
||||
float frame_shift_ms = 10.0f; // in milliseconds.
|
||||
float frame_length_ms = 25.0f; // in milliseconds.
|
||||
float dither = 1.0f; // Amount of dithering, 0.0 means no dither.
|
||||
float preemph_coeff = 0.97f; // Preemphasis coefficient.
|
||||
bool remove_dc_offset = true; // Subtract mean of wave before FFT.
|
||||
std::string window_type = "povey"; // e.g. Hamming window
|
||||
// May be "hamming", "rectangular", "povey", "hanning", "sine", "blackman"
|
||||
// "povey" is a window I made to be similar to Hamming but to go to zero at
|
||||
// the edges, it's pow((0.5 - 0.5*cos(n/N*2*pi)), 0.85) I just don't think the
|
||||
// Hamming window makes sense as a windowing function.
|
||||
bool round_to_power_of_two = true;
|
||||
float blackman_coeff = 0.42f;
|
||||
bool snip_edges = true;
|
||||
// bool allow_downsample = false;
|
||||
// bool allow_upsample = false;
|
||||
|
||||
// Used for streaming feature extraction. It indicates the number
|
||||
// of feature frames to keep in the recycling vector. -1 means to
|
||||
// keep all feature frames.
|
||||
int32_t max_feature_vectors = -1;
|
||||
|
||||
int32_t WindowShift() const {
|
||||
return static_cast<int32_t>(samp_freq * 0.001f * frame_shift_ms);
|
||||
}
|
||||
int32_t WindowSize() const {
|
||||
return static_cast<int32_t>(samp_freq * 0.001f * frame_length_ms);
|
||||
}
|
||||
int32_t PaddedWindowSize() const {
|
||||
return (round_to_power_of_two ? RoundUpToNearestPowerOfTwo(WindowSize())
|
||||
: WindowSize());
|
||||
}
|
||||
std::string ToString() const {
|
||||
std::ostringstream os;
|
||||
#define KNF_PRINT(x) os << #x << ": " << x << "\n"
|
||||
KNF_PRINT(samp_freq);
|
||||
KNF_PRINT(frame_shift_ms);
|
||||
KNF_PRINT(frame_length_ms);
|
||||
KNF_PRINT(dither);
|
||||
KNF_PRINT(preemph_coeff);
|
||||
KNF_PRINT(remove_dc_offset);
|
||||
KNF_PRINT(window_type);
|
||||
KNF_PRINT(round_to_power_of_two);
|
||||
KNF_PRINT(blackman_coeff);
|
||||
KNF_PRINT(snip_edges);
|
||||
// KNF_PRINT(allow_downsample);
|
||||
// KNF_PRINT(allow_upsample);
|
||||
KNF_PRINT(max_feature_vectors);
|
||||
#undef KNF_PRINT
|
||||
return os.str();
|
||||
}
|
||||
};
|
||||
|
||||
std::ostream &operator<<(std::ostream &os, const FrameExtractionOptions &opts);
|
||||
|
||||
class FeatureWindowFunction {
|
||||
public:
|
||||
FeatureWindowFunction() = default;
|
||||
explicit FeatureWindowFunction(const FrameExtractionOptions &opts);
|
||||
/**
|
||||
* @param wave Pointer to a 1-D array of shape [window_size].
|
||||
* It is modified in-place: wave[i] = wave[i] * window_[i].
|
||||
* @param
|
||||
*/
|
||||
void Apply(float *wave) const;
|
||||
|
||||
private:
|
||||
std::vector<float> window_; // of size opts.WindowSize()
|
||||
};
|
||||
|
||||
int64_t FirstSampleOfFrame(int32_t frame, const FrameExtractionOptions &opts);
|
||||
|
||||
/**
|
||||
This function returns the number of frames that we can extract from a wave
|
||||
file with the given number of samples in it (assumed to have the same
|
||||
sampling rate as specified in 'opts').
|
||||
|
||||
@param [in] num_samples The number of samples in the wave file.
|
||||
@param [in] opts The frame-extraction options class
|
||||
|
||||
@param [in] flush True if we are asserting that this number of samples
|
||||
is 'all there is', false if we expecting more data to possibly come in. This
|
||||
only makes a difference to the answer
|
||||
if opts.snips_edges== false. For offline feature extraction you always want
|
||||
flush == true. In an online-decoding context, once you know (or decide) that
|
||||
no more data is coming in, you'd call it with flush == true at the end to
|
||||
flush out any remaining data.
|
||||
*/
|
||||
int32_t NumFrames(int64_t num_samples, const FrameExtractionOptions &opts,
|
||||
bool flush = true);
|
||||
|
||||
/*
|
||||
ExtractWindow() extracts a windowed frame of waveform (possibly with a
|
||||
power-of-two, padded size, depending on the config), including all the
|
||||
processing done by ProcessWindow().
|
||||
|
||||
@param [in] sample_offset If 'wave' is not the entire waveform, but
|
||||
part of it to the left has been discarded, then the
|
||||
number of samples prior to 'wave' that we have
|
||||
already discarded. Set this to zero if you are
|
||||
processing the entire waveform in one piece, or
|
||||
if you get 'no matching function' compilation
|
||||
errors when updating the code.
|
||||
@param [in] wave The waveform
|
||||
@param [in] f The frame index to be extracted, with
|
||||
0 <= f < NumFrames(sample_offset + wave.Dim(), opts, true)
|
||||
@param [in] opts The options class to be used
|
||||
@param [in] window_function The windowing function, as derived from the
|
||||
options class.
|
||||
@param [out] window The windowed, possibly-padded waveform to be
|
||||
extracted. Will be resized as needed.
|
||||
@param [out] log_energy_pre_window If non-NULL, the log-energy of
|
||||
the signal prior to pre-emphasis and multiplying by
|
||||
the windowing function will be written to here.
|
||||
*/
|
||||
void ExtractWindow(int64_t sample_offset, const std::vector<float> &wave,
|
||||
int32_t f, const FrameExtractionOptions &opts,
|
||||
const FeatureWindowFunction &window_function,
|
||||
std::vector<float> *window,
|
||||
float *log_energy_pre_window = nullptr);
|
||||
|
||||
/**
|
||||
This function does all the windowing steps after actually
|
||||
extracting the windowed signal: depending on the
|
||||
configuration, it does dithering, dc offset removal,
|
||||
preemphasis, and multiplication by the windowing function.
|
||||
@param [in] opts The options class to be used
|
||||
@param [in] window_function The windowing function-- should have
|
||||
been initialized using 'opts'.
|
||||
@param [in,out] window A vector of size opts.WindowSize(). Note:
|
||||
it will typically be a sub-vector of a larger vector of size
|
||||
opts.PaddedWindowSize(), with the remaining samples zero,
|
||||
as the FFT code is more efficient if it operates on data with
|
||||
power-of-two size.
|
||||
@param [out] log_energy_pre_window If non-NULL, then after dithering and
|
||||
DC offset removal, this function will write to this pointer the log of
|
||||
the total energy (i.e. sum-squared) of the frame.
|
||||
*/
|
||||
void ProcessWindow(const FrameExtractionOptions &opts,
|
||||
const FeatureWindowFunction &window_function, float *window,
|
||||
float *log_energy_pre_window = nullptr);
|
||||
|
||||
// Compute the inner product of two vectors
|
||||
float InnerProduct(const float *a, const float *b, int32_t n);
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_FEATURE_WINDOW_H_
|
||||
2968
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/fftsg.c
vendored
Normal file
2968
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/fftsg.c
vendored
Normal file
File diff suppressed because it is too large
Load Diff
142
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/log.cc
vendored
Normal file
142
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/log.cc
vendored
Normal file
@@ -0,0 +1,142 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
/*
|
||||
* Stack trace related stuff is from kaldi.
|
||||
* Refer to
|
||||
* https://github.com/kaldi-asr/kaldi/blob/master/src/base/kaldi-error.cc
|
||||
*/
|
||||
|
||||
#include "kaldi-native-fbank/csrc/log.h"
|
||||
|
||||
#ifdef KNF_HAVE_EXECINFO_H
|
||||
#include <execinfo.h> // To get stack trace in error messages.
|
||||
#ifdef KNF_HAVE_CXXABI_H
|
||||
#include <cxxabi.h> // For name demangling.
|
||||
// Useful to decode the stack trace, but only used if we have execinfo.h
|
||||
#endif // KNF_HAVE_CXXABI_H
|
||||
#endif // KNF_HAVE_EXECINFO_H
|
||||
|
||||
#include <stdlib.h>
|
||||
|
||||
#include <ctime>
|
||||
#include <iomanip>
|
||||
#include <string>
|
||||
|
||||
namespace knf {
|
||||
|
||||
std::string GetDateTimeStr() {
|
||||
std::ostringstream os;
|
||||
std::time_t t = std::time(nullptr);
|
||||
std::tm tm = *std::localtime(&t);
|
||||
os << std::put_time(&tm, "%F %T"); // yyyy-mm-dd hh:mm:ss
|
||||
return os.str();
|
||||
}
|
||||
|
||||
static bool LocateSymbolRange(const std::string &trace_name, std::size_t *begin,
|
||||
std::size_t *end) {
|
||||
// Find the first '_' with leading ' ' or '('.
|
||||
*begin = std::string::npos;
|
||||
for (std::size_t i = 1; i < trace_name.size(); ++i) {
|
||||
if (trace_name[i] != '_') {
|
||||
continue;
|
||||
}
|
||||
if (trace_name[i - 1] == ' ' || trace_name[i - 1] == '(') {
|
||||
*begin = i;
|
||||
break;
|
||||
}
|
||||
}
|
||||
if (*begin == std::string::npos) {
|
||||
return false;
|
||||
}
|
||||
*end = trace_name.find_first_of(" +", *begin);
|
||||
return *end != std::string::npos;
|
||||
}
|
||||
|
||||
#ifdef KNF_HAVE_EXECINFO_H
|
||||
static std::string Demangle(const std::string &trace_name) {
|
||||
#ifndef KNF_HAVE_CXXABI_H
|
||||
return trace_name;
|
||||
#else // KNF_HAVE_CXXABI_H
|
||||
// Try demangle the symbol. We are trying to support the following formats
|
||||
// produced by different platforms:
|
||||
//
|
||||
// Linux:
|
||||
// ./kaldi-error-test(_ZN5kaldi13UnitTestErrorEv+0xb) [0x804965d]
|
||||
//
|
||||
// Mac:
|
||||
// 0 server 0x000000010f67614d _ZNK5kaldi13MessageLogger10LogMessageEv + 813
|
||||
//
|
||||
// We want to extract the name e.g., '_ZN5kaldi13UnitTestErrorEv' and
|
||||
// demangle it info a readable name like kaldi::UnitTextError.
|
||||
std::size_t begin, end;
|
||||
if (!LocateSymbolRange(trace_name, &begin, &end)) {
|
||||
return trace_name;
|
||||
}
|
||||
std::string symbol = trace_name.substr(begin, end - begin);
|
||||
int status;
|
||||
char *demangled_name = abi::__cxa_demangle(symbol.c_str(), 0, 0, &status);
|
||||
if (status == 0 && demangled_name != nullptr) {
|
||||
symbol = demangled_name;
|
||||
free(demangled_name);
|
||||
}
|
||||
return trace_name.substr(0, begin) + symbol +
|
||||
trace_name.substr(end, std::string::npos);
|
||||
#endif // KNF_HAVE_CXXABI_H
|
||||
}
|
||||
#endif // KNF_HAVE_EXECINFO_H
|
||||
|
||||
std::string GetStackTrace() {
|
||||
std::string ans;
|
||||
#ifdef KNF_HAVE_EXECINFO_H
|
||||
constexpr const std::size_t kMaxTraceSize = 50;
|
||||
constexpr const std::size_t kMaxTracePrint = 50; // Must be even.
|
||||
// Buffer for the trace.
|
||||
void *trace[kMaxTraceSize];
|
||||
// Get the trace.
|
||||
std::size_t size = backtrace(trace, kMaxTraceSize);
|
||||
// Get the trace symbols.
|
||||
char **trace_symbol = backtrace_symbols(trace, size);
|
||||
if (trace_symbol == nullptr) return ans;
|
||||
|
||||
// Compose a human-readable backtrace string.
|
||||
ans += "[ Stack-Trace: ]\n";
|
||||
if (size <= kMaxTracePrint) {
|
||||
for (std::size_t i = 0; i < size; ++i) {
|
||||
ans += Demangle(trace_symbol[i]) + "\n";
|
||||
}
|
||||
} else { // Print out first+last (e.g.) 5.
|
||||
for (std::size_t i = 0; i < kMaxTracePrint / 2; ++i) {
|
||||
ans += Demangle(trace_symbol[i]) + "\n";
|
||||
}
|
||||
ans += ".\n.\n.\n";
|
||||
for (std::size_t i = size - kMaxTracePrint / 2; i < size; ++i) {
|
||||
ans += Demangle(trace_symbol[i]) + "\n";
|
||||
}
|
||||
if (size == kMaxTraceSize)
|
||||
ans += ".\n.\n.\n"; // Stack was too long, probably a bug.
|
||||
}
|
||||
|
||||
// We must free the array of pointers allocated by backtrace_symbols(),
|
||||
// but not the strings themselves.
|
||||
free(trace_symbol);
|
||||
#endif // KNF_HAVE_EXECINFO_H
|
||||
return ans;
|
||||
}
|
||||
|
||||
} // namespace knf
|
||||
383
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/log.h
vendored
Normal file
383
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/log.h
vendored
Normal file
@@ -0,0 +1,383 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// The content in this file is copied/modified from
|
||||
// https://github.com/k2-fsa/k2/blob/master/k2/csrc/log.h
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_LOG_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_LOG_H_
|
||||
|
||||
#include <stdio.h>
|
||||
|
||||
#include <mutex> // NOLINT
|
||||
#include <sstream>
|
||||
#include <string>
|
||||
|
||||
namespace knf {
|
||||
|
||||
#if KNF_ENABLE_CHECK
|
||||
|
||||
#if defined(NDEBUG)
|
||||
constexpr bool kDisableDebug = true;
|
||||
#else
|
||||
constexpr bool kDisableDebug = false;
|
||||
#endif
|
||||
|
||||
enum class LogLevel {
|
||||
kTrace = 0,
|
||||
kDebug = 1,
|
||||
kInfo = 2,
|
||||
kWarning = 3,
|
||||
kError = 4,
|
||||
kFatal = 5, // print message and abort the program
|
||||
};
|
||||
|
||||
// They are used in KNF_LOG(xxx), so their names
|
||||
// do not follow the google c++ code style
|
||||
//
|
||||
// You can use them in the following way:
|
||||
//
|
||||
// KNF_LOG(TRACE) << "some message";
|
||||
// KNF_LOG(DEBUG) << "some message";
|
||||
#ifndef _MSC_VER
|
||||
constexpr LogLevel TRACE = LogLevel::kTrace;
|
||||
constexpr LogLevel DEBUG = LogLevel::kDebug;
|
||||
constexpr LogLevel INFO = LogLevel::kInfo;
|
||||
constexpr LogLevel WARNING = LogLevel::kWarning;
|
||||
constexpr LogLevel ERROR = LogLevel::kError;
|
||||
constexpr LogLevel FATAL = LogLevel::kFatal;
|
||||
#else
|
||||
#define TRACE LogLevel::kTrace
|
||||
#define DEBUG LogLevel::kDebug
|
||||
#define INFO LogLevel::kInfo
|
||||
#define WARNING LogLevel::kWarning
|
||||
#define ERROR LogLevel::kError
|
||||
#define FATAL LogLevel::kFatal
|
||||
#endif
|
||||
|
||||
std::string GetStackTrace();
|
||||
|
||||
/* Return the current log level.
|
||||
|
||||
|
||||
If the current log level is TRACE, then all logged messages are printed out.
|
||||
|
||||
If the current log level is DEBUG, log messages with "TRACE" level are not
|
||||
shown and all other levels are printed out.
|
||||
|
||||
Similarly, if the current log level is INFO, log message with "TRACE" and
|
||||
"DEBUG" are not shown and all other levels are printed out.
|
||||
|
||||
If it is FATAL, then only FATAL messages are shown.
|
||||
*/
|
||||
inline LogLevel GetCurrentLogLevel() {
|
||||
static LogLevel log_level = INFO;
|
||||
static std::once_flag init_flag;
|
||||
std::call_once(init_flag, []() {
|
||||
const char *env_log_level = std::getenv("KNF_LOG_LEVEL");
|
||||
if (env_log_level == nullptr) return;
|
||||
|
||||
std::string s = env_log_level;
|
||||
if (s == "TRACE")
|
||||
log_level = TRACE;
|
||||
else if (s == "DEBUG")
|
||||
log_level = DEBUG;
|
||||
else if (s == "INFO")
|
||||
log_level = INFO;
|
||||
else if (s == "WARNING")
|
||||
log_level = WARNING;
|
||||
else if (s == "ERROR")
|
||||
log_level = ERROR;
|
||||
else if (s == "FATAL")
|
||||
log_level = FATAL;
|
||||
else
|
||||
fprintf(stderr,
|
||||
"Unknown KNF_LOG_LEVEL: %s"
|
||||
"\nSupported values are: "
|
||||
"TRACE, DEBUG, INFO, WARNING, ERROR, FATAL",
|
||||
s.c_str());
|
||||
});
|
||||
return log_level;
|
||||
}
|
||||
|
||||
inline bool EnableAbort() {
|
||||
static std::once_flag init_flag;
|
||||
static bool enable_abort = false;
|
||||
std::call_once(init_flag, []() {
|
||||
enable_abort = (std::getenv("KNF_ABORT") != nullptr);
|
||||
});
|
||||
return enable_abort;
|
||||
}
|
||||
|
||||
class Logger {
|
||||
public:
|
||||
Logger(const char *filename, const char *func_name, uint32_t line_num,
|
||||
LogLevel level)
|
||||
: filename_(filename),
|
||||
func_name_(func_name),
|
||||
line_num_(line_num),
|
||||
level_(level) {
|
||||
cur_level_ = GetCurrentLogLevel();
|
||||
fprintf(stderr, "here\n");
|
||||
switch (level) {
|
||||
case TRACE:
|
||||
if (cur_level_ <= TRACE) fprintf(stderr, "[T] ");
|
||||
break;
|
||||
case DEBUG:
|
||||
if (cur_level_ <= DEBUG) fprintf(stderr, "[D] ");
|
||||
break;
|
||||
case INFO:
|
||||
if (cur_level_ <= INFO) fprintf(stderr, "[I] ");
|
||||
break;
|
||||
case WARNING:
|
||||
if (cur_level_ <= WARNING) fprintf(stderr, "[W] ");
|
||||
break;
|
||||
case ERROR:
|
||||
if (cur_level_ <= ERROR) fprintf(stderr, "[E] ");
|
||||
break;
|
||||
case FATAL:
|
||||
if (cur_level_ <= FATAL) fprintf(stderr, "[F] ");
|
||||
break;
|
||||
}
|
||||
|
||||
if (cur_level_ <= level_) {
|
||||
fprintf(stderr, "%s:%u:%s ", filename, line_num, func_name);
|
||||
}
|
||||
}
|
||||
|
||||
~Logger() noexcept(false) {
|
||||
static constexpr const char *kErrMsg = R"(
|
||||
Some bad things happened. Please read the above error messages and stack
|
||||
trace. If you are using Python, the following command may be helpful:
|
||||
|
||||
gdb --args python /path/to/your/code.py
|
||||
|
||||
(You can use `gdb` to debug the code. Please consider compiling
|
||||
a debug version of KNF.).
|
||||
|
||||
If you are unable to fix it, please open an issue at:
|
||||
|
||||
https://github.com/csukuangfj/kaldi-native-fbank/issues/new
|
||||
)";
|
||||
fprintf(stderr, "\n");
|
||||
if (level_ == FATAL) {
|
||||
std::string stack_trace = GetStackTrace();
|
||||
if (!stack_trace.empty()) {
|
||||
fprintf(stderr, "\n\n%s\n", stack_trace.c_str());
|
||||
}
|
||||
|
||||
fflush(nullptr);
|
||||
|
||||
#ifndef __ANDROID_API__
|
||||
if (EnableAbort()) {
|
||||
// NOTE: abort() will terminate the program immediately without
|
||||
// printing the Python stack backtrace.
|
||||
abort();
|
||||
}
|
||||
|
||||
throw std::runtime_error(kErrMsg);
|
||||
#else
|
||||
abort();
|
||||
#endif
|
||||
}
|
||||
}
|
||||
|
||||
const Logger &operator<<(bool b) const {
|
||||
if (cur_level_ <= level_) {
|
||||
fprintf(stderr, b ? "true" : "false");
|
||||
}
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(int8_t i) const {
|
||||
if (cur_level_ <= level_) fprintf(stderr, "%d", i);
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(const char *s) const {
|
||||
if (cur_level_ <= level_) fprintf(stderr, "%s", s);
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(int32_t i) const {
|
||||
if (cur_level_ <= level_) fprintf(stderr, "%d", i);
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(uint32_t i) const {
|
||||
if (cur_level_ <= level_) fprintf(stderr, "%u", i);
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(uint64_t i) const {
|
||||
if (cur_level_ <= level_)
|
||||
fprintf(stderr, "%llu", (long long unsigned int)i); // NOLINT
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(int64_t i) const {
|
||||
if (cur_level_ <= level_)
|
||||
fprintf(stderr, "%lli", (long long int)i); // NOLINT
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(float f) const {
|
||||
if (cur_level_ <= level_) fprintf(stderr, "%f", f);
|
||||
return *this;
|
||||
}
|
||||
|
||||
const Logger &operator<<(double d) const {
|
||||
if (cur_level_ <= level_) fprintf(stderr, "%f", d);
|
||||
return *this;
|
||||
}
|
||||
|
||||
template <typename T>
|
||||
const Logger &operator<<(const T &t) const {
|
||||
// require T overloads operator<<
|
||||
std::ostringstream os;
|
||||
os << t;
|
||||
return *this << os.str().c_str();
|
||||
}
|
||||
|
||||
// specialization to fix compile error: `stringstream << nullptr` is ambiguous
|
||||
const Logger &operator<<(const std::nullptr_t &null) const {
|
||||
if (cur_level_ <= level_) *this << "(null)";
|
||||
return *this;
|
||||
}
|
||||
|
||||
private:
|
||||
const char *filename_;
|
||||
const char *func_name_;
|
||||
uint32_t line_num_;
|
||||
LogLevel level_;
|
||||
LogLevel cur_level_;
|
||||
};
|
||||
#endif // KNF_ENABLE_CHECK
|
||||
|
||||
class Voidifier {
|
||||
public:
|
||||
#if KNF_ENABLE_CHECK
|
||||
void operator&(const Logger &) const {}
|
||||
#endif
|
||||
};
|
||||
#if !defined(KNF_ENABLE_CHECK)
|
||||
template <typename T>
|
||||
const Voidifier &operator<<(const Voidifier &v, T &&) {
|
||||
return v;
|
||||
}
|
||||
#endif
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#define KNF_STATIC_ASSERT(x) static_assert(x, "")
|
||||
|
||||
#ifdef KNF_ENABLE_CHECK
|
||||
|
||||
#if defined(__clang__) || defined(__GNUC__) || defined(__GNUG__) || \
|
||||
defined(__PRETTY_FUNCTION__)
|
||||
// for clang and GCC
|
||||
#define KNF_FUNC __PRETTY_FUNCTION__
|
||||
#else
|
||||
// for other compilers
|
||||
#define KNF_FUNC __func__
|
||||
#endif
|
||||
|
||||
#define KNF_CHECK(x) \
|
||||
(x) ? (void)0 \
|
||||
: ::knf::Voidifier() & \
|
||||
::knf::Logger(__FILE__, KNF_FUNC, __LINE__, ::knf::FATAL) \
|
||||
<< "Check failed: " << #x << " "
|
||||
|
||||
// WARNING: x and y may be evaluated multiple times, but this happens only
|
||||
// when the check fails. Since the program aborts if it fails, we don't think
|
||||
// the extra evaluation of x and y matters.
|
||||
//
|
||||
// CAUTION: we recommend the following use case:
|
||||
//
|
||||
// auto x = Foo();
|
||||
// auto y = Bar();
|
||||
// KNF_CHECK_EQ(x, y) << "Some message";
|
||||
//
|
||||
// And please avoid
|
||||
//
|
||||
// KNF_CHECK_EQ(Foo(), Bar());
|
||||
//
|
||||
// if `Foo()` or `Bar()` causes some side effects, e.g., changing some
|
||||
// local static variables or global variables.
|
||||
#define _KNF_CHECK_OP(x, y, op) \
|
||||
((x)op(y)) ? (void)0 \
|
||||
: ::knf::Voidifier() & \
|
||||
::knf::Logger(__FILE__, KNF_FUNC, __LINE__, ::knf::FATAL) \
|
||||
<< "Check failed: " << #x << " " << #op << " " << #y \
|
||||
<< " (" << (x) << " vs. " << (y) << ") "
|
||||
|
||||
#define KNF_CHECK_EQ(x, y) _KNF_CHECK_OP(x, y, ==)
|
||||
#define KNF_CHECK_NE(x, y) _KNF_CHECK_OP(x, y, !=)
|
||||
#define KNF_CHECK_LT(x, y) _KNF_CHECK_OP(x, y, <)
|
||||
#define KNF_CHECK_LE(x, y) _KNF_CHECK_OP(x, y, <=)
|
||||
#define KNF_CHECK_GT(x, y) _KNF_CHECK_OP(x, y, >)
|
||||
#define KNF_CHECK_GE(x, y) _KNF_CHECK_OP(x, y, >=)
|
||||
|
||||
#define KNF_LOG(x) ::knf::Logger(__FILE__, KNF_FUNC, __LINE__, ::knf::x)
|
||||
|
||||
// ------------------------------------------------------------
|
||||
// For debug check
|
||||
// ------------------------------------------------------------
|
||||
// If you define the macro "-D NDEBUG" while compiling kaldi-native-fbank,
|
||||
// the following macros are in fact empty and does nothing.
|
||||
|
||||
#define KNF_DCHECK(x) ::knf::kDisableDebug ? (void)0 : KNF_CHECK(x)
|
||||
|
||||
#define KNF_DCHECK_EQ(x, y) ::knf::kDisableDebug ? (void)0 : KNF_CHECK_EQ(x, y)
|
||||
|
||||
#define KNF_DCHECK_NE(x, y) ::knf::kDisableDebug ? (void)0 : KNF_CHECK_NE(x, y)
|
||||
|
||||
#define KNF_DCHECK_LT(x, y) ::knf::kDisableDebug ? (void)0 : KNF_CHECK_LT(x, y)
|
||||
|
||||
#define KNF_DCHECK_LE(x, y) ::knf::kDisableDebug ? (void)0 : KNF_CHECK_LE(x, y)
|
||||
|
||||
#define KNF_DCHECK_GT(x, y) ::knf::kDisableDebug ? (void)0 : KNF_CHECK_GT(x, y)
|
||||
|
||||
#define KNF_DCHECK_GE(x, y) ::knf::kDisableDebug ? (void)0 : KNF_CHECK_GE(x, y)
|
||||
|
||||
#define KNF_DLOG(x) \
|
||||
::knf::kDisableDebug ? (void)0 : ::knf::Voidifier() & KNF_LOG(x)
|
||||
|
||||
#else
|
||||
|
||||
#define KNF_CHECK(x) ::knf::Voidifier()
|
||||
#define KNF_LOG(x) ::knf::Voidifier()
|
||||
|
||||
#define KNF_CHECK_EQ(x, y) ::knf::Voidifier()
|
||||
#define KNF_CHECK_NE(x, y) ::knf::Voidifier()
|
||||
#define KNF_CHECK_LT(x, y) ::knf::Voidifier()
|
||||
#define KNF_CHECK_LE(x, y) ::knf::Voidifier()
|
||||
#define KNF_CHECK_GT(x, y) ::knf::Voidifier()
|
||||
#define KNF_CHECK_GE(x, y) ::knf::Voidifier()
|
||||
|
||||
#define KNF_DCHECK(x) ::knf::Voidifier()
|
||||
#define KNF_DLOG(x) ::knf::Voidifier()
|
||||
#define KNF_DCHECK_EQ(x, y) ::knf::Voidifier()
|
||||
#define KNF_DCHECK_NE(x, y) ::knf::Voidifier()
|
||||
#define KNF_DCHECK_LT(x, y) ::knf::Voidifier()
|
||||
#define KNF_DCHECK_LE(x, y) ::knf::Voidifier()
|
||||
#define KNF_DCHECK_GT(x, y) ::knf::Voidifier()
|
||||
#define KNF_DCHECK_GE(x, y) ::knf::Voidifier()
|
||||
|
||||
#endif // KNF_CHECK_NE
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_LOG_H_
|
||||
@@ -0,0 +1,257 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// This file is copied/modified from kaldi/src/feat/mel-computations.cc
|
||||
|
||||
#include "kaldi-native-fbank/csrc/mel-computations.h"
|
||||
|
||||
#include <algorithm>
|
||||
#include <sstream>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-window.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
std::ostream &operator<<(std::ostream &os, const MelBanksOptions &opts) {
|
||||
os << opts.ToString();
|
||||
return os;
|
||||
}
|
||||
|
||||
float MelBanks::VtlnWarpFreq(
|
||||
float vtln_low_cutoff, // upper+lower frequency cutoffs for VTLN.
|
||||
float vtln_high_cutoff,
|
||||
float low_freq, // upper+lower frequency cutoffs in mel computation
|
||||
float high_freq, float vtln_warp_factor, float freq) {
|
||||
/// This computes a VTLN warping function that is not the same as HTK's one,
|
||||
/// but has similar inputs (this function has the advantage of never producing
|
||||
/// empty bins).
|
||||
|
||||
/// This function computes a warp function F(freq), defined between low_freq
|
||||
/// and high_freq inclusive, with the following properties:
|
||||
/// F(low_freq) == low_freq
|
||||
/// F(high_freq) == high_freq
|
||||
/// The function is continuous and piecewise linear with two inflection
|
||||
/// points.
|
||||
/// The lower inflection point (measured in terms of the unwarped
|
||||
/// frequency) is at frequency l, determined as described below.
|
||||
/// The higher inflection point is at a frequency h, determined as
|
||||
/// described below.
|
||||
/// If l <= f <= h, then F(f) = f/vtln_warp_factor.
|
||||
/// If the higher inflection point (measured in terms of the unwarped
|
||||
/// frequency) is at h, then max(h, F(h)) == vtln_high_cutoff.
|
||||
/// Since (by the last point) F(h) == h/vtln_warp_factor, then
|
||||
/// max(h, h/vtln_warp_factor) == vtln_high_cutoff, so
|
||||
/// h = vtln_high_cutoff / max(1, 1/vtln_warp_factor).
|
||||
/// = vtln_high_cutoff * min(1, vtln_warp_factor).
|
||||
/// If the lower inflection point (measured in terms of the unwarped
|
||||
/// frequency) is at l, then min(l, F(l)) == vtln_low_cutoff
|
||||
/// This implies that l = vtln_low_cutoff / min(1, 1/vtln_warp_factor)
|
||||
/// = vtln_low_cutoff * max(1, vtln_warp_factor)
|
||||
|
||||
if (freq < low_freq || freq > high_freq)
|
||||
return freq; // in case this gets called
|
||||
// for out-of-range frequencies, just return the freq.
|
||||
|
||||
KNF_CHECK_GT(vtln_low_cutoff, low_freq);
|
||||
KNF_CHECK_LT(vtln_high_cutoff, high_freq);
|
||||
|
||||
float one = 1.0f;
|
||||
float l = vtln_low_cutoff * std::max(one, vtln_warp_factor);
|
||||
float h = vtln_high_cutoff * std::min(one, vtln_warp_factor);
|
||||
float scale = 1.0f / vtln_warp_factor;
|
||||
float Fl = scale * l; // F(l);
|
||||
float Fh = scale * h; // F(h);
|
||||
KNF_CHECK(l > low_freq && h < high_freq);
|
||||
// slope of left part of the 3-piece linear function
|
||||
float scale_left = (Fl - low_freq) / (l - low_freq);
|
||||
// [slope of center part is just "scale"]
|
||||
|
||||
// slope of right part of the 3-piece linear function
|
||||
float scale_right = (high_freq - Fh) / (high_freq - h);
|
||||
|
||||
if (freq < l) {
|
||||
return low_freq + scale_left * (freq - low_freq);
|
||||
} else if (freq < h) {
|
||||
return scale * freq;
|
||||
} else { // freq >= h
|
||||
return high_freq + scale_right * (freq - high_freq);
|
||||
}
|
||||
}
|
||||
|
||||
float MelBanks::VtlnWarpMelFreq(
|
||||
float vtln_low_cutoff, // upper+lower frequency cutoffs for VTLN.
|
||||
float vtln_high_cutoff,
|
||||
float low_freq, // upper+lower frequency cutoffs in mel computation
|
||||
float high_freq, float vtln_warp_factor, float mel_freq) {
|
||||
return MelScale(VtlnWarpFreq(vtln_low_cutoff, vtln_high_cutoff, low_freq,
|
||||
high_freq, vtln_warp_factor,
|
||||
InverseMelScale(mel_freq)));
|
||||
}
|
||||
|
||||
MelBanks::MelBanks(const MelBanksOptions &opts,
|
||||
const FrameExtractionOptions &frame_opts,
|
||||
float vtln_warp_factor)
|
||||
: htk_mode_(opts.htk_mode) {
|
||||
int32_t num_bins = opts.num_bins;
|
||||
if (num_bins < 3) KNF_LOG(FATAL) << "Must have at least 3 mel bins";
|
||||
|
||||
float sample_freq = frame_opts.samp_freq;
|
||||
int32_t window_length_padded = frame_opts.PaddedWindowSize();
|
||||
KNF_CHECK_EQ(window_length_padded % 2, 0);
|
||||
|
||||
int32_t num_fft_bins = window_length_padded / 2;
|
||||
float nyquist = 0.5f * sample_freq;
|
||||
|
||||
float low_freq = opts.low_freq, high_freq;
|
||||
if (opts.high_freq > 0.0f)
|
||||
high_freq = opts.high_freq;
|
||||
else
|
||||
high_freq = nyquist + opts.high_freq;
|
||||
|
||||
if (low_freq < 0.0f || low_freq >= nyquist || high_freq <= 0.0f ||
|
||||
high_freq > nyquist || high_freq <= low_freq) {
|
||||
KNF_LOG(FATAL) << "Bad values in options: low-freq " << low_freq
|
||||
<< " and high-freq " << high_freq << " vs. nyquist "
|
||||
<< nyquist;
|
||||
}
|
||||
|
||||
float fft_bin_width = sample_freq / window_length_padded;
|
||||
// fft-bin width [think of it as Nyquist-freq / half-window-length]
|
||||
|
||||
float mel_low_freq = MelScale(low_freq);
|
||||
float mel_high_freq = MelScale(high_freq);
|
||||
|
||||
debug_ = opts.debug_mel;
|
||||
|
||||
// divide by num_bins+1 in next line because of end-effects where the bins
|
||||
// spread out to the sides.
|
||||
float mel_freq_delta = (mel_high_freq - mel_low_freq) / (num_bins + 1);
|
||||
|
||||
float vtln_low = opts.vtln_low, vtln_high = opts.vtln_high;
|
||||
if (vtln_high < 0.0f) {
|
||||
vtln_high += nyquist;
|
||||
}
|
||||
|
||||
if (vtln_warp_factor != 1.0f &&
|
||||
(vtln_low < 0.0f || vtln_low <= low_freq || vtln_low >= high_freq ||
|
||||
vtln_high <= 0.0f || vtln_high >= high_freq || vtln_high <= vtln_low)) {
|
||||
KNF_LOG(FATAL) << "Bad values in options: vtln-low " << vtln_low
|
||||
<< " and vtln-high " << vtln_high << ", versus "
|
||||
<< "low-freq " << low_freq << " and high-freq " << high_freq;
|
||||
}
|
||||
|
||||
bins_.resize(num_bins);
|
||||
center_freqs_.resize(num_bins);
|
||||
|
||||
for (int32_t bin = 0; bin < num_bins; ++bin) {
|
||||
float left_mel = mel_low_freq + bin * mel_freq_delta,
|
||||
center_mel = mel_low_freq + (bin + 1) * mel_freq_delta,
|
||||
right_mel = mel_low_freq + (bin + 2) * mel_freq_delta;
|
||||
|
||||
if (vtln_warp_factor != 1.0f) {
|
||||
left_mel = VtlnWarpMelFreq(vtln_low, vtln_high, low_freq, high_freq,
|
||||
vtln_warp_factor, left_mel);
|
||||
center_mel = VtlnWarpMelFreq(vtln_low, vtln_high, low_freq, high_freq,
|
||||
vtln_warp_factor, center_mel);
|
||||
right_mel = VtlnWarpMelFreq(vtln_low, vtln_high, low_freq, high_freq,
|
||||
vtln_warp_factor, right_mel);
|
||||
}
|
||||
center_freqs_[bin] = InverseMelScale(center_mel);
|
||||
|
||||
// this_bin will be a vector of coefficients that is only
|
||||
// nonzero where this mel bin is active.
|
||||
std::vector<float> this_bin(num_fft_bins);
|
||||
|
||||
int32_t first_index = -1, last_index = -1;
|
||||
for (int32_t i = 0; i < num_fft_bins; ++i) {
|
||||
float freq = (fft_bin_width * i); // Center frequency of this fft
|
||||
// bin.
|
||||
float mel = MelScale(freq);
|
||||
if (mel > left_mel && mel < right_mel) {
|
||||
float weight;
|
||||
if (mel <= center_mel)
|
||||
weight = (mel - left_mel) / (center_mel - left_mel);
|
||||
else
|
||||
weight = (right_mel - mel) / (right_mel - center_mel);
|
||||
this_bin[i] = weight;
|
||||
if (first_index == -1) first_index = i;
|
||||
last_index = i;
|
||||
}
|
||||
}
|
||||
KNF_CHECK(first_index != -1 && last_index >= first_index &&
|
||||
"You may have set num_mel_bins too large.");
|
||||
|
||||
bins_[bin].first = first_index;
|
||||
int32_t size = last_index + 1 - first_index;
|
||||
bins_[bin].second.insert(bins_[bin].second.end(),
|
||||
this_bin.begin() + first_index,
|
||||
this_bin.begin() + first_index + size);
|
||||
|
||||
// Replicate a bug in HTK, for testing purposes.
|
||||
if (opts.htk_mode && bin == 0 && mel_low_freq != 0.0f) {
|
||||
bins_[bin].second[0] = 0.0;
|
||||
}
|
||||
} // for (int32_t bin = 0; bin < num_bins; ++bin) {
|
||||
|
||||
if (debug_) {
|
||||
std::ostringstream os;
|
||||
for (size_t i = 0; i < bins_.size(); i++) {
|
||||
os << "bin " << i << ", offset = " << bins_[i].first << ", vec = ";
|
||||
for (auto k : bins_[i].second) os << k << ", ";
|
||||
os << "\n";
|
||||
}
|
||||
KNF_LOG(INFO) << os.str();
|
||||
}
|
||||
}
|
||||
|
||||
// "power_spectrum" contains fft energies.
|
||||
void MelBanks::Compute(const float *power_spectrum,
|
||||
float *mel_energies_out) const {
|
||||
int32_t num_bins = bins_.size();
|
||||
|
||||
for (int32_t i = 0; i < num_bins; i++) {
|
||||
int32_t offset = bins_[i].first;
|
||||
const auto &v = bins_[i].second;
|
||||
float energy = 0;
|
||||
for (int32_t k = 0; k != v.size(); ++k) {
|
||||
energy += v[k] * power_spectrum[k + offset];
|
||||
}
|
||||
|
||||
// HTK-like flooring- for testing purposes (we prefer dither)
|
||||
if (htk_mode_ && energy < 1.0) {
|
||||
energy = 1.0;
|
||||
}
|
||||
|
||||
mel_energies_out[i] = energy;
|
||||
|
||||
// The following assert was added due to a problem with OpenBlas that
|
||||
// we had at one point (it was a bug in that library). Just to detect
|
||||
// it early.
|
||||
KNF_CHECK_EQ(energy, energy); // check that energy is not nan
|
||||
}
|
||||
|
||||
if (debug_) {
|
||||
fprintf(stderr, "MEL BANKS:\n");
|
||||
for (int32_t i = 0; i < num_bins; i++)
|
||||
fprintf(stderr, " %f", mel_energies_out[i]);
|
||||
fprintf(stderr, "\n");
|
||||
}
|
||||
}
|
||||
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,117 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
// This file is copied/modified from kaldi/src/feat/mel-computations.h
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_MEL_COMPUTATIONS_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_MEL_COMPUTATIONS_H_
|
||||
|
||||
#include <cmath>
|
||||
#include <string>
|
||||
#include <utility>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-window.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
struct MelBanksOptions {
|
||||
int32_t num_bins = 25; // e.g. 25; number of triangular bins
|
||||
float low_freq = 20; // e.g. 20; lower frequency cutoff
|
||||
|
||||
// an upper frequency cutoff; 0 -> no cutoff, negative
|
||||
// ->added to the Nyquist frequency to get the cutoff.
|
||||
float high_freq = 0;
|
||||
|
||||
float vtln_low = 100; // vtln lower cutoff of warping function.
|
||||
|
||||
// vtln upper cutoff of warping function: if negative, added
|
||||
// to the Nyquist frequency to get the cutoff.
|
||||
float vtln_high = -500;
|
||||
|
||||
bool debug_mel = false;
|
||||
// htk_mode is a "hidden" config, it does not show up on command line.
|
||||
// Enables more exact compatibility with HTK, for testing purposes. Affects
|
||||
// mel-energy flooring and reproduces a bug in HTK.
|
||||
bool htk_mode = false;
|
||||
|
||||
std::string ToString() const {
|
||||
std::ostringstream os;
|
||||
os << "num_bins: " << num_bins << "\n";
|
||||
os << "low_freq: " << low_freq << "\n";
|
||||
os << "high_freq: " << high_freq << "\n";
|
||||
os << "vtln_low: " << vtln_low << "\n";
|
||||
os << "vtln_high: " << vtln_high << "\n";
|
||||
os << "debug_mel: " << debug_mel << "\n";
|
||||
os << "htk_mode: " << htk_mode << "\n";
|
||||
return os.str();
|
||||
}
|
||||
};
|
||||
|
||||
std::ostream &operator<<(std::ostream &os, const MelBanksOptions &opts);
|
||||
|
||||
class MelBanks {
|
||||
public:
|
||||
static inline float InverseMelScale(float mel_freq) {
|
||||
return 700.0f * (expf(mel_freq / 1127.0f) - 1.0f);
|
||||
}
|
||||
|
||||
static inline float MelScale(float freq) {
|
||||
return 1127.0f * logf(1.0f + freq / 700.0f);
|
||||
}
|
||||
|
||||
static float VtlnWarpFreq(
|
||||
float vtln_low_cutoff,
|
||||
float vtln_high_cutoff, // discontinuities in warp func
|
||||
float low_freq,
|
||||
float high_freq, // upper+lower frequency cutoffs in
|
||||
// the mel computation
|
||||
float vtln_warp_factor, float freq);
|
||||
|
||||
static float VtlnWarpMelFreq(float vtln_low_cutoff, float vtln_high_cutoff,
|
||||
float low_freq, float high_freq,
|
||||
float vtln_warp_factor, float mel_freq);
|
||||
|
||||
// TODO(fangjun): Remove vtln_warp_factor
|
||||
MelBanks(const MelBanksOptions &opts,
|
||||
const FrameExtractionOptions &frame_opts, float vtln_warp_factor);
|
||||
|
||||
/// Compute Mel energies (note: not log energies).
|
||||
/// At input, "fft_energies" contains the FFT energies (not log).
|
||||
///
|
||||
/// @param fft_energies 1-D array of size num_fft_bins/2+1
|
||||
/// @param mel_energies_out 1-D array of size num_mel_bins
|
||||
void Compute(const float *fft_energies, float *mel_energies_out) const;
|
||||
|
||||
int32_t NumBins() const { return bins_.size(); }
|
||||
|
||||
private:
|
||||
// center frequencies of bins, numbered from 0 ... num_bins-1.
|
||||
// Needed by GetCenterFreqs().
|
||||
std::vector<float> center_freqs_;
|
||||
|
||||
// the "bins_" vector is a vector, one for each bin, of a pair:
|
||||
// (the first nonzero fft-bin), (the vector of weights).
|
||||
std::vector<std::pair<int32_t, std::vector<float>>> bins_;
|
||||
|
||||
// TODO(fangjun): Remove debug_ and htk_mode_
|
||||
bool debug_;
|
||||
bool htk_mode_;
|
||||
};
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_MEL_COMPUTATIONS_H_
|
||||
@@ -0,0 +1,165 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// The content in this file is copied/modified from
|
||||
// This file is copied/modified from kaldi/src/feat/online-feature.cc
|
||||
|
||||
#include "kaldi-native-fbank/csrc/online-feature.h"
|
||||
|
||||
#include <algorithm>
|
||||
#include <utility>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-window.h"
|
||||
#include "kaldi-native-fbank/csrc/log.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
RecyclingVector::RecyclingVector(int32_t items_to_hold)
|
||||
: items_to_hold_(items_to_hold == 0 ? -1 : items_to_hold),
|
||||
first_available_index_(0) {}
|
||||
|
||||
const float *RecyclingVector::At(int32_t index) const {
|
||||
if (index < first_available_index_) {
|
||||
KNF_LOG(FATAL) << "Attempted to retrieve feature vector that was "
|
||||
"already removed by the RecyclingVector (index = "
|
||||
<< index << "; "
|
||||
<< "first_available_index = " << first_available_index_
|
||||
<< "; "
|
||||
<< "size = " << Size() << ")";
|
||||
}
|
||||
// 'at' does size checking.
|
||||
return items_.at(index - first_available_index_).data();
|
||||
}
|
||||
|
||||
void RecyclingVector::PushBack(std::vector<float> item) {
|
||||
// Note: -1 is a larger number when treated as unsigned
|
||||
if (items_.size() == static_cast<size_t>(items_to_hold_)) {
|
||||
items_.pop_front();
|
||||
++first_available_index_;
|
||||
}
|
||||
items_.push_back(std::move(item));
|
||||
}
|
||||
|
||||
int32_t RecyclingVector::Size() const {
|
||||
return first_available_index_ + static_cast<int32_t>(items_.size());
|
||||
}
|
||||
|
||||
template <class C>
|
||||
OnlineGenericBaseFeature<C>::OnlineGenericBaseFeature(
|
||||
const typename C::Options &opts)
|
||||
: computer_(opts),
|
||||
window_function_(computer_.GetFrameOptions()),
|
||||
features_(opts.frame_opts.max_feature_vectors),
|
||||
input_finished_(false),
|
||||
waveform_offset_(0) {
|
||||
// RE the following assert: search for ONLINE_IVECTOR_LIMIT in
|
||||
// online-ivector-feature.cc.
|
||||
// Casting to uint32, an unsigned type, means that -1 would be treated
|
||||
// as `very large`.
|
||||
KNF_CHECK(static_cast<uint32_t>(opts.frame_opts.max_feature_vectors) > 200);
|
||||
}
|
||||
|
||||
template <class C>
|
||||
void OnlineGenericBaseFeature<C>::AcceptWaveform(float sampling_rate,
|
||||
const float *waveform,
|
||||
int32_t n) {
|
||||
if (n == 0) {
|
||||
return; // Nothing to do.
|
||||
}
|
||||
|
||||
if (input_finished_) {
|
||||
KNF_LOG(FATAL) << "AcceptWaveform called after InputFinished() was called.";
|
||||
}
|
||||
|
||||
KNF_CHECK_EQ(sampling_rate, computer_.GetFrameOptions().samp_freq);
|
||||
|
||||
waveform_remainder_.insert(waveform_remainder_.end(), waveform, waveform + n);
|
||||
|
||||
ComputeFeatures();
|
||||
}
|
||||
|
||||
template <class C>
|
||||
void OnlineGenericBaseFeature<C>::InputFinished() {
|
||||
input_finished_ = true;
|
||||
ComputeFeatures();
|
||||
}
|
||||
|
||||
template <class C>
|
||||
void OnlineGenericBaseFeature<C>::ComputeFeatures() {
|
||||
const FrameExtractionOptions &frame_opts = computer_.GetFrameOptions();
|
||||
|
||||
int64_t num_samples_total = waveform_offset_ + waveform_remainder_.size();
|
||||
|
||||
int32_t num_frames_old = features_.Size();
|
||||
|
||||
int32_t num_frames_new =
|
||||
NumFrames(num_samples_total, frame_opts, input_finished_);
|
||||
|
||||
KNF_CHECK_GE(num_frames_new, num_frames_old);
|
||||
|
||||
// note: this online feature-extraction code does not support VTLN.
|
||||
float vtln_warp = 1.0;
|
||||
|
||||
std::vector<float> window;
|
||||
bool need_raw_log_energy = computer_.NeedRawLogEnergy();
|
||||
|
||||
for (int32_t frame = num_frames_old; frame < num_frames_new; ++frame) {
|
||||
std::fill(window.begin(), window.end(), 0);
|
||||
float raw_log_energy = 0.0;
|
||||
ExtractWindow(waveform_offset_, waveform_remainder_, frame, frame_opts,
|
||||
window_function_, &window,
|
||||
need_raw_log_energy ? &raw_log_energy : nullptr);
|
||||
|
||||
std::vector<float> this_feature(computer_.Dim());
|
||||
|
||||
computer_.Compute(raw_log_energy, vtln_warp, &window, this_feature.data());
|
||||
features_.PushBack(std::move(this_feature));
|
||||
}
|
||||
|
||||
// OK, we will now discard any portion of the signal that will not be
|
||||
// necessary to compute frames in the future.
|
||||
int64_t first_sample_of_next_frame =
|
||||
FirstSampleOfFrame(num_frames_new, frame_opts);
|
||||
|
||||
int32_t samples_to_discard = first_sample_of_next_frame - waveform_offset_;
|
||||
|
||||
if (samples_to_discard > 0) {
|
||||
// discard the leftmost part of the waveform that we no longer need.
|
||||
int32_t new_num_samples =
|
||||
static_cast<int32_t>(waveform_remainder_.size()) - samples_to_discard;
|
||||
|
||||
if (new_num_samples <= 0) {
|
||||
// odd, but we'll try to handle it.
|
||||
waveform_offset_ += waveform_remainder_.size();
|
||||
waveform_remainder_.resize(0);
|
||||
} else {
|
||||
std::vector<float> new_remainder(new_num_samples);
|
||||
|
||||
std::copy(waveform_remainder_.begin() + samples_to_discard,
|
||||
waveform_remainder_.end(), new_remainder.begin());
|
||||
waveform_offset_ += samples_to_discard;
|
||||
|
||||
waveform_remainder_.swap(new_remainder);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
template class OnlineGenericBaseFeature<FbankComputer>;
|
||||
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,142 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// The content in this file is copied/modified from
|
||||
// This file is copied/modified from kaldi/src/feat/online-feature.h
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_ONLINE_FEATURE_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_ONLINE_FEATURE_H_
|
||||
|
||||
#include <cstdint>
|
||||
#include <deque>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/feature-fbank.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
/// This class serves as a storage for feature vectors with an option to limit
|
||||
/// the memory usage by removing old elements. The deleted frames indices are
|
||||
/// "remembered" so that regardless of the MAX_ITEMS setting, the user always
|
||||
/// provides the indices as if no deletion was being performed.
|
||||
/// This is useful when processing very long recordings which would otherwise
|
||||
/// cause the memory to eventually blow up when the features are not being
|
||||
/// removed.
|
||||
class RecyclingVector {
|
||||
public:
|
||||
/// By default it does not remove any elements.
|
||||
explicit RecyclingVector(int32_t items_to_hold = -1);
|
||||
|
||||
~RecyclingVector() = default;
|
||||
RecyclingVector(const RecyclingVector &) = delete;
|
||||
RecyclingVector &operator=(const RecyclingVector &) = delete;
|
||||
|
||||
// The pointer is owned by RecyclingVector
|
||||
// Users should not free it
|
||||
const float *At(int32_t index) const;
|
||||
|
||||
void PushBack(std::vector<float> item);
|
||||
|
||||
/// This method returns the size as if no "recycling" had happened,
|
||||
/// i.e. equivalent to the number of times the PushBack method has been
|
||||
/// called.
|
||||
int32_t Size() const;
|
||||
|
||||
private:
|
||||
std::deque<std::vector<float>> items_;
|
||||
int32_t items_to_hold_;
|
||||
int32_t first_available_index_;
|
||||
};
|
||||
|
||||
/// This is a templated class for online feature extraction;
|
||||
/// it's templated on a class like MfccComputer or PlpComputer
|
||||
/// that does the basic feature extraction.
|
||||
template <class C>
|
||||
class OnlineGenericBaseFeature {
|
||||
public:
|
||||
// Constructor from options class
|
||||
explicit OnlineGenericBaseFeature(const typename C::Options &opts);
|
||||
|
||||
int32_t Dim() const { return computer_.Dim(); }
|
||||
|
||||
float FrameShiftInSeconds() const {
|
||||
return computer_.GetFrameOptions().frame_shift_ms / 1000.0f;
|
||||
}
|
||||
|
||||
int32_t NumFramesReady() const { return features_.Size(); }
|
||||
|
||||
// Note: IsLastFrame() will only ever return true if you have called
|
||||
// InputFinished() (and this frame is the last frame).
|
||||
bool IsLastFrame(int32_t frame) const {
|
||||
return input_finished_ && frame == NumFramesReady() - 1;
|
||||
}
|
||||
|
||||
const float *GetFrame(int32_t frame) const { return features_.At(frame); }
|
||||
|
||||
// This would be called from the application, when you get
|
||||
// more wave data. Note: the sampling_rate is only provided so
|
||||
// the code can assert that it matches the sampling rate
|
||||
// expected in the options.
|
||||
//
|
||||
// @param sampling_rate The sampling_rate of the input waveform
|
||||
// @param waveform Pointer to a 1-D array of size n
|
||||
// @param n Number of entries in waveform
|
||||
void AcceptWaveform(float sampling_rate, const float *waveform, int32_t n);
|
||||
|
||||
// InputFinished() tells the class you won't be providing any
|
||||
// more waveform. This will help flush out the last frame or two
|
||||
// of features, in the case where snip-edges == false; it also
|
||||
// affects the return value of IsLastFrame().
|
||||
void InputFinished();
|
||||
|
||||
private:
|
||||
// This function computes any additional feature frames that it is possible to
|
||||
// compute from 'waveform_remainder_', which at this point may contain more
|
||||
// than just a remainder-sized quantity (because AcceptWaveform() appends to
|
||||
// waveform_remainder_ before calling this function). It adds these feature
|
||||
// frames to features_, and shifts off any now-unneeded samples of input from
|
||||
// waveform_remainder_ while incrementing waveform_offset_ by the same amount.
|
||||
void ComputeFeatures();
|
||||
|
||||
C computer_; // class that does the MFCC or PLP or filterbank computation
|
||||
|
||||
FeatureWindowFunction window_function_;
|
||||
|
||||
// features_ is the Mfcc or Plp or Fbank features that we have already
|
||||
// computed.
|
||||
|
||||
RecyclingVector features_;
|
||||
|
||||
// True if the user has called "InputFinished()"
|
||||
bool input_finished_;
|
||||
|
||||
// waveform_offset_ is the number of samples of waveform that we have
|
||||
// already discarded, i.e. that were prior to 'waveform_remainder_'.
|
||||
int64_t waveform_offset_;
|
||||
|
||||
// waveform_remainder_ is a short piece of waveform that we may need to keep
|
||||
// after extracting all the whole frames we can (whatever length of feature
|
||||
// will be required for the next phase of computation).
|
||||
// It is a 1-D tensor
|
||||
std::vector<float> waveform_remainder_;
|
||||
};
|
||||
|
||||
using OnlineFbank = OnlineGenericBaseFeature<FbankComputer>;
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_ONLINE_FEATURE_H_
|
||||
67
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/rfft.cc
vendored
Normal file
67
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/rfft.cc
vendored
Normal file
@@ -0,0 +1,67 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "kaldi-native-fbank/csrc/rfft.h"
|
||||
|
||||
#include <algorithm>
|
||||
#include <cmath>
|
||||
#include <vector>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/log.h"
|
||||
|
||||
// see fftsg.c
|
||||
#ifdef __cplusplus
|
||||
extern "C" void rdft(int n, int isgn, double *a, int *ip, double *w);
|
||||
#else
|
||||
void rdft(int n, int isgn, double *a, int *ip, double *w);
|
||||
#endif
|
||||
|
||||
namespace knf {
|
||||
class Rfft::RfftImpl {
|
||||
public:
|
||||
explicit RfftImpl(int32_t n) : n_(n), ip_(2 + std::sqrt(n / 2)), w_(n / 2) {
|
||||
KNF_CHECK_EQ(n & (n - 1), 0);
|
||||
}
|
||||
|
||||
void Compute(float *in_out) {
|
||||
std::vector<double> d(in_out, in_out + n_);
|
||||
|
||||
Compute(d.data());
|
||||
|
||||
std::copy(d.begin(), d.end(), in_out);
|
||||
}
|
||||
|
||||
void Compute(double *in_out) {
|
||||
// 1 means forward fft
|
||||
rdft(n_, 1, in_out, ip_.data(), w_.data());
|
||||
}
|
||||
|
||||
private:
|
||||
int32_t n_;
|
||||
std::vector<int32_t> ip_;
|
||||
std::vector<double> w_;
|
||||
};
|
||||
|
||||
Rfft::Rfft(int32_t n) : impl_(std::make_unique<RfftImpl>(n)) {}
|
||||
|
||||
Rfft::~Rfft() = default;
|
||||
|
||||
void Rfft::Compute(float *in_out) { impl_->Compute(in_out); }
|
||||
void Rfft::Compute(double *in_out) { impl_->Compute(in_out); }
|
||||
|
||||
} // namespace knf
|
||||
56
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/rfft.h
vendored
Normal file
56
funasr_local/runtime/onnxruntime/third_party/kaldi-native-fbank/kaldi-native-fbank/csrc/rfft.h
vendored
Normal file
@@ -0,0 +1,56 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#ifndef KALDI_NATIVE_FBANK_CSRC_RFFT_H_
|
||||
#define KALDI_NATIVE_FBANK_CSRC_RFFT_H_
|
||||
|
||||
#include <memory>
|
||||
|
||||
namespace knf {
|
||||
|
||||
// n-point Real discrete Fourier transform
|
||||
// where n is a power of 2. n >= 2
|
||||
//
|
||||
// R[k] = sum_j=0^n-1 in[j]*cos(2*pi*j*k/n), 0<=k<=n/2
|
||||
// I[k] = sum_j=0^n-1 in[j]*sin(2*pi*j*k/n), 0<k<n/2
|
||||
class Rfft {
|
||||
public:
|
||||
// @param n Number of fft bins. it should be a power of 2.
|
||||
explicit Rfft(int32_t n);
|
||||
~Rfft();
|
||||
|
||||
/** @param in_out A 1-D array of size n.
|
||||
* On return:
|
||||
* in_out[0] = R[0]
|
||||
* in_out[1] = R[n/2]
|
||||
* for 1 < k < n/2,
|
||||
* in_out[2*k] = R[k]
|
||||
* in_out[2*k+1] = I[k]
|
||||
*
|
||||
*/
|
||||
void Compute(float *in_out);
|
||||
void Compute(double *in_out);
|
||||
|
||||
private:
|
||||
class RfftImpl;
|
||||
std::unique_ptr<RfftImpl> impl_;
|
||||
};
|
||||
|
||||
} // namespace knf
|
||||
|
||||
#endif // KALDI_NATIVE_FBANK_CSRC_RFFT_H_
|
||||
@@ -0,0 +1,73 @@
|
||||
/**
|
||||
* Copyright 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "gtest/gtest.h"
|
||||
#include "kaldi-native-fbank/csrc/log.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
#if KNF_ENABLE_CHECK
|
||||
|
||||
TEST(Log, TestLog) {
|
||||
KNF_LOG(TRACE) << "this is a trace message";
|
||||
KNF_LOG(DEBUG) << "this is a debug message";
|
||||
KNF_LOG(INFO) << "this is an info message";
|
||||
KNF_LOG(WARNING) << "this is a warning message";
|
||||
KNF_LOG(ERROR) << "this is an error message";
|
||||
|
||||
ASSERT_THROW(KNF_LOG(FATAL) << "This will crash the program",
|
||||
std::runtime_error);
|
||||
|
||||
// For debug build
|
||||
|
||||
KNF_DLOG(TRACE) << "this is a trace message for debug build";
|
||||
KNF_DLOG(DEBUG) << "this is a trace message for debug build";
|
||||
KNF_DLOG(INFO) << "this is a trace message for debug build";
|
||||
KNF_DLOG(ERROR) << "this is an error message for debug build";
|
||||
KNF_DLOG(WARNING) << "this is a trace message for debug build";
|
||||
|
||||
#if !defined(NDEBUG)
|
||||
ASSERT_THROW(KNF_DLOG(FATAL) << "this is a trace message for debug build",
|
||||
std::runtime_error);
|
||||
#endif
|
||||
}
|
||||
|
||||
TEST(Log, TestCheck) {
|
||||
KNF_CHECK_EQ(1, 1) << "ok";
|
||||
KNF_CHECK_LE(1, 3) << "ok";
|
||||
KNF_CHECK_LT(1, 2) << "ok";
|
||||
KNF_CHECK_GT(2, 1) << "ok";
|
||||
KNF_CHECK_GE(2, 1) << "ok";
|
||||
|
||||
ASSERT_THROW(KNF_CHECK_EQ(2, 1) << "bad things happened", std::runtime_error);
|
||||
|
||||
// for debug build
|
||||
KNF_DCHECK_EQ(1, 1) << "ok";
|
||||
KNF_DCHECK_LE(1, 3) << "ok";
|
||||
KNF_DCHECK_LT(1, 2) << "ok";
|
||||
KNF_DCHECK_GT(2, 1) << "ok";
|
||||
KNF_DCHECK_GE(2, 1) << "ok";
|
||||
|
||||
#if !defined(NDEBUG)
|
||||
ASSERT_THROW(KNF_CHECK_EQ(2, 1) << "bad things happened", std::runtime_error);
|
||||
#endif
|
||||
}
|
||||
|
||||
#endif
|
||||
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,48 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include <iostream>
|
||||
|
||||
#include "kaldi-native-fbank/csrc/online-feature.h"
|
||||
|
||||
int main() {
|
||||
knf::FbankOptions opts;
|
||||
opts.frame_opts.dither = 0;
|
||||
opts.mel_opts.num_bins = 10;
|
||||
|
||||
knf::OnlineFbank fbank(opts);
|
||||
for (int32_t i = 0; i < 1600; ++i) {
|
||||
float s = (i * i - i / 2) / 32767.;
|
||||
fbank.AcceptWaveform(16000, &s, 1);
|
||||
}
|
||||
|
||||
std::ostringstream os;
|
||||
|
||||
int32_t n = fbank.NumFramesReady();
|
||||
for (int32_t i = 0; i != n; ++i) {
|
||||
const float *frame = fbank.GetFrame(i);
|
||||
for (int32_t k = 0; k != opts.mel_opts.num_bins; ++k) {
|
||||
os << frame[k] << ", ";
|
||||
}
|
||||
os << "\n";
|
||||
}
|
||||
|
||||
std::cout << os.str() << "\n";
|
||||
|
||||
return 0;
|
||||
}
|
||||
@@ -0,0 +1,59 @@
|
||||
/**
|
||||
* Copyright (c) 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "gtest/gtest.h"
|
||||
#include "kaldi-native-fbank/csrc/online-feature.h"
|
||||
namespace knf {
|
||||
|
||||
TEST(RecyclingVector, TestUnlimited) {
|
||||
RecyclingVector v(-1);
|
||||
constexpr int32_t N = 100;
|
||||
for (int32_t i = 0; i != N; ++i) {
|
||||
std::unique_ptr<float[]> p(new float[3]{i, i + 1, i + 2});
|
||||
v.PushBack(std::move(p));
|
||||
}
|
||||
ASSERT_EQ(v.Size(), N);
|
||||
|
||||
for (int32_t i = 0; i != N; ++i) {
|
||||
const float *t = v.At(i);
|
||||
for (int32_t k = 0; k != 3; ++k) {
|
||||
EXPECT_EQ(t[k], (i + k));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TEST(RecyclingVector, Testlimited) {
|
||||
constexpr int32_t K = 3;
|
||||
constexpr int32_t N = 10;
|
||||
RecyclingVector v(K);
|
||||
for (int32_t i = 0; i != N; ++i) {
|
||||
std::unique_ptr<float[]> p(new float[3]{i, i + 1, i + 2});
|
||||
v.PushBack(std::move(p));
|
||||
}
|
||||
|
||||
ASSERT_EQ(v.Size(), N);
|
||||
|
||||
for (int32_t i = N - K; i != N; ++i) {
|
||||
const float *t = v.At(i);
|
||||
|
||||
for (int32_t k = 0; k != 3; ++k) {
|
||||
EXPECT_EQ(t[k], (i + k));
|
||||
}
|
||||
}
|
||||
}
|
||||
} // namespace knf
|
||||
@@ -0,0 +1,52 @@
|
||||
/**
|
||||
* Copyright 2022 Xiaomi Corporation (authors: Fangjun Kuang)
|
||||
*
|
||||
* See LICENSE for clarification regarding multiple authors
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
#include "gtest/gtest.h"
|
||||
#include "kaldi-native-fbank/csrc/rfft.h"
|
||||
|
||||
namespace knf {
|
||||
|
||||
#if 0
|
||||
>>> import torch
|
||||
>>> a = torch.tensor([1., -1, 3, 8, 20, 6, 0, 2])
|
||||
>>> torch.fft.rfft(a)
|
||||
tensor([ 39.0000+0.0000j, -28.1924-2.2929j, 18.0000+5.0000j, -9.8076+3.7071j,
|
||||
9.0000+0.0000j])
|
||||
#endif
|
||||
|
||||
TEST(Rfft, TestRfft) {
|
||||
knf::Rfft fft(8);
|
||||
for (int32_t i = 0; i != 10; ++i) {
|
||||
std::vector<float> d = {1, -1, 3, 8, 20, 6, 0, 2};
|
||||
fft.Compute(d.data());
|
||||
|
||||
EXPECT_EQ(d[0], 39);
|
||||
EXPECT_EQ(d[1], 9);
|
||||
|
||||
EXPECT_NEAR(d[2], -28.1924, 1e-3);
|
||||
EXPECT_NEAR(-d[3], -2.2929, 1e-3);
|
||||
|
||||
EXPECT_NEAR(d[4], 18, 1e-3);
|
||||
EXPECT_NEAR(-d[5], 5, 1e-3);
|
||||
|
||||
EXPECT_NEAR(d[6], -9.8076, 1e-3);
|
||||
EXPECT_NEAR(-d[7], 3.7071, 1e-3);
|
||||
}
|
||||
}
|
||||
|
||||
} // namespace knf
|
||||
Reference in New Issue
Block a user