diff --git a/AutoCoverTool/readme.txt b/AutoCoverTool/readme.txt
new file mode 100644
index 0000000..6ce7935
--- /dev/null
+++ b/AutoCoverTool/readme.txt
@@ -0,0 +1,224 @@
+自动翻唱工具
+1. 训练音色
+2. 给定音频，将音频按照特定音色进行转换
+
+    ----data                    // 所有数据的位置
+    ----ref                     // 依赖的代码的位置
+        ----music_remover       // 消音工具
+        ----so-vits-svc         // 训练音色和变声的工具
+    ----script                  // 脚本位置
+
+
+3. data结构介绍:
+    ---train_users                  // 训练时使用的数据集
+        ---zjl                      // 每个音色
+            ---src                  // 源数据(文件夹)
+            ---vocals               // 消音之后的数据(文件夹)
+            ---speaker0             // 切片之后的数据(文件夹)
+            ---slice_resample       // 重采样规整之后的数据(文件夹)
+                ---speaker0         // 重采样规整之后的数据(文件夹)
+            ---filelists            // 训练时需要使用的文件夹
+                ---train.txt
+                ---val.txt
+                ---test.txt
+            ---config               // 配置文件
+                ---config.json      // 配置文件
+    ---inf_users                    // 推理时要用的数据
+        ---song1                    // 每个测试时输入的歌曲
+            ---src                  // 源数据(文件)
+            ---vocals               // 分离出的人声文件
+            ---acc                  // 分离出的伴奏文件
+        ---song2
+        ...
+    ---out_data                     // 推理出的数据
+        ---song1                    // 每个歌曲
+            ---song1_zjl_vocals     // 歌曲和音色组成的结果人声
+        ---song2
+        ....
+    ---final_data                   // 最终结果
+        ---song1                    // 每个歌曲
+            ---song1_zjl_mix        // 歌曲和音色组成的结果人声混音之后的结果
+
+---------------------------------------------------------------------->>>>
+快速使用之训练:
+    将数据放到data/train_users/xxx/src目录下，以ogg作为结尾
+    然后执行script/train.sh xxx 即可,输出的模型在data/train_users/xxx/logs/32k目录下
+---------------------------------------------------------------------->>>>
+
+训练过程：
+环境变量:
+export LD_LIBRARY_PATH=/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/lib:$LD_LIBRARY_PATH
+export PATH=$PATH:/data/gpu_env_common/env/bin/ffmpeg/bin
+export PYTHONPATH=$PWD:$PWD/ref/music_remover/demucs
+
+# 训练过程
+1. 收集数据放到data/train_users/zjl/src
+2. 提取人声 & 分片 & 取音量响度大的Top80
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_train.py zjl
+3. 重采样
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/resample.py --in_dir=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl --out_dir2=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/slice_resample
+4. 生成配置文件
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/preprocess_flist_config.py --source_dir=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/slice_resample --train_list=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/filelists/train.txt --val_list=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/filelists/val.txt --test_list=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/filelists/test.txt --config_path=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/config/config.json
+5. 预处理提取特征
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/preprocess_hubert_f0.py --in_dir=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/zjl/slice_resample
+6. 拷贝数据到logs文件夹
+mkdir -p data/train_users/zjl/logs/32k
+cp -r data/models/G_0.pth data/train_users/zjl/logs/32k
+cp -r data/models/D_0.pth data/train_users/zjl/logs/32k
+7. 训练
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/train.py -c data/train_users/zjl/config/config.json -m 32k -l data/train_users/zjl/logs
+
+
+# 推理过程
+1. 将输出放入data/inf_users/pfdyt/src.mp3
+2. 提取人声、伴奏
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/test_2/src.mp3 data/inf_users/test_2
+3. 推理
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/inference_main.py data/train_users/zjl/logs/32k/G_2000.pth data/train_users/zjl/config/config.json data/inf_users/pfdyt/vocal_32.wav data/out_data/pfdyt/pfdyt_zjl.wav
+4. 获取占比信息，剔除占比过高的音频
+/data/gpu_env_common/env/anaconda3/envs/th1_9_3_9/bin/python script/process_one.py
+5. 对符合要求的音频进行降噪和拉伸
+/opt/soft/bin/denoise_exe in_wav out_wav
+/opt/soft/bin/draw_volume in_wav ref_wav out_wav
+
+6. 手动制作, 使用 accentize/Chameleon 插件，复制原始wav的混响,以及调整响度大小
+7. 用手动制作好的数据进行再次替换
+/data/gpu_env_common/env/anaconda3/envs/th1_9_3_9/bin/python script/process_one.py
+8. 将替换好的成品和伴奏混合，得到结果
+/opt/soft/bin/simple_mixer in_wav acc_path mix_path
+
+
+4. 将干声重采样
+ffmpeg -i data/out_data/pfdyt/pfdyt_zjl.wav -ar 44100 -ac 2 data/out_data/pfdyt/pfdyt_zjl_44_2.wav
+5. 合成
+/data/rsync/jianli.yang/AutoCoverTool/data/bin/mixer data/models/impluse_im_plus_wet2.wav data/out_data/pfdyt/pfdyt_zjl_44_2.wav data/inf_users/pfdyt/acc.wav data/final_data/pfdyt_zjl_44_2_mix.wav
+
+
+
+
+/data/rsync/jianli.yang/AutoCoverTool/data/bin/mixer data/models/impluse_im_plus_wet2.wav data/out_data/pfdyt/pfdyt_zjl_44_2.wav data/inf_users/pfdyt/acc.wav data/final_data/pfdyt_zjl_44_2_mix.wav
+
+
+
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/0.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/1.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/2.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/3.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/4.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/5.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/6.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step1/7.zip
+
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step2/0.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step2/1.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step3/2.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step4/3.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step5/4.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step6/5.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step7/6.zip
+https://av-audit-sync-bj-1256122840.cos.ap-beijing.myqcloud.com/tmp/fanchang/step8/7.zip
+
+
+// 从编辑库获取原唱数据:
+select task_url,starmaker_songid from starmaker_musicbook.silence where starmaker_songid in
+
+611752105026189342
+611752105030433779
+611752105029689090
+611752105021285282
+611752105030419624
+611752105030419633
+611752105030104548
+611752105029990849
+611752105029993297
+611752105030047424
+611752105030419688
+611752105023434557
+611752105024429936
+611752105027557408
+611752105024250202
+611752105027302268
+611752105026707760
+611752105022345104
+611752105024678976
+611752105024679221
+611752105020378620
+611752105022667231
+611752105023811083
+611752105023623965
+611752105022745595
+611752105020290695
+611752105028683824
+611752105020411654
+611752105020286501
+611752105020387015
+611752105020382559
+611752105030077711
+611752105019423720
+611752105020256284
+611752105020357112
+611752105024628047
+611752105020282612
+611752105020351134
+611752105020336950
+611752105022736204
+611752105020290639
+611752105021442406
+611752105020286443
+611752105024953316
+611752105020282613
+611752105024714646
+611752105022647082
+611752105027188746
+611752105022770952
+611752105020417488
+611752105025104181
+611752105022735101
+611752105023532439
+611752105022842477
+611752105028650636
+611752105022842004
+611752105029954168
+611752105020417688
+611752105020336946
+611752105020394297
+611752105026946178
+611752105020343687
+611752105024676794
+611752105020390950
+611752105020286433
+611752105026771723
+611752105022446809
+611752105020350988
+611752105025510149
+611752105020394121
+611752105021442417
+611752105020256227
+611752105025231610
+611752105021453011
+611752105020325137
+611752105027047993
+611752105021330812
+611752105021375100
+611752105021273980
+611752105021453011
+611752105020325137
+611752105027047993
+611752105021330812
+611752105021273980
+611752105024786030
+611752105027189453
+611752105020548211
+611752105020286446
+611752105020376320
+611752105020563523
+611752105027588072
+611752105022389596
+611752105020315368
+611752105020343699
+611752105029954089
+611752105026523547
+611752105029955214
+611752105020315328
+611752105020350990
+611752105021332759
diff --git a/AutoCoverTool/ref/music_remover/demucs/CODE_OF_CONDUCT.md b/AutoCoverTool/ref/music_remover/demucs/CODE_OF_CONDUCT.md
new file mode 100644
index 0000000..f049d4c
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/CODE_OF_CONDUCT.md
@@ -0,0 +1,76 @@
+# Code of Conduct
+
+## Our Pledge
+
+In the interest of fostering an open and welcoming environment, we as
+contributors and maintainers pledge to make participation in our project and
+our community a harassment-free experience for everyone, regardless of age, body
+size, disability, ethnicity, sex characteristics, gender identity and expression,
+level of experience, education, socio-economic status, nationality, personal
+appearance, race, religion, or sexual identity and orientation.
+
+## Our Standards
+
+Examples of behavior that contributes to creating a positive environment
+include:
+
+* Using welcoming and inclusive language
+* Being respectful of differing viewpoints and experiences
+* Gracefully accepting constructive criticism
+* Focusing on what is best for the community
+* Showing empathy towards other community members
+
+Examples of unacceptable behavior by participants include:
+
+* The use of sexualized language or imagery and unwelcome sexual attention or
+  advances
+* Trolling, insulting/derogatory comments, and personal or political attacks
+* Public or private harassment
+* Publishing others' private information, such as a physical or electronic
+  address, without explicit permission
+* Other conduct which could reasonably be considered inappropriate in a
+  professional setting
+
+## Our Responsibilities
+
+Project maintainers are responsible for clarifying the standards of acceptable
+behavior and are expected to take appropriate and fair corrective action in
+response to any instances of unacceptable behavior.
+
+Project maintainers have the right and responsibility to remove, edit, or
+reject comments, commits, code, wiki edits, issues, and other contributions
+that are not aligned to this Code of Conduct, or to ban temporarily or
+permanently any contributor for other behaviors that they deem inappropriate,
+threatening, offensive, or harmful.
+
+## Scope
+
+This Code of Conduct applies within all project spaces, and it also applies when
+an individual is representing the project or its community in public spaces.
+Examples of representing a project or community include using an official
+project e-mail address, posting via an official social media account, or acting
+as an appointed representative at an online or offline event. Representation of
+a project may be further defined and clarified by project maintainers.
+
+## Enforcement
+
+Instances of abusive, harassing, or otherwise unacceptable behavior may be
+reported by contacting the project team at <opensource-conduct@fb.com>. All
+complaints will be reviewed and investigated and will result in a response that
+is deemed necessary and appropriate to the circumstances. The project team is
+obligated to maintain confidentiality with regard to the reporter of an incident.
+Further details of specific enforcement policies may be posted separately.
+
+Project maintainers who do not follow or enforce the Code of Conduct in good
+faith may face temporary or permanent repercussions as determined by other
+members of the project's leadership.
+
+## Attribution
+
+This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
+available at https://www.contributor-covenant.org/version/1/4/code-of-conduct.html
+
+[homepage]: https://www.contributor-covenant.org
+
+For answers to common questions about this code of conduct, see
+https://www.contributor-covenant.org/faq
diff --git a/AutoCoverTool/ref/music_remover/demucs/CONTRIBUTING.md b/AutoCoverTool/ref/music_remover/demucs/CONTRIBUTING.md
new file mode 100644
index 0000000..f14f4af
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/CONTRIBUTING.md
@@ -0,0 +1,23 @@
+# Contributing to Demucs
+
+## Pull Requests
+
+In order to accept your pull request, we need you to submit a CLA. You only need
+to do this once to work on any of Facebook's open source projects.
+
+Complete your CLA here: <https://code.facebook.com/cla>
+
+Demucs is the implementation of a research paper.
+Therefore, we do not plan on accepting many pull requests for new features.
+We certainly welcome them for bug fixes.
+
+
+## Issues
+
+We use GitHub issues to track public bugs. Please ensure your description is
+clear and has sufficient instructions to be able to reproduce the issue.
+
+
+## License
+By contributing to this repository, you agree that your contributions will be licensed
+under the LICENSE file in the root directory of this source tree.
diff --git a/AutoCoverTool/ref/music_remover/demucs/Demucs.ipynb b/AutoCoverTool/ref/music_remover/demucs/Demucs.ipynb
new file mode 100644
index 0000000..9ebcfd5
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/Demucs.ipynb
@@ -0,0 +1,153 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "colab_type": "text",
+    "id": "Be9yoh-ILfRr"
+   },
+   "source": [
+    "# Hybrid Demucs\n",
+    "\n",
+    "Feel free to use the Colab version:\n",
+    "https://colab.research.google.com/drive/1dC9nVxk3V_VPjUADsnFu8EiT-xnU1tGH?usp=sharing"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "colab": {
+     "base_uri": "https://localhost:8080/",
+     "height": 139
+    },
+    "colab_type": "code",
+    "executionInfo": {
+     "elapsed": 12277,
+     "status": "ok",
+     "timestamp": 1583778134659,
+     "user": {
+      "displayName": "Marllus Lustosa",
+      "photoUrl": "https://lh3.googleusercontent.com/a-/AOh14GgLl2RbW64ZyWz3Y8IBku0zhHCMnt7fz7fEl0LTdA=s64",
+      "userId": "14811735256675200480"
+     },
+     "user_tz": 180
+    },
+    "id": "kOjIPLlzhPfn",
+    "outputId": "c75f17ec-b576-4105-bc5b-c2ac9c1018a3"
+   },
+   "outputs": [],
+   "source": [
+    "!pip install -U demucs\n",
+    "# or for local development, if you have a clone of Demucs\n",
+    "# pip install -e ."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "colab": {},
+    "colab_type": "code",
+    "id": "5lYOzKKCKAbJ"
+   },
+   "outputs": [],
+   "source": [
+    "# You can use the `demucs` command line to separate tracks\n",
+    "!demucs test.mp3"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# You can also load directly the pretrained models,\n",
+    "# for instance for the MDX 2021 winning model of Track A:\n",
+    "from demucs import pretrained\n",
+    "model = pretrained.get_model('mdx')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Because `model` is a bag of 4 models, you cannot directly call it on your data,\n",
+    "# but the `apply_model` will know what to do of it.\n",
+    "import torch\n",
+    "from demucs.apply import apply_model\n",
+    "x = torch.randn(1, 2, 44100 * 10)  # ten seconds of white noise for the demo\n",
+    "out = apply_model(model, x)[0]     # shape is [S, C, T] with S the number of sources\n",
+    "\n",
+    "# So let see, where is all the white noise content is going ?\n",
+    "for name, source in zip(model.sources, out):\n",
+    "    print(name, source.std() / x.std())\n",
+    "# The outputs are quite weird to be fair, not what I would have expected."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# now let's take a single model from the bag, and let's test it on a pure cosine\n",
+    "freq = 440  # in Hz\n",
+    "sr = model.samplerate\n",
+    "t = torch.arange(10 * sr).float() / sr\n",
+    "x = torch.cos(2 * 3.1416 * freq * t).expand(1, 2, -1)\n",
+    "sub_model = model.models[3]\n",
+    "out = sub_model(x)[0]\n",
+    "\n",
+    "# Same question where does it go?\n",
+    "for name, source in zip(model.sources, out):\n",
+    "    print(name, source.std() / x.std())\n",
+    "    \n",
+    "# Well now it makes much more sense, all the energy is going\n",
+    "# in the `other` source.\n",
+    "# Feel free to try lower pitch (try 80 Hz) to see what happens !"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# For training or more fun, refer to the Demucs README on our repo\n",
+    "# https://github.com/facebookresearch/demucs/tree/main/demucs"
+   ]
+  }
+ ],
+ "metadata": {
+  "accelerator": "GPU",
+  "colab": {
+   "authorship_tag": "ABX9TyM9xpVr1M86NRcjtQ7g9tCx",
+   "collapsed_sections": [],
+   "name": "Demucs.ipynb",
+   "provenance": []
+  },
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.8"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
diff --git a/AutoCoverTool/ref/music_remover/demucs/LICENSE b/AutoCoverTool/ref/music_remover/demucs/LICENSE
new file mode 100644
index 0000000..5797855
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) Meta, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/MANIFEST.in b/AutoCoverTool/ref/music_remover/demucs/MANIFEST.in
new file mode 100644
index 0000000..96e5f54
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/MANIFEST.in
@@ -0,0 +1,13 @@
+recursive-exclude env *
+recursive-include conf *.yaml
+include Makefile
+include LICENSE
+include demucs.png
+include outputs.tar.gz
+include test.mp3
+include requirements.txt
+include requirements_minimal.txt
+include mypy.ini
+include demucs/py.typed
+include demucs/remote/*.txt
+include demucs/remote/*.yaml
diff --git a/AutoCoverTool/ref/music_remover/demucs/Makefile b/AutoCoverTool/ref/music_remover/demucs/Makefile
new file mode 100644
index 0000000..344786c
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/Makefile
@@ -0,0 +1,32 @@
+all: linter tests
+
+linter:
+	flake8 demucs
+	mypy demucs
+
+tests: test_train test_eval
+
+test_train: tests/musdb
+	_DORA_TEST_PATH=/tmp/demucs python3 -m dora run --clear \
+		dset.musdb=./tests/musdb dset.segment=4 dset.shift=2 epochs=2 model=demucs \
+		demucs.depth=2 demucs.channels=4 test.sdr=false misc.num_workers=0 test.workers=0 \
+		test.shifts=0
+
+test_eval:
+	python3 -m demucs -n demucs_unittest test.mp3
+	python3 -m demucs -n demucs_unittest --two-stems=vocals test.mp3
+	python3 -m demucs -n demucs_unittest --mp3 test.mp3
+	python3 -m demucs -n demucs_unittest --int24 --clip-mode clamp test.mp3
+
+tests/musdb:
+	test -e tests || mkdir tests
+	python3 -c 'import musdb; musdb.DB("tests/tmp", download=True)'
+	musdbconvert tests/tmp tests/musdb
+
+dist:
+	python3 setup.py sdist
+
+clean:
+	rm -r dist build *.egg-info
+
+.PHONY: linter dist test_train test_eval
diff --git a/AutoCoverTool/ref/music_remover/demucs/README.md b/AutoCoverTool/ref/music_remover/demucs/README.md
new file mode 100644
index 0000000..365c03e
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/README.md
@@ -0,0 +1,290 @@
+# Demucs Music Source Separation
+
+[![Support Ukraine](https://img.shields.io/badge/Support-Ukraine-FFD500?style=flat&labelColor=005BBB)](https://opensource.fb.com/support-ukraine)
+![tests badge](https://github.com/facebookresearch/demucs/workflows/tests/badge.svg)
+![linter badge](https://github.com/facebookresearch/demucs/workflows/linter/badge.svg)
+
+
+This is the 4th release of Demucs (v4), featuring Hybrid Transformer based source separation.
+**For the classic Hybrid Demucs (v3):** [Go this commit][demucs_v3].
+If you are experiencing issues and want the old Demucs back, please fill an issue, and then you can get back to the v3 with
+`git checkout v3`. You can also go [Demucs v2][demucs_v2].
+
+
+Demucs is a state-of-the-art music source separation model, currently capable of separating
+drums, bass, and vocals from the rest of the accompaniment.
+Demucs is based on a U-Net convolutional architecture inspired by [Wave-U-Net][waveunet].
+The v4 version features [Hybrid Transformer Demucs][htdemucs], a hybrid spectrogram/waveform separation model using Transformers.
+It is based on [Hybrid Demucs][hybrid_paper] (also provided in this repo) with the innermost layers are
+replaced by a cross-domain Transformer Encoder. This Transformer uses self-attention within each domain,
+and cross-attention across domains.
+The model achieves a SDR of 9.00 dB on the MUSDB HQ test set. Moreover, when using sparse attention
+kernels to extend its receptive field and per source fine-tuning, we achieve state-of-the-art 9.20 dB of SDR.
+
+Samples are available [on our sample page](https://ai.honu.io/papers/htdemucs/index.html).
+Checkout [our paper][htdemucs] for more information.
+It has been trained on the [MUSDB HQ][musdb] dataset + an extra training dataset of 800 songs.
+This model separates drums, bass and vocals and other stems for any song.
+
+
+As Hybrid Transformer Demucs is brand new, it is not activated by default, you can activate it in the usual
+commands described hereafter with `-n htdemucs_ft`.
+The single, non fine-tuned model is provided as `-n htdemucs`, and the retrained baseline
+as `-n hdemucs_mmi`. The Sparse Hybrid Transformer model decribed in our paper is not provided as its
+requires custom CUDA code that is not ready for release yet.
+
+
+<p align="center">
+<img src="./demucs.png" alt="Schema representing the structure of Hybrid Transformer Demucs,
+    with a dual U-Net structure, one branch for the temporal domain,
+    and one branch for the spectral domain. There is a cross-domain Transformer between the Encoders and Decoders."
+width="800px"></p>
+
+
+
+## Important news if you are already using Demucs
+
+See the [release notes](./docs/release.md) for more details.
+
+- 16/11/2022: Added the new Hybrid Transformer Demucs models.
+	Adding support for the [torchaudio implementation of HDemucs](https://pytorch.org/audio/stable/tutorials/hybrid_demucs_tutorial.html).
+- 30/08/2022: added reproducibility and ablation grids, along with an updated version of the paper.
+- 17/08/2022: Releasing v3.0.5: Set split segment length to reduce memory. Compatible with pyTorch 1.12.
+- 24/02/2022: Releasing v3.0.4: split into two stems (i.e. karaoke mode).
+    Export as float32 or int24.
+- 17/12/2021: Releasing v3.0.3: bug fixes  (thanks @keunwoochoi), memory drastically
+    reduced on GPU (thanks @famzah) and new multi-core evaluation on CPU (`-j` flag).
+- 12/11/2021: Releasing **Demucs v3** with hybrid domain separation. Strong improvements
+	on all sources. This is the model that won Sony MDX challenge.
+- 11/05/2021: Adding support for MusDB-HQ and arbitrary wav set, for the MDX challenge. For more information
+on joining the challenge with Demucs see [the Demucs MDX instructions](docs/mdx.md)
+- 28/04/2021: **Demucs v2**, with extra augmentation and DiffQ based quantization.
+  **EVERYTHING WILL BREAK**, please restart from scratch following the instructions hereafter.
+  This version also adds overlap between prediction frames, with linear transition from one to the next,
+  which should prevent sudden changes at frame boundaries. Also, Demucs is now on PyPI, so for separation
+  only, installation is as easy as `pip install demucs` :)
+- 13/04/2020: **Demucs released under MIT**: We are happy to release Demucs under the MIT licence.
+    We hope that this will broaden the impact of this research to new applications.
+
+
+## Comparison with other models
+
+We provide hereafter a summary of the different metrics presented in the paper.
+You can also compare Hybrid Demucs (v3), [KUIELAB-MDX-Net][kuielab], [Spleeter][spleeter], Open-Unmix, Demucs (v1), and Conv-Tasnet on one of my favorite
+songs on my [soundcloud playlist][soundcloud].
+
+### Comparison of accuracy
+
+`Overall SDR` is the mean of the SDR for each of the 4 sources, `MOS Quality` is a rating from 1 to 5
+of the naturalness and absence of artifacts given by human listeners (5 = no artifacts), `MOS Contamination`
+is a rating from 1 to 5 with 5 being zero contamination by other sources. We refer the reader to our [paper][hybrid_paper],
+for more details.
+
+| Model                        | Domain      | Extra data? | Overall SDR | MOS Quality | MOS Contamination |
+|------------------------------|-------------|-------------|-------------|-------------|-------------------|
+| [Wave-U-Net][waveunet]       | waveform    | no          | 3.2         | -           | -                 |
+| [Open-Unmix][openunmix]      | spectrogram | no          | 5.3         | -           | -                 |
+| [D3Net][d3net]               | spectrogram | no          | 6.0         | -           | -                 |
+| [Conv-Tasnet][demucs_v2]     | waveform    | no          | 5.7         | -           |                   |
+| [Demucs (v2)][demucs_v2]     | waveform    | no          | 6.3         | 2.37        | 2.36              |
+| [ResUNetDecouple+][decouple] | spectrogram | no          | 6.7         | -           | -                 |
+| [KUIELAB-MDX-Net][kuielab]   | hybrid      | no          | 7.5         | **2.86**    | 2.55              |
+| [Band-Spit RNN][bandsplit]   | spectrogram | no          | **8.2**     | -           | -                 |
+| **Hybrid Demucs (v3)**       | hybrid      | no          | 7.7         | **2.83**    | **3.04**          |
+| [MMDenseLSTM][mmdenselstm]   | spectrogram | 804 songs   | 6.0         | -           | -                 |
+| [D3Net][d3net]               | spectrogram | 1.5k songs  | 6.7         | -           | -                 |
+| [Spleeter][spleeter]         | spectrogram | 25k songs   | 5.9         | -           | -                 |
+| [Band-Spit RNN][bandsplit]   | spectrogram | 1.7k (mixes only)     | **9.0**     | -           | -                 |
+| **HT Demucs f.t. (v4)**      | hybrid      | 800 songs   | **9.0**     | -           | -                 |
+
+
+
+## Requirements
+
+You will need at least Python 3.7. See `requirements_minimal.txt` for requirements for separation only,
+and `environment-[cpu|cuda].yml` (or `requirements.txt`) if you want to train a new model.
+
+### For Windows users
+
+Everytime you see `python3`, replace it with `python.exe`. You should always run commands from the
+Anaconda console.
+
+### For musicians
+
+If you just want to use Demucs to separate tracks, you can install it with
+
+```bash
+python3 -m pip install -U demucs
+```
+
+For bleeding edge versions, you can install directly from this repo using
+```bash
+python3 -m pip install -U git+https://github.com/facebookresearch/demucs#egg=demucs
+```
+
+**For Hybrid Transformer Demucs,** you must install the bleeding edge version and use either
+`-n htdemucs` or `-n htdemucs_ft`.
+
+Advanced OS support are provided on the following page, **you must read the page for your OS before posting an issues**:
+- **If you are using Windows:** [Windows support](docs/windows.md).
+- **If you are using MAC OS X:** [Mac OS X support](docs/mac.md).
+- **If you are using Linux:** [Linux support](docs/linux.md).
+
+### For machine learning scientists
+
+If you have anaconda installed, you can run from the root of this repository:
+
+```bash
+conda env update -f environment-cpu.yml  # if you don't have GPUs
+conda env update -f environment-cuda.yml # if you have GPUs
+conda activate demucs
+pip install -e .
+```
+
+This will create a `demucs` environment with all the dependencies installed.
+
+You will also need to install [soundstretch/soundtouch](https://www.surina.net/soundtouch/soundstretch.html): on Mac OSX you can do `brew install sound-touch`,
+and on Ubuntu `sudo apt-get install soundstretch`. This is used for the
+pitch/tempo augmentation.
+
+
+### Running in Docker
+
+Thanks to @xserrat, there is now a Docker image definition ready for using Demucs. This can ensure all libraries are correctly installed without interfering with the host OS. See his repo [Docker Facebook Demucs](https://github.com/xserrat/docker-facebook-demucs) for more information.
+
+
+### Running from Colab
+
+I made a Colab to easily separate track with Demucs. Note that
+transfer speeds with Colab are a bit slow for large media files,
+but it will allow you to use Demucs without installing anything.
+
+[Demucs on Google Colab](https://colab.research.google.com/drive/1dC9nVxk3V_VPjUADsnFu8EiT-xnU1tGH?usp=sharing)
+
+### Web Demo
+
+Integrated to [Huggingface Spaces](https://huggingface.co/spaces) with [Gradio](https://github.com/gradio-app/gradio). See demo: [![Hugging Face Spaces](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Spaces-blue)](https://huggingface.co/spaces/akhaliq/demucs)
+
+### Graphical Interface
+
+@CarlGao4 has released a GUI for Demucs: [CarlGao4/Demucs-Gui](https://github.com/CarlGao4/Demucs-Gui). Downloads for Windows and macOS is available [here](https://github.com/CarlGao4/Demucs-Gui/releases). Use [FossHub mirror](https://fosshub.com/Demucs-GUI.html) to speed up your download.
+
+@Anjok07 is providing a self contained GUI in [UVR (Ultimate Vocal Remover)](https://github.com/facebookresearch/demucs/issues/334) that supports Demucs.
+
+### Other providers
+
+Audiostrip is providing free online separation with Demucs on their website [https://audiostrip.co.uk/](https://audiostrip.co.uk/).
+[MVSep](https://mvsep.com/) also provides free online separation, select `Demucs3 model B` for the best quality.
+
+Spleeter.io provides free online separation with Demucs on their website [https://www.spleeter.io/demucs](https://www.spleeter.io/demucs).
+
+
+## Separating tracks
+
+In order to try Demucs, you can just run from any folder (as long as you properly installed it)
+
+```bash
+demucs PATH_TO_AUDIO_FILE_1 [PATH_TO_AUDIO_FILE_2 ...]   # for Demucs
+# If you used `pip install --user` you might need to replace demucs with python3 -m demucs
+python3 -m demucs --mp3 --mp3-bitrate BITRATE PATH_TO_AUDIO_FILE_1  # output files saved as MP3
+# If your filename contain spaces don't forget to quote it !!!
+demucs "my music/my favorite track.mp3"
+# You can select different models with `-n` mdx_q is the quantized model, smaller but maybe a bit less accurate.
+demucs -n mdx_q myfile.mp3
+# If you only want to separate vocals out of an audio, use `--two-stems=vocal` (You can also set to drums or bass)
+demucs --two-stems=vocals myfile.mp3
+```
+
+
+If you have a GPU, but you run out of memory, please use `--segment SEGMENT` to reduce length of each split. `SEGMENT` should be changed to a integer. Personally recommend not less than 10 (the bigger the number is, the more memory is required, but quality may increase). Create an environment variable `PYTORCH_NO_CUDA_MEMORY_CACHING=1` is also helpful. If this still cannot help, please add `-d cpu` to the command line. See the section hereafter for more details on the memory requirements for GPU acceleration.
+
+Separated tracks are stored in the `separated/MODEL_NAME/TRACK_NAME` folder. There you will find four stereo wav files sampled at 44.1 kHz: `drums.wav`, `bass.wav`,
+`other.wav`, `vocals.wav` (or `.mp3` if you used the `--mp3` option).
+
+All audio formats supported by `torchaudio` can be processed (i.e. wav, mp3, flac, ogg/vorbis on Linux/Mac OS X etc.). On Windows, `torchaudio` has limited support, so we rely on `ffmpeg`, which should support pretty much anything.
+Audio is resampled on the fly if necessary.
+The output will be a wave file encoded as int16.
+You can save as float32 wav files with `--float32`, or 24 bits integer wav with `--int24`.
+You can pass `--mp3` to save as mp3 instead, and set the bitrate with `--mp3-bitrate` (default is 320kbps).
+
+It can happen that the output would need clipping, in particular due to some separation artifacts.
+Demucs will automatically rescale each output stem so as to avoid clipping. This can however break
+the relative volume between stems. If instead you prefer hard clipping, pass `--clip-mode clamp`.
+You can also try to reduce the volume of the input mixture before feeding it to Demucs.
+
+
+Other pre-trained models can be selected with the `-n` flag.
+The list of pre-trained models is:
+- `htdemucs`: first version of Hybrid Transformer Demucs. Trained on MusDB + 800 songs.
+- `htdemucs_ft`: fine-tuned version of `htdemucs`, separation will take 4 times more time
+    but might be a bit better. Same training set as `htdemucs`.
+- `hdemucs_mmi`: Hybrid Demucs v3, retrained on MusDB + 800 songs.
+- `mdx`: trained only on MusDB HQ, winning model on track A at the [MDX][mdx] challenge.
+- `mdx_extra`: trained with extra training data (including MusDB test set), ranked 2nd on the track B
+    of the [MDX][mdx] challenge.
+- `mdx_q`, `mdx_extra_q`: quantized version of the previous models. Smaller download and storage
+    but quality can be slightly worse. `mdx_extra_q` is the default model used.
+- `SIG`: where `SIG` is a single model from the [model zoo](docs/training.md#model-zoo).
+
+The `--two-stems=vocals` option allows to separate vocals from the rest (e.g. karaoke mode).
+`vocals` can be changed into any source in the selected model.
+This will mix the files after separating the mix fully, so this won't be faster or use less memory.
+
+The `--shifts=SHIFTS` performs multiple predictions with random shifts (a.k.a the *shift trick*) of the input and average them. This makes prediction `SHIFTS` times
+slower. Don't use it unless you have a GPU.
+
+The `--overlap` option controls the amount of overlap between prediction windows. Default is 0.25 (i.e. 25%) which is probably fine.
+It can probably be reduced to 0.1 to improve a bit speed.
+
+
+The `-j` flag allow to specify a number of parallel jobs (e.g. `demucs -j 2 myfile.mp3`).
+This will multiply by the same amount the RAM used so be careful!
+
+### Memory requirements for GPU acceleration
+
+If you want to use GPU acceleration, you will need at least 3GB of RAM on your GPU for `demucs`. However, about 7GB of RAM will be required if you use the default arguments. Add `--segment SEGMENT` to change size of each split. If you only have 3GB memory, set SEGMENT to 8 (though quality may be worse if this argument is too small). Creating an environment variable `PYTORCH_NO_CUDA_MEMORY_CACHING=1` can help users with even smaller RAM such as 2GB (I separated a track that is 4 minutes but only 1.5GB is used), but this would make the separation slower.
+
+If you do not have enough memory on your GPU, simply add `-d cpu` to the command line to use the CPU. With Demucs, processing time should be roughly equal to 1.5 times the duration of the track.
+
+
+## Training Demucs
+
+If you want to train (Hybrid) Demucs, please follow the [training doc](docs/training.md).
+
+## MDX Challenge reproduction
+
+In order to reproduce the results from the Track A and Track B submissions, checkout the [MDX Hybrid Demucs submission repo][mdx_submission].
+
+
+
+## How to cite
+
+```
+@inproceedings{defossez2021hybrid,
+  title={Hybrid Spectrogram and Waveform Source Separation},
+  author={D{\'e}fossez, Alexandre},
+  booktitle={Proceedings of the ISMIR 2021 Workshop on Music Source Separation},
+  year={2021}
+}
+```
+
+## License
+
+Demucs is released under the MIT license as found in the [LICENSE](LICENSE) file.
+
+[hybrid_paper]: https://arxiv.org/abs/2111.03600
+[waveunet]: https://github.com/f90/Wave-U-Net
+[musdb]: https://sigsep.github.io/datasets/musdb.html
+[openunmix]: https://github.com/sigsep/open-unmix-pytorch
+[mmdenselstm]: https://arxiv.org/abs/1805.02410
+[demucs_v2]: https://github.com/facebookresearch/demucs/tree/v2
+[demucs_v3]: https://github.com/facebookresearch/demucs/tree/v3
+[spleeter]: https://github.com/deezer/spleeter
+[soundcloud]: https://soundcloud.com/honualx/sets/source-separation-in-the-waveform-domain
+[d3net]: https://arxiv.org/abs/2010.01733
+[mdx]: https://www.aicrowd.com/challenges/music-demixing-challenge-ismir-2021
+[kuielab]: https://github.com/kuielab/mdx-net-submission
+[decouple]: https://arxiv.org/abs/2109.05418
+[mdx_submission]: https://github.com/adefossez/mdx21_demucs
+[bandsplit]: https://arxiv.org/abs/2209.15174
+[htdemucs]: https://arxiv.org/abs/2211.08553
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/config.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/config.yaml
new file mode 100644
index 0000000..0ea477e
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/config.yaml
@@ -0,0 +1,302 @@
+defaults:
+  - _self_
+  - dset: musdb44
+  - svd: default
+  - variant: default
+  - override hydra/hydra_logging: colorlog
+  - override hydra/job_logging: colorlog
+
+dummy:
+dset:
+  musdb: /checkpoint/defossez/datasets/musdbhq
+  musdb_samplerate: 44100
+  wav:  # path to custom wav dataset
+  wav2:  # second custom wav dataset
+  segment: 11
+  shift: 1
+  train_valid: false
+  full_cv: true
+  samplerate: 44100
+  channels: 2
+  normalize: true
+  metadata: ./metadata
+  sources: ['drums', 'bass', 'other', 'vocals']
+  valid_samples: # valid dataset size
+
+test:
+  save: False
+  best: True
+  workers: 2
+  every: 20
+  split: true
+  shifts: 1
+  overlap: 0.25
+  sdr: true
+  metric: 'loss'  # metric used for best model selection on the valid set, can also be nsdr
+  nonhq:   # path to non hq MusDB for evaluation
+
+epochs: 360
+batch_size: 64
+max_batches:  # limit the number of batches per epoch, useful for debugging
+              # or if your dataset is gigantic.
+optim:
+  lr: 3e-4
+  momentum: 0.9
+  beta2: 0.999
+  loss: l1    # l1 or mse
+  optim: adam
+  weight_decay: 0
+  clip_grad: 0
+
+seed: 42
+debug: false
+valid_apply: true
+flag:
+save_every:
+weights: [1., 1., 1., 1.]  # weights over each source for the training/valid loss.
+
+augment:
+  shift_same: false
+  repitch:
+    proba: 0.2
+    max_tempo: 12
+  remix:
+    proba: 1
+    group_size: 4
+  scale:
+    proba: 1
+    min: 0.25
+    max: 1.25
+  flip: true
+
+continue_from:  # continue from other XP, give the XP Dora signature.
+continue_pretrained:   # signature of a pretrained XP, this cannot be a bag of models.
+pretrained_repo:   # repo for pretrained model (default is official AWS)
+continue_best: true
+continue_opt: false
+
+misc:
+  num_workers: 10
+  num_prints: 4
+  show: false
+  verbose: false
+
+# List of decay for EMA at batch or epoch level, e.g. 0.999.
+# Batch level EMA are kept on GPU for speed.
+ema:
+  epoch: []
+  batch: []
+
+use_train_segment: true  # to remove
+model_segment:  # override the segment parameter for the model, usually 4 times the training segment.
+model: demucs  # see demucs/train.py for the possibilities, and config for each model hereafter.
+demucs:  # see demucs/demucs.py for a detailed description
+  # Channels
+  channels: 64
+  growth: 2
+  # Main structure
+  depth: 6
+  rewrite: true
+  lstm_layers: 0
+  # Convolutions
+  kernel_size: 8
+  stride: 4
+  context: 1
+  # Activations
+  gelu: true
+  glu: true
+  # Normalization
+  norm_groups: 4
+  norm_starts: 4
+  # DConv residual branch
+  dconv_depth: 2
+  dconv_mode: 1  # 1 = branch in encoder, 2 = in decoder, 3 = in both.
+  dconv_comp: 4
+  dconv_attn: 4
+  dconv_lstm: 4
+  dconv_init: 1e-4
+  # Pre/post treatment
+  resample: true
+  normalize: false
+  # Weight init
+  rescale: 0.1
+
+hdemucs:  # see demucs/hdemucs.py for a detailed description
+  # Channels
+  channels: 48
+  channels_time:
+  growth: 2
+  # STFT
+  nfft: 4096
+  wiener_iters: 0
+  end_iters: 0
+  wiener_residual: false
+  cac: true
+  # Main structure
+  depth: 6
+  rewrite: true
+  hybrid: true
+  hybrid_old: false
+  # Frequency Branch
+  multi_freqs: []
+  multi_freqs_depth: 3
+  freq_emb: 0.2
+  emb_scale: 10
+  emb_smooth: true
+  # Convolutions
+  kernel_size: 8
+  stride: 4
+  time_stride: 2
+  context: 1
+  context_enc: 0
+  # normalization
+  norm_starts: 4
+  norm_groups: 4
+  # DConv residual branch
+  dconv_mode: 1
+  dconv_depth: 2
+  dconv_comp: 4
+  dconv_attn: 4
+  dconv_lstm: 4
+  dconv_init: 1e-3
+  # Weight init
+  rescale: 0.1
+
+# Torchaudio implementation of HDemucs
+torch_hdemucs:
+# Channels
+  channels: 48
+  growth: 2
+  # STFT
+  nfft: 4096
+  # Main structure
+  depth: 6
+  freq_emb: 0.2
+  emb_scale: 10
+  emb_smooth: true
+  # Convolutions
+  kernel_size: 8
+  stride: 4
+  time_stride: 2
+  context: 1
+  context_enc: 0
+  # normalization
+  norm_starts: 4
+  norm_groups: 4
+  # DConv residual branch
+  dconv_depth: 2
+  dconv_comp: 4
+  dconv_attn: 4
+  dconv_lstm: 4
+  dconv_init: 1e-3
+
+htdemucs:  # see demucs/htdemucs.py for a detailed description
+  # Channels
+  channels: 48
+  channels_time:
+  growth: 2
+  # STFT
+  nfft: 4096
+  wiener_iters: 0
+  end_iters: 0
+  wiener_residual: false
+  cac: true
+  # Main structure
+  depth: 4
+  rewrite: true
+  # Frequency Branch
+  multi_freqs: []
+  multi_freqs_depth: 3
+  freq_emb: 0.2
+  emb_scale: 10
+  emb_smooth: true
+  # Convolutions
+  kernel_size: 8
+  stride: 4
+  time_stride: 2
+  context: 1
+  context_enc: 0
+  # normalization
+  norm_starts: 4
+  norm_groups: 4
+  # DConv residual branch
+  dconv_mode: 1
+  dconv_depth: 2
+  dconv_comp: 8
+  dconv_init: 1e-3
+  # Before the Transformer
+  bottom_channels: 0
+  # CrossTransformer
+  # ------ Common to all
+  # Regular parameters
+  t_layers: 5
+  t_hidden_scale: 4.0
+  t_heads: 8
+  t_dropout: 0.0
+  t_layer_scale: True
+  t_gelu: True
+  # ------------- Positional Embedding
+  t_emb: sin
+  t_max_positions: 10000 # for the scaled embedding
+  t_max_period: 10000.0
+  t_weight_pos_embed: 1.0
+  t_cape_mean_normalize: True
+  t_cape_augment: True
+  t_cape_glob_loc_scale: [5000.0, 1.0, 1.4]
+  t_sin_random_shift: 0
+  # ------------- norm before a transformer encoder
+  t_norm_in: True
+  t_norm_in_group: False
+  # ------------- norm inside the encoder
+  t_group_norm: False
+  t_norm_first: True
+  t_norm_out: True
+  # ------------- optim
+  t_weight_decay: 0.0
+  t_lr:
+  # ------------- sparsity
+  t_sparse_self_attn: False
+  t_sparse_cross_attn: False
+  t_mask_type: diag
+  t_mask_random_seed: 42
+  t_sparse_attn_window: 400
+  t_global_window: 100
+  t_sparsity: 0.95
+  t_auto_sparsity: False
+  # Cross Encoder First (False)
+  t_cross_first: False
+  # Weight init
+  rescale: 0.1
+
+svd:  # see svd.py for documentation
+  penalty: 0
+  min_size: 0.1
+  dim: 1
+  niters: 2
+  powm: false
+  proba: 1
+  conv_only: false
+  convtr: false
+  bs: 1
+
+quant:  # quantization hyper params
+  diffq:    # diffq penalty, typically 1e-4 or 3e-4
+  qat:      # use QAT with a fixed number of bits (not as good as diffq)
+  min_size: 0.2
+  group_size: 8
+
+dora:
+  dir: outputs
+  exclude: ["misc.*", "slurm.*", 'test.reval', 'flag']
+
+slurm:
+  time: 4320
+  constraint: volta32gb
+  setup: ['module load cudnn/v8.4.1.50-cuda.11.6 NCCL/2.11.4-6-cuda.11.6 cuda/11.6']
+
+# Hydra config
+hydra:
+  job_logging:
+    formatters:
+      colorlog:
+        datefmt: "%m-%d %H:%M:%S"
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/aetl.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/aetl.yaml
new file mode 100644
index 0000000..7c98316
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/aetl.yaml
@@ -0,0 +1,19 @@
+# @package _global_
+
+# automix dataset with Musdb, extra training data and the test set of Musdb.
+# This used even more remixes than auto_extra_test.
+dset:
+  wav: /checkpoint/defossez/datasets/aetl
+  samplerate: 44100
+  channels: 2
+epochs: 320
+max_batches: 500
+
+augment:
+  shift_same: true
+  scale:
+    proba: 0.
+  remix:
+    proba: 0
+  repitch:
+    proba: 0
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/auto_extra_test.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/auto_extra_test.yaml
new file mode 100644
index 0000000..056183a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/auto_extra_test.yaml
@@ -0,0 +1,18 @@
+# @package _global_
+
+# automix dataset with Musdb, extra training data and the test set of Musdb.
+dset:
+  wav: /checkpoint/defossez/datasets/automix_extra_test2
+  samplerate: 44100
+  channels: 2
+epochs: 320
+max_batches: 500
+
+augment:
+  shift_same: true
+  scale:
+    proba: 0.
+  remix:
+    proba: 0
+  repitch:
+    proba: 0
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/auto_mus.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/auto_mus.yaml
new file mode 100644
index 0000000..9a2d9df
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/auto_mus.yaml
@@ -0,0 +1,20 @@
+# @package _global_
+
+# Automix dataset based on musdb train set.
+dset:
+  wav: /checkpoint/defossez/datasets/automix_musdb
+  samplerate: 44100
+  channels: 2
+epochs: 360
+max_batches: 300
+test:
+  every: 4
+
+augment:
+  shift_same: true
+  scale:
+    proba: 0.5
+  remix:
+    proba: 0
+  repitch:
+    proba: 0
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra44.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra44.yaml
new file mode 100644
index 0000000..f0adc46
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra44.yaml
@@ -0,0 +1,8 @@
+# @package _global_
+
+# Musdb + extra tracks
+dset:
+  wav: /checkpoint/defossez/datasets/allstems_44/
+  samplerate: 44100
+  channels: 2
+epochs: 320
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra_mmi_goodclean.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra_mmi_goodclean.yaml
new file mode 100644
index 0000000..fe47bcf
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra_mmi_goodclean.yaml
@@ -0,0 +1,12 @@
+# @package _global_
+
+# Musdb + extra tracks
+dset:
+  wav: /checkpoint/defossez/datasets/allstems_44/
+  wav2: /checkpoint/defossez/datasets/mmi44_goodclean
+  samplerate: 44100
+  channels: 2
+  wav2_weight: null
+  wav2_valid: false
+  valid_samples: 100
+epochs: 1200
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra_test.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra_test.yaml
new file mode 100644
index 0000000..1e7d05a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/extra_test.yaml
@@ -0,0 +1,12 @@
+# @package _global_
+
+# Musdb + extra tracks + test set from musdb.
+dset:
+  wav: /checkpoint/defossez/datasets/allstems_test_44/
+  samplerate: 44100
+  channels: 2
+epochs: 320
+max_batches: 700
+test:
+  sdr: false
+  every: 500
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/dset/musdb44.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/dset/musdb44.yaml
new file mode 100644
index 0000000..c562346
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/dset/musdb44.yaml
@@ -0,0 +1,5 @@
+# @package _global_
+
+dset:
+  samplerate: 44100
+  channels: 2
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/svd/base.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/svd/base.yaml
new file mode 100644
index 0000000..e4de868
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/svd/base.yaml
@@ -0,0 +1,14 @@
+# @package _global_
+
+svd:
+  penalty: 0
+  min_size: 1
+  dim: 50
+  niters: 4
+  powm: false
+  proba: 1
+  conv_only: false
+  convtr: false  # ideally this should be true, but some models were trained with this to false.
+
+optim:
+  beta2: 0.9998
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/svd/base2.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/svd/base2.yaml
new file mode 100644
index 0000000..b88a751
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/svd/base2.yaml
@@ -0,0 +1,14 @@
+# @package _global_
+
+svd:
+  penalty: 0
+  min_size: 1
+  dim: 100
+  niters: 4
+  powm: false
+  proba: 1
+  conv_only: false
+  convtr: true
+
+optim:
+  beta2: 0.9998
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/svd/default.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/svd/default.yaml
new file mode 100644
index 0000000..03bfe3d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/svd/default.yaml
@@ -0,0 +1 @@
+# @package _global_
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/variant/default.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/variant/default.yaml
new file mode 100644
index 0000000..03bfe3d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/variant/default.yaml
@@ -0,0 +1 @@
+# @package _global_
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/variant/example.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/variant/example.yaml
new file mode 100644
index 0000000..9b38aec
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/variant/example.yaml
@@ -0,0 +1,5 @@
+# @package _global_
+
+model: hdemucs
+hdemucs:
+  channels: 32
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/conf/variant/finetune.yaml b/AutoCoverTool/ref/music_remover/demucs/conf/variant/finetune.yaml
new file mode 100644
index 0000000..c3ea21e
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/conf/variant/finetune.yaml
@@ -0,0 +1,19 @@
+# @package _global_
+
+epochs: 4
+batch_size: 16
+optim:
+  lr: 0.0006
+test:
+  every: 1
+  sdr: false
+dset:
+  segment: 28
+  shift: 2
+
+augment:
+  scale:
+    proba: 0
+  shift_same: true
+  remix:
+    proba: 0
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/PKG-INFO b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/PKG-INFO
new file mode 100644
index 0000000..2e97a2d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/PKG-INFO
@@ -0,0 +1,307 @@
+Metadata-Version: 2.1
+Name: demucs
+Version: 4.0.0a1
+Summary: Music source separation in the waveform domain.
+Home-page: https://github.com/facebookresearch/demucs
+Author: Alexandre Défossez
+Author-email: defossez@fb.com
+License: MIT License
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Topic :: Multimedia :: Sound/Audio
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Requires-Python: >=3.7.0
+Description-Content-Type: text/markdown
+Provides-Extra: dev
+License-File: LICENSE
+
+
+# Demucs Music Source Separation
+
+[![Support Ukraine](https://img.shields.io/badge/Support-Ukraine-FFD500?style=flat&labelColor=005BBB)](https://opensource.fb.com/support-ukraine)
+![tests badge](https://github.com/facebookresearch/demucs/workflows/tests/badge.svg)
+![linter badge](https://github.com/facebookresearch/demucs/workflows/linter/badge.svg)
+
+
+This is the 4th release of Demucs (v4), featuring Hybrid Transformer based source separation.
+**For the classic Hybrid Demucs (v3):** [Go this commit][demucs_v3].
+If you are experiencing issues and want the old Demucs back, please fill an issue, and then you can get back to the v3 with
+`git checkout v3`. You can also go [Demucs v2][demucs_v2].
+
+
+Demucs is a state-of-the-art music source separation model, currently capable of separating
+drums, bass, and vocals from the rest of the accompaniment.
+Demucs is based on a U-Net convolutional architecture inspired by [Wave-U-Net][waveunet].
+The v4 version features [Hybrid Transformer Demucs][htdemucs], a hybrid spectrogram/waveform separation model using Transformers.
+It is based on [Hybrid Demucs][hybrid_paper] (also provided in this repo) with the innermost layers are
+replaced by a cross-domain Transformer Encoder. This Transformer uses self-attention within each domain,
+and cross-attention across domains.
+The model achieves a SDR of 9.00 dB on the MUSDB HQ test set. Moreover, when using sparse attention
+kernels to extend its receptive field and per source fine-tuning, we achieve state-of-the-art 9.20 dB of SDR.
+
+Samples are available [on our sample page](https://ai.honu.io/papers/htdemucs/index.html).
+Checkout [our paper][htdemucs] for more information.
+It has been trained on the [MUSDB HQ][musdb] dataset + an extra training dataset of 800 songs.
+This model separates drums, bass and vocals and other stems for any song.
+
+
+As Hybrid Transformer Demucs is brand new, it is not activated by default, you can activate it in the usual
+commands described hereafter with `-n htdemucs_ft`.
+The single, non fine-tuned model is provided as `-n htdemucs`, and the retrained baseline
+as `-n hdemucs_mmi`. The Sparse Hybrid Transformer model decribed in our paper is not provided as its
+requires custom CUDA code that is not ready for release yet.
+
+
+<p align="center">
+<img src="./demucs.png" alt="Schema representing the structure of Hybrid Transformer Demucs,
+    with a dual U-Net structure, one branch for the temporal domain,
+    and one branch for the spectral domain. There is a cross-domain Transformer between the Encoders and Decoders."
+width="800px"></p>
+
+
+
+## Important news if you are already using Demucs
+
+See the [release notes](./docs/release.md) for more details.
+
+- 16/11/2022: Added the new Hybrid Transformer Demucs models.
+	Adding support for the [torchaudio implementation of HDemucs](https://pytorch.org/audio/stable/tutorials/hybrid_demucs_tutorial.html).
+- 30/08/2022: added reproducibility and ablation grids, along with an updated version of the paper.
+- 17/08/2022: Releasing v3.0.5: Set split segment length to reduce memory. Compatible with pyTorch 1.12.
+- 24/02/2022: Releasing v3.0.4: split into two stems (i.e. karaoke mode).
+    Export as float32 or int24.
+- 17/12/2021: Releasing v3.0.3: bug fixes  (thanks @keunwoochoi), memory drastically
+    reduced on GPU (thanks @famzah) and new multi-core evaluation on CPU (`-j` flag).
+- 12/11/2021: Releasing **Demucs v3** with hybrid domain separation. Strong improvements
+	on all sources. This is the model that won Sony MDX challenge.
+- 11/05/2021: Adding support for MusDB-HQ and arbitrary wav set, for the MDX challenge. For more information
+on joining the challenge with Demucs see [the Demucs MDX instructions](docs/mdx.md)
+- 28/04/2021: **Demucs v2**, with extra augmentation and DiffQ based quantization.
+  **EVERYTHING WILL BREAK**, please restart from scratch following the instructions hereafter.
+  This version also adds overlap between prediction frames, with linear transition from one to the next,
+  which should prevent sudden changes at frame boundaries. Also, Demucs is now on PyPI, so for separation
+  only, installation is as easy as `pip install demucs` :)
+- 13/04/2020: **Demucs released under MIT**: We are happy to release Demucs under the MIT licence.
+    We hope that this will broaden the impact of this research to new applications.
+
+
+## Comparison with other models
+
+We provide hereafter a summary of the different metrics presented in the paper.
+You can also compare Hybrid Demucs (v3), [KUIELAB-MDX-Net][kuielab], [Spleeter][spleeter], Open-Unmix, Demucs (v1), and Conv-Tasnet on one of my favorite
+songs on my [soundcloud playlist][soundcloud].
+
+### Comparison of accuracy
+
+`Overall SDR` is the mean of the SDR for each of the 4 sources, `MOS Quality` is a rating from 1 to 5
+of the naturalness and absence of artifacts given by human listeners (5 = no artifacts), `MOS Contamination`
+is a rating from 1 to 5 with 5 being zero contamination by other sources. We refer the reader to our [paper][hybrid_paper],
+for more details.
+
+| Model                        | Domain      | Extra data? | Overall SDR | MOS Quality | MOS Contamination |
+|------------------------------|-------------|-------------|-------------|-------------|-------------------|
+| [Wave-U-Net][waveunet]       | waveform    | no          | 3.2         | -           | -                 |
+| [Open-Unmix][openunmix]      | spectrogram | no          | 5.3         | -           | -                 |
+| [D3Net][d3net]               | spectrogram | no          | 6.0         | -           | -                 |
+| [Conv-Tasnet][demucs_v2]     | waveform    | no          | 5.7         | -           |                   |
+| [Demucs (v2)][demucs_v2]     | waveform    | no          | 6.3         | 2.37        | 2.36              |
+| [ResUNetDecouple+][decouple] | spectrogram | no          | 6.7         | -           | -                 |
+| [KUIELAB-MDX-Net][kuielab]   | hybrid      | no          | 7.5         | **2.86**    | 2.55              |
+| [Band-Spit RNN][bandsplit]   | spectrogram | no          | **8.2**     | -           | -                 |
+| **Hybrid Demucs (v3)**       | hybrid      | no          | 7.7         | **2.83**    | **3.04**          |
+| [MMDenseLSTM][mmdenselstm]   | spectrogram | 804 songs   | 6.0         | -           | -                 |
+| [D3Net][d3net]               | spectrogram | 1.5k songs  | 6.7         | -           | -                 |
+| [Spleeter][spleeter]         | spectrogram | 25k songs   | 5.9         | -           | -                 |
+| [Band-Spit RNN][bandsplit]   | spectrogram | 1.7k (mixes only)     | **9.0**     | -           | -                 |
+| **HT Demucs f.t. (v4)**      | hybrid      | 800 songs   | **9.0**     | -           | -                 |
+
+
+
+## Requirements
+
+You will need at least Python 3.7. See `requirements_minimal.txt` for requirements for separation only,
+and `environment-[cpu|cuda].yml` (or `requirements.txt`) if you want to train a new model.
+
+### For Windows users
+
+Everytime you see `python3`, replace it with `python.exe`. You should always run commands from the
+Anaconda console.
+
+### For musicians
+
+If you just want to use Demucs to separate tracks, you can install it with
+
+```bash
+python3 -m pip install -U demucs
+```
+
+For bleeding edge versions, you can install directly from this repo using
+```bash
+python3 -m pip install -U git+https://github.com/facebookresearch/demucs#egg=demucs
+```
+
+**For Hybrid Transformer Demucs,** you must install the bleeding edge version and use either
+`-n htdemucs` or `-n htdemucs_ft`.
+
+Advanced OS support are provided on the following page, **you must read the page for your OS before posting an issues**:
+- **If you are using Windows:** [Windows support](docs/windows.md).
+- **If you are using MAC OS X:** [Mac OS X support](docs/mac.md).
+- **If you are using Linux:** [Linux support](docs/linux.md).
+
+### For machine learning scientists
+
+If you have anaconda installed, you can run from the root of this repository:
+
+```bash
+conda env update -f environment-cpu.yml  # if you don't have GPUs
+conda env update -f environment-cuda.yml # if you have GPUs
+conda activate demucs
+pip install -e .
+```
+
+This will create a `demucs` environment with all the dependencies installed.
+
+You will also need to install [soundstretch/soundtouch](https://www.surina.net/soundtouch/soundstretch.html): on Mac OSX you can do `brew install sound-touch`,
+and on Ubuntu `sudo apt-get install soundstretch`. This is used for the
+pitch/tempo augmentation.
+
+
+### Running in Docker
+
+Thanks to @xserrat, there is now a Docker image definition ready for using Demucs. This can ensure all libraries are correctly installed without interfering with the host OS. See his repo [Docker Facebook Demucs](https://github.com/xserrat/docker-facebook-demucs) for more information.
+
+
+### Running from Colab
+
+I made a Colab to easily separate track with Demucs. Note that
+transfer speeds with Colab are a bit slow for large media files,
+but it will allow you to use Demucs without installing anything.
+
+[Demucs on Google Colab](https://colab.research.google.com/drive/1dC9nVxk3V_VPjUADsnFu8EiT-xnU1tGH?usp=sharing)
+
+### Web Demo
+
+Integrated to [Huggingface Spaces](https://huggingface.co/spaces) with [Gradio](https://github.com/gradio-app/gradio). See demo: [![Hugging Face Spaces](https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Spaces-blue)](https://huggingface.co/spaces/akhaliq/demucs)
+
+### Graphical Interface
+
+@CarlGao4 has released a GUI for Demucs: [CarlGao4/Demucs-Gui](https://github.com/CarlGao4/Demucs-Gui). Downloads for Windows and macOS is available [here](https://github.com/CarlGao4/Demucs-Gui/releases). Use [FossHub mirror](https://fosshub.com/Demucs-GUI.html) to speed up your download.
+
+@Anjok07 is providing a self contained GUI in [UVR (Ultimate Vocal Remover)](https://github.com/facebookresearch/demucs/issues/334) that supports Demucs.
+
+### Other providers
+
+Audiostrip is providing free online separation with Demucs on their website [https://audiostrip.co.uk/](https://audiostrip.co.uk/).
+[MVSep](https://mvsep.com/) also provides free online separation, select `Demucs3 model B` for the best quality.
+
+Spleeter.io provides free online separation with Demucs on their website [https://www.spleeter.io/demucs](https://www.spleeter.io/demucs).
+
+
+## Separating tracks
+
+In order to try Demucs, you can just run from any folder (as long as you properly installed it)
+
+```bash
+demucs PATH_TO_AUDIO_FILE_1 [PATH_TO_AUDIO_FILE_2 ...]   # for Demucs
+# If you used `pip install --user` you might need to replace demucs with python3 -m demucs
+python3 -m demucs --mp3 --mp3-bitrate BITRATE PATH_TO_AUDIO_FILE_1  # output files saved as MP3
+# If your filename contain spaces don't forget to quote it !!!
+demucs "my music/my favorite track.mp3"
+# You can select different models with `-n` mdx_q is the quantized model, smaller but maybe a bit less accurate.
+demucs -n mdx_q myfile.mp3
+# If you only want to separate vocals out of an audio, use `--two-stems=vocal` (You can also set to drums or bass)
+demucs --two-stems=vocals myfile.mp3
+```
+
+
+If you have a GPU, but you run out of memory, please use `--segment SEGMENT` to reduce length of each split. `SEGMENT` should be changed to a integer. Personally recommend not less than 10 (the bigger the number is, the more memory is required, but quality may increase). Create an environment variable `PYTORCH_NO_CUDA_MEMORY_CACHING=1` is also helpful. If this still cannot help, please add `-d cpu` to the command line. See the section hereafter for more details on the memory requirements for GPU acceleration.
+
+Separated tracks are stored in the `separated/MODEL_NAME/TRACK_NAME` folder. There you will find four stereo wav files sampled at 44.1 kHz: `drums.wav`, `bass.wav`,
+`other.wav`, `vocals.wav` (or `.mp3` if you used the `--mp3` option).
+
+All audio formats supported by `torchaudio` can be processed (i.e. wav, mp3, flac, ogg/vorbis on Linux/Mac OS X etc.). On Windows, `torchaudio` has limited support, so we rely on `ffmpeg`, which should support pretty much anything.
+Audio is resampled on the fly if necessary.
+The output will be a wave file encoded as int16.
+You can save as float32 wav files with `--float32`, or 24 bits integer wav with `--int24`.
+You can pass `--mp3` to save as mp3 instead, and set the bitrate with `--mp3-bitrate` (default is 320kbps).
+
+It can happen that the output would need clipping, in particular due to some separation artifacts.
+Demucs will automatically rescale each output stem so as to avoid clipping. This can however break
+the relative volume between stems. If instead you prefer hard clipping, pass `--clip-mode clamp`.
+You can also try to reduce the volume of the input mixture before feeding it to Demucs.
+
+
+Other pre-trained models can be selected with the `-n` flag.
+The list of pre-trained models is:
+- `htdemucs`: first version of Hybrid Transformer Demucs. Trained on MusDB + 800 songs.
+- `htdemucs_ft`: fine-tuned version of `htdemucs`, separation will take 4 times more time
+    but might be a bit better. Same training set as `htdemucs`.
+- `hdemucs_mmi`: Hybrid Demucs v3, retrained on MusDB + 800 songs.
+- `mdx`: trained only on MusDB HQ, winning model on track A at the [MDX][mdx] challenge.
+- `mdx_extra`: trained with extra training data (including MusDB test set), ranked 2nd on the track B
+    of the [MDX][mdx] challenge.
+- `mdx_q`, `mdx_extra_q`: quantized version of the previous models. Smaller download and storage
+    but quality can be slightly worse. `mdx_extra_q` is the default model used.
+- `SIG`: where `SIG` is a single model from the [model zoo](docs/training.md#model-zoo).
+
+The `--two-stems=vocals` option allows to separate vocals from the rest (e.g. karaoke mode).
+`vocals` can be changed into any source in the selected model.
+This will mix the files after separating the mix fully, so this won't be faster or use less memory.
+
+The `--shifts=SHIFTS` performs multiple predictions with random shifts (a.k.a the *shift trick*) of the input and average them. This makes prediction `SHIFTS` times
+slower. Don't use it unless you have a GPU.
+
+The `--overlap` option controls the amount of overlap between prediction windows. Default is 0.25 (i.e. 25%) which is probably fine.
+It can probably be reduced to 0.1 to improve a bit speed.
+
+
+The `-j` flag allow to specify a number of parallel jobs (e.g. `demucs -j 2 myfile.mp3`).
+This will multiply by the same amount the RAM used so be careful!
+
+### Memory requirements for GPU acceleration
+
+If you want to use GPU acceleration, you will need at least 3GB of RAM on your GPU for `demucs`. However, about 7GB of RAM will be required if you use the default arguments. Add `--segment SEGMENT` to change size of each split. If you only have 3GB memory, set SEGMENT to 8 (though quality may be worse if this argument is too small). Creating an environment variable `PYTORCH_NO_CUDA_MEMORY_CACHING=1` can help users with even smaller RAM such as 2GB (I separated a track that is 4 minutes but only 1.5GB is used), but this would make the separation slower.
+
+If you do not have enough memory on your GPU, simply add `-d cpu` to the command line to use the CPU. With Demucs, processing time should be roughly equal to 1.5 times the duration of the track.
+
+
+## Training Demucs
+
+If you want to train (Hybrid) Demucs, please follow the [training doc](docs/training.md).
+
+## MDX Challenge reproduction
+
+In order to reproduce the results from the Track A and Track B submissions, checkout the [MDX Hybrid Demucs submission repo][mdx_submission].
+
+
+
+## How to cite
+
+```
+@inproceedings{defossez2021hybrid,
+  title={Hybrid Spectrogram and Waveform Source Separation},
+  author={D{\'e}fossez, Alexandre},
+  booktitle={Proceedings of the ISMIR 2021 Workshop on Music Source Separation},
+  year={2021}
+}
+```
+
+## License
+
+Demucs is released under the MIT license as found in the [LICENSE](LICENSE) file.
+
+[hybrid_paper]: https://arxiv.org/abs/2111.03600
+[waveunet]: https://github.com/f90/Wave-U-Net
+[musdb]: https://sigsep.github.io/datasets/musdb.html
+[openunmix]: https://github.com/sigsep/open-unmix-pytorch
+[mmdenselstm]: https://arxiv.org/abs/1805.02410
+[demucs_v2]: https://github.com/facebookresearch/demucs/tree/v2
+[demucs_v3]: https://github.com/facebookresearch/demucs/tree/v3
+[spleeter]: https://github.com/deezer/spleeter
+[soundcloud]: https://soundcloud.com/honualx/sets/source-separation-in-the-waveform-domain
+[d3net]: https://arxiv.org/abs/2010.01733
+[mdx]: https://www.aicrowd.com/challenges/music-demixing-challenge-ismir-2021
+[kuielab]: https://github.com/kuielab/mdx-net-submission
+[decouple]: https://arxiv.org/abs/2109.05418
+[mdx_submission]: https://github.com/adefossez/mdx21_demucs
+[bandsplit]: https://arxiv.org/abs/2209.15174
+[htdemucs]: https://arxiv.org/abs/2211.08553
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/SOURCES.txt b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/SOURCES.txt
new file mode 100644
index 0000000..e6ad754
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/SOURCES.txt
@@ -0,0 +1,68 @@
+LICENSE
+MANIFEST.in
+Makefile
+README.md
+demucs.png
+mypy.ini
+outputs.tar.gz
+requirements.txt
+requirements_minimal.txt
+setup.cfg
+setup.py
+test.mp3
+conf/config.yaml
+conf/dset/aetl.yaml
+conf/dset/auto_extra_test.yaml
+conf/dset/auto_mus.yaml
+conf/dset/extra44.yaml
+conf/dset/extra_mmi_goodclean.yaml
+conf/dset/extra_test.yaml
+conf/dset/musdb44.yaml
+conf/svd/base.yaml
+conf/svd/base2.yaml
+conf/svd/default.yaml
+conf/variant/default.yaml
+conf/variant/example.yaml
+conf/variant/finetune.yaml
+demucs/__init__.py
+demucs/__main__.py
+demucs/apply.py
+demucs/audio.py
+demucs/augment.py
+demucs/demucs.py
+demucs/distrib.py
+demucs/ema.py
+demucs/evaluate.py
+demucs/hdemucs.py
+demucs/htdemucs.py
+demucs/pretrained.py
+demucs/py.typed
+demucs/repitch.py
+demucs/repo.py
+demucs/separate.py
+demucs/solver.py
+demucs/spec.py
+demucs/states.py
+demucs/svd.py
+demucs/train.py
+demucs/transformer.py
+demucs/utils.py
+demucs/wav.py
+demucs/wdemucs.py
+demucs.egg-info/PKG-INFO
+demucs.egg-info/SOURCES.txt
+demucs.egg-info/dependency_links.txt
+demucs.egg-info/entry_points.txt
+demucs.egg-info/requires.txt
+demucs.egg-info/top_level.txt
+demucs/remote/files.txt
+demucs/remote/hdemucs_mmi.yaml
+demucs/remote/htdemucs.yaml
+demucs/remote/htdemucs_ft.yaml
+demucs/remote/mdx.yaml
+demucs/remote/mdx_extra.yaml
+demucs/remote/mdx_extra_q.yaml
+demucs/remote/mdx_q.yaml
+demucs/remote/repro_mdx_a.yaml
+demucs/remote/repro_mdx_a_hybrid_only.yaml
+demucs/remote/repro_mdx_a_time_only.yaml
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/dependency_links.txt b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/dependency_links.txt
new file mode 100644
index 0000000..8b13789
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/dependency_links.txt
@@ -0,0 +1 @@
+
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/entry_points.txt b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/entry_points.txt
new file mode 100644
index 0000000..3def845
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/entry_points.txt
@@ -0,0 +1,2 @@
+[console_scripts]
+demucs = demucs.separate:main
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/requires.txt b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/requires.txt
new file mode 100644
index 0000000..012c2cb
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/requires.txt
@@ -0,0 +1,32 @@
+dora-search
+diffq>=0.2.1
+einops
+julius>=0.2.3
+lameenc>=1.2
+openunmix
+pyyaml
+torch>=1.8.1
+torchaudio>=0.8
+tqdm
+
+[dev]
+dora-search
+diffq>=0.2.1
+einops
+flake8
+hydra-colorlog>=1.1
+hydra-core>=1.1
+julius>=0.2.3
+lameenc>=1.2
+museval
+mypy
+openunmix
+pyyaml
+submitit
+torch>=1.8.1
+torchaudio>=0.8
+tqdm
+treetable
+
+[dev:sys_platform == "win32"]
+soundfile>=0.10.3
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/top_level.txt b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/top_level.txt
new file mode 100644
index 0000000..b35ba4c
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs.egg-info/top_level.txt
@@ -0,0 +1 @@
+demucs
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs.png b/AutoCoverTool/ref/music_remover/demucs/demucs.png
new file mode 100644
index 0000000..d043f64
Binary files /dev/null and b/AutoCoverTool/ref/music_remover/demucs/demucs.png differ
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/__init__.py b/AutoCoverTool/ref/music_remover/demucs/demucs/__init__.py
new file mode 100644
index 0000000..5578946
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/__init__.py
@@ -0,0 +1,7 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+__version__ = "4.0.0a1"
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/__main__.py b/AutoCoverTool/ref/music_remover/demucs/demucs/__main__.py
new file mode 100644
index 0000000..2171e17
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/__main__.py
@@ -0,0 +1,10 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+from .separate import main
+
+if __name__ == '__main__':
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/apply.py b/AutoCoverTool/ref/music_remover/demucs/demucs/apply.py
new file mode 100644
index 0000000..def1729
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/apply.py
@@ -0,0 +1,245 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Code to apply a model to a mix. It will handle chunking with overlaps and
+inteprolation between chunks, as well as the "shift trick".
+"""
+from concurrent.futures import ThreadPoolExecutor
+import random
+import typing as tp
+
+import torch as th
+from torch import nn
+from torch.nn import functional as F
+import tqdm
+
+from .demucs import Demucs
+from .hdemucs import HDemucs
+from .utils import center_trim, DummyPoolExecutor
+
+Model = tp.Union[Demucs, HDemucs]
+
+
+class BagOfModels(nn.Module):
+    def __init__(self, models: tp.List[Model],
+                 weights: tp.Optional[tp.List[tp.List[float]]] = None,
+                 segment: tp.Optional[float] = None):
+        """
+        Represents a bag of models with specific weights.
+        You should call `apply_model` rather than calling directly the forward here for
+        optimal performance.
+
+        Args:
+            models (list[nn.Module]): list of Demucs/HDemucs models.
+            weights (list[list[float]]): list of weights. If None, assumed to
+                be all ones, otherwise it should be a list of N list (N number of models),
+                each containing S floats (S number of sources).
+            segment (None or float): overrides the `segment` attribute of each model
+                (this is performed inplace, be careful is you reuse the models passed).
+        """
+        super().__init__()
+        assert len(models) > 0
+        first = models[0]
+        for other in models:
+            assert other.sources == first.sources
+            assert other.samplerate == first.samplerate
+            assert other.audio_channels == first.audio_channels
+            if segment is not None:
+                other.segment = segment
+
+        self.audio_channels = first.audio_channels
+        self.samplerate = first.samplerate
+        self.sources = first.sources
+        self.models = nn.ModuleList(models)
+
+        if weights is None:
+            weights = [[1. for _ in first.sources] for _ in models]
+        else:
+            assert len(weights) == len(models)
+            for weight in weights:
+                assert len(weight) == len(first.sources)
+        self.weights = weights
+
+    def forward(self, x):
+        raise NotImplementedError("Call `apply_model` on this.")
+
+
+class TensorChunk:
+    def __init__(self, tensor, offset=0, length=None):
+        total_length = tensor.shape[-1]
+        assert offset >= 0
+        assert offset < total_length
+
+        if length is None:
+            length = total_length - offset
+        else:
+            length = min(total_length - offset, length)
+
+        if isinstance(tensor, TensorChunk):
+            self.tensor = tensor.tensor
+            self.offset = offset + tensor.offset
+        else:
+            self.tensor = tensor
+            self.offset = offset
+        self.length = length
+        self.device = tensor.device
+
+    @property
+    def shape(self):
+        shape = list(self.tensor.shape)
+        shape[-1] = self.length
+        return shape
+
+    def padded(self, target_length):
+        delta = target_length - self.length
+        total_length = self.tensor.shape[-1]
+        assert delta >= 0
+
+        start = self.offset - delta // 2
+        end = start + target_length
+
+        correct_start = max(0, start)
+        correct_end = min(total_length, end)
+
+        pad_left = correct_start - start
+        pad_right = end - correct_end
+
+        out = F.pad(self.tensor[..., correct_start:correct_end], (pad_left, pad_right))
+        assert out.shape[-1] == target_length
+        return out
+
+
+def tensor_chunk(tensor_or_chunk):
+    if isinstance(tensor_or_chunk, TensorChunk):
+        return tensor_or_chunk
+    else:
+        assert isinstance(tensor_or_chunk, th.Tensor)
+        return TensorChunk(tensor_or_chunk)
+
+
+def apply_model(model, mix, shifts=1, split=True,
+                overlap=0.25, transition_power=1., progress=False, device=None,
+                num_workers=0, pool=None):
+    """
+    Apply model to a given mixture.
+
+    Args:
+        shifts (int): if > 0, will shift in time `mix` by a random amount between 0 and 0.5 sec
+            and apply the oppositve shift to the output. This is repeated `shifts` time and
+            all predictions are averaged. This effectively makes the model time equivariant
+            and improves SDR by up to 0.2 points.
+        split (bool): if True, the input will be broken down in 8 seconds extracts
+            and predictions will be performed individually on each and concatenated.
+            Useful for model with large memory footprint like Tasnet.
+        progress (bool): if True, show a progress bar (requires split=True)
+        device (torch.device, str, or None): if provided, device on which to
+            execute the computation, otherwise `mix.device` is assumed.
+            When `device` is different from `mix.device`, only local computations will
+            be on `device`, while the entire tracks will be stored on `mix.device`.
+    """
+    if device is None:
+        device = mix.device
+    else:
+        device = th.device(device)
+    if pool is None:
+        if num_workers > 0 and device.type == 'cpu':
+            pool = ThreadPoolExecutor(num_workers)
+        else:
+            pool = DummyPoolExecutor()
+    kwargs = {
+        'shifts': shifts,
+        'split': split,
+        'overlap': overlap,
+        'transition_power': transition_power,
+        'progress': progress,
+        'device': device,
+        'pool': pool,
+    }
+    if isinstance(model, BagOfModels):
+        # Special treatment for bag of model.
+        # We explicitely apply multiple times `apply_model` so that the random shifts
+        # are different for each model.
+        estimates = 0
+        totals = [0] * len(model.sources)
+        for sub_model, weight in zip(model.models, model.weights):
+            original_model_device = next(iter(sub_model.parameters())).device
+            sub_model.to(device)
+
+            out = apply_model(sub_model, mix, **kwargs)
+            sub_model.to(original_model_device)
+            for k, inst_weight in enumerate(weight):
+                out[:, k, :, :] *= inst_weight
+                totals[k] += inst_weight
+            estimates += out
+            del out
+
+        for k in range(estimates.shape[1]):
+            estimates[:, k, :, :] /= totals[k]
+        return estimates
+
+    model.to(device)
+    model.eval()
+    assert transition_power >= 1, "transition_power < 1 leads to weird behavior."
+    batch, channels, length = mix.shape
+    if shifts:
+        kwargs['shifts'] = 0
+        max_shift = int(0.5 * model.samplerate)
+        mix = tensor_chunk(mix)
+        padded_mix = mix.padded(length + 2 * max_shift)
+        out = 0
+        for _ in range(shifts):
+            # TODO 这里使用了一个随机值，导致多次输出的结果不一致
+            # 验证代码时可以先写死
+            # offset = 2312
+            offset = random.randint(0, max_shift)
+            shifted = TensorChunk(padded_mix, offset, length + max_shift - offset)
+            shifted_out = apply_model(model, shifted, **kwargs)
+            out += shifted_out[..., max_shift - offset:]
+        out /= shifts
+        return out
+    elif split:
+        kwargs['split'] = False
+        out = th.zeros(batch, len(model.sources), channels, length, device=mix.device)
+        sum_weight = th.zeros(length, device=mix.device)
+        segment = int(model.samplerate * model.segment)
+        stride = int((1 - overlap) * segment)
+        offsets = range(0, length, stride)
+        scale = float(format(stride / model.samplerate, ".2f"))
+        # We start from a triangle shaped weight, with maximal weight in the middle
+        # of the segment. Then we normalize and take to the power `transition_power`.
+        # Large values of transition power will lead to sharper transitions.
+        weight = th.cat([th.arange(1, segment // 2 + 1, device=device),
+                         th.arange(segment - segment // 2, 0, -1, device=device)])
+        assert len(weight) == segment
+        # If the overlap < 50%, this will translate to linear transition when
+        # transition_power is 1.
+        weight = (weight / weight.max())**transition_power
+        futures = []
+        for offset in offsets:
+            chunk = TensorChunk(mix, offset, segment)
+            future = pool.submit(apply_model, model, chunk, **kwargs)
+            futures.append((future, offset))
+            offset += segment
+        if progress:
+            futures = tqdm.tqdm(futures, unit_scale=scale, ncols=120, unit='seconds')
+        for future, offset in futures:
+            chunk_out = future.result()
+            chunk_length = chunk_out.shape[-1]
+            out[..., offset:offset + segment] += (weight[:chunk_length] * chunk_out).to(mix.device)
+            sum_weight[offset:offset + segment] += weight[:chunk_length].to(mix.device)
+        assert sum_weight.min() > 0
+        out /= sum_weight
+        return out
+    else:
+        if hasattr(model, 'valid_length'):
+            valid_length = model.valid_length(length)
+        else:
+            valid_length = length
+        mix = tensor_chunk(mix)
+        padded_mix = mix.padded(valid_length).to(device)
+        with th.no_grad():
+            out = model(padded_mix)
+        return center_trim(out, length)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/audio.py b/AutoCoverTool/ref/music_remover/demucs/demucs/audio.py
new file mode 100644
index 0000000..ae3bfb7
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/audio.py
@@ -0,0 +1,257 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+import json
+import subprocess as sp
+from pathlib import Path
+
+import lameenc
+import julius
+import numpy as np
+import torch
+import torchaudio as ta
+
+from .utils import temp_filenames
+
+
+def _read_info(path):
+    stdout_data = sp.check_output([
+        'ffprobe', "-loglevel", "panic",
+        str(path), '-print_format', 'json', '-show_format', '-show_streams'
+    ])
+    return json.loads(stdout_data.decode('utf-8'))
+
+
+class AudioFile:
+    """
+    Allows to read audio from any format supported by ffmpeg, as well as resampling or
+    converting to mono on the fly. See :method:`read` for more details.
+    """
+    def __init__(self, path: Path):
+        self.path = Path(path)
+        self._info = None
+
+    def __repr__(self):
+        features = [("path", self.path)]
+        features.append(("samplerate", self.samplerate()))
+        features.append(("channels", self.channels()))
+        features.append(("streams", len(self)))
+        features_str = ", ".join(f"{name}={value}" for name, value in features)
+        return f"AudioFile({features_str})"
+
+    @property
+    def info(self):
+        if self._info is None:
+            self._info = _read_info(self.path)
+        return self._info
+
+    @property
+    def duration(self):
+        return float(self.info['format']['duration'])
+
+    @property
+    def _audio_streams(self):
+        return [
+            index for index, stream in enumerate(self.info["streams"])
+            if stream["codec_type"] == "audio"
+        ]
+
+    def __len__(self):
+        return len(self._audio_streams)
+
+    def channels(self, stream=0):
+        return int(self.info['streams'][self._audio_streams[stream]]['channels'])
+
+    def samplerate(self, stream=0):
+        return int(self.info['streams'][self._audio_streams[stream]]['sample_rate'])
+
+    def read(self,
+             seek_time=None,
+             duration=None,
+             streams=slice(None),
+             samplerate=None,
+             channels=None,
+             temp_folder=None):
+        """
+        Slightly more efficient implementation than stempeg,
+        in particular, this will extract all stems at once
+        rather than having to loop over one file multiple times
+        for each stream.
+
+        Args:
+            seek_time (float):  seek time in seconds or None if no seeking is needed.
+            duration (float): duration in seconds to extract or None to extract until the end.
+            streams (slice, int or list): streams to extract, can be a single int, a list or
+                a slice. If it is a slice or list, the output will be of size [S, C, T]
+                with S the number of streams, C the number of channels and T the number of samples.
+                If it is an int, the output will be [C, T].
+            samplerate (int): if provided, will resample on the fly. If None, no resampling will
+                be done. Original sampling rate can be obtained with :method:`samplerate`.
+            channels (int): if 1, will convert to mono. We do not rely on ffmpeg for that
+                as ffmpeg automatically scale by +3dB to conserve volume when playing on speakers.
+                See https://sound.stackexchange.com/a/42710.
+                Our definition of mono is simply the average of the two channels. Any other
+                value will be ignored.
+            temp_folder (str or Path or None): temporary folder to use for decoding.
+
+
+        """
+        streams = np.array(range(len(self)))[streams]
+        single = not isinstance(streams, np.ndarray)
+        if single:
+            streams = [streams]
+
+        if duration is None:
+            target_size = None
+            query_duration = None
+        else:
+            target_size = int((samplerate or self.samplerate()) * duration)
+            query_duration = float((target_size + 1) / (samplerate or self.samplerate()))
+
+        with temp_filenames(len(streams)) as filenames:
+            command = ['ffmpeg', '-y']
+            command += ['-loglevel', 'panic']
+            if seek_time:
+                command += ['-ss', str(seek_time)]
+            command += ['-i', str(self.path)]
+            for stream, filename in zip(streams, filenames):
+                command += ['-map', f'0:{self._audio_streams[stream]}']
+                if query_duration is not None:
+                    command += ['-t', str(query_duration)]
+                command += ['-threads', '1']
+                command += ['-f', 'f32le']
+                if samplerate is not None:
+                    command += ['-ar', str(samplerate)]
+                command += [filename]
+
+            sp.run(command, check=True)
+            wavs = []
+            for filename in filenames:
+                wav = np.fromfile(filename, dtype=np.float32)
+                wav = torch.from_numpy(wav)
+                wav = wav.view(-1, self.channels()).t()
+                if channels is not None:
+                    wav = convert_audio_channels(wav, channels)
+                if target_size is not None:
+                    wav = wav[..., :target_size]
+                wavs.append(wav)
+        wav = torch.stack(wavs, dim=0)
+        if single:
+            wav = wav[0]
+        return wav
+
+
+def convert_audio_channels(wav, channels=2):
+    """Convert audio to the given number of channels."""
+    *shape, src_channels, length = wav.shape
+    if src_channels == channels:
+        pass
+    elif channels == 1:
+        # Case 1:
+        # The caller asked 1-channel audio, but the stream have multiple
+        # channels, downmix all channels.
+        wav = wav.mean(dim=-2, keepdim=True)
+    elif src_channels == 1:
+        # Case 2:
+        # The caller asked for multiple channels, but the input file have
+        # one single channel, replicate the audio over all channels.
+        wav = wav.expand(*shape, channels, length)
+    elif src_channels >= channels:
+        # Case 3:
+        # The caller asked for multiple channels, and the input file have
+        # more channels than requested. In that case return the first channels.
+        wav = wav[..., :channels, :]
+    else:
+        # Case 4: What is a reasonable choice here?
+        raise ValueError('The audio file has less channels than requested but is not mono.')
+    return wav
+
+
+def convert_audio(wav, from_samplerate, to_samplerate, channels):
+    """Convert audio from a given samplerate to a target one and target number of channels."""
+    wav = convert_audio_channels(wav, channels)
+    return julius.resample_frac(wav, from_samplerate, to_samplerate)
+
+
+def i16_pcm(wav):
+    """Convert audio to 16 bits integer PCM format."""
+    if wav.dtype.is_floating_point:
+        return (wav.clamp_(-1, 1) * (2**15 - 1)).short()
+    else:
+        return wav
+
+
+def f32_pcm(wav):
+    """Convert audio to float 32 bits PCM format."""
+    if wav.dtype.is_floating_point:
+        return wav
+    else:
+        return wav.float() / (2**15 - 1)
+
+
+def as_dtype_pcm(wav, dtype):
+    """Convert audio to either f32 pcm or i16 pcm depending on the given dtype."""
+    if wav.dtype.is_floating_point:
+        return f32_pcm(wav)
+    else:
+        return i16_pcm(wav)
+
+
+def encode_mp3(wav, path, samplerate=44100, bitrate=320, verbose=False):
+    """Save given audio as mp3. This should work on all OSes."""
+    C, T = wav.shape
+    wav = i16_pcm(wav)
+    encoder = lameenc.Encoder()
+    encoder.set_bit_rate(bitrate)
+    encoder.set_in_sample_rate(samplerate)
+    encoder.set_channels(C)
+    encoder.set_quality(2)  # 2-highest, 7-fastest
+    if not verbose:
+        encoder.silence()
+    wav = wav.data.cpu()
+    wav = wav.transpose(0, 1).numpy()
+    mp3_data = encoder.encode(wav.tobytes())
+    mp3_data += encoder.flush()
+    with open(path, "wb") as f:
+        f.write(mp3_data)
+
+
+def prevent_clip(wav, mode='rescale'):
+    """
+    different strategies for avoiding raw clipping.
+    """
+    assert wav.dtype.is_floating_point, "too late for clipping"
+    if mode == 'rescale':
+        wav = wav / max(1.01 * wav.abs().max(), 1)
+    elif mode == 'clamp':
+        wav = wav.clamp(-0.99, 0.99)
+    elif mode == 'tanh':
+        wav = torch.tanh(wav)
+    else:
+        raise ValueError(f"Invalid mode {mode}")
+    return wav
+
+
+def save_audio(wav, path, samplerate, bitrate=320, clip='rescale',
+               bits_per_sample=16, as_float=False):
+    """Save audio file, automatically preventing clipping if necessary
+    based on the given `clip` strategy. If the path ends in `.mp3`, this
+    will save as mp3 with the given `bitrate`.
+    """
+    wav = prevent_clip(wav, mode=clip)
+    path = Path(path)
+    suffix = path.suffix.lower()
+    if suffix == ".mp3":
+        encode_mp3(wav, path, samplerate, bitrate)
+    elif suffix == ".wav":
+        if as_float:
+            bits_per_sample = 32
+            encoding = 'PCM_F'
+        else:
+            encoding = 'PCM_S'
+        ta.save(str(path), wav, sample_rate=samplerate,
+                encoding=encoding, bits_per_sample=bits_per_sample)
+    else:
+        raise ValueError(f"Invalid suffix for path: {suffix}")
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/augment.py b/AutoCoverTool/ref/music_remover/demucs/demucs/augment.py
new file mode 100644
index 0000000..2e4df78
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/augment.py
@@ -0,0 +1,111 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Data augmentations.
+"""
+
+import random
+import torch as th
+from torch import nn
+
+
+class Shift(nn.Module):
+    """
+    Randomly shift audio in time by up to `shift` samples.
+    """
+    def __init__(self, shift=8192, same=False):
+        super().__init__()
+        self.shift = shift
+        self.same = same
+
+    def forward(self, wav):
+        batch, sources, channels, time = wav.size()
+        length = time - self.shift
+        if self.shift > 0:
+            if not self.training:
+                wav = wav[..., :length]
+            else:
+                srcs = 1 if self.same else sources
+                offsets = th.randint(self.shift, [batch, srcs, 1, 1], device=wav.device)
+                offsets = offsets.expand(-1, sources, channels, -1)
+                indexes = th.arange(length, device=wav.device)
+                wav = wav.gather(3, indexes + offsets)
+        return wav
+
+
+class FlipChannels(nn.Module):
+    """
+    Flip left-right channels.
+    """
+    def forward(self, wav):
+        batch, sources, channels, time = wav.size()
+        if self.training and wav.size(2) == 2:
+            left = th.randint(2, (batch, sources, 1, 1), device=wav.device)
+            left = left.expand(-1, -1, -1, time)
+            right = 1 - left
+            wav = th.cat([wav.gather(2, left), wav.gather(2, right)], dim=2)
+        return wav
+
+
+class FlipSign(nn.Module):
+    """
+    Random sign flip.
+    """
+    def forward(self, wav):
+        batch, sources, channels, time = wav.size()
+        if self.training:
+            signs = th.randint(2, (batch, sources, 1, 1), device=wav.device, dtype=th.float32)
+            wav = wav * (2 * signs - 1)
+        return wav
+
+
+class Remix(nn.Module):
+    """
+    Shuffle sources to make new mixes.
+    """
+    def __init__(self, proba=1, group_size=4):
+        """
+        Shuffle sources within one batch.
+        Each batch is divided into groups of size `group_size` and shuffling is done within
+        each group separatly. This allow to keep the same probability distribution no matter
+        the number of GPUs. Without this grouping, using more GPUs would lead to a higher
+        probability of keeping two sources from the same track together which can impact
+        performance.
+        """
+        super().__init__()
+        self.proba = proba
+        self.group_size = group_size
+
+    def forward(self, wav):
+        batch, streams, channels, time = wav.size()
+        device = wav.device
+
+        if self.training and random.random() < self.proba:
+            group_size = self.group_size or batch
+            if batch % group_size != 0:
+                raise ValueError(f"Batch size {batch} must be divisible by group size {group_size}")
+            groups = batch // group_size
+            wav = wav.view(groups, group_size, streams, channels, time)
+            permutations = th.argsort(th.rand(groups, group_size, streams, 1, 1, device=device),
+                                      dim=1)
+            wav = wav.gather(1, permutations.expand(-1, -1, -1, channels, time))
+            wav = wav.view(batch, streams, channels, time)
+        return wav
+
+
+class Scale(nn.Module):
+    def __init__(self, proba=1., min=0.25, max=1.25):
+        super().__init__()
+        self.proba = proba
+        self.min = min
+        self.max = max
+
+    def forward(self, wav):
+        batch, streams, channels, time = wav.size()
+        device = wav.device
+        if self.training and random.random() < self.proba:
+            scales = th.empty(batch, streams, 1, 1, device=device).uniform_(self.min, self.max)
+            wav *= scales
+        return wav
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/demucs.py b/AutoCoverTool/ref/music_remover/demucs/demucs/demucs.py
new file mode 100644
index 0000000..967c833
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/demucs.py
@@ -0,0 +1,447 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+import math
+import typing as tp
+
+import julius
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+from .states import capture_init
+from .utils import center_trim, unfold
+from .transformer import LayerScale
+
+
+class BLSTM(nn.Module):
+    """
+    BiLSTM with same hidden units as input dim.
+    If `max_steps` is not None, input will be splitting in overlapping
+    chunks and the LSTM applied separately on each chunk.
+    """
+    def __init__(self, dim, layers=1, max_steps=None, skip=False):
+        super().__init__()
+        assert max_steps is None or max_steps % 4 == 0
+        self.max_steps = max_steps
+        self.lstm = nn.LSTM(bidirectional=True, num_layers=layers, hidden_size=dim, input_size=dim)
+        self.linear = nn.Linear(2 * dim, dim)
+        self.skip = skip
+
+    def forward(self, x):
+        B, C, T = x.shape
+        y = x
+        framed = False
+        if self.max_steps is not None and T > self.max_steps:
+            width = self.max_steps
+            stride = width // 2
+            frames = unfold(x, width, stride)
+            nframes = frames.shape[2]
+            framed = True
+            x = frames.permute(0, 2, 1, 3).reshape(-1, C, width)
+
+        x = x.permute(2, 0, 1)
+
+        x = self.lstm(x)[0]
+        x = self.linear(x)
+        x = x.permute(1, 2, 0)
+        if framed:
+            out = []
+            frames = x.reshape(B, -1, C, width)
+            limit = stride // 2
+            for k in range(nframes):
+                if k == 0:
+                    out.append(frames[:, k, :, :-limit])
+                elif k == nframes - 1:
+                    out.append(frames[:, k, :, limit:])
+                else:
+                    out.append(frames[:, k, :, limit:-limit])
+            out = torch.cat(out, -1)
+            out = out[..., :T]
+            x = out
+        if self.skip:
+            x = x + y
+        return x
+
+
+def rescale_conv(conv, reference):
+    """Rescale initial weight scale. It is unclear why it helps but it certainly does.
+    """
+    std = conv.weight.std().detach()
+    scale = (std / reference)**0.5
+    conv.weight.data /= scale
+    if conv.bias is not None:
+        conv.bias.data /= scale
+
+
+def rescale_module(module, reference):
+    for sub in module.modules():
+        if isinstance(sub, (nn.Conv1d, nn.ConvTranspose1d, nn.Conv2d, nn.ConvTranspose2d)):
+            rescale_conv(sub, reference)
+
+
+class DConv(nn.Module):
+    """
+    New residual branches in each encoder layer.
+    This alternates dilated convolutions, potentially with LSTMs and attention.
+    Also before entering each residual branch, dimension is projected on a smaller subspace,
+    e.g. of dim `channels // compress`.
+    """
+    def __init__(self, channels: int, compress: float = 4, depth: int = 2, init: float = 1e-4,
+                 norm=True, attn=False, heads=4, ndecay=4, lstm=False, gelu=True,
+                 kernel=3, dilate=True):
+        """
+        Args:
+            channels: input/output channels for residual branch.
+            compress: amount of channel compression inside the branch.
+            depth: number of layers in the residual branch. Each layer has its own
+                projection, and potentially LSTM and attention.
+            init: initial scale for LayerNorm.
+            norm: use GroupNorm.
+            attn: use LocalAttention.
+            heads: number of heads for the LocalAttention.
+            ndecay: number of decay controls in the LocalAttention.
+            lstm: use LSTM.
+            gelu: Use GELU activation.
+            kernel: kernel size for the (dilated) convolutions.
+            dilate: if true, use dilation, increasing with the depth.
+        """
+
+        super().__init__()
+        assert kernel % 2 == 1
+        self.channels = channels
+        self.compress = compress
+        self.depth = abs(depth)
+        dilate = depth > 0
+
+        norm_fn: tp.Callable[[int], nn.Module]
+        norm_fn = lambda d: nn.Identity()  # noqa
+        if norm:
+            norm_fn = lambda d: nn.GroupNorm(1, d)  # noqa
+
+        hidden = int(channels / compress)
+
+        act: tp.Type[nn.Module]
+        if gelu:
+            act = nn.GELU
+        else:
+            act = nn.ReLU
+
+        self.layers = nn.ModuleList([])
+        for d in range(self.depth):
+            dilation = 2 ** d if dilate else 1
+            padding = dilation * (kernel // 2)
+            mods = [
+                nn.Conv1d(channels, hidden, kernel, dilation=dilation, padding=padding),
+                norm_fn(hidden), act(),
+                nn.Conv1d(hidden, 2 * channels, 1),
+                norm_fn(2 * channels), nn.GLU(1),
+                LayerScale(channels, init),
+            ]
+            if attn:
+                mods.insert(3, LocalState(hidden, heads=heads, ndecay=ndecay))
+            if lstm:
+                mods.insert(3, BLSTM(hidden, layers=2, max_steps=200, skip=True))
+            layer = nn.Sequential(*mods)
+            self.layers.append(layer)
+
+    def forward(self, x):
+        for layer in self.layers:
+            x = x + layer(x)
+        return x
+
+
+class LocalState(nn.Module):
+    """Local state allows to have attention based only on data (no positional embedding),
+    but while setting a constraint on the time window (e.g. decaying penalty term).
+
+    Also a failed experiments with trying to provide some frequency based attention.
+    """
+    def __init__(self, channels: int, heads: int = 4, nfreqs: int = 0, ndecay: int = 4):
+        super().__init__()
+        assert channels % heads == 0, (channels, heads)
+        self.heads = heads
+        self.nfreqs = nfreqs
+        self.ndecay = ndecay
+        self.content = nn.Conv1d(channels, channels, 1)
+        self.query = nn.Conv1d(channels, channels, 1)
+        self.key = nn.Conv1d(channels, channels, 1)
+        if nfreqs:
+            self.query_freqs = nn.Conv1d(channels, heads * nfreqs, 1)
+        if ndecay:
+            self.query_decay = nn.Conv1d(channels, heads * ndecay, 1)
+            # Initialize decay close to zero (there is a sigmoid), for maximum initial window.
+            self.query_decay.weight.data *= 0.01
+            assert self.query_decay.bias is not None  # stupid type checker
+            self.query_decay.bias.data[:] = -2
+        self.proj = nn.Conv1d(channels + heads * nfreqs, channels, 1)
+
+    def forward(self, x):
+        B, C, T = x.shape
+        heads = self.heads
+        indexes = torch.arange(T, device=x.device, dtype=x.dtype)
+        # left index are keys, right index are queries
+        delta = indexes[:, None] - indexes[None, :]
+
+        queries = self.query(x).view(B, heads, -1, T)
+        keys = self.key(x).view(B, heads, -1, T)
+        # t are keys, s are queries
+        dots = torch.einsum("bhct,bhcs->bhts", keys, queries)
+        dots /= keys.shape[2]**0.5
+        if self.nfreqs:
+            periods = torch.arange(1, self.nfreqs + 1, device=x.device, dtype=x.dtype)
+            freq_kernel = torch.cos(2 * math.pi * delta / periods.view(-1, 1, 1))
+            freq_q = self.query_freqs(x).view(B, heads, -1, T) / self.nfreqs ** 0.5
+            dots += torch.einsum("fts,bhfs->bhts", freq_kernel, freq_q)
+        if self.ndecay:
+            decays = torch.arange(1, self.ndecay + 1, device=x.device, dtype=x.dtype)
+            decay_q = self.query_decay(x).view(B, heads, -1, T)
+            decay_q = torch.sigmoid(decay_q) / 2
+            decay_kernel = - decays.view(-1, 1, 1) * delta.abs() / self.ndecay**0.5
+            dots += torch.einsum("fts,bhfs->bhts", decay_kernel, decay_q)
+
+        # Kill self reference.
+        dots.masked_fill_(torch.eye(T, device=dots.device, dtype=torch.bool), -100)
+        weights = torch.softmax(dots, dim=2)
+
+        content = self.content(x).view(B, heads, -1, T)
+        result = torch.einsum("bhts,bhct->bhcs", weights, content)
+        if self.nfreqs:
+            time_sig = torch.einsum("bhts,fts->bhfs", weights, freq_kernel)
+            result = torch.cat([result, time_sig], 2)
+        result = result.reshape(B, -1, T)
+        return x + self.proj(result)
+
+
+class Demucs(nn.Module):
+    @capture_init
+    def __init__(self,
+                 sources,
+                 # Channels
+                 audio_channels=2,
+                 channels=64,
+                 growth=2.,
+                 # Main structure
+                 depth=6,
+                 rewrite=True,
+                 lstm_layers=0,
+                 # Convolutions
+                 kernel_size=8,
+                 stride=4,
+                 context=1,
+                 # Activations
+                 gelu=True,
+                 glu=True,
+                 # Normalization
+                 norm_starts=4,
+                 norm_groups=4,
+                 # DConv residual branch
+                 dconv_mode=1,
+                 dconv_depth=2,
+                 dconv_comp=4,
+                 dconv_attn=4,
+                 dconv_lstm=4,
+                 dconv_init=1e-4,
+                 # Pre/post processing
+                 normalize=True,
+                 resample=True,
+                 # Weight init
+                 rescale=0.1,
+                 # Metadata
+                 samplerate=44100,
+                 segment=4 * 10):
+        """
+        Args:
+            sources (list[str]): list of source names
+            audio_channels (int): stereo or mono
+            channels (int): first convolution channels
+            depth (int): number of encoder/decoder layers
+            growth (float): multiply (resp divide) number of channels by that
+                for each layer of the encoder (resp decoder)
+            depth (int): number of layers in the encoder and in the decoder.
+            rewrite (bool): add 1x1 convolution to each layer.
+            lstm_layers (int): number of lstm layers, 0 = no lstm. Deactivated
+                by default, as this is now replaced by the smaller and faster small LSTMs
+                in the DConv branches.
+            kernel_size (int): kernel size for convolutions
+            stride (int): stride for convolutions
+            context (int): kernel size of the convolution in the
+                decoder before the transposed convolution. If > 1,
+                will provide some context from neighboring time steps.
+            gelu: use GELU activation function.
+            glu (bool): use glu instead of ReLU for the 1x1 rewrite conv.
+            norm_starts: layer at which group norm starts being used.
+                decoder layers are numbered in reverse order.
+            norm_groups: number of groups for group norm.
+            dconv_mode: if 1: dconv in encoder only, 2: decoder only, 3: both.
+            dconv_depth: depth of residual DConv branch.
+            dconv_comp: compression of DConv branch.
+            dconv_attn: adds attention layers in DConv branch starting at this layer.
+            dconv_lstm: adds a LSTM layer in DConv branch starting at this layer.
+            dconv_init: initial scale for the DConv branch LayerScale.
+            normalize (bool): normalizes the input audio on the fly, and scales back
+                the output by the same amount.
+            resample (bool): upsample x2 the input and downsample /2 the output.
+            rescale (int): rescale initial weights of convolutions
+                to get their standard deviation closer to `rescale`.
+            samplerate (int): stored as meta information for easing
+                future evaluations of the model.
+            segment (float): duration of the chunks of audio to ideally evaluate the model on.
+                This is used by `demucs.apply.apply_model`.
+        """
+
+        super().__init__()
+        self.audio_channels = audio_channels
+        self.sources = sources
+        self.kernel_size = kernel_size
+        self.context = context
+        self.stride = stride
+        self.depth = depth
+        self.resample = resample
+        self.channels = channels
+        self.normalize = normalize
+        self.samplerate = samplerate
+        self.segment = segment
+        self.encoder = nn.ModuleList()
+        self.decoder = nn.ModuleList()
+        self.skip_scales = nn.ModuleList()
+
+        if glu:
+            activation = nn.GLU(dim=1)
+            ch_scale = 2
+        else:
+            activation = nn.ReLU()
+            ch_scale = 1
+        if gelu:
+            act2 = nn.GELU
+        else:
+            act2 = nn.ReLU
+
+        in_channels = audio_channels
+        padding = 0
+        for index in range(depth):
+            norm_fn = lambda d: nn.Identity()  # noqa
+            if index >= norm_starts:
+                norm_fn = lambda d: nn.GroupNorm(norm_groups, d)  # noqa
+
+            encode = []
+            encode += [
+                nn.Conv1d(in_channels, channels, kernel_size, stride),
+                norm_fn(channels),
+                act2(),
+            ]
+            attn = index >= dconv_attn
+            lstm = index >= dconv_lstm
+            if dconv_mode & 1:
+                encode += [DConv(channels, depth=dconv_depth, init=dconv_init,
+                                 compress=dconv_comp, attn=attn, lstm=lstm)]
+            if rewrite:
+                encode += [
+                    nn.Conv1d(channels, ch_scale * channels, 1),
+                    norm_fn(ch_scale * channels), activation]
+            self.encoder.append(nn.Sequential(*encode))
+
+            decode = []
+            if index > 0:
+                out_channels = in_channels
+            else:
+                out_channels = len(self.sources) * audio_channels
+            if rewrite:
+                decode += [
+                    nn.Conv1d(channels, ch_scale * channels, 2 * context + 1, padding=context),
+                    norm_fn(ch_scale * channels), activation]
+            if dconv_mode & 2:
+                decode += [DConv(channels, depth=dconv_depth, init=dconv_init,
+                                 compress=dconv_comp, attn=attn, lstm=lstm)]
+            decode += [nn.ConvTranspose1d(channels, out_channels,
+                       kernel_size, stride, padding=padding)]
+            if index > 0:
+                decode += [norm_fn(out_channels), act2()]
+            self.decoder.insert(0, nn.Sequential(*decode))
+            in_channels = channels
+            channels = int(growth * channels)
+
+        channels = in_channels
+        if lstm_layers:
+            self.lstm = BLSTM(channels, lstm_layers)
+        else:
+            self.lstm = None
+
+        if rescale:
+            rescale_module(self, reference=rescale)
+
+    def valid_length(self, length):
+        """
+        Return the nearest valid length to use with the model so that
+        there is no time steps left over in a convolution, e.g. for all
+        layers, size of the input - kernel_size % stride = 0.
+
+        Note that input are automatically padded if necessary to ensure that the output
+        has the same length as the input.
+        """
+        if self.resample:
+            length *= 2
+
+        for _ in range(self.depth):
+            length = math.ceil((length - self.kernel_size) / self.stride) + 1
+            length = max(1, length)
+
+        for idx in range(self.depth):
+            length = (length - 1) * self.stride + self.kernel_size
+
+        if self.resample:
+            length = math.ceil(length / 2)
+        return int(length)
+
+    def forward(self, mix):
+        x = mix
+        length = x.shape[-1]
+
+        if self.normalize:
+            mono = mix.mean(dim=1, keepdim=True)
+            mean = mono.mean(dim=-1, keepdim=True)
+            std = mono.std(dim=-1, keepdim=True)
+            x = (x - mean) / (1e-5 + std)
+        else:
+            mean = 0
+            std = 1
+
+        delta = self.valid_length(length) - length
+        x = F.pad(x, (delta // 2, delta - delta // 2))
+
+        if self.resample:
+            x = julius.resample_frac(x, 1, 2)
+
+        saved = []
+        for encode in self.encoder:
+            x = encode(x)
+            saved.append(x)
+
+        if self.lstm:
+            x = self.lstm(x)
+
+        for decode in self.decoder:
+            skip = saved.pop(-1)
+            skip = center_trim(skip, x)
+            x = decode(x + skip)
+
+        if self.resample:
+            x = julius.resample_frac(x, 2, 1)
+        x = x * std + mean
+        x = center_trim(x, length)
+        x = x.view(x.size(0), len(self.sources), self.audio_channels, x.size(-1))
+        return x
+
+    def load_state_dict(self, state, strict=True):
+        # fix a mismatch with previous generation Demucs models.
+        for idx in range(self.depth):
+            for a in ['encoder', 'decoder']:
+                for b in ['bias', 'weight']:
+                    new = f'{a}.{idx}.3.{b}'
+                    old = f'{a}.{idx}.2.{b}'
+                    if old in state and new not in state:
+                        state[new] = state.pop(old)
+        super().load_state_dict(state, strict=strict)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/distrib.py b/AutoCoverTool/ref/music_remover/demucs/demucs/distrib.py
new file mode 100644
index 0000000..370822e
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/distrib.py
@@ -0,0 +1,100 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Distributed training utilities.
+"""
+import logging
+import pickle
+
+import numpy as np
+import torch
+from torch.utils.data.distributed import DistributedSampler
+from torch.utils.data import DataLoader, Subset
+from torch.nn.parallel.distributed import DistributedDataParallel
+
+from dora import distrib as dora_distrib
+
+logger = logging.getLogger(__name__)
+rank = 0
+world_size = 1
+
+
+def init():
+    global rank, world_size
+    if not torch.distributed.is_initialized():
+        dora_distrib.init()
+    rank = dora_distrib.rank()
+    world_size = dora_distrib.world_size()
+
+
+def average(metrics, count=1.):
+    if isinstance(metrics, dict):
+        keys, values = zip(*sorted(metrics.items()))
+        values = average(values, count)
+        return dict(zip(keys, values))
+    if world_size == 1:
+        return metrics
+    tensor = torch.tensor(list(metrics) + [1], device='cuda', dtype=torch.float32)
+    tensor *= count
+    torch.distributed.all_reduce(tensor, op=torch.distributed.ReduceOp.SUM)
+    return (tensor[:-1] / tensor[-1]).cpu().numpy().tolist()
+
+
+def wrap(model):
+    if world_size == 1:
+        return model
+    else:
+        return DistributedDataParallel(
+            model,
+            # find_unused_parameters=True,
+            device_ids=[torch.cuda.current_device()],
+            output_device=torch.cuda.current_device())
+
+
+def barrier():
+    if world_size > 1:
+        torch.distributed.barrier()
+
+
+def share(obj=None, src=0):
+    if world_size == 1:
+        return obj
+    size = torch.empty(1, device='cuda', dtype=torch.long)
+    if rank == src:
+        dump = pickle.dumps(obj)
+        size[0] = len(dump)
+    torch.distributed.broadcast(size, src=src)
+    # size variable is now set to the length of pickled obj in all processes
+
+    if rank == src:
+        buffer = torch.from_numpy(np.frombuffer(dump, dtype=np.uint8).copy()).cuda()
+    else:
+        buffer = torch.empty(size[0].item(), device='cuda', dtype=torch.uint8)
+    torch.distributed.broadcast(buffer, src=src)
+    # buffer variable is now set to pickled obj in all processes
+
+    if rank != src:
+        obj = pickle.loads(buffer.cpu().numpy().tobytes())
+    logger.debug(f"Shared object of size {len(buffer)}")
+    return obj
+
+
+def loader(dataset, *args, shuffle=False, klass=DataLoader, **kwargs):
+    """
+    Create a dataloader properly in case of distributed training.
+    If a gradient is going to be computed you must set `shuffle=True`.
+    """
+    if world_size == 1:
+        return klass(dataset, *args, shuffle=shuffle, **kwargs)
+
+    if shuffle:
+        # train means we will compute backward, we use DistributedSampler
+        sampler = DistributedSampler(dataset)
+        # We ignore shuffle, DistributedSampler already shuffles
+        return klass(dataset, *args, **kwargs, sampler=sampler)
+    else:
+        # We make a manual shard, as DistributedSampler otherwise replicate some examples
+        dataset = Subset(dataset, list(range(rank, len(dataset), world_size)))
+        return klass(dataset, *args, shuffle=shuffle, **kwargs)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/ema.py b/AutoCoverTool/ref/music_remover/demucs/demucs/ema.py
new file mode 100644
index 0000000..41e615a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/ema.py
@@ -0,0 +1,66 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+# Inspired from https://github.com/rwightman/pytorch-image-models
+from contextlib import contextmanager
+
+import torch
+
+from .states import swap_state
+
+
+class ModelEMA:
+    """
+    Perform EMA on a model. You can switch to the EMA weights temporarily
+    with the `swap` method.
+
+        ema = ModelEMA(model)
+        with ema.swap():
+            # compute valid metrics with averaged model.
+    """
+    def __init__(self, model, decay=0.9999, unbias=True, device='cpu'):
+        self.decay = decay
+        self.model = model
+        self.state = {}
+        self.count = 0
+        self.device = device
+        self.unbias = unbias
+
+        self._init()
+
+    def _init(self):
+        for key, val in self.model.state_dict().items():
+            if val.dtype != torch.float32:
+                continue
+            device = self.device or val.device
+            if key not in self.state:
+                self.state[key] = val.detach().to(device, copy=True)
+
+    def update(self):
+        if self.unbias:
+            self.count = self.count * self.decay + 1
+            w = 1 / self.count
+        else:
+            w = 1 - self.decay
+        for key, val in self.model.state_dict().items():
+            if val.dtype != torch.float32:
+                continue
+            device = self.device or val.device
+            self.state[key].mul_(1 - w)
+            self.state[key].add_(val.detach().to(device), alpha=w)
+
+    @contextmanager
+    def swap(self):
+        with swap_state(self.model, self.state):
+            yield
+
+    def state_dict(self):
+        return {'state': self.state, 'count': self.count}
+
+    def load_state_dict(self, state):
+        self.count = state['count']
+        for k, v in state['state'].items():
+            self.state[k].copy_(v)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/evaluate.py b/AutoCoverTool/ref/music_remover/demucs/demucs/evaluate.py
new file mode 100755
index 0000000..24e2994
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/evaluate.py
@@ -0,0 +1,174 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""Test time evaluation, either using the original SDR from [Vincent et al. 2006]
+or the newest SDR definition from the MDX 2021 competition (this one will
+be reported as `nsdr` for `new sdr`).
+"""
+
+from concurrent import futures
+import logging
+
+from dora.log import LogProgress
+import numpy as np
+import musdb
+import museval
+import torch as th
+
+from .apply import apply_model
+from .audio import convert_audio, save_audio
+from . import distrib
+from .utils import DummyPoolExecutor
+
+
+logger = logging.getLogger(__name__)
+
+
+def new_sdr(references, estimates):
+    """
+    Compute the SDR according to the MDX challenge definition.
+    Adapted from AIcrowd/music-demixing-challenge-starter-kit (MIT license)
+    """
+    assert references.dim() == 4
+    assert estimates.dim() == 4
+    delta = 1e-7  # avoid numerical errors
+    num = th.sum(th.square(references), dim=(2, 3))
+    den = th.sum(th.square(references - estimates), dim=(2, 3))
+    num += delta
+    den += delta
+    scores = 10 * th.log10(num / den)
+    return scores
+
+
+def eval_track(references, estimates, win, hop, compute_sdr=True):
+    references = references.transpose(1, 2).double()
+    estimates = estimates.transpose(1, 2).double()
+
+    new_scores = new_sdr(references.cpu()[None], estimates.cpu()[None])[0]
+
+    if not compute_sdr:
+        return None, new_scores
+    else:
+        references = references.numpy()
+        estimates = estimates.numpy()
+        scores = museval.metrics.bss_eval(
+            references, estimates,
+            compute_permutation=False,
+            window=win,
+            hop=hop,
+            framewise_filters=False,
+            bsseval_sources_version=False)[:-1]
+        return scores, new_scores
+
+
+def evaluate(solver, compute_sdr=False):
+    """
+    Evaluate model using museval.
+    compute_sdr=False means using only the MDX definition of the SDR, which
+    is much faster to evaluate.
+    """
+
+    args = solver.args
+
+    output_dir = solver.folder / "results"
+    output_dir.mkdir(exist_ok=True, parents=True)
+    json_folder = solver.folder / "results/test"
+    json_folder.mkdir(exist_ok=True, parents=True)
+
+    # we load tracks from the original musdb set
+    if args.test.nonhq is None:
+        test_set = musdb.DB(args.dset.musdb, subsets=["test"], is_wav=True)
+    else:
+        test_set = musdb.DB(args.test.nonhq, subsets=["test"], is_wav=False)
+    src_rate = args.dset.musdb_samplerate
+
+    eval_device = 'cpu'
+
+    model = solver.model
+    win = int(1. * model.samplerate)
+    hop = int(1. * model.samplerate)
+
+    indexes = range(distrib.rank, len(test_set), distrib.world_size)
+    indexes = LogProgress(logger, indexes, updates=args.misc.num_prints,
+                          name='Eval')
+    pendings = []
+
+    pool = futures.ProcessPoolExecutor if args.test.workers else DummyPoolExecutor
+    with pool(args.test.workers) as pool:
+        for index in indexes:
+            track = test_set.tracks[index]
+
+            mix = th.from_numpy(track.audio).t().float()
+            if mix.dim() == 1:
+                mix = mix[None]
+            mix = mix.to(solver.device)
+            ref = mix.mean(dim=0)  # mono mixture
+            mix = (mix - ref.mean()) / ref.std()
+            mix = convert_audio(mix, src_rate, model.samplerate, model.audio_channels)
+            estimates = apply_model(model, mix[None],
+                                    shifts=args.test.shifts, split=args.test.split,
+                                    overlap=args.test.overlap)[0]
+            estimates = estimates * ref.std() + ref.mean()
+            estimates = estimates.to(eval_device)
+
+            references = th.stack(
+                [th.from_numpy(track.targets[name].audio).t() for name in model.sources])
+            if references.dim() == 2:
+                references = references[:, None]
+            references = references.to(eval_device)
+            references = convert_audio(references, src_rate,
+                                       model.samplerate, model.audio_channels)
+            if args.test.save:
+                folder = solver.folder / "wav" / track.name
+                folder.mkdir(exist_ok=True, parents=True)
+                for name, estimate in zip(model.sources, estimates):
+                    save_audio(estimate.cpu(), folder / (name + ".mp3"), model.samplerate)
+
+            pendings.append((track.name, pool.submit(
+                eval_track, references, estimates, win=win, hop=hop, compute_sdr=compute_sdr)))
+
+        pendings = LogProgress(logger, pendings, updates=args.misc.num_prints,
+                               name='Eval (BSS)')
+        tracks = {}
+        for track_name, pending in pendings:
+            pending = pending.result()
+            scores, nsdrs = pending
+            tracks[track_name] = {}
+            for idx, target in enumerate(model.sources):
+                tracks[track_name][target] = {'nsdr': [float(nsdrs[idx])]}
+            if scores is not None:
+                (sdr, isr, sir, sar) = scores
+                for idx, target in enumerate(model.sources):
+                    values = {
+                        "SDR": sdr[idx].tolist(),
+                        "SIR": sir[idx].tolist(),
+                        "ISR": isr[idx].tolist(),
+                        "SAR": sar[idx].tolist()
+                    }
+                    tracks[track_name][target].update(values)
+
+        all_tracks = {}
+        for src in range(distrib.world_size):
+            all_tracks.update(distrib.share(tracks, src))
+
+        result = {}
+        metric_names = next(iter(all_tracks.values()))[model.sources[0]]
+        for metric_name in metric_names:
+            avg = 0
+            avg_of_medians = 0
+            for source in model.sources:
+                medians = [
+                    np.nanmedian(all_tracks[track][source][metric_name])
+                    for track in all_tracks.keys()]
+                mean = np.mean(medians)
+                median = np.median(medians)
+                result[metric_name.lower() + "_" + source] = mean
+                result[metric_name.lower() + "_med" + "_" + source] = median
+                avg += mean / len(model.sources)
+                avg_of_medians += median / len(model.sources)
+            result[metric_name.lower()] = avg
+            result[metric_name.lower() + "_med"] = avg_of_medians
+        return result
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/__init__.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/_explorers.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/_explorers.py
new file mode 100644
index 0000000..f01d84f
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/_explorers.py
@@ -0,0 +1,64 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+from dora import Explorer
+import treetable as tt
+
+
+class MyExplorer(Explorer):
+    test_metrics = ['nsdr', 'sdr_med']
+
+    def get_grid_metrics(self):
+        """Return the metrics that should be displayed in the tracking table.
+        """
+        return [
+            tt.group("train", [
+                tt.leaf("epoch"),
+                tt.leaf("reco", ".3f"),
+             ], align=">"),
+            tt.group("valid", [
+                tt.leaf("penalty", ".1f"),
+                tt.leaf("ms", ".1f"),
+                tt.leaf("reco", ".2%"),
+                tt.leaf("breco", ".2%"),
+                tt.leaf("b_nsdr", ".2f"),
+                # tt.leaf("b_nsdr_drums", ".2f"),
+                # tt.leaf("b_nsdr_bass", ".2f"),
+                # tt.leaf("b_nsdr_other", ".2f"),
+                # tt.leaf("b_nsdr_vocals", ".2f"),
+             ], align=">"),
+            tt.group("test", [
+                tt.leaf(name, ".2f")
+                for name in self.test_metrics
+             ], align=">")
+        ]
+
+    def process_history(self, history):
+        train = {
+            'epoch': len(history),
+        }
+        valid = {}
+        test = {}
+        best_v_main = float('inf')
+        breco = float('inf')
+        for metrics in history:
+            train.update(metrics['train'])
+            valid.update(metrics['valid'])
+            if 'main' in metrics['valid']:
+                best_v_main = min(best_v_main, metrics['valid']['main']['loss'])
+            valid['bmain'] = best_v_main
+            valid['breco'] = min(breco, metrics['valid']['reco'])
+            breco = valid['breco']
+            if (metrics['valid']['loss'] == metrics['valid']['best'] or
+                    metrics['valid'].get('nsdr') == metrics['valid']['best']):
+                for k, v in metrics['valid'].items():
+                    if k.startswith('reco_'):
+                        valid['b_' + k[len('reco_'):]] = v
+                    if k.startswith('nsdr'):
+                        valid[f'b_{k}'] = v
+            if 'test' in metrics:
+                test.update(metrics['test'])
+            metrics = history[-1]
+        return {"train": train, "valid": valid, "test": test}
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx.py
new file mode 100644
index 0000000..b35d8ab
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx.py
@@ -0,0 +1,33 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Main training for the Track A MDX models.
+"""
+
+from ._explorers import MyExplorer
+from ..train import main
+
+
+TRACK_A = ['0d19c1c6', '7ecf8ec1', 'c511e2ab', '7d865c68']
+
+
+@MyExplorer
+def explorer(launcher):
+    launcher.slurm_(
+        gpus=8,
+        time=3 * 24 * 60,
+        partition='learnlab')
+
+    # Reproduce results from MDX competition Track A
+    # This trains the first round of models. Once this is trained,
+    # you will need to schedule `mdx_refine`.
+    for sig in TRACK_A:
+        xp = main.get_xp_from_sig(sig)
+        parent = xp.cfg.continue_from
+        xp = main.get_xp_from_sig(parent)
+        launcher(xp.argv)
+        launcher(xp.argv, {'quant.diffq': 1e-4})
+        launcher(xp.argv, {'quant.diffq': 3e-4})
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx_extra.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx_extra.py
new file mode 100644
index 0000000..e32f7cd
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx_extra.py
@@ -0,0 +1,36 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Main training for the Track A MDX models.
+"""
+
+from ._explorers import MyExplorer
+from ..train import main
+
+TRACK_B = ['e51eebcc', 'a1d90b5c', '5d2d6c55', 'cfa93e08']
+
+
+@MyExplorer
+def explorer(launcher):
+    launcher.slurm_(
+        gpus=8,
+        time=3 * 24 * 60,
+        partition='learnlab')
+
+    # Reproduce results from MDX competition Track A
+    # This trains the first round of models. Once this is trained,
+    # you will need to schedule `mdx_refine`.
+    for sig in TRACK_B:
+        while sig is not None:
+            xp = main.get_xp_from_sig(sig)
+            sig = xp.cfg.continue_from
+
+        for dset in ['extra44', 'extra_test']:
+            sub = launcher.bind(xp.argv, dset=dset)
+            sub()
+            if dset == 'extra_test':
+                sub({'quant.diffq': 1e-4})
+                sub({'quant.diffq': 3e-4})
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx_refine.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx_refine.py
new file mode 100644
index 0000000..496a879
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mdx_refine.py
@@ -0,0 +1,34 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Main training for the Track A MDX models.
+"""
+
+from ._explorers import MyExplorer
+from .mdx import TRACK_A
+from ..train import main
+
+
+@MyExplorer
+def explorer(launcher):
+    launcher.slurm_(
+        gpus=8,
+        time=3 * 24 * 60,
+        partition='learnlab')
+
+    # Reproduce results from MDX competition Track A
+    # WARNING: all the experiments in the `mdx` grid must have completed.
+    for sig in TRACK_A:
+        xp = main.get_xp_from_sig(sig)
+        launcher(xp.argv)
+        for diffq in [1e-4, 3e-4]:
+            xp_src = main.get_xp_from_sig(xp.cfg.continue_from)
+            q_argv = [f'quant.diffq={diffq}']
+            actual_src = main.get_xp(xp_src.argv + q_argv)
+            actual_src.link.load()
+            assert len(actual_src.link.history) == actual_src.cfg.epochs
+            argv = xp.argv + q_argv + [f'continue_from="{actual_src.sig}"']
+            launcher(argv)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mmi.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mmi.py
new file mode 100644
index 0000000..f51e1b8
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mmi.py
@@ -0,0 +1,69 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+from ._explorers import MyExplorer
+from dora import Launcher
+
+
+@MyExplorer
+def explorer(launcher: Launcher):
+    launcher.slurm_(gpus=8, time=3 * 24 * 60, partition="devlab,learnlab,learnfair")  # 3 days
+
+    sub = launcher.bind_(
+        {
+            "dset": "extra_mmi_goodclean",
+            "test.shifts": 0,
+            "model": "htdemucs",
+            "htdemucs.dconv_mode": 3,
+            "htdemucs.depth": 4,
+            "htdemucs.t_dropout": 0.02,
+            "htdemucs.t_layers": 5,
+            "max_batches": 800,
+            "ema.epoch": [0.9, 0.95],
+            "ema.batch": [0.9995, 0.9999],
+            "dset.segment": 10,
+            "batch_size": 32,
+        }
+    )
+    sub({"model": "hdemucs"})
+    sub({"model": "hdemucs", "dset": "extra44"})
+    sub({"model": "hdemucs", "dset": "musdb44"})
+
+    sparse = {
+        'batch_size': 3 * 8,
+        'augment.remix.group_size': 3,
+        'htdemucs.t_auto_sparsity': True,
+        'htdemucs.t_sparse_self_attn': True,
+        'htdemucs.t_sparse_cross_attn': True,
+        'htdemucs.t_sparsity': 0.9,
+        "htdemucs.t_layers": 7
+    }
+
+    with launcher.job_array():
+        for transf_layers in [5, 7]:
+            for bottom_channels in [0, 512]:
+                sub = launcher.bind({
+                    "htdemucs.t_layers": transf_layers,
+                    "htdemucs.bottom_channels": bottom_channels,
+                })
+                if bottom_channels == 0 and transf_layers == 5:
+                    sub({"augment.remix.proba": 0.0})
+                    sub({
+                        "augment.repitch.proba": 0.0,
+                        # when doing repitching, we trim the outut to align on the
+                        # highest change of BPM. When removing repitching,
+                        # we simulate it here to ensure the training context is the same.
+                        # Another second is lost for all experiments due to the random
+                        # shift augmentation.
+                        "dset.segment": 10 * 0.88})
+                elif bottom_channels == 512 and transf_layers == 5:
+                    sub(dset="musdb44")
+                    sub(dset="extra44")
+                    # Sparse kernel XP, currently not released as kernels are still experimental.
+                    sub(sparse, {'dset.segment': 15, "htdemucs.t_layers": 7})
+
+                for duration in [5, 10, 15]:
+                    sub({"dset.segment": duration})
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mmi_ft.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mmi_ft.py
new file mode 100644
index 0000000..10de9c8
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/mmi_ft.py
@@ -0,0 +1,55 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+from ._explorers import MyExplorer
+from dora import Launcher
+from demucs import train
+
+
+def get_sub(launcher, sig):
+    xp = train.main.get_xp_from_sig(sig)
+    sub = launcher.bind(xp.argv)
+    sub()
+    sub.bind_({
+        'continue_from': sig,
+        'continue_best': True})
+    return sub
+
+
+@MyExplorer
+def explorer(launcher: Launcher):
+    launcher.slurm_(gpus=4, time=3 * 24 * 60, partition="devlab,learnlab,learnfair")  # 3 days
+    ft = {
+        'optim.lr': 1e-4,
+        'augment.remix.proba': 0,
+        'augment.scale.proba': 0,
+        'augment.shift_same': True,
+        'htdemucs.t_weight_decay': 0.05,
+        'batch_size': 8,
+        'optim.clip_grad': 5,
+        'optim.optim': 'adamw',
+        'epochs': 50,
+        'dset.wav2_valid': True,
+        'ema.epoch': [],  # let's make valid a bit faster
+    }
+    with launcher.job_array():
+        for sig in ['2899e11a']:
+            sub = get_sub(launcher, sig)
+            sub.bind_(ft)
+            for segment in [15, 18]:
+                for source in range(4):
+                    w = [0] * 4
+                    w[source] = 1
+                    sub({'weights': w, 'dset.segment': segment})
+
+        for sig in ['955717e8']:
+            sub = get_sub(launcher, sig)
+            sub.bind_(ft)
+            for segment in [10, 15]:
+                for source in range(4):
+                    w = [0] * 4
+                    w[source] = 1
+                    sub({'weights': w, 'dset.segment': segment})
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/repro.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/repro.py
new file mode 100644
index 0000000..c5eba72
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/repro.py
@@ -0,0 +1,50 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Easier training for reproducibility
+"""
+
+from ._explorers import MyExplorer
+
+
+@MyExplorer
+def explorer(launcher):
+    launcher.slurm_(
+        gpus=8,
+        time=3 * 24 * 60,
+        partition='devlab,learnlab')
+
+    launcher.bind_({'ema.epoch': [0.9, 0.95]})
+    launcher.bind_({'ema.batch': [0.9995, 0.9999]})
+    launcher.bind_({'epochs': 600})
+
+    base = {'model': 'demucs', 'demucs.dconv_mode': 0, 'demucs.gelu': False,
+            'demucs.lstm_layers': 2}
+    newt = {'model': 'demucs', 'demucs.normalize': True}
+    hdem = {'model': 'hdemucs'}
+    svd = {'svd.penalty': 1e-5, 'svd': 'base2'}
+
+    with launcher.job_array():
+        for model in [base, newt, hdem]:
+            sub = launcher.bind(model)
+            if model is base:
+                # Training the v2 Demucs on MusDB HQ
+                sub(epochs=360)
+                continue
+
+            # those two will be used in the repro_mdx_a bag of models.
+            sub(svd)
+            sub(svd, seed=43)
+            if model == newt:
+                # Ablation study
+                sub()
+                abl = sub.bind(svd)
+                abl({'ema.epoch': [], 'ema.batch': []})
+                abl({'demucs.dconv_lstm': 10})
+                abl({'demucs.dconv_attn': 10})
+                abl({'demucs.dconv_attn': 10, 'demucs.dconv_lstm': 10, 'demucs.lstm_layers': 2})
+                abl({'demucs.dconv_mode': 0})
+                abl({'demucs.gelu': False})
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/grids/repro_ft.py b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/repro_ft.py
new file mode 100644
index 0000000..2399fcc
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/grids/repro_ft.py
@@ -0,0 +1,46 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Fine tuning experiments
+"""
+
+from ._explorers import MyExplorer
+from ..train import main
+
+
+@MyExplorer
+def explorer(launcher):
+    launcher.slurm_(
+        gpus=8,
+        time=300,
+        partition='devlab,learnlab')
+
+    # Mus
+    launcher.slurm_(constraint='volta32gb')
+
+    grid = "repro"
+    folder = main.dora.dir / "grids" / grid
+
+    for sig in folder.iterdir():
+        if not sig.is_symlink():
+            continue
+        xp = main.get_xp_from_sig(sig)
+        xp.link.load()
+        if len(xp.link.history) != xp.cfg.epochs:
+            continue
+        sub = launcher.bind(xp.argv, [f'continue_from="{xp.sig}"'])
+        sub.bind_({'ema.epoch': [0.9, 0.95], 'ema.batch': [0.9995, 0.9999]})
+        sub.bind_({'test.every': 1, 'test.sdr': True, 'epochs': 4})
+        sub.bind_({'dset.segment': 28, 'dset.shift': 2})
+        sub.bind_({'batch_size': 32})
+        auto = {'dset': 'auto_mus'}
+        auto.update({'augment.remix.proba': 0, 'augment.scale.proba': 0,
+                     'augment.shift_same': True})
+        sub.bind_(auto)
+        sub.bind_({'batch_size': 16})
+        sub.bind_({'optim.lr': 1e-4})
+        sub.bind_({'model_segment': 44})
+        sub()
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/hdemucs.py b/AutoCoverTool/ref/music_remover/demucs/demucs/hdemucs.py
new file mode 100644
index 0000000..c2e0ae7
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/hdemucs.py
@@ -0,0 +1,784 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+This code contains the spectrogram and Hybrid version of Demucs.
+"""
+from copy import deepcopy
+import math
+import typing as tp
+
+from openunmix.filtering import wiener
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+from .demucs import DConv, rescale_module
+from .states import capture_init
+from .spec import spectro, ispectro
+
+
+def pad1d(x: torch.Tensor, paddings: tp.Tuple[int, int], mode: str = 'constant', value: float = 0.):
+    """Tiny wrapper around F.pad, just to allow for reflect padding on small input.
+    If this is the case, we insert extra 0 padding to the right before the reflection happen."""
+    x0 = x
+    length = x.shape[-1]
+    padding_left, padding_right = paddings
+    if mode == 'reflect':
+        max_pad = max(padding_left, padding_right)
+        if length <= max_pad:
+            extra_pad = max_pad - length + 1
+            extra_pad_right = min(padding_right, extra_pad)
+            extra_pad_left = extra_pad - extra_pad_right
+            paddings = (padding_left - extra_pad_left, padding_right - extra_pad_right)
+            x = F.pad(x, (extra_pad_left, extra_pad_right))
+    out = F.pad(x, paddings, mode, value)
+    assert out.shape[-1] == length + padding_left + padding_right
+    if not (out[..., padding_left: padding_left + length] == x0).all():
+        raise RuntimeError("pad1d err!")
+    # assert (out[..., padding_left: padding_left + length] == x0).all()
+    return out
+
+
+class ScaledEmbedding(nn.Module):
+    """
+    Boost learning rate for embeddings (with `scale`).
+    Also, can make embeddings continuous with `smooth`.
+    """
+    def __init__(self, num_embeddings: int, embedding_dim: int,
+                 scale: float = 10., smooth=False):
+        super().__init__()
+        self.embedding = nn.Embedding(num_embeddings, embedding_dim)
+        if smooth:
+            weight = torch.cumsum(self.embedding.weight.data, dim=0)
+            # when summing gaussian, overscale raises as sqrt(n), so we nornalize by that.
+            weight = weight / torch.arange(1, num_embeddings + 1).to(weight).sqrt()[:, None]
+            self.embedding.weight.data[:] = weight
+        self.embedding.weight.data /= scale
+        self.scale = scale
+
+    @property
+    def weight(self):
+        return self.embedding.weight * self.scale
+
+    def forward(self, x):
+        out = self.embedding(x) * self.scale
+        return out
+
+
+class HEncLayer(nn.Module):
+    def __init__(self, chin, chout, kernel_size=8, stride=4, norm_groups=1, empty=False,
+                 freq=True, dconv=True, norm=True, context=0, dconv_kw={}, pad=True,
+                 rewrite=True):
+        """Encoder layer. This used both by the time and the frequency branch.
+
+        Args:
+            chin: number of input channels.
+            chout: number of output channels.
+            norm_groups: number of groups for group norm.
+            empty: used to make a layer with just the first conv. this is used
+                before merging the time and freq. branches.
+            freq: this is acting on frequencies.
+            dconv: insert DConv residual branches.
+            norm: use GroupNorm.
+            context: context size for the 1x1 conv.
+            dconv_kw: list of kwargs for the DConv class.
+            pad: pad the input. Padding is done so that the output size is
+                always the input size / stride.
+            rewrite: add 1x1 conv at the end of the layer.
+        """
+        super().__init__()
+        norm_fn = lambda d: nn.Identity()  # noqa
+        if norm:
+            norm_fn = lambda d: nn.GroupNorm(norm_groups, d)  # noqa
+        if pad:
+            pad = kernel_size // 4
+        else:
+            pad = 0
+        klass = nn.Conv1d
+        self.freq = freq
+        self.kernel_size = kernel_size
+        self.stride = stride
+        self.empty = empty
+        self.norm = norm
+        self.pad = pad
+        if freq:
+            kernel_size = [kernel_size, 1]
+            stride = [stride, 1]
+            pad = [pad, 0]
+            klass = nn.Conv2d
+        self.conv = klass(chin, chout, kernel_size, stride, pad)
+        if self.empty:
+            return
+        self.norm1 = norm_fn(chout)
+        self.rewrite = None
+        if rewrite:
+            self.rewrite = klass(chout, 2 * chout, 1 + 2 * context, 1, context)
+            self.norm2 = norm_fn(2 * chout)
+
+        self.dconv = None
+        if dconv:
+            self.dconv = DConv(chout, **dconv_kw)
+
+    def forward(self, x, inject=None):
+        """
+        `inject` is used to inject the result from the time branch into the frequency branch,
+        when both have the same stride.
+        """
+        if not self.freq and x.dim() == 4:
+            B, C, Fr, T = x.shape
+            x = x.view(B, -1, T)
+
+        if not self.freq:
+            le = x.shape[-1]
+            if not le % self.stride == 0:
+                x = F.pad(x, (0, self.stride - (le % self.stride)))
+        y = self.conv(x)
+        if self.empty:
+            return y
+        if inject is not None:
+            assert inject.shape[-1] == y.shape[-1], (inject.shape, y.shape)
+            if inject.dim() == 3 and y.dim() == 4:
+                inject = inject[:, :, None]
+            y = y + inject
+        y = F.gelu(self.norm1(y))
+        if self.dconv:
+            if self.freq:
+                B, C, Fr, T = y.shape
+                y = y.permute(0, 2, 1, 3).reshape(-1, C, T)
+            y = self.dconv(y)
+            if self.freq:
+                y = y.view(B, Fr, C, T).permute(0, 2, 1, 3)
+        if self.rewrite:
+            z = self.norm2(self.rewrite(y))
+            z = F.glu(z, dim=1)
+        else:
+            z = y
+        return z
+
+
+class MultiWrap(nn.Module):
+    """
+    Takes one layer and replicate it N times. each replica will act
+    on a frequency band. All is done so that if the N replica have the same weights,
+    then this is exactly equivalent to applying the original module on all frequencies.
+
+    This is a bit over-engineered to avoid edge artifacts when splitting
+    the frequency bands, but it is possible the naive implementation would work as well...
+    """
+    def __init__(self, layer, split_ratios):
+        """
+        Args:
+            layer: module to clone, must be either HEncLayer or HDecLayer.
+            split_ratios: list of float indicating which ratio to keep for each band.
+        """
+        super().__init__()
+        self.split_ratios = split_ratios
+        self.layers = nn.ModuleList()
+        self.conv = isinstance(layer, HEncLayer)
+        assert not layer.norm
+        assert layer.freq
+        assert layer.pad
+        if not self.conv:
+            assert not layer.context_freq
+        for k in range(len(split_ratios) + 1):
+            lay = deepcopy(layer)
+            if self.conv:
+                lay.conv.padding = (0, 0)
+            else:
+                lay.pad = False
+            for m in lay.modules():
+                if hasattr(m, 'reset_parameters'):
+                    m.reset_parameters()
+            self.layers.append(lay)
+
+    def forward(self, x, skip=None, length=None):
+        B, C, Fr, T = x.shape
+
+        ratios = list(self.split_ratios) + [1]
+        start = 0
+        outs = []
+        for ratio, layer in zip(ratios, self.layers):
+            if self.conv:
+                pad = layer.kernel_size // 4
+                if ratio == 1:
+                    limit = Fr
+                    frames = -1
+                else:
+                    limit = int(round(Fr * ratio))
+                    le = limit - start
+                    if start == 0:
+                        le += pad
+                    frames = round((le - layer.kernel_size) / layer.stride + 1)
+                    limit = start + (frames - 1) * layer.stride + layer.kernel_size
+                    if start == 0:
+                        limit -= pad
+                assert limit - start > 0, (limit, start)
+                assert limit <= Fr, (limit, Fr)
+                y = x[:, :, start:limit, :]
+                if start == 0:
+                    y = F.pad(y, (0, 0, pad, 0))
+                if ratio == 1:
+                    y = F.pad(y, (0, 0, 0, pad))
+                outs.append(layer(y))
+                start = limit - layer.kernel_size + layer.stride
+            else:
+                if ratio == 1:
+                    limit = Fr
+                else:
+                    limit = int(round(Fr * ratio))
+                last = layer.last
+                layer.last = True
+
+                y = x[:, :, start:limit]
+                s = skip[:, :, start:limit]
+                out, _ = layer(y, s, None)
+                if outs:
+                    outs[-1][:, :, -layer.stride:] += (
+                        out[:, :, :layer.stride] - layer.conv_tr.bias.view(1, -1, 1, 1))
+                    out = out[:, :, layer.stride:]
+                if ratio == 1:
+                    out = out[:, :, :-layer.stride // 2, :]
+                if start == 0:
+                    out = out[:, :, layer.stride // 2:, :]
+                outs.append(out)
+                layer.last = last
+                start = limit
+        out = torch.cat(outs, dim=2)
+        if not self.conv and not last:
+            out = F.gelu(out)
+        if self.conv:
+            return out
+        else:
+            return out, None
+
+
+class HDecLayer(nn.Module):
+    def __init__(self, chin, chout, last=False, kernel_size=8, stride=4, norm_groups=1, empty=False,
+                 freq=True, dconv=True, norm=True, context=1, dconv_kw={}, pad=True,
+                 context_freq=True, rewrite=True):
+        """
+        Same as HEncLayer but for decoder. See `HEncLayer` for documentation.
+        """
+        super().__init__()
+        norm_fn = lambda d: nn.Identity()  # noqa
+        if norm:
+            norm_fn = lambda d: nn.GroupNorm(norm_groups, d)  # noqa
+        if pad:
+            pad = kernel_size // 4
+        else:
+            pad = 0
+        self.pad = pad
+        self.last = last
+        self.freq = freq
+        self.chin = chin
+        self.empty = empty
+        self.stride = stride
+        self.kernel_size = kernel_size
+        self.norm = norm
+        self.context_freq = context_freq
+        klass = nn.Conv1d
+        klass_tr = nn.ConvTranspose1d
+        if freq:
+            kernel_size = [kernel_size, 1]
+            stride = [stride, 1]
+            klass = nn.Conv2d
+            klass_tr = nn.ConvTranspose2d
+        self.conv_tr = klass_tr(chin, chout, kernel_size, stride)
+        self.norm2 = norm_fn(chout)
+        if self.empty:
+            return
+        self.rewrite = None
+        if rewrite:
+            if context_freq:
+                self.rewrite = klass(chin, 2 * chin, 1 + 2 * context, 1, context)
+            else:
+                self.rewrite = klass(chin, 2 * chin, [1, 1 + 2 * context], 1,
+                                     [0, context])
+            self.norm1 = norm_fn(2 * chin)
+
+        self.dconv = None
+        if dconv:
+            self.dconv = DConv(chin, **dconv_kw)
+
+    def forward(self, x, skip, length):
+        if self.freq and x.dim() == 3:
+            B, C, T = x.shape
+            x = x.view(B, self.chin, -1, T)
+
+        if not self.empty:
+            x = x + skip
+
+            if self.rewrite:
+                y = F.glu(self.norm1(self.rewrite(x)), dim=1)
+            else:
+                y = x
+            if self.dconv:
+                if self.freq:
+                    B, C, Fr, T = y.shape
+                    y = y.permute(0, 2, 1, 3).reshape(-1, C, T)
+                y = self.dconv(y)
+                if self.freq:
+                    y = y.view(B, Fr, C, T).permute(0, 2, 1, 3)
+        else:
+            y = x
+            assert skip is None
+        z = self.norm2(self.conv_tr(y))
+        if self.freq:
+            if self.pad:
+                z = z[..., self.pad:-self.pad, :]
+        else:
+            z = z[..., self.pad:self.pad + length]
+            assert z.shape[-1] == length, (z.shape[-1], length)
+        if not self.last:
+            z = F.gelu(z)
+        return z, y
+
+
+class HDemucs(nn.Module):
+    """
+    Spectrogram and hybrid Demucs model.
+    The spectrogram model has the same structure as Demucs, except the first few layers are over the
+    frequency axis, until there is only 1 frequency, and then it moves to time convolutions.
+    Frequency layers can still access information across time steps thanks to the DConv residual.
+
+    Hybrid model have a parallel time branch. At some layer, the time branch has the same stride
+    as the frequency branch and then the two are combined. The opposite happens in the decoder.
+
+    Models can either use naive iSTFT from masking, Wiener filtering ([Ulhih et al. 2017]),
+    or complex as channels (CaC) [Choi et al. 2020]. Wiener filtering is based on
+    Open Unmix implementation [Stoter et al. 2019].
+
+    The loss is always on the temporal domain, by backpropagating through the above
+    output methods and iSTFT. This allows to define hybrid models nicely. However, this breaks
+    a bit Wiener filtering, as doing more iteration at test time will change the spectrogram
+    contribution, without changing the one from the waveform, which will lead to worse performance.
+    I tried using the residual option in OpenUnmix Wiener implementation, but it didn't improve.
+    CaC on the other hand provides similar performance for hybrid, and works naturally with
+    hybrid models.
+
+    This model also uses frequency embeddings are used to improve efficiency on convolutions
+    over the freq. axis, following [Isik et al. 2020] (https://arxiv.org/pdf/2008.04470.pdf).
+
+    Unlike classic Demucs, there is no resampling here, and normalization is always applied.
+    """
+    @capture_init
+    def __init__(self,
+                 sources,
+                 # Channels
+                 audio_channels=2,
+                 channels=48,
+                 channels_time=None,
+                 growth=2,
+                 # STFT
+                 nfft=4096,
+                 wiener_iters=0,
+                 end_iters=0,
+                 wiener_residual=False,
+                 cac=True,
+                 # Main structure
+                 depth=6,
+                 rewrite=True,
+                 hybrid=True,
+                 hybrid_old=False,
+                 # Frequency branch
+                 multi_freqs=None,
+                 multi_freqs_depth=2,
+                 freq_emb=0.2,
+                 emb_scale=10,
+                 emb_smooth=True,
+                 # Convolutions
+                 kernel_size=8,
+                 time_stride=2,
+                 stride=4,
+                 context=1,
+                 context_enc=0,
+                 # Normalization
+                 norm_starts=4,
+                 norm_groups=4,
+                 # DConv residual branch
+                 dconv_mode=1,
+                 dconv_depth=2,
+                 dconv_comp=4,
+                 dconv_attn=4,
+                 dconv_lstm=4,
+                 dconv_init=1e-4,
+                 # Weight init
+                 rescale=0.1,
+                 # Metadata
+                 samplerate=44100,
+                 segment=4 * 10):
+        """
+        Args:
+            sources (list[str]): list of source names.
+            audio_channels (int): input/output audio channels.
+            channels (int): initial number of hidden channels.
+            channels_time: if not None, use a different `channels` value for the time branch.
+            growth: increase the number of hidden channels by this factor at each layer.
+            nfft: number of fft bins. Note that changing this require careful computation of
+                various shape parameters and will not work out of the box for hybrid models.
+            wiener_iters: when using Wiener filtering, number of iterations at test time.
+            end_iters: same but at train time. For a hybrid model, must be equal to `wiener_iters`.
+            wiener_residual: add residual source before wiener filtering.
+            cac: uses complex as channels, i.e. complex numbers are 2 channels each
+                in input and output. no further processing is done before ISTFT.
+            depth (int): number of layers in the encoder and in the decoder.
+            rewrite (bool): add 1x1 convolution to each layer.
+            hybrid (bool): make a hybrid time/frequency domain, otherwise frequency only.
+            hybrid_old: some models trained for MDX had a padding bug. This replicates
+                this bug to avoid retraining them.
+            multi_freqs: list of frequency ratios for splitting frequency bands with `MultiWrap`.
+            multi_freqs_depth: how many layers to wrap with `MultiWrap`. Only the outermost
+                layers will be wrapped.
+            freq_emb: add frequency embedding after the first frequency layer if > 0,
+                the actual value controls the weight of the embedding.
+            emb_scale: equivalent to scaling the embedding learning rate
+            emb_smooth: initialize the embedding with a smooth one (with respect to frequencies).
+            kernel_size: kernel_size for encoder and decoder layers.
+            stride: stride for encoder and decoder layers.
+            time_stride: stride for the final time layer, after the merge.
+            context: context for 1x1 conv in the decoder.
+            context_enc: context for 1x1 conv in the encoder.
+            norm_starts: layer at which group norm starts being used.
+                decoder layers are numbered in reverse order.
+            norm_groups: number of groups for group norm.
+            dconv_mode: if 1: dconv in encoder only, 2: decoder only, 3: both.
+            dconv_depth: depth of residual DConv branch.
+            dconv_comp: compression of DConv branch.
+            dconv_attn: adds attention layers in DConv branch starting at this layer.
+            dconv_lstm: adds a LSTM layer in DConv branch starting at this layer.
+            dconv_init: initial scale for the DConv branch LayerScale.
+            rescale: weight recaling trick
+
+        """
+        super().__init__()
+        self.cac = cac
+        self.wiener_residual = wiener_residual
+        self.audio_channels = audio_channels
+        self.sources = sources
+        self.kernel_size = kernel_size
+        self.context = context
+        self.stride = stride
+        self.depth = depth
+        self.channels = channels
+        self.samplerate = samplerate
+        self.segment = segment
+
+        self.nfft = nfft
+        self.hop_length = nfft // 4
+        self.wiener_iters = wiener_iters
+        self.end_iters = end_iters
+        self.freq_emb = None
+        self.hybrid = hybrid
+        self.hybrid_old = hybrid_old
+        if hybrid_old:
+            assert hybrid, "hybrid_old must come with hybrid=True"
+        if hybrid:
+            assert wiener_iters == end_iters
+
+        self.encoder = nn.ModuleList()
+        self.decoder = nn.ModuleList()
+
+        if hybrid:
+            self.tencoder = nn.ModuleList()
+            self.tdecoder = nn.ModuleList()
+
+        chin = audio_channels
+        chin_z = chin  # number of channels for the freq branch
+        if self.cac:
+            chin_z *= 2
+        chout = channels_time or channels
+        chout_z = channels
+        freqs = nfft // 2
+
+        for index in range(depth):
+            lstm = index >= dconv_lstm
+            attn = index >= dconv_attn
+            norm = index >= norm_starts
+            freq = freqs > 1
+            stri = stride
+            ker = kernel_size
+            if not freq:
+                assert freqs == 1
+                ker = time_stride * 2
+                stri = time_stride
+
+            pad = True
+            last_freq = False
+            if freq and freqs <= kernel_size:
+                ker = freqs
+                pad = False
+                last_freq = True
+
+            kw = {
+                'kernel_size': ker,
+                'stride': stri,
+                'freq': freq,
+                'pad': pad,
+                'norm': norm,
+                'rewrite': rewrite,
+                'norm_groups': norm_groups,
+                'dconv_kw': {
+                    'lstm': lstm,
+                    'attn': attn,
+                    'depth': dconv_depth,
+                    'compress': dconv_comp,
+                    'init': dconv_init,
+                    'gelu': True,
+                }
+            }
+            kwt = dict(kw)
+            kwt['freq'] = 0
+            kwt['kernel_size'] = kernel_size
+            kwt['stride'] = stride
+            kwt['pad'] = True
+            kw_dec = dict(kw)
+            multi = False
+            if multi_freqs and index < multi_freqs_depth:
+                multi = True
+                kw_dec['context_freq'] = False
+
+            if last_freq:
+                chout_z = max(chout, chout_z)
+                chout = chout_z
+
+            enc = HEncLayer(chin_z, chout_z,
+                            dconv=dconv_mode & 1, context=context_enc, **kw)
+            if hybrid and freq:
+                tenc = HEncLayer(chin, chout, dconv=dconv_mode & 1, context=context_enc,
+                                 empty=last_freq, **kwt)
+                self.tencoder.append(tenc)
+
+            if multi:
+                enc = MultiWrap(enc, multi_freqs)
+            self.encoder.append(enc)
+            if index == 0:
+                chin = self.audio_channels * len(self.sources)
+                chin_z = chin
+                if self.cac:
+                    chin_z *= 2
+            dec = HDecLayer(chout_z, chin_z, dconv=dconv_mode & 2,
+                            last=index == 0, context=context, **kw_dec)
+            if multi:
+                dec = MultiWrap(dec, multi_freqs)
+            if hybrid and freq:
+                tdec = HDecLayer(chout, chin, dconv=dconv_mode & 2, empty=last_freq,
+                                 last=index == 0, context=context, **kwt)
+                self.tdecoder.insert(0, tdec)
+            self.decoder.insert(0, dec)
+
+            chin = chout
+            chin_z = chout_z
+            chout = int(growth * chout)
+            chout_z = int(growth * chout_z)
+            if freq:
+                if freqs <= kernel_size:
+                    freqs = 1
+                else:
+                    freqs //= stride
+            if index == 0 and freq_emb:
+                self.freq_emb = ScaledEmbedding(
+                    freqs, chin_z, smooth=emb_smooth, scale=emb_scale)
+                self.freq_emb_scale = freq_emb
+
+        if rescale:
+            rescale_module(self, reference=rescale)
+
+    def _spec(self, x):
+        hl = self.hop_length
+        nfft = self.nfft
+        x0 = x  # noqa
+
+        if self.hybrid:
+            # We re-pad the signal in order to keep the property
+            # that the size of the output is exactly the size of the input
+            # divided by the stride (here hop_length), when divisible.
+            # This is achieved by padding by 1/4th of the kernel size (here nfft).
+            # which is not supported by torch.stft.
+            # Having all convolution operations follow this convention allow to easily
+            # align the time and frequency branches later on.
+            assert hl == nfft // 4
+            le = int(math.ceil(x.shape[-1] / hl))
+            pad = hl // 2 * 3
+            if not self.hybrid_old:
+                x = pad1d(x, (pad, pad + le * hl - x.shape[-1]), mode='reflect')
+            else:
+                x = pad1d(x, (pad, pad + le * hl - x.shape[-1]))
+
+        z = spectro(x, nfft, hl)[..., :-1, :]
+        if self.hybrid:
+            assert z.shape[-1] == le + 4, (z.shape, x.shape, le)
+            z = z[..., 2:2+le]
+        return z
+
+    def _ispec(self, z, length=None, scale=0):
+        hl = self.hop_length // (4 ** scale)
+        z = F.pad(z, (0, 0, 0, 1))
+        if self.hybrid:
+            z = F.pad(z, (2, 2))
+            pad = hl // 2 * 3
+            if not self.hybrid_old:
+                le = hl * int(math.ceil(length / hl)) + 2 * pad
+            else:
+                le = hl * int(math.ceil(length / hl))
+            x = ispectro(z, hl, length=le)
+            if not self.hybrid_old:
+                x = x[..., pad:pad + length]
+            else:
+                x = x[..., :length]
+        else:
+            x = ispectro(z, hl, length)
+        return x
+
+    def _magnitude(self, z):
+        # return the magnitude of the spectrogram, except when cac is True,
+        # in which case we just move the complex dimension to the channel one.
+        if self.cac:
+            B, C, Fr, T = z.shape
+            m = torch.view_as_real(z).permute(0, 1, 4, 2, 3)
+            m = m.reshape(B, C * 2, Fr, T)
+        else:
+            m = z.abs()
+        return m
+
+    def _mask(self, z, m):
+        # Apply masking given the mixture spectrogram `z` and the estimated mask `m`.
+        # If `cac` is True, `m` is actually a full spectrogram and `z` is ignored.
+        niters = self.wiener_iters
+        if self.cac:
+            B, S, C, Fr, T = m.shape
+            out = m.view(B, S, -1, 2, Fr, T).permute(0, 1, 2, 4, 5, 3)
+            out = torch.view_as_complex(out.contiguous())
+            return out
+        if self.training:
+            niters = self.end_iters
+        if niters < 0:
+            z = z[:, None]
+            return z / (1e-8 + z.abs()) * m
+        else:
+            return self._wiener(m, z, niters)
+
+    def _wiener(self, mag_out, mix_stft, niters):
+        # apply wiener filtering from OpenUnmix.
+        init = mix_stft.dtype
+        wiener_win_len = 300
+        residual = self.wiener_residual
+
+        B, S, C, Fq, T = mag_out.shape
+        mag_out = mag_out.permute(0, 4, 3, 2, 1)
+        mix_stft = torch.view_as_real(mix_stft.permute(0, 3, 2, 1))
+
+        outs = []
+        for sample in range(B):
+            pos = 0
+            out = []
+            for pos in range(0, T, wiener_win_len):
+                frame = slice(pos, pos + wiener_win_len)
+                z_out = wiener(
+                    mag_out[sample, frame], mix_stft[sample, frame], niters,
+                    residual=residual)
+                out.append(z_out.transpose(-1, -2))
+            outs.append(torch.cat(out, dim=0))
+        out = torch.view_as_complex(torch.stack(outs, 0))
+        out = out.permute(0, 4, 3, 2, 1).contiguous()
+        if residual:
+            out = out[:, :-1]
+        assert list(out.shape) == [B, S, C, Fq, T]
+        return out.to(init)
+
+    def forward(self, mix):
+        x = mix
+        length = x.shape[-1]
+
+        z = self._spec(mix)
+        mag = self._magnitude(z)
+        x = mag
+
+        B, C, Fq, T = x.shape
+
+        # unlike previous Demucs, we always normalize because it is easier.
+        mean = x.mean(dim=(1, 2, 3), keepdim=True)
+        std = x.std(dim=(1, 2, 3), keepdim=True)
+        x = (x - mean) / (1e-5 + std)
+        # x will be the freq. branch input.
+
+        if self.hybrid:
+            # Prepare the time branch input.
+            xt = mix
+            meant = xt.mean(dim=(1, 2), keepdim=True)
+            stdt = xt.std(dim=(1, 2), keepdim=True)
+            xt = (xt - meant) / (1e-5 + stdt)
+
+        # okay, this is a giant mess I know...
+        saved = []  # skip connections, freq.
+        saved_t = []  # skip connections, time.
+        lengths = []  # saved lengths to properly remove padding, freq branch.
+        lengths_t = []  # saved lengths for time branch.
+        for idx, encode in enumerate(self.encoder):
+            lengths.append(x.shape[-1])
+            inject = None
+            if self.hybrid and idx < len(self.tencoder):
+                # we have not yet merged branches.
+                lengths_t.append(xt.shape[-1])
+                tenc = self.tencoder[idx]
+                xt = tenc(xt)
+                if not tenc.empty:
+                    # save for skip connection
+                    saved_t.append(xt)
+                else:
+                    # tenc contains just the first conv., so that now time and freq.
+                    # branches have the same shape and can be merged.
+                    inject = xt
+            x = encode(x, inject)
+            if idx == 0 and self.freq_emb is not None:
+                # add frequency embedding to allow for non equivariant convolutions
+                # over the frequency axis.
+                frs = torch.arange(x.shape[-2], device=x.device)
+                emb = self.freq_emb(frs).t()[None, :, :, None].expand_as(x)
+                x = x + self.freq_emb_scale * emb
+
+            saved.append(x)
+
+        x = torch.zeros_like(x)
+        if self.hybrid:
+            xt = torch.zeros_like(x)
+        # initialize everything to zero (signal will go through u-net skips).
+
+        for idx, decode in enumerate(self.decoder):
+            skip = saved.pop(-1)
+            x, pre = decode(x, skip, lengths.pop(-1))
+            # `pre` contains the output just before final transposed convolution,
+            # which is used when the freq. and time branch separate.
+
+            if self.hybrid:
+                offset = self.depth - len(self.tdecoder)
+            if self.hybrid and idx >= offset:
+                tdec = self.tdecoder[idx - offset]
+                length_t = lengths_t.pop(-1)
+                if tdec.empty:
+                    assert pre.shape[2] == 1, pre.shape
+                    pre = pre[:, :, 0]
+                    xt, _ = tdec(pre, None, length_t)
+                else:
+                    skip = saved_t.pop(-1)
+                    xt, _ = tdec(xt, skip, length_t)
+
+        # Let's make sure we used all stored skip connections.
+        assert len(saved) == 0
+        assert len(lengths_t) == 0
+        assert len(saved_t) == 0
+
+        S = len(self.sources)
+        x = x.view(B, S, -1, Fq, T)
+        x = x * std[:, None] + mean[:, None]
+
+        zout = self._mask(z, x)
+        x = self._ispec(zout, length)
+
+        if self.hybrid:
+            xt = xt.view(B, S, -1, length)
+            xt = xt * stdt[:, None] + meant[:, None]
+            x = xt + x
+        return x
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/htdemucs.py b/AutoCoverTool/ref/music_remover/demucs/demucs/htdemucs.py
new file mode 100644
index 0000000..adc3713
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/htdemucs.py
@@ -0,0 +1,648 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+# First author is Simon Rouard.
+"""
+This code contains the spectrogram and Hybrid version of Demucs.
+"""
+import math
+
+from openunmix.filtering import wiener
+import torch
+from torch import nn
+from torch.nn import functional as F
+from fractions import Fraction
+from einops import rearrange
+
+from .transformer import CrossTransformerEncoder
+
+from .demucs import rescale_module
+from .states import capture_init
+from .spec import spectro, ispectro
+from .hdemucs import pad1d, ScaledEmbedding, HEncLayer, MultiWrap, HDecLayer
+
+
+class HTDemucs(nn.Module):
+    """
+    Spectrogram and hybrid Demucs model.
+    The spectrogram model has the same structure as Demucs, except the first few layers are over the
+    frequency axis, until there is only 1 frequency, and then it moves to time convolutions.
+    Frequency layers can still access information across time steps thanks to the DConv residual.
+
+    Hybrid model have a parallel time branch. At some layer, the time branch has the same stride
+    as the frequency branch and then the two are combined. The opposite happens in the decoder.
+
+    Models can either use naive iSTFT from masking, Wiener filtering ([Ulhih et al. 2017]),
+    or complex as channels (CaC) [Choi et al. 2020]. Wiener filtering is based on
+    Open Unmix implementation [Stoter et al. 2019].
+
+    The loss is always on the temporal domain, by backpropagating through the above
+    output methods and iSTFT. This allows to define hybrid models nicely. However, this breaks
+    a bit Wiener filtering, as doing more iteration at test time will change the spectrogram
+    contribution, without changing the one from the waveform, which will lead to worse performance.
+    I tried using the residual option in OpenUnmix Wiener implementation, but it didn't improve.
+    CaC on the other hand provides similar performance for hybrid, and works naturally with
+    hybrid models.
+
+    This model also uses frequency embeddings are used to improve efficiency on convolutions
+    over the freq. axis, following [Isik et al. 2020] (https://arxiv.org/pdf/2008.04470.pdf).
+
+    Unlike classic Demucs, there is no resampling here, and normalization is always applied.
+    """
+
+    @capture_init
+    def __init__(
+        self,
+        sources,
+        # Channels
+        audio_channels=2,
+        channels=48,
+        channels_time=None,
+        growth=2,
+        # STFT
+        nfft=4096,
+        wiener_iters=0,
+        end_iters=0,
+        wiener_residual=False,
+        cac=True,
+        # Main structure
+        depth=4,
+        rewrite=True,
+        # Frequency branch
+        multi_freqs=None,
+        multi_freqs_depth=3,
+        freq_emb=0.2,
+        emb_scale=10,
+        emb_smooth=True,
+        # Convolutions
+        kernel_size=8,
+        time_stride=2,
+        stride=4,
+        context=1,
+        context_enc=0,
+        # Normalization
+        norm_starts=4,
+        norm_groups=4,
+        # DConv residual branch
+        dconv_mode=1,
+        dconv_depth=2,
+        dconv_comp=8,
+        dconv_init=1e-3,
+        # Before the Transformer
+        bottom_channels=0,
+        # Transformer
+        t_layers=5,
+        t_emb="sin",
+        t_hidden_scale=4.0,
+        t_heads=8,
+        t_dropout=0.0,
+        t_max_positions=10000,
+        t_norm_in=True,
+        t_norm_in_group=False,
+        t_group_norm=False,
+        t_norm_first=True,
+        t_norm_out=True,
+        t_max_period=10000.0,
+        t_weight_decay=0.0,
+        t_lr=None,
+        t_layer_scale=True,
+        t_gelu=True,
+        t_weight_pos_embed=1.0,
+        t_sin_random_shift=0,
+        t_cape_mean_normalize=True,
+        t_cape_augment=True,
+        t_cape_glob_loc_scale=[5000.0, 1.0, 1.4],
+        t_sparse_self_attn=False,
+        t_sparse_cross_attn=False,
+        t_mask_type="diag",
+        t_mask_random_seed=42,
+        t_sparse_attn_window=500,
+        t_global_window=100,
+        t_sparsity=0.95,
+        t_auto_sparsity=False,
+        # ------ Particuliar parameters
+        t_cross_first=False,
+        # Weight init
+        rescale=0.1,
+        # Metadata
+        samplerate=44100,
+        segment=10,
+        use_train_segment=True,
+    ):
+        """
+        Args:
+            sources (list[str]): list of source names.
+            audio_channels (int): input/output audio channels.
+            channels (int): initial number of hidden channels.
+            channels_time: if not None, use a different `channels` value for the time branch.
+            growth: increase the number of hidden channels by this factor at each layer.
+            nfft: number of fft bins. Note that changing this require careful computation of
+                various shape parameters and will not work out of the box for hybrid models.
+            wiener_iters: when using Wiener filtering, number of iterations at test time.
+            end_iters: same but at train time. For a hybrid model, must be equal to `wiener_iters`.
+            wiener_residual: add residual source before wiener filtering.
+            cac: uses complex as channels, i.e. complex numbers are 2 channels each
+                in input and output. no further processing is done before ISTFT.
+            depth (int): number of layers in the encoder and in the decoder.
+            rewrite (bool): add 1x1 convolution to each layer.
+            multi_freqs: list of frequency ratios for splitting frequency bands with `MultiWrap`.
+            multi_freqs_depth: how many layers to wrap with `MultiWrap`. Only the outermost
+                layers will be wrapped.
+            freq_emb: add frequency embedding after the first frequency layer if > 0,
+                the actual value controls the weight of the embedding.
+            emb_scale: equivalent to scaling the embedding learning rate
+            emb_smooth: initialize the embedding with a smooth one (with respect to frequencies).
+            kernel_size: kernel_size for encoder and decoder layers.
+            stride: stride for encoder and decoder layers.
+            time_stride: stride for the final time layer, after the merge.
+            context: context for 1x1 conv in the decoder.
+            context_enc: context for 1x1 conv in the encoder.
+            norm_starts: layer at which group norm starts being used.
+                decoder layers are numbered in reverse order.
+            norm_groups: number of groups for group norm.
+            dconv_mode: if 1: dconv in encoder only, 2: decoder only, 3: both.
+            dconv_depth: depth of residual DConv branch.
+            dconv_comp: compression of DConv branch.
+            dconv_attn: adds attention layers in DConv branch starting at this layer.
+            dconv_lstm: adds a LSTM layer in DConv branch starting at this layer.
+            dconv_init: initial scale for the DConv branch LayerScale.
+            bottom_channels: if >0 it adds a linear layer (1x1 Conv) before and after the
+                transformer in order to change the number of channels
+            t_layers: number of layers in each branch (waveform and spec) of the transformer
+            t_emb: "sin", "cape" or "scaled"
+            t_hidden_scale: the hidden scale of the Feedforward parts of the transformer
+                for instance if C = 384 (the number of channels in the transformer) and
+                t_hidden_scale = 4.0 then the intermediate layer of the FFN has dimension
+                384 * 4 = 1536
+            t_heads: number of heads for the transformer
+            t_dropout: dropout in the transformer
+            t_max_positions: max_positions for the "scaled" positional embedding, only
+                useful if t_emb="scaled"
+            t_norm_in: (bool) norm before addinf positional embedding and getting into the
+                transformer layers
+            t_norm_in_group: (bool) if True while t_norm_in=True, the norm is on all the
+                timesteps (GroupNorm with group=1)
+            t_group_norm: (bool) if True, the norms of the Encoder Layers are on all the
+                timesteps (GroupNorm with group=1)
+            t_norm_first: (bool) if True the norm is before the attention and before the FFN
+            t_norm_out: (bool) if True, there is a GroupNorm (group=1) at the end of each layer
+            t_max_period: (float) denominator in the sinusoidal embedding expression
+            t_weight_decay: (float) weight decay for the transformer
+            t_lr: (float) specific learning rate for the transformer
+            t_layer_scale: (bool) Layer Scale for the transformer
+            t_gelu: (bool) activations of the transformer are GeLU if True, ReLU else
+            t_weight_pos_embed: (float) weighting of the positional embedding
+            t_cape_mean_normalize: (bool) if t_emb="cape", normalisation of positional embeddings
+                see: https://arxiv.org/abs/2106.03143
+            t_cape_augment: (bool) if t_emb="cape", must be True during training and False
+                during the inference, see: https://arxiv.org/abs/2106.03143
+            t_cape_glob_loc_scale: (list of 3 floats) if t_emb="cape", CAPE parameters
+                see: https://arxiv.org/abs/2106.03143
+            t_sparse_self_attn: (bool) if True, the self attentions are sparse
+            t_sparse_cross_attn: (bool) if True, the cross-attentions are sparse (don't use it
+                unless you designed really specific masks)
+            t_mask_type: (str) can be "diag", "jmask", "random", "global" or any combination
+                with '_' between: i.e. "diag_jmask_random" (note that this is permutation
+                invariant i.e. "diag_jmask_random" is equivalent to "jmask_random_diag")
+            t_mask_random_seed: (int) if "random" is in t_mask_type, controls the seed
+                that generated the random part of the mask
+            t_sparse_attn_window: (int) if "diag" is in t_mask_type, for a query (i), and
+                a key (j), the mask is True id |i-j|<=t_sparse_attn_window
+            t_global_window: (int) if "global" is in t_mask_type, mask[:t_global_window, :]
+                and mask[:, :t_global_window] will be True
+            t_sparsity: (float) if "random" is in t_mask_type, t_sparsity is the sparsity
+                level of the random part of the mask.
+            t_cross_first: (bool) if True cross attention is the first layer of the
+                transformer (False seems to be better)
+            rescale: weight rescaling trick
+            use_train_segment: (bool) if True, the actual size that is used during the
+                training is used during inference.
+        """
+        super().__init__()
+        self.cac = cac
+        self.wiener_residual = wiener_residual
+        self.audio_channels = audio_channels
+        self.sources = sources
+        self.kernel_size = kernel_size
+        self.context = context
+        self.stride = stride
+        self.depth = depth
+        self.bottom_channels = bottom_channels
+        self.channels = channels
+        self.samplerate = samplerate
+        self.segment = segment
+        self.use_train_segment = use_train_segment
+        self.nfft = nfft
+        self.hop_length = nfft // 4
+        self.wiener_iters = wiener_iters
+        self.end_iters = end_iters
+        self.freq_emb = None
+        assert wiener_iters == end_iters
+
+        self.encoder = nn.ModuleList()
+        self.decoder = nn.ModuleList()
+
+        self.tencoder = nn.ModuleList()
+        self.tdecoder = nn.ModuleList()
+
+        chin = audio_channels
+        chin_z = chin  # number of channels for the freq branch
+        if self.cac:
+            chin_z *= 2
+        chout = channels_time or channels
+        chout_z = channels
+        freqs = nfft // 2
+
+        for index in range(depth):
+            norm = index >= norm_starts
+            freq = freqs > 1
+            stri = stride
+            ker = kernel_size
+            if not freq:
+                assert freqs == 1
+                ker = time_stride * 2
+                stri = time_stride
+
+            pad = True
+            last_freq = False
+            if freq and freqs <= kernel_size:
+                ker = freqs
+                pad = False
+                last_freq = True
+
+            kw = {
+                "kernel_size": ker,
+                "stride": stri,
+                "freq": freq,
+                "pad": pad,
+                "norm": norm,
+                "rewrite": rewrite,
+                "norm_groups": norm_groups,
+                "dconv_kw": {
+                    "depth": dconv_depth,
+                    "compress": dconv_comp,
+                    "init": dconv_init,
+                    "gelu": True,
+                },
+            }
+            kwt = dict(kw)
+            kwt["freq"] = 0
+            kwt["kernel_size"] = kernel_size
+            kwt["stride"] = stride
+            kwt["pad"] = True
+            kw_dec = dict(kw)
+            multi = False
+            if multi_freqs and index < multi_freqs_depth:
+                multi = True
+                kw_dec["context_freq"] = False
+
+            if last_freq:
+                chout_z = max(chout, chout_z)
+                chout = chout_z
+
+            enc = HEncLayer(
+                chin_z, chout_z, dconv=dconv_mode & 1, context=context_enc, **kw
+            )
+            if freq:
+                tenc = HEncLayer(
+                    chin,
+                    chout,
+                    dconv=dconv_mode & 1,
+                    context=context_enc,
+                    empty=last_freq,
+                    **kwt
+                )
+                self.tencoder.append(tenc)
+
+            if multi:
+                enc = MultiWrap(enc, multi_freqs)
+            self.encoder.append(enc)
+            if index == 0:
+                chin = self.audio_channels * len(self.sources)
+                chin_z = chin
+                if self.cac:
+                    chin_z *= 2
+            dec = HDecLayer(
+                chout_z,
+                chin_z,
+                dconv=dconv_mode & 2,
+                last=index == 0,
+                context=context,
+                **kw_dec
+            )
+            if multi:
+                dec = MultiWrap(dec, multi_freqs)
+            if freq:
+                tdec = HDecLayer(
+                    chout,
+                    chin,
+                    dconv=dconv_mode & 2,
+                    empty=last_freq,
+                    last=index == 0,
+                    context=context,
+                    **kwt
+                )
+                self.tdecoder.insert(0, tdec)
+            self.decoder.insert(0, dec)
+
+            chin = chout
+            chin_z = chout_z
+            chout = int(growth * chout)
+            chout_z = int(growth * chout_z)
+            if freq:
+                if freqs <= kernel_size:
+                    freqs = 1
+                else:
+                    freqs //= stride
+            if index == 0 and freq_emb:
+                self.freq_emb = ScaledEmbedding(
+                    freqs, chin_z, smooth=emb_smooth, scale=emb_scale
+                )
+                self.freq_emb_scale = freq_emb
+
+        if rescale:
+            rescale_module(self, reference=rescale)
+
+        transformer_channels = channels * growth ** (depth - 1)
+        if bottom_channels:
+            self.channel_upsampler = nn.Conv1d(transformer_channels, bottom_channels, 1)
+            self.channel_downsampler = nn.Conv1d(
+                bottom_channels, transformer_channels, 1
+            )
+            self.channel_upsampler_t = nn.Conv1d(
+                transformer_channels, bottom_channels, 1
+            )
+            self.channel_downsampler_t = nn.Conv1d(
+                bottom_channels, transformer_channels, 1
+            )
+
+            transformer_channels = bottom_channels
+
+        if t_layers > 0:
+            self.crosstransformer = CrossTransformerEncoder(
+                dim=transformer_channels,
+                emb=t_emb,
+                hidden_scale=t_hidden_scale,
+                num_heads=t_heads,
+                num_layers=t_layers,
+                cross_first=t_cross_first,
+                dropout=t_dropout,
+                max_positions=t_max_positions,
+                norm_in=t_norm_in,
+                norm_in_group=t_norm_in_group,
+                group_norm=t_group_norm,
+                norm_first=t_norm_first,
+                norm_out=t_norm_out,
+                max_period=t_max_period,
+                weight_decay=t_weight_decay,
+                lr=t_lr,
+                layer_scale=t_layer_scale,
+                gelu=t_gelu,
+                sin_random_shift=t_sin_random_shift,
+                weight_pos_embed=t_weight_pos_embed,
+                cape_mean_normalize=t_cape_mean_normalize,
+                cape_augment=t_cape_augment,
+                cape_glob_loc_scale=t_cape_glob_loc_scale,
+                sparse_self_attn=t_sparse_self_attn,
+                sparse_cross_attn=t_sparse_cross_attn,
+                mask_type=t_mask_type,
+                mask_random_seed=t_mask_random_seed,
+                sparse_attn_window=t_sparse_attn_window,
+                global_window=t_global_window,
+                sparsity=t_sparsity,
+                auto_sparsity=t_auto_sparsity,
+            )
+        else:
+            self.crosstransformer = None
+
+    def _spec(self, x):
+        hl = self.hop_length
+        nfft = self.nfft
+        x0 = x  # noqa
+
+        # We re-pad the signal in order to keep the property
+        # that the size of the output is exactly the size of the input
+        # divided by the stride (here hop_length), when divisible.
+        # This is achieved by padding by 1/4th of the kernel size (here nfft).
+        # which is not supported by torch.stft.
+        # Having all convolution operations follow this convention allow to easily
+        # align the time and frequency branches later on.
+        assert hl == nfft // 4
+        le = int(math.ceil(x.shape[-1] / hl))
+        pad = hl // 2 * 3
+        x = pad1d(x, (pad, pad + le * hl - x.shape[-1]), mode="reflect")
+
+        z = spectro(x, nfft, hl)[..., :-1, :]
+        assert z.shape[-1] == le + 4, (z.shape, x.shape, le)
+        z = z[..., 2: 2 + le]
+        return z
+
+    def _ispec(self, z, length=None, scale=0):
+        hl = self.hop_length // (4**scale)
+        z = F.pad(z, (0, 0, 0, 1))
+        z = F.pad(z, (2, 2))
+        pad = hl // 2 * 3
+        le = hl * int(math.ceil(length / hl)) + 2 * pad
+        x = ispectro(z, hl, length=le)
+        x = x[..., pad: pad + length]
+        return x
+
+    def _magnitude(self, z):
+        # return the magnitude of the spectrogram, except when cac is True,
+        # in which case we just move the complex dimension to the channel one.
+        if self.cac:
+            B, C, Fr, T = z.shape
+            m = torch.view_as_real(z).permute(0, 1, 4, 2, 3)
+            m = m.reshape(B, C * 2, Fr, T)
+        else:
+            m = z.abs()
+        return m
+
+    def _mask(self, z, m):
+        # Apply masking given the mixture spectrogram `z` and the estimated mask `m`.
+        # If `cac` is True, `m` is actually a full spectrogram and `z` is ignored.
+        niters = self.wiener_iters
+        if self.cac:
+            B, S, C, Fr, T = m.shape
+            out = m.view(B, S, -1, 2, Fr, T).permute(0, 1, 2, 4, 5, 3)
+            out = torch.view_as_complex(out.contiguous())
+            return out
+        if self.training:
+            niters = self.end_iters
+        if niters < 0:
+            z = z[:, None]
+            return z / (1e-8 + z.abs()) * m
+        else:
+            return self._wiener(m, z, niters)
+
+    def _wiener(self, mag_out, mix_stft, niters):
+        # apply wiener filtering from OpenUnmix.
+        init = mix_stft.dtype
+        wiener_win_len = 300
+        residual = self.wiener_residual
+
+        B, S, C, Fq, T = mag_out.shape
+        mag_out = mag_out.permute(0, 4, 3, 2, 1)
+        mix_stft = torch.view_as_real(mix_stft.permute(0, 3, 2, 1))
+
+        outs = []
+        for sample in range(B):
+            pos = 0
+            out = []
+            for pos in range(0, T, wiener_win_len):
+                frame = slice(pos, pos + wiener_win_len)
+                z_out = wiener(
+                    mag_out[sample, frame],
+                    mix_stft[sample, frame],
+                    niters,
+                    residual=residual,
+                )
+                out.append(z_out.transpose(-1, -2))
+            outs.append(torch.cat(out, dim=0))
+        out = torch.view_as_complex(torch.stack(outs, 0))
+        out = out.permute(0, 4, 3, 2, 1).contiguous()
+        if residual:
+            out = out[:, :-1]
+        assert list(out.shape) == [B, S, C, Fq, T]
+        return out.to(init)
+
+    def valid_length(self, length: int):
+        """
+        Return a length that is appropriate for evaluation.
+        In our case, always return the training length, unless
+        it is smaller than the given length, in which case this
+        raises an error.
+        """
+        if not self.use_train_segment:
+            return length
+        training_length = int(self.segment * self.samplerate)
+        if training_length < length:
+            raise ValueError(
+                    f"Given length {length} is longer than "
+                    f"training length {training_length}")
+        return training_length
+
+    def forward(self, mix):
+        length = mix.shape[-1]
+        length_pre_pad = None
+        if self.use_train_segment:
+            if self.training:
+                self.segment = Fraction(mix.shape[-1], self.samplerate)
+            else:
+                training_length = int(self.segment * self.samplerate)
+                if mix.shape[-1] < training_length:
+                    length_pre_pad = mix.shape[-1]
+                    mix = F.pad(mix, (0, training_length - length_pre_pad))
+        z = self._spec(mix)
+        mag = self._magnitude(z)
+        x = mag
+
+        B, C, Fq, T = x.shape
+
+        # unlike previous Demucs, we always normalize because it is easier.
+        mean = x.mean(dim=(1, 2, 3), keepdim=True)
+        std = x.std(dim=(1, 2, 3), keepdim=True)
+        x = (x - mean) / (1e-5 + std)
+        # x will be the freq. branch input.
+
+        # Prepare the time branch input.
+        xt = mix
+        meant = xt.mean(dim=(1, 2), keepdim=True)
+        stdt = xt.std(dim=(1, 2), keepdim=True)
+        xt = (xt - meant) / (1e-5 + stdt)
+
+        # okay, this is a giant mess I know...
+        saved = []  # skip connections, freq.
+        saved_t = []  # skip connections, time.
+        lengths = []  # saved lengths to properly remove padding, freq branch.
+        lengths_t = []  # saved lengths for time branch.
+        for idx, encode in enumerate(self.encoder):
+            lengths.append(x.shape[-1])
+            inject = None
+            if idx < len(self.tencoder):
+                # we have not yet merged branches.
+                lengths_t.append(xt.shape[-1])
+                tenc = self.tencoder[idx]
+                xt = tenc(xt)
+                if not tenc.empty:
+                    # save for skip connection
+                    saved_t.append(xt)
+                else:
+                    # tenc contains just the first conv., so that now time and freq.
+                    # branches have the same shape and can be merged.
+                    inject = xt
+            x = encode(x, inject)
+            if idx == 0 and self.freq_emb is not None:
+                # add frequency embedding to allow for non equivariant convolutions
+                # over the frequency axis.
+                frs = torch.arange(x.shape[-2], device=x.device)
+                emb = self.freq_emb(frs).t()[None, :, :, None].expand_as(x)
+                x = x + self.freq_emb_scale * emb
+
+            saved.append(x)
+        if self.crosstransformer:
+            if self.bottom_channels:
+                b, c, f, t = x.shape
+                x = rearrange(x, "b c f t-> b c (f t)")
+                x = self.channel_upsampler(x)
+                x = rearrange(x, "b c (f t)-> b c f t", f=f)
+                xt = self.channel_upsampler_t(xt)
+
+            x, xt = self.crosstransformer(x, xt)
+
+            if self.bottom_channels:
+                x = rearrange(x, "b c f t-> b c (f t)")
+                x = self.channel_downsampler(x)
+                x = rearrange(x, "b c (f t)-> b c f t", f=f)
+                xt = self.channel_downsampler_t(xt)
+
+        for idx, decode in enumerate(self.decoder):
+            skip = saved.pop(-1)
+            x, pre = decode(x, skip, lengths.pop(-1))
+            # `pre` contains the output just before final transposed convolution,
+            # which is used when the freq. and time branch separate.
+
+            offset = self.depth - len(self.tdecoder)
+            if idx >= offset:
+                tdec = self.tdecoder[idx - offset]
+                length_t = lengths_t.pop(-1)
+                if tdec.empty:
+                    assert pre.shape[2] == 1, pre.shape
+                    pre = pre[:, :, 0]
+                    xt, _ = tdec(pre, None, length_t)
+                else:
+                    skip = saved_t.pop(-1)
+                    xt, _ = tdec(xt, skip, length_t)
+
+        # Let's make sure we used all stored skip connections.
+        assert len(saved) == 0
+        assert len(lengths_t) == 0
+        assert len(saved_t) == 0
+
+        S = len(self.sources)
+        x = x.view(B, S, -1, Fq, T)
+        x = x * std[:, None] + mean[:, None]
+
+        zout = self._mask(z, x)
+        if self.use_train_segment:
+            if self.training:
+                x = self._ispec(zout, length)
+            else:
+                x = self._ispec(zout, training_length)
+        else:
+            x = self._ispec(zout, length)
+
+        if self.use_train_segment:
+            if self.training:
+                xt = xt.view(B, S, -1, length)
+            else:
+                xt = xt.view(B, S, -1, training_length)
+        else:
+            xt = xt.view(B, S, -1, length)
+        xt = xt * stdt[:, None] + meant[:, None]
+        x = xt + x
+        if length_pre_pad:
+            x = x[..., :length_pre_pad]
+        return x
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/pretrained.py b/AutoCoverTool/ref/music_remover/demucs/demucs/pretrained.py
new file mode 100644
index 0000000..bb0ab00
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/pretrained.py
@@ -0,0 +1,82 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Loading pretrained models.
+"""
+
+import logging
+from pathlib import Path
+import typing as tp
+
+from dora.log import fatal
+
+from .hdemucs import HDemucs
+from .repo import RemoteRepo, LocalRepo, ModelOnlyRepo, BagOnlyRepo, AnyModelRepo, ModelLoadingError  # noqa
+
+logger = logging.getLogger(__name__)
+ROOT_URL = "https://dl.fbaipublicfiles.com/demucs/"
+REMOTE_ROOT = Path(__file__).parent / 'remote'
+
+SOURCES = ["drums", "bass", "other", "vocals"]
+
+
+def demucs_unittest():
+    model = HDemucs(channels=4, sources=SOURCES)
+    return model
+
+
+def add_model_flags(parser):
+    group = parser.add_mutually_exclusive_group(required=False)
+    group.add_argument("-s", "--sig", help="Locally trained XP signature.")
+    group.add_argument("-n", "--name", default="mdx_extra_q",
+                       help="Pretrained model name or signature. Default is mdx_extra_q.")
+    parser.add_argument("--repo", type=Path,
+                        help="Folder containing all pre-trained models for use with -n.")
+
+
+def _parse_remote_files(remote_file_list) -> tp.Dict[str, str]:
+    root: str = ''
+    models: tp.Dict[str, str] = {}
+    for line in remote_file_list.read_text().split('\n'):
+        line = line.strip()
+        if line.startswith('#'):
+            continue
+        elif line.startswith('root:'):
+            root = line.split(':', 1)[1].strip()
+        else:
+            sig = line.split('-', 1)[0]
+            assert sig not in models
+            models[sig] = ROOT_URL + root + line
+    return models
+
+
+def get_model(name: str,
+              repo: tp.Optional[Path] = None):
+    """`name` must be a bag of models name or a pretrained signature
+    from the remote AWS model repo or the specified local repo if `repo` is not None.
+    """
+    if name == 'demucs_unittest':
+        return demucs_unittest()
+    model_repo: ModelOnlyRepo
+    if repo is None:
+        models = _parse_remote_files(REMOTE_ROOT / 'files.txt')
+        model_repo = RemoteRepo(models)
+        bag_repo = BagOnlyRepo(REMOTE_ROOT, model_repo)
+    else:
+        if not repo.is_dir():
+            fatal(f"{repo} must exist and be a directory.")
+        model_repo = LocalRepo(repo)
+        bag_repo = BagOnlyRepo(repo, model_repo)
+    any_repo = AnyModelRepo(model_repo, bag_repo)
+    model = any_repo.get_model(name)
+    model.eval()
+    return model
+
+
+def get_model_from_args(args):
+    """
+    Load local model package or pre-trained model.
+    """
+    return get_model(name=args.name, repo=args.repo)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/py.typed b/AutoCoverTool/ref/music_remover/demucs/demucs/py.typed
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/files.txt b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/files.txt
new file mode 100644
index 0000000..7cb7c1a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/files.txt
@@ -0,0 +1,30 @@
+# MDX Models
+root: mdx_final/
+0d19c1c6-0f06f20e.th
+5d2d6c55-db83574e.th
+7d865c68-3d5dd56b.th
+7ecf8ec1-70f50cc9.th
+a1d90b5c-ae9d2452.th
+c511e2ab-fe698775.th
+cfa93e08-61801ae1.th
+e51eebcc-c1b80bdd.th
+6b9c2ca1-3fd82607.th
+b72baf4e-8778635e.th
+42e558d4-196e0e1b.th
+305bc58f-18378783.th
+14fc6a69-a89dd0ee.th
+464b36d7-e5a9386e.th
+7fd6ef75-a905dd85.th
+83fc094f-4a16d450.th
+1ef250f1-592467ce.th
+902315c2-b39ce9c9.th
+9a6b4851-03af0aa6.th
+fa0cb7f9-100d8bf4.th
+# Hybrid Transformer models
+root: hybrid_transformer/
+955717e8-8726e21a.th
+f7e0c4bc-ba3fe64a.th
+d12395a8-e57c48e6.th
+92cfc3b6-ef3bcb9c.th
+04573f0d-f3cf25b2.th
+75fc33f5-1941ce65.th
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/hdemucs_mmi.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/hdemucs_mmi.yaml
new file mode 100644
index 0000000..0ea0891
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/hdemucs_mmi.yaml
@@ -0,0 +1,2 @@
+models: ['75fc33f5']
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/htdemucs.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/htdemucs.yaml
new file mode 100644
index 0000000..0d5f208
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/htdemucs.yaml
@@ -0,0 +1 @@
+models: ['955717e8']
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/htdemucs_ft.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/htdemucs_ft.yaml
new file mode 100644
index 0000000..ba5c69c
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/htdemucs_ft.yaml
@@ -0,0 +1,7 @@
+models: ['f7e0c4bc', 'd12395a8', '92cfc3b6', '04573f0d']
+weights: [
+  [1., 0., 0., 0.],
+  [0., 1., 0., 0.],
+  [0., 0., 1., 0.],
+  [0., 0., 0., 1.],
+]
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx.yaml
new file mode 100644
index 0000000..4e81a50
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx.yaml
@@ -0,0 +1,8 @@
+models: ['0d19c1c6', '7ecf8ec1', 'c511e2ab', '7d865c68']
+weights: [
+  [1., 1., 0., 0.],
+  [0., 1., 0., 0.],
+  [1., 0., 1., 1.],
+  [1., 0., 1., 1.],
+]
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_extra.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_extra.yaml
new file mode 100644
index 0000000..847bf66
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_extra.yaml
@@ -0,0 +1,2 @@
+models: ['e51eebcc', 'a1d90b5c', '5d2d6c55', 'cfa93e08']
+segment: 44
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_extra_q.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_extra_q.yaml
new file mode 100644
index 0000000..87702bc
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_extra_q.yaml
@@ -0,0 +1,2 @@
+models: ['83fc094f', '464b36d7', '14fc6a69', '7fd6ef75']
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_q.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_q.yaml
new file mode 100644
index 0000000..827d2c6
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/mdx_q.yaml
@@ -0,0 +1,8 @@
+models: ['6b9c2ca1', 'b72baf4e', '42e558d4', '305bc58f']
+weights: [
+  [1., 1., 0., 0.],
+  [0., 1., 0., 0.],
+  [1., 0., 1., 1.],
+  [1., 0., 1., 1.],
+]
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a.yaml
new file mode 100644
index 0000000..691abc2
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a.yaml
@@ -0,0 +1,2 @@
+models: ['9a6b4851', '1ef250f1', 'fa0cb7f9', '902315c2']
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a_hybrid_only.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a_hybrid_only.yaml
new file mode 100644
index 0000000..78eb8e0
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a_hybrid_only.yaml
@@ -0,0 +1,2 @@
+models: ['fa0cb7f9', '902315c2', 'fa0cb7f9', '902315c2']
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a_time_only.yaml b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a_time_only.yaml
new file mode 100644
index 0000000..d5d16ea
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/remote/repro_mdx_a_time_only.yaml
@@ -0,0 +1,2 @@
+models: ['9a6b4851', '9a6b4851', '1ef250f1', '1ef250f1']
+segment: 44
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/repitch.py b/AutoCoverTool/ref/music_remover/demucs/demucs/repitch.py
new file mode 100644
index 0000000..d23d2bc
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/repitch.py
@@ -0,0 +1,86 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Utility for on the fly pitch/tempo change for data augmentation."""
+
+import random
+import subprocess as sp
+import tempfile
+
+import torch
+import torchaudio as ta
+
+from .audio import save_audio
+
+
+class RepitchedWrapper:
+    """
+    Wrap a dataset to apply online change of pitch / tempo.
+    """
+    def __init__(self, dataset, proba=0.2, max_pitch=2, max_tempo=12,
+                 tempo_std=5, vocals=[3], same=True):
+        self.dataset = dataset
+        self.proba = proba
+        self.max_pitch = max_pitch
+        self.max_tempo = max_tempo
+        self.tempo_std = tempo_std
+        self.same = same
+        self.vocals = vocals
+
+    def __len__(self):
+        return len(self.dataset)
+
+    def __getitem__(self, index):
+        streams = self.dataset[index]
+        in_length = streams.shape[-1]
+        out_length = int((1 - 0.01 * self.max_tempo) * in_length)
+
+        if random.random() < self.proba:
+            outs = []
+            for idx, stream in enumerate(streams):
+                if idx == 0 or not self.same:
+                    delta_pitch = random.randint(-self.max_pitch, self.max_pitch)
+                    delta_tempo = random.gauss(0, self.tempo_std)
+                    delta_tempo = min(max(-self.max_tempo, delta_tempo), self.max_tempo)
+                stream = repitch(
+                    stream,
+                    delta_pitch,
+                    delta_tempo,
+                    voice=idx in self.vocals)
+                outs.append(stream[:, :out_length])
+            streams = torch.stack(outs)
+        else:
+            streams = streams[..., :out_length]
+        return streams
+
+
+def repitch(wav, pitch, tempo, voice=False, quick=False, samplerate=44100):
+    """
+    tempo is a relative delta in percentage, so tempo=10 means tempo at 110%!
+    pitch is in semi tones.
+    Requires `soundstretch` to be installed, see
+    https://www.surina.net/soundtouch/soundstretch.html
+    """
+    infile = tempfile.NamedTemporaryFile(suffix=".wav")
+    outfile = tempfile.NamedTemporaryFile(suffix=".wav")
+    save_audio(wav, infile.name, samplerate, clip='clamp')
+    command = [
+        "soundstretch",
+        infile.name,
+        outfile.name,
+        f"-pitch={pitch}",
+        f"-tempo={tempo:.6f}",
+    ]
+    if quick:
+        command += ["-quick"]
+    if voice:
+        command += ["-speech"]
+    try:
+        sp.run(command, capture_output=True, check=True)
+    except sp.CalledProcessError as error:
+        raise RuntimeError(f"Could not change bpm because {error.stderr.decode('utf-8')}")
+    wav, sr = ta.load(outfile.name)
+    assert sr == samplerate
+    return wav
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/repo.py b/AutoCoverTool/ref/music_remover/demucs/demucs/repo.py
new file mode 100644
index 0000000..a7645be
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/repo.py
@@ -0,0 +1,148 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Represents a model repository, including pre-trained models and bags of models.
+A repo can either be the main remote repository stored in AWS, or a local repository
+with your own models.
+"""
+
+from hashlib import sha256
+from pathlib import Path
+import typing as tp
+
+import torch
+import yaml
+
+from .apply import BagOfModels, Model
+from .states import load_model
+
+
+AnyModel = tp.Union[Model, BagOfModels]
+
+
+class ModelLoadingError(RuntimeError):
+    pass
+
+
+def check_checksum(path: Path, checksum: str):
+    sha = sha256()
+    with open(path, 'rb') as file:
+        while True:
+            buf = file.read(2**20)
+            if not buf:
+                break
+            sha.update(buf)
+    actual_checksum = sha.hexdigest()[:len(checksum)]
+    if actual_checksum != checksum:
+        raise ModelLoadingError(f'Invalid checksum for file {path}, '
+                                f'expected {checksum} but got {actual_checksum}')
+
+
+class ModelOnlyRepo:
+    """Base class for all model only repos.
+    """
+    def has_model(self, sig: str) -> bool:
+        raise NotImplementedError()
+
+    def get_model(self, sig: str) -> Model:
+        raise NotImplementedError()
+
+
+class RemoteRepo(ModelOnlyRepo):
+    def __init__(self, models: tp.Dict[str, str]):
+        self._models = models
+
+    def has_model(self, sig: str) -> bool:
+        return sig in self._models
+
+    def get_model(self, sig: str) -> Model:
+        try:
+            url = self._models[sig]
+        except KeyError:
+            raise ModelLoadingError(f'Could not find a pre-trained model with signature {sig}.')
+        pkg = torch.hub.load_state_dict_from_url(
+            url, map_location='cpu', check_hash=True)  # type: ignore
+        return load_model(pkg)
+
+
+class LocalRepo(ModelOnlyRepo):
+    def __init__(self, root: Path):
+        self.root = root
+        self.scan()
+
+    def scan(self):
+        self._models = {}
+        self._checksums = {}
+        for file in self.root.iterdir():
+            if file.suffix == '.th':
+                if '-' in file.stem:
+                    xp_sig, checksum = file.stem.split('-')
+                    self._checksums[xp_sig] = checksum
+                else:
+                    xp_sig = file.stem
+                if xp_sig in self._models:
+                    raise ModelLoadingError(
+                        f'Duplicate pre-trained model exist for signature {xp_sig}. '
+                        'Please delete all but one.')
+                self._models[xp_sig] = file
+
+    def has_model(self, sig: str) -> bool:
+        return sig in self._models
+
+    def get_model(self, sig: str) -> Model:
+        try:
+            file = self._models[sig]
+        except KeyError:
+            raise ModelLoadingError(f'Could not find pre-trained model with signature {sig}.')
+        if sig in self._checksums:
+            check_checksum(file, self._checksums[sig])
+        return load_model(file)
+
+
+class BagOnlyRepo:
+    """Handles only YAML files containing bag of models, leaving the actual
+    model loading to some Repo.
+    """
+    def __init__(self, root: Path, model_repo: ModelOnlyRepo):
+        self.root = root
+        self.model_repo = model_repo
+        self.scan()
+
+    def scan(self):
+        self._bags = {}
+        for file in self.root.iterdir():
+            if file.suffix == '.yaml':
+                self._bags[file.stem] = file
+
+    def has_model(self, name: str) -> bool:
+        return name in self._bags
+
+    def get_model(self, name: str) -> BagOfModels:
+        try:
+            yaml_file = self._bags[name]
+        except KeyError:
+            raise ModelLoadingError(f'{name} is neither a single pre-trained model or '
+                                    'a bag of models.')
+        bag = yaml.safe_load(open(yaml_file))
+        signatures = bag['models']
+        models = [self.model_repo.get_model(sig) for sig in signatures]
+        weights = bag.get('weights')
+        segment = bag.get('segment')
+        return BagOfModels(models, weights, segment)
+
+
+class AnyModelRepo:
+    def __init__(self, model_repo: ModelOnlyRepo, bag_repo: BagOnlyRepo):
+        self.model_repo = model_repo
+        self.bag_repo = bag_repo
+
+    def has_model(self, name_or_sig: str) -> bool:
+        return self.model_repo.has_model(name_or_sig) or self.bag_repo.has_model(name_or_sig)
+
+    def get_model(self, name_or_sig: str) -> AnyModel:
+        if self.model_repo.has_model(name_or_sig):
+            return self.model_repo.get_model(name_or_sig)
+        else:
+            return self.bag_repo.get_model(name_or_sig)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/separate.py b/AutoCoverTool/ref/music_remover/demucs/demucs/separate.py
new file mode 100644
index 0000000..1560a44
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/separate.py
@@ -0,0 +1,217 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+import time
+import argparse
+import sys
+from pathlib import Path
+import subprocess
+
+from dora.log import fatal
+import torch as th
+import torchaudio as ta
+
+from .apply import apply_model, BagOfModels
+from .audio import AudioFile, convert_audio, save_audio
+from .pretrained import get_model_from_args, add_model_flags, ModelLoadingError
+
+
+def load_track(track, audio_channels, samplerate):
+    errors = {}
+    wav = None
+
+    try:
+        wav = AudioFile(track).read(
+            streams=0,
+            samplerate=samplerate,
+            channels=audio_channels)
+    except FileNotFoundError:
+        errors['ffmpeg'] = 'FFmpeg is not installed.'
+    except subprocess.CalledProcessError:
+        errors['ffmpeg'] = 'FFmpeg could not read the file.'
+
+    if wav is None:
+        try:
+            wav, sr = ta.load(str(track))
+        except RuntimeError as err:
+            errors['torchaudio'] = err.args[0]
+        else:
+            wav = convert_audio(wav, sr, samplerate, audio_channels)
+
+    if wav is None:
+        print(f"Could not load file {track}. "
+              "Maybe it is not a supported file format? ")
+        for backend, error in errors.items():
+            print(f"When trying to load using {backend}, got the following error: {error}")
+        sys.exit(1)
+    return wav
+
+
+def main():
+    parser = argparse.ArgumentParser("demucs.separate",
+                                     description="Separate the sources for the given tracks")
+    parser.add_argument("tracks", nargs='+', type=Path, default=[], help='Path to tracks')
+    add_model_flags(parser)
+    parser.add_argument("-v", "--verbose", action="store_true")
+    parser.add_argument("-o",
+                        "--out",
+                        type=Path,
+                        default=Path("separated"),
+                        help="Folder where to put extracted tracks. A subfolder "
+                        "with the model name will be created.")
+    parser.add_argument("--filename",
+                        default="{track}/{stem}.{ext}",
+                        help="Set the name of output file. \n"
+                        'Use "{track}", "{trackext}", "{stem}", "{ext}" to use '
+                        "variables of track name without extension, track extension, "
+                        "stem name and default output file extension. \n"
+                        'Default is "{track}/{stem}.{ext}".')
+    parser.add_argument("-d",
+                        "--device",
+                        default="cuda" if th.cuda.is_available() else "cpu",
+                        help="Device to use, default is cuda if available else cpu")
+    parser.add_argument("--shifts",
+                        default=1,
+                        type=int,
+                        help="Number of random shifts for equivariant stabilization."
+                        "Increase separation time but improves quality for Demucs. 10 was used "
+                        "in the original paper.")
+    parser.add_argument("--overlap",
+                        default=0.25,
+                        type=float,
+                        help="Overlap between the splits.")
+    split_group = parser.add_mutually_exclusive_group()
+    split_group.add_argument("--no-split",
+                             action="store_false",
+                             dest="split",
+                             default=True,
+                             help="Doesn't split audio in chunks. "
+                             "This can use large amounts of memory.")
+    split_group.add_argument("--segment", type=int,
+                             help="Set split size of each chunk. "
+                             "This can help save memory of graphic card. ")
+    parser.add_argument("--two-stems",
+                        dest="stem", metavar="STEM",
+                        help="Only separate audio into {STEM} and no_{STEM}. ")
+    group = parser.add_mutually_exclusive_group()
+    group.add_argument("--int24", action="store_true",
+                       help="Save wav output as 24 bits wav.")
+    group.add_argument("--float32", action="store_true",
+                       help="Save wav output as float32 (2x bigger).")
+    parser.add_argument("--clip-mode", default="rescale", choices=["rescale", "clamp"],
+                        help="Strategy for avoiding clipping: rescaling entire signal "
+                             "if necessary  (rescale) or hard clipping (clamp).")
+    parser.add_argument("--mp3", action="store_true",
+                        help="Convert the output wavs to mp3.")
+    parser.add_argument("--mp3-bitrate",
+                        default=320,
+                        type=int,
+                        help="Bitrate of converted mp3.")
+    parser.add_argument("-j", "--jobs",
+                        default=0,
+                        type=int,
+                        help="Number of jobs. This can increase memory usage but will "
+                             "be much faster when multiple cores are available.")
+
+    args = parser.parse_args()
+    print(args)
+
+    st = time.time()
+    try:
+        model = get_model_from_args(args)
+    except ModelLoadingError as error:
+        fatal(error.args[0])
+
+    print("load data spent time={}".format(time.time() - st))
+    st = time.time()
+
+    if args.segment is not None and args.segment < 8:
+        fatal("Segment must greater than 8. ")
+
+    if '..' in args.filename.replace("\\", "/").split("/"):
+        fatal('".." must not appear in filename. ')
+
+    if isinstance(model, BagOfModels):
+        print(f"Selected model is a bag of {len(model.models)} models. "
+              "You will see that many progress bars per track.")
+        if args.segment is not None:
+            for sub in model.models:
+                sub.segment = args.segment
+    else:
+        if args.segment is not None:
+            model.segment = args.segment
+
+    model.cpu()
+    model.eval()
+
+    if args.stem is not None and args.stem not in model.sources:
+        fatal(
+            'error: stem "{stem}" is not in selected model. STEM must be one of {sources}.'.format(
+                stem=args.stem, sources=', '.join(model.sources)))
+    out = args.out / args.name
+    out.mkdir(parents=True, exist_ok=True)
+    print(f"Separated tracks will be stored in {out.resolve()}")
+    for track in args.tracks:
+        if not track.exists():
+            print(
+                f"File {track} does not exist. If the path contains spaces, "
+                "please try again after surrounding the entire path with quotes \"\".",
+                file=sys.stderr)
+            continue
+        print(f"Separating track {track}")
+        st = time.time()
+        wav = load_track(track, model.audio_channels, model.samplerate)
+        print("load track spent = {}".format(time.time() - st))
+
+        st = time.time()
+        ref = wav.mean(0)
+        wav = (wav - ref.mean()) / ref.std()
+        # wav[None] -> 增加一个维度,原来是[2, xxx] -> [1, 2, xxx]
+        sources = apply_model(model, wav[None], device=args.device, shifts=args.shifts,
+                              split=args.split, overlap=args.overlap, progress=True,
+                              num_workers=args.jobs)[0]
+        sources = sources * ref.std() + ref.mean()
+        print("apply_model spent = {}".format(time.time() - st))
+
+        if args.mp3:
+            ext = "mp3"
+        else:
+            ext = "wav"
+        kwargs = {
+            'samplerate': model.samplerate,
+            'bitrate': args.mp3_bitrate,
+            'clip': args.clip_mode,
+            'as_float': args.float32,
+            'bits_per_sample': 24 if args.int24 else 16,
+        }
+        if args.stem is None:
+            for source, name in zip(sources, model.sources):
+                st = time.time()
+                stem = out / args.filename.format(track=track.name.rsplit(".", 1)[0],
+                                                  trackext=track.name.rsplit(".", 1)[-1],
+                                                  stem=name, ext=ext)
+                stem.parent.mkdir(parents=True, exist_ok=True)
+                save_audio(source, str(stem), **kwargs)
+                print("save_audio spent = {}".format(time.time() - st))
+        else:
+            sources = list(sources)
+            stem = out / args.filename.format(track=track.name.rsplit(".", 1)[0],
+                                              trackext=track.name.rsplit(".", 1)[-1],
+                                              stem=args.stem, ext=ext)
+            stem.parent.mkdir(parents=True, exist_ok=True)
+            save_audio(sources.pop(model.sources.index(args.stem)), str(stem), **kwargs)
+            # Warning : after poping the stem, selected stem is no longer in the list 'sources'
+            other_stem = th.zeros_like(sources[0])
+            for i in sources:
+                other_stem += i
+            stem = out / args.filename.format(track=track.name.rsplit(".", 1)[0],
+                                              trackext=track.name.rsplit(".", 1)[-1],
+                                              stem="no_"+args.stem, ext=ext)
+            stem.parent.mkdir(parents=True, exist_ok=True)
+            save_audio(other_stem, str(stem), **kwargs)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/solver.py b/AutoCoverTool/ref/music_remover/demucs/demucs/solver.py
new file mode 100644
index 0000000..ced824a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/solver.py
@@ -0,0 +1,405 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Main training loop."""
+
+import logging
+
+from dora import get_xp
+from dora.utils import write_and_rename
+from dora.log import LogProgress, bold
+import torch
+import torch.nn.functional as F
+
+from . import augment, distrib, states, pretrained
+from .apply import apply_model
+from .ema import ModelEMA
+from .evaluate import evaluate, new_sdr
+from .svd import svd_penalty
+from .utils import pull_metric, EMA
+
+logger = logging.getLogger(__name__)
+
+
+def _summary(metrics):
+    return " | ".join(f"{key.capitalize()}={val}" for key, val in metrics.items())
+
+
+class Solver(object):
+    def __init__(self, loaders, model, optimizer, args):
+        self.args = args
+        self.loaders = loaders
+
+        self.model = model
+        self.optimizer = optimizer
+        self.quantizer = states.get_quantizer(self.model, args.quant, self.optimizer)
+        self.dmodel = distrib.wrap(model)
+        self.device = next(iter(self.model.parameters())).device
+
+        # Exponential moving average of the model, either updated every batch or epoch.
+        # The best model from all the EMAs and the original one is kept based on the valid
+        # loss for the final best model.
+        self.emas = {'batch': [], 'epoch': []}
+        for kind in self.emas.keys():
+            decays = getattr(args.ema, kind)
+            device = self.device if kind == 'batch' else 'cpu'
+            if decays:
+                for decay in decays:
+                    self.emas[kind].append(ModelEMA(self.model, decay, device=device))
+
+        # data augment
+        augments = [augment.Shift(shift=int(args.dset.samplerate * args.dset.shift),
+                                  same=args.augment.shift_same)]
+        if args.augment.flip:
+            augments += [augment.FlipChannels(), augment.FlipSign()]
+        for aug in ['scale', 'remix']:
+            kw = getattr(args.augment, aug)
+            if kw.proba:
+                augments.append(getattr(augment, aug.capitalize())(**kw))
+        self.augment = torch.nn.Sequential(*augments)
+
+        xp = get_xp()
+        self.folder = xp.folder
+        # Checkpoints
+        self.checkpoint_file = xp.folder / 'checkpoint.th'
+        self.best_file = xp.folder / 'best.th'
+        logger.debug("Checkpoint will be saved to %s", self.checkpoint_file.resolve())
+        self.best_state = None
+        self.best_changed = False
+
+        self.link = xp.link
+        self.history = self.link.history
+
+        self._reset()
+
+    def _serialize(self, epoch):
+        package = {}
+        package['state'] = self.model.state_dict()
+        package['optimizer'] = self.optimizer.state_dict()
+        package['history'] = self.history
+        package['best_state'] = self.best_state
+        package['args'] = self.args
+        for kind, emas in self.emas.items():
+            for k, ema in enumerate(emas):
+                package[f'ema_{kind}_{k}'] = ema.state_dict()
+        with write_and_rename(self.checkpoint_file) as tmp:
+            torch.save(package, tmp)
+
+        save_every = self.args.save_every
+        if save_every and (epoch + 1) % save_every == 0 and epoch + 1 != self.args.epochs:
+            with write_and_rename(self.folder / f'checkpoint_{epoch + 1}.th') as tmp:
+                torch.save(package, tmp)
+
+        if self.best_changed:
+            # Saving only the latest best model.
+            with write_and_rename(self.best_file) as tmp:
+                package = states.serialize_model(self.model, self.args)
+                package['state'] = self.best_state
+                torch.save(package, tmp)
+            self.best_changed = False
+
+    def _reset(self):
+        """Reset state of the solver, potentially using checkpoint."""
+        if self.checkpoint_file.exists():
+            logger.info(f'Loading checkpoint model: {self.checkpoint_file}')
+            package = torch.load(self.checkpoint_file, 'cpu')
+            self.model.load_state_dict(package['state'])
+            self.optimizer.load_state_dict(package['optimizer'])
+            self.history[:] = package['history']
+            self.best_state = package['best_state']
+            for kind, emas in self.emas.items():
+                for k, ema in enumerate(emas):
+                    ema.load_state_dict(package[f'ema_{kind}_{k}'])
+        elif self.args.continue_pretrained:
+            model = pretrained.get_model(
+                name=self.args.continue_pretrained,
+                repo=self.args.pretrained_repo)
+            self.model.load_state_dict(model.state_dict())
+        elif self.args.continue_from:
+            name = 'checkpoint.th'
+            root = self.folder.parent
+            cf = root / str(self.args.continue_from) / name
+            logger.info("Loading from %s", cf)
+            package = torch.load(cf, 'cpu')
+            self.best_state = package['best_state']
+            if self.args.continue_best:
+                self.model.load_state_dict(package['best_state'], strict=False)
+            else:
+                self.model.load_state_dict(package['state'], strict=False)
+            if self.args.continue_opt:
+                self.optimizer.load_state_dict(package['optimizer'])
+
+    def _format_train(self, metrics: dict) -> dict:
+        """Formatting for train/valid metrics."""
+        losses = {
+            'loss': format(metrics['loss'], ".4f"),
+            'reco': format(metrics['reco'], ".4f"),
+        }
+        if 'nsdr' in metrics:
+            losses['nsdr'] = format(metrics['nsdr'], ".3f")
+        if self.quantizer is not None:
+            losses['ms'] = format(metrics['ms'], ".2f")
+        if 'grad' in metrics:
+            losses['grad'] = format(metrics['grad'], ".4f")
+        if 'best' in metrics:
+            losses['best'] = format(metrics['best'], '.4f')
+        if 'bname' in metrics:
+            losses['bname'] = metrics['bname']
+        if 'penalty' in metrics:
+            losses['penalty'] = format(metrics['penalty'], ".4f")
+        if 'hloss' in metrics:
+            losses['hloss'] = format(metrics['hloss'], ".4f")
+        return losses
+
+    def _format_test(self, metrics: dict) -> dict:
+        """Formatting for test metrics."""
+        losses = {}
+        if 'sdr' in metrics:
+            losses['sdr'] = format(metrics['sdr'], '.3f')
+        if 'nsdr' in metrics:
+            losses['nsdr'] = format(metrics['nsdr'], '.3f')
+        for source in self.model.sources:
+            key = f'sdr_{source}'
+            if key in metrics:
+                losses[key] = format(metrics[key], '.3f')
+            key = f'nsdr_{source}'
+            if key in metrics:
+                losses[key] = format(metrics[key], '.3f')
+        return losses
+
+    def train(self):
+        # Optimizing the model
+        if self.history:
+            logger.info("Replaying metrics from previous run")
+        for epoch, metrics in enumerate(self.history):
+            formatted = self._format_train(metrics['train'])
+            logger.info(
+                bold(f'Train Summary | Epoch {epoch + 1} | {_summary(formatted)}'))
+            formatted = self._format_train(metrics['valid'])
+            logger.info(
+                bold(f'Valid Summary | Epoch {epoch + 1} | {_summary(formatted)}'))
+            if 'test' in metrics:
+                formatted = self._format_test(metrics['test'])
+                if formatted:
+                    logger.info(bold(f"Test Summary | Epoch {epoch + 1} | {_summary(formatted)}"))
+
+        epoch = 0
+        for epoch in range(len(self.history), self.args.epochs):
+            # Train one epoch
+            self.model.train()  # Turn on BatchNorm & Dropout
+            metrics = {}
+            logger.info('-' * 70)
+            logger.info("Training...")
+            metrics['train'] = self._run_one_epoch(epoch)
+            formatted = self._format_train(metrics['train'])
+            logger.info(
+                bold(f'Train Summary | Epoch {epoch + 1} | {_summary(formatted)}'))
+
+            # Cross validation
+            logger.info('-' * 70)
+            logger.info('Cross validation...')
+            self.model.eval()  # Turn off Batchnorm & Dropout
+            with torch.no_grad():
+                valid = self._run_one_epoch(epoch, train=False)
+                bvalid = valid
+                bname = 'main'
+                state = states.copy_state(self.model.state_dict())
+                metrics['valid'] = {}
+                metrics['valid']['main'] = valid
+                key = self.args.test.metric
+                for kind, emas in self.emas.items():
+                    for k, ema in enumerate(emas):
+                        with ema.swap():
+                            valid = self._run_one_epoch(epoch, train=False)
+                        name = f'ema_{kind}_{k}'
+                        metrics['valid'][name] = valid
+                        a = valid[key]
+                        b = bvalid[key]
+                        if key.startswith('nsdr'):
+                            a = -a
+                            b = -b
+                        if a < b:
+                            bvalid = valid
+                            state = ema.state
+                            bname = name
+                    metrics['valid'].update(bvalid)
+                    metrics['valid']['bname'] = bname
+
+            valid_loss = metrics['valid'][key]
+            mets = pull_metric(self.link.history, f'valid.{key}') + [valid_loss]
+            if key.startswith('nsdr'):
+                best_loss = max(mets)
+            else:
+                best_loss = min(mets)
+            metrics['valid']['best'] = best_loss
+            if self.args.svd.penalty > 0:
+                kw = dict(self.args.svd)
+                kw.pop('penalty')
+                with torch.no_grad():
+                    penalty = svd_penalty(self.model, exact=True, **kw)
+                metrics['valid']['penalty'] = penalty
+
+            formatted = self._format_train(metrics['valid'])
+            logger.info(
+                bold(f'Valid Summary | Epoch {epoch + 1} | {_summary(formatted)}'))
+
+            # Save the best model
+            if valid_loss == best_loss or self.args.dset.train_valid:
+                logger.info(bold('New best valid loss %.4f'), valid_loss)
+                self.best_state = states.copy_state(state)
+                self.best_changed = True
+
+            # Eval model every `test.every` epoch or on last epoch
+            should_eval = (epoch + 1) % self.args.test.every == 0
+            is_last = epoch == self.args.epochs - 1
+            # # Tries to detect divergence in a reliable way and finish job
+            # # not to waste compute.
+            # # Commented out as this was super specific to the MDX competition.
+            # reco = metrics['valid']['main']['reco']
+            # div = epoch >= 180 and reco > 0.18
+            # div = div or epoch >= 100 and reco > 0.25
+            # div = div and self.args.optim.loss == 'l1'
+            # if div:
+            #     logger.warning("Finishing training early because valid loss is too high.")
+            #     is_last = True
+            if should_eval or is_last:
+                # Evaluate on the testset
+                logger.info('-' * 70)
+                logger.info('Evaluating on the test set...')
+                # We switch to the best known model for testing
+                if self.args.test.best:
+                    state = self.best_state
+                else:
+                    state = states.copy_state(self.model.state_dict())
+                compute_sdr = self.args.test.sdr and is_last
+                with states.swap_state(self.model, state):
+                    with torch.no_grad():
+                        metrics['test'] = evaluate(self, compute_sdr=compute_sdr)
+                formatted = self._format_test(metrics['test'])
+                logger.info(bold(f"Test Summary | Epoch {epoch + 1} | {_summary(formatted)}"))
+            self.link.push_metrics(metrics)
+
+            if distrib.rank == 0:
+                # Save model each epoch
+                self._serialize(epoch)
+                logger.debug("Checkpoint saved to %s", self.checkpoint_file.resolve())
+            if is_last:
+                break
+
+    def _run_one_epoch(self, epoch, train=True):
+        args = self.args
+        data_loader = self.loaders['train'] if train else self.loaders['valid']
+        if distrib.world_size > 1 and train:
+            data_loader.sampler.set_epoch(epoch)
+
+        label = ["Valid", "Train"][train]
+        name = label + f" | Epoch {epoch + 1}"
+        total = len(data_loader)
+        if args.max_batches:
+            total = min(total, args.max_batches)
+        logprog = LogProgress(logger, data_loader, total=total,
+                              updates=self.args.misc.num_prints, name=name)
+        averager = EMA()
+
+        for idx, sources in enumerate(logprog):
+            sources = sources.to(self.device)
+            if train:
+                sources = self.augment(sources)
+                mix = sources.sum(dim=1)
+            else:
+                mix = sources[:, 0]
+                sources = sources[:, 1:]
+
+            if not train and self.args.valid_apply:
+                estimate = apply_model(self.model, mix, split=self.args.test.split, overlap=0)
+            else:
+                estimate = self.dmodel(mix)
+            if train and hasattr(self.model, 'transform_target'):
+                sources = self.model.transform_target(mix, sources)
+            assert estimate.shape == sources.shape, (estimate.shape, sources.shape)
+            dims = tuple(range(2, sources.dim()))
+
+            if args.optim.loss == 'l1':
+                loss = F.l1_loss(estimate, sources, reduction='none')
+                loss = loss.mean(dims).mean(0)
+                reco = loss
+            elif args.optim.loss == 'mse':
+                loss = F.mse_loss(estimate, sources, reduction='none')
+                loss = loss.mean(dims)
+                reco = loss**0.5
+                reco = reco.mean(0)
+            else:
+                raise ValueError(f"Invalid loss {self.args.loss}")
+            weights = torch.tensor(args.weights).to(sources)
+            loss = (loss * weights).sum() / weights.sum()
+
+            ms = 0
+            if self.quantizer is not None:
+                ms = self.quantizer.model_size()
+            if args.quant.diffq:
+                loss += args.quant.diffq * ms
+
+            losses = {}
+            losses['reco'] = (reco * weights).sum() / weights.sum()
+            losses['ms'] = ms
+
+            if not train:
+                nsdrs = new_sdr(sources, estimate.detach()).mean(0)
+                total = 0
+                for source, nsdr, w in zip(self.model.sources, nsdrs, weights):
+                    losses[f'nsdr_{source}'] = nsdr
+                    total += w * nsdr
+                losses['nsdr'] = total / weights.sum()
+
+            if train and args.svd.penalty > 0:
+                kw = dict(args.svd)
+                kw.pop('penalty')
+                penalty = svd_penalty(self.model, **kw)
+                losses['penalty'] = penalty
+                loss += args.svd.penalty * penalty
+
+            losses['loss'] = loss
+
+            for k, source in enumerate(self.model.sources):
+                losses[f'reco_{source}'] = reco[k]
+
+            # optimize model in training mode
+            if train:
+                loss.backward()
+                grad_norm = 0
+                grads = []
+                for p in self.model.parameters():
+                    if p.grad is not None:
+                        grad_norm += p.grad.data.norm()**2
+                        grads.append(p.grad.data)
+                losses['grad'] = grad_norm ** 0.5
+                if args.optim.clip_grad:
+                    torch.nn.utils.clip_grad_norm_(
+                        self.model.parameters(),
+                        args.optim.clip_grad)
+
+                if self.args.flag == 'uns':
+                    for n, p in self.model.named_parameters():
+                        if p.grad is None:
+                            print('no grad', n)
+                self.optimizer.step()
+                self.optimizer.zero_grad()
+                for ema in self.emas['batch']:
+                    ema.update()
+            losses = averager(losses)
+            logs = self._format_train(losses)
+            logprog.update(**logs)
+            # Just in case, clear some memory
+            del loss, estimate, reco, ms
+            if args.max_batches == idx:
+                break
+            if self.args.debug and train:
+                break
+            if self.args.flag == 'debug':
+                break
+        if train:
+            for ema in self.emas['epoch']:
+                ema.update()
+        return distrib.average(losses, idx + 1)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/spec.py b/AutoCoverTool/ref/music_remover/demucs/demucs/spec.py
new file mode 100644
index 0000000..3fa9835
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/spec.py
@@ -0,0 +1,41 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Conveniance wrapper to perform STFT and iSTFT"""
+
+import torch as th
+
+
+def spectro(x, n_fft=512, hop_length=None, pad=0):
+    *other, length = x.shape
+    x = x.reshape(-1, length)
+    z = th.stft(x,
+                n_fft * (1 + pad),
+                hop_length or n_fft // 4,
+                window=th.hann_window(n_fft).to(x),
+                win_length=n_fft,
+                normalized=True,
+                center=True,
+                return_complex=True,
+                pad_mode='reflect')
+    _, freqs, frame = z.shape
+    return z.view(*other, freqs, frame)
+
+
+def ispectro(z, hop_length=None, length=None, pad=0):
+    *other, freqs, frames = z.shape
+    n_fft = 2 * freqs - 2
+    z = z.view(-1, freqs, frames)
+    win_length = n_fft // (1 + pad)
+    x = th.istft(z,
+                 n_fft,
+                 hop_length,
+                 window=th.hann_window(win_length).to(z.real),
+                 win_length=win_length,
+                 normalized=True,
+                 length=length,
+                 center=True)
+    _, length = x.shape
+    return x.view(*other, length)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/states.py b/AutoCoverTool/ref/music_remover/demucs/demucs/states.py
new file mode 100644
index 0000000..71f229a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/states.py
@@ -0,0 +1,148 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""
+Utilities to save and load models.
+"""
+from contextlib import contextmanager
+
+import functools
+import hashlib
+import inspect
+import io
+from pathlib import Path
+import warnings
+
+from omegaconf import OmegaConf
+from diffq import DiffQuantizer, UniformQuantizer, restore_quantized_state
+import torch
+
+
+def get_quantizer(model, args, optimizer=None):
+    """Return the quantizer given the XP quantization args."""
+    quantizer = None
+    if args.diffq:
+        quantizer = DiffQuantizer(
+            model, min_size=args.min_size, group_size=args.group_size)
+        if optimizer is not None:
+            quantizer.setup_optimizer(optimizer)
+    elif args.qat:
+        quantizer = UniformQuantizer(
+                model, bits=args.qat, min_size=args.min_size)
+    return quantizer
+
+
+def load_model(path_or_package, strict=False):
+    """Load a model from the given serialized model, either given as a dict (already loaded)
+    or a path to a file on disk."""
+    if isinstance(path_or_package, dict):
+        package = path_or_package
+    elif isinstance(path_or_package, (str, Path)):
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            path = path_or_package
+            package = torch.load(path, 'cpu')
+    else:
+        raise ValueError(f"Invalid type for {path_or_package}.")
+
+    klass = package["klass"]
+    args = package["args"]
+    kwargs = package["kwargs"]
+
+    if strict:
+        model = klass(*args, **kwargs)
+    else:
+        sig = inspect.signature(klass)
+        for key in list(kwargs):
+            if key not in sig.parameters:
+                warnings.warn("Dropping inexistant parameter " + key)
+                del kwargs[key]
+        model = klass(*args, **kwargs)
+
+    state = package["state"]
+
+    set_state(model, state)
+    return model
+
+
+def get_state(model, quantizer, half=False):
+    """Get the state from a model, potentially with quantization applied.
+    If `half` is True, model are stored as half precision, which shouldn't impact performance
+    but half the state size."""
+    if quantizer is None:
+        dtype = torch.half if half else None
+        state = {k: p.data.to(device='cpu', dtype=dtype) for k, p in model.state_dict().items()}
+    else:
+        state = quantizer.get_quantized_state()
+        state['__quantized'] = True
+    return state
+
+
+def set_state(model, state, quantizer=None):
+    """Set the state on a given model."""
+    if state.get('__quantized'):
+        if quantizer is not None:
+            quantizer.restore_quantized_state(model, state['quantized'])
+        else:
+            restore_quantized_state(model, state)
+    else:
+        model.load_state_dict(state)
+    return state
+
+
+def save_with_checksum(content, path):
+    """Save the given value on disk, along with a sha256 hash.
+    Should be used with the output of either `serialize_model` or `get_state`."""
+    buf = io.BytesIO()
+    torch.save(content, buf)
+    sig = hashlib.sha256(buf.getvalue()).hexdigest()[:8]
+
+    path = path.parent / (path.stem + "-" + sig + path.suffix)
+    path.write_bytes(buf.getvalue())
+
+
+def serialize_model(model, training_args, quantizer=None, half=True):
+    args, kwargs = model._init_args_kwargs
+    klass = model.__class__
+
+    state = get_state(model, quantizer, half)
+    return {
+        'klass': klass,
+        'args': args,
+        'kwargs': kwargs,
+        'state': state,
+        'training_args': OmegaConf.to_container(training_args, resolve=True),
+    }
+
+
+def copy_state(state):
+    return {k: v.cpu().clone() for k, v in state.items()}
+
+
+@contextmanager
+def swap_state(model, state):
+    """
+    Context manager that swaps the state of a model, e.g:
+
+        # model is in old state
+        with swap_state(model, new_state):
+            # model in new state
+        # model back to old state
+    """
+    old_state = copy_state(model.state_dict())
+    model.load_state_dict(state, strict=False)
+    try:
+        yield
+    finally:
+        model.load_state_dict(old_state)
+
+
+def capture_init(init):
+    @functools.wraps(init)
+    def __init__(self, *args, **kwargs):
+        self._init_args_kwargs = (args, kwargs)
+        init(self, *args, **kwargs)
+
+    return __init__
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/svd.py b/AutoCoverTool/ref/music_remover/demucs/demucs/svd.py
new file mode 100644
index 0000000..59ab603
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/svd.py
@@ -0,0 +1,83 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Ways to make the model stronger."""
+import random
+import torch
+
+
+def power_iteration(m, niters=1, bs=1):
+    """This is the power method. batch size is used to try multiple starting point in parallel."""
+    assert m.dim() == 2
+    assert m.shape[0] == m.shape[1]
+    dim = m.shape[0]
+    b = torch.randn(dim, bs, device=m.device, dtype=m.dtype)
+
+    for _ in range(niters):
+        n = m.mm(b)
+        norm = n.norm(dim=0, keepdim=True)
+        b = n / (1e-10 + norm)
+
+    return norm.mean()
+
+
+# We need a shared RNG to make sure all the distributed worker will skip the penalty together,
+# as otherwise we wouldn't get any speed up.
+penalty_rng = random.Random(1234)
+
+
+def svd_penalty(model, min_size=0.1, dim=1, niters=2, powm=False, convtr=True,
+                proba=1, conv_only=False, exact=False, bs=1):
+    """
+    Penalty on the largest singular value for a layer.
+    Args:
+        - model: model to penalize
+        - min_size: minimum size in MB of a layer to penalize.
+        - dim: projection dimension for the svd_lowrank. Higher is better but slower.
+        - niters: number of iterations in the algorithm used by svd_lowrank.
+        - powm: use power method instead of lowrank SVD, my own experience
+            is that it is both slower and less stable.
+        - convtr: when True, differentiate between Conv and Transposed Conv.
+            this is kept for compatibility with older experiments.
+        - proba: probability to apply the penalty.
+        - conv_only: only apply to conv and conv transposed, not LSTM
+            (might not be reliable for other models than Demucs).
+        - exact: use exact SVD (slow but useful at validation).
+        - bs: batch_size for power method.
+    """
+    total = 0
+    if penalty_rng.random() > proba:
+        return 0.
+
+    for m in model.modules():
+        for name, p in m.named_parameters(recurse=False):
+            if p.numel() / 2**18 < min_size:
+                continue
+            if convtr:
+                if isinstance(m, (torch.nn.ConvTranspose1d, torch.nn.ConvTranspose2d)):
+                    if p.dim() in [3, 4]:
+                        p = p.transpose(0, 1).contiguous()
+            if p.dim() == 3:
+                p = p.view(len(p), -1)
+            elif p.dim() == 4:
+                p = p.view(len(p), -1)
+            elif p.dim() == 1:
+                continue
+            elif conv_only:
+                continue
+            assert p.dim() == 2, (name, p.shape)
+            if exact:
+                estimate = torch.svd(p, compute_uv=False)[1].pow(2).max()
+            elif powm:
+                a, b = p.shape
+                if a < b:
+                    n = p.mm(p.t())
+                else:
+                    n = p.t().mm(p)
+                estimate = power_iteration(n, niters, bs)
+            else:
+                estimate = torch.svd_lowrank(p, dim, niters)[1][0].pow(2)
+            total += estimate
+    return total / proba
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/train.py b/AutoCoverTool/ref/music_remover/demucs/demucs/train.py
new file mode 100644
index 0000000..6cc0256
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/train.py
@@ -0,0 +1,243 @@
+#!/usr/bin/env python3
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Main training script entry point"""
+
+import logging
+import os
+from pathlib import Path
+import sys
+
+from dora import hydra_main
+import hydra
+from hydra.core.global_hydra import GlobalHydra
+from omegaconf import OmegaConf
+import torch
+from torch import nn
+from torch.utils.data import ConcatDataset
+
+from . import distrib
+from .wav import get_wav_datasets, get_musdb_wav_datasets
+from .demucs import Demucs
+from .hdemucs import HDemucs
+from .htdemucs import HTDemucs
+from .repitch import RepitchedWrapper
+from .solver import Solver
+from .states import capture_init
+from .utils import random_subset
+
+logger = logging.getLogger(__name__)
+
+
+class TorchHDemucsWrapper(nn.Module):
+    """Wrapper around torchaudio HDemucs implementation to provide the proper metadata
+    for model evaluation.
+    See https://pytorch.org/audio/stable/tutorials/hybrid_demucs_tutorial.html"""
+
+    @capture_init
+    def __init__(self,  **kwargs):
+        super().__init__()
+        try:
+            from torchaudio.models import HDemucs as TorchHDemucs
+        except ImportError:
+            raise ImportError("Please upgrade torchaudio for using its implementation of HDemucs")
+        self.samplerate = kwargs.pop('samplerate')
+        self.segment = kwargs.pop('segment')
+        self.sources = kwargs['sources']
+        self.torch_hdemucs = TorchHDemucs(**kwargs)
+
+    def forward(self, mix):
+        return self.torch_hdemucs.forward(mix)
+
+
+def get_model(args):
+    extra = {
+        'sources': list(args.dset.sources),
+        'audio_channels': args.dset.channels,
+        'samplerate': args.dset.samplerate,
+        'segment': args.model_segment or 4 * args.dset.segment,
+    }
+    klass = {
+        'demucs': Demucs,
+        'hdemucs': HDemucs,
+        'htdemucs': HTDemucs,
+        'torch_hdemucs': TorchHDemucsWrapper,
+    }[args.model]
+    kw = OmegaConf.to_container(getattr(args, args.model), resolve=True)
+    model = klass(**extra, **kw)
+    return model
+
+
+def get_optimizer(model, args):
+    seen_params = set()
+    other_params = []
+    groups = []
+    for n, module in model.named_modules():
+        if hasattr(module, "make_optim_group"):
+            group = module.make_optim_group()
+            params = set(group["params"])
+            assert params.isdisjoint(seen_params)
+            seen_params |= set(params)
+            groups.append(group)
+    for param in model.parameters():
+        if param not in seen_params:
+            other_params.append(param)
+    groups.insert(0, {"params": other_params})
+    parameters = groups
+    if args.optim.optim == "adam":
+        return torch.optim.Adam(
+            parameters,
+            lr=args.optim.lr,
+            betas=(args.optim.momentum, args.optim.beta2),
+            weight_decay=args.optim.weight_decay,
+        )
+    elif args.optim.optim == "adamw":
+        return torch.optim.AdamW(
+            parameters,
+            lr=args.optim.lr,
+            betas=(args.optim.momentum, args.optim.beta2),
+            weight_decay=args.optim.weight_decay,
+        )
+    else:
+        raise ValueError("Invalid optimizer %s", args.optim.optimizer)
+
+
+def get_datasets(args):
+    train_set, valid_set = get_musdb_wav_datasets(args.dset)
+    if args.dset.wav:
+        extra_train_set, extra_valid_set = get_wav_datasets(args.dset)
+        if len(args.dset.sources) <= 4:
+            train_set = ConcatDataset([train_set, extra_train_set])
+            valid_set = ConcatDataset([valid_set, extra_valid_set])
+        else:
+            train_set = extra_train_set
+            valid_set = extra_valid_set
+
+    if args.dset.wav2:
+        extra_train_set, extra_valid_set = get_wav_datasets(args.dset, "wav2")
+        weight = args.dset.wav2_weight
+        if weight is not None:
+            b = len(train_set)
+            e = len(extra_train_set)
+            reps = max(1, round(e / b * (1 / weight - 1)))
+        else:
+            reps = 1
+        train_set = ConcatDataset([train_set] * reps + [extra_train_set])
+        if args.dset.wav2_valid:
+            if weight is not None:
+                b = len(valid_set)
+                n_kept = int(round(weight * b / (1 - weight)))
+                valid_set = ConcatDataset(
+                    [valid_set, random_subset(extra_valid_set, n_kept)]
+                )
+            else:
+                valid_set = ConcatDataset([valid_set, extra_valid_set])
+    if args.dset.valid_samples is not None:
+        valid_set = random_subset(valid_set, args.dset.valid_samples)
+    return train_set, valid_set
+
+
+def get_solver(args, model_only=False):
+    distrib.init()
+
+    torch.manual_seed(args.seed)
+    model = get_model(args)
+    if args.misc.show:
+        logger.info(model)
+        mb = sum(p.numel() for p in model.parameters()) * 4 / 2**20
+        logger.info('Size: %.1f MB', mb)
+        if hasattr(model, 'valid_length'):
+            field = model.valid_length(1)
+            logger.info('Field: %.1f ms', field / args.dset.samplerate * 1000)
+        sys.exit(0)
+
+    # torch also initialize cuda seed if available
+    if torch.cuda.is_available():
+        model.cuda()
+
+    # optimizer
+    optimizer = get_optimizer(model, args)
+
+    assert args.batch_size % distrib.world_size == 0
+    args.batch_size //= distrib.world_size
+
+    if model_only:
+        return Solver(None, model, optimizer, args)
+
+    train_set, valid_set = get_datasets(args)
+
+    if args.augment.repitch.proba:
+        vocals = []
+        if 'vocals' in args.dset.sources:
+            vocals.append(args.dset.sources.index('vocals'))
+        else:
+            logger.warning('No vocal source found')
+        if args.augment.repitch.proba:
+            train_set = RepitchedWrapper(train_set, vocals=vocals, **args.augment.repitch)
+
+    logger.info("train/valid set size: %d %d", len(train_set), len(valid_set))
+    train_loader = distrib.loader(
+        train_set, batch_size=args.batch_size, shuffle=True,
+        num_workers=args.misc.num_workers, drop_last=True)
+    if args.dset.full_cv:
+        valid_loader = distrib.loader(
+            valid_set, batch_size=1, shuffle=False,
+            num_workers=args.misc.num_workers)
+    else:
+        valid_loader = distrib.loader(
+            valid_set, batch_size=args.batch_size, shuffle=False,
+            num_workers=args.misc.num_workers, drop_last=True)
+    loaders = {"train": train_loader, "valid": valid_loader}
+
+    # Construct Solver
+    return Solver(loaders, model, optimizer, args)
+
+
+def get_solver_from_sig(sig, model_only=False):
+    inst = GlobalHydra.instance()
+    hyd = None
+    if inst.is_initialized():
+        hyd = inst.hydra
+        inst.clear()
+    xp = main.get_xp_from_sig(sig)
+    if hyd is not None:
+        inst.clear()
+        inst.initialize(hyd)
+
+    with xp.enter(stack=True):
+        return get_solver(xp.cfg, model_only)
+
+
+@hydra_main(config_path="../conf", config_name="config")
+def main(args):
+    global __file__
+    __file__ = hydra.utils.to_absolute_path(__file__)
+    for attr in ["musdb", "wav", "metadata"]:
+        val = getattr(args.dset, attr)
+        if val is not None:
+            setattr(args.dset, attr, hydra.utils.to_absolute_path(val))
+
+    os.environ["OMP_NUM_THREADS"] = "1"
+    os.environ["MKL_NUM_THREADS"] = "1"
+
+    if args.misc.verbose:
+        logger.setLevel(logging.DEBUG)
+
+    logger.info("For logs, checkpoints and samples check %s", os.getcwd())
+    logger.debug(args)
+    from dora import get_xp
+    logger.debug(get_xp().cfg)
+
+    solver = get_solver(args)
+    solver.train()
+
+
+if '_DORA_TEST_PATH' in os.environ:
+    main.dora.dir = Path(os.environ['_DORA_TEST_PATH'])
+
+
+if __name__ == "__main__":
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/transformer.py b/AutoCoverTool/ref/music_remover/demucs/demucs/transformer.py
new file mode 100644
index 0000000..56a465b
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/transformer.py
@@ -0,0 +1,839 @@
+# Copyright (c) 2019-present, Meta, Inc.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+# First author is Simon Rouard.
+
+import random
+import typing as tp
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import numpy as np
+import math
+from einops import rearrange
+
+
+def create_sin_embedding(
+    length: int, dim: int, shift: int = 0, device="cpu", max_period=10000
+):
+    # We aim for TBC format
+    assert dim % 2 == 0
+    pos = shift + torch.arange(length, device=device).view(-1, 1, 1)
+    half_dim = dim // 2
+    adim = torch.arange(dim // 2, device=device).view(1, 1, -1)
+    phase = pos / (max_period ** (adim / (half_dim - 1)))
+    return torch.cat(
+        [
+            torch.cos(phase),
+            torch.sin(phase),
+        ],
+        dim=-1,
+    )
+
+
+def create_2d_sin_embedding(d_model, height, width, device="cpu", max_period=10000):
+    """
+    :param d_model: dimension of the model
+    :param height: height of the positions
+    :param width: width of the positions
+    :return: d_model*height*width position matrix
+    """
+    if d_model % 4 != 0:
+        raise ValueError(
+            "Cannot use sin/cos positional encoding with "
+            "odd dimension (got dim={:d})".format(d_model)
+        )
+    pe = torch.zeros(d_model, height, width)
+    # Each dimension use half of d_model
+    d_model = int(d_model / 2)
+    div_term = torch.exp(
+        torch.arange(0.0, d_model, 2) * -(math.log(max_period) / d_model)
+    )
+    pos_w = torch.arange(0.0, width).unsqueeze(1)
+    pos_h = torch.arange(0.0, height).unsqueeze(1)
+    pe[0:d_model:2, :, :] = (
+        torch.sin(pos_w * div_term).transpose(0, 1).unsqueeze(1).repeat(1, height, 1)
+    )
+    pe[1:d_model:2, :, :] = (
+        torch.cos(pos_w * div_term).transpose(0, 1).unsqueeze(1).repeat(1, height, 1)
+    )
+    pe[d_model::2, :, :] = (
+        torch.sin(pos_h * div_term).transpose(0, 1).unsqueeze(2).repeat(1, 1, width)
+    )
+    pe[d_model + 1:: 2, :, :] = (
+        torch.cos(pos_h * div_term).transpose(0, 1).unsqueeze(2).repeat(1, 1, width)
+    )
+
+    return pe[None, :].to(device)
+
+
+def create_sin_embedding_cape(
+    length: int,
+    dim: int,
+    batch_size: int,
+    mean_normalize: bool,
+    augment: bool,  # True during training
+    max_global_shift: float = 0.0,  # delta max
+    max_local_shift: float = 0.0,  # epsilon max
+    max_scale: float = 1.0,
+    device: str = "cpu",
+    max_period: float = 10000.0,
+):
+    # We aim for TBC format
+    assert dim % 2 == 0
+    pos = 1.0 * torch.arange(length).view(-1, 1, 1)  # (length, 1, 1)
+    pos = pos.repeat(1, batch_size, 1)  # (length, batch_size, 1)
+    if mean_normalize:
+        pos -= torch.nanmean(pos, dim=0, keepdim=True)
+
+    if augment:
+        delta = np.random.uniform(
+            -max_global_shift, +max_global_shift, size=[1, batch_size, 1]
+        )
+        delta_local = np.random.uniform(
+            -max_local_shift, +max_local_shift, size=[length, batch_size, 1]
+        )
+        log_lambdas = np.random.uniform(
+            -np.log(max_scale), +np.log(max_scale), size=[1, batch_size, 1]
+        )
+        pos = (pos + delta + delta_local) * np.exp(log_lambdas)
+
+    pos = pos.to(device)
+
+    half_dim = dim // 2
+    adim = torch.arange(dim // 2, device=device).view(1, 1, -1)
+    phase = pos / (max_period ** (adim / (half_dim - 1)))
+    return torch.cat(
+        [
+            torch.cos(phase),
+            torch.sin(phase),
+        ],
+        dim=-1,
+    ).float()
+
+
+def get_causal_mask(length):
+    pos = torch.arange(length)
+    return pos > pos[:, None]
+
+
+def get_elementary_mask(
+    T1,
+    T2,
+    mask_type,
+    sparse_attn_window,
+    global_window,
+    mask_random_seed,
+    sparsity,
+    device,
+):
+    """
+    When the input of the Decoder has length T1 and the output T2
+    The mask matrix has shape (T2, T1)
+    """
+    assert mask_type in ["diag", "jmask", "random", "global"]
+
+    if mask_type == "global":
+        mask = torch.zeros(T2, T1, dtype=torch.bool)
+        mask[:, :global_window] = True
+        line_window = int(global_window * T2 / T1)
+        mask[:line_window, :] = True
+
+    if mask_type == "diag":
+
+        mask = torch.zeros(T2, T1, dtype=torch.bool)
+        rows = torch.arange(T2)[:, None]
+        cols = (
+            (T1 / T2 * rows + torch.arange(-sparse_attn_window, sparse_attn_window + 1))
+            .long()
+            .clamp(0, T1 - 1)
+        )
+        mask.scatter_(1, cols, torch.ones(1, dtype=torch.bool).expand_as(cols))
+
+    elif mask_type == "jmask":
+        mask = torch.zeros(T2 + 2, T1 + 2, dtype=torch.bool)
+        rows = torch.arange(T2 + 2)[:, None]
+        t = torch.arange(0, int((2 * T1) ** 0.5 + 1))
+        t = (t * (t + 1) / 2).int()
+        t = torch.cat([-t.flip(0)[:-1], t])
+        cols = (T1 / T2 * rows + t).long().clamp(0, T1 + 1)
+        mask.scatter_(1, cols, torch.ones(1, dtype=torch.bool).expand_as(cols))
+        mask = mask[1:-1, 1:-1]
+
+    elif mask_type == "random":
+        gene = torch.Generator(device=device)
+        gene.manual_seed(mask_random_seed)
+        mask = (
+            torch.rand(T1 * T2, generator=gene, device=device).reshape(T2, T1)
+            > sparsity
+        )
+
+    mask = mask.to(device)
+    return mask
+
+
+def get_mask(
+    T1,
+    T2,
+    mask_type,
+    sparse_attn_window,
+    global_window,
+    mask_random_seed,
+    sparsity,
+    device,
+):
+    """
+    Return a SparseCSRTensor mask that is a combination of elementary masks
+    mask_type can be a combination of multiple masks: for instance "diag_jmask_random"
+    """
+    from xformers.sparse import SparseCSRTensor
+    # create a list
+    mask_types = mask_type.split("_")
+
+    all_masks = [
+        get_elementary_mask(
+            T1,
+            T2,
+            mask,
+            sparse_attn_window,
+            global_window,
+            mask_random_seed,
+            sparsity,
+            device,
+        )
+        for mask in mask_types
+    ]
+
+    final_mask = torch.stack(all_masks).sum(axis=0) > 0
+
+    return SparseCSRTensor.from_dense(final_mask[None])
+
+
+class ScaledEmbedding(nn.Module):
+    def __init__(
+        self,
+        num_embeddings: int,
+        embedding_dim: int,
+        scale: float = 1.0,
+        boost: float = 3.0,
+    ):
+        super().__init__()
+        self.embedding = nn.Embedding(num_embeddings, embedding_dim)
+        self.embedding.weight.data *= scale / boost
+        self.boost = boost
+
+    @property
+    def weight(self):
+        return self.embedding.weight * self.boost
+
+    def forward(self, x):
+        return self.embedding(x) * self.boost
+
+
+class LayerScale(nn.Module):
+    """Layer scale from [Touvron et al 2021] (https://arxiv.org/pdf/2103.17239.pdf).
+    This rescales diagonaly residual outputs close to 0 initially, then learnt.
+    """
+
+    def __init__(self, channels: int, init: float = 0, channel_last=False):
+        """
+        channel_last = False corresponds to (B, C, T) tensors
+        channel_last = True corresponds to (T, B, C) tensors
+        """
+        super().__init__()
+        self.channel_last = channel_last
+        self.scale = nn.Parameter(torch.zeros(channels, requires_grad=True))
+        self.scale.data[:] = init
+
+    def forward(self, x):
+        if self.channel_last:
+            return self.scale * x
+        else:
+            return self.scale[:, None] * x
+
+
+class MyGroupNorm(nn.GroupNorm):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+
+    def forward(self, x):
+        """
+        x: (B, T, C)
+        if num_groups=1: Normalisation on all T and C together for each B
+        """
+        x = x.transpose(1, 2)
+        return super().forward(x).transpose(1, 2)
+
+
+class MyTransformerEncoderLayer(nn.TransformerEncoderLayer):
+    def __init__(
+        self,
+        d_model,
+        nhead,
+        dim_feedforward=2048,
+        dropout=0.1,
+        activation=F.relu,
+        group_norm=0,
+        norm_first=False,
+        norm_out=False,
+        layer_norm_eps=1e-5,
+        layer_scale=False,
+        init_values=1e-4,
+        device=None,
+        dtype=None,
+        sparse=False,
+        mask_type="diag",
+        mask_random_seed=42,
+        sparse_attn_window=500,
+        global_window=50,
+        auto_sparsity=False,
+        sparsity=0.95,
+        batch_first=False,
+    ):
+        factory_kwargs = {"device": device, "dtype": dtype}
+        super().__init__(
+            d_model=d_model,
+            nhead=nhead,
+            dim_feedforward=dim_feedforward,
+            dropout=dropout,
+            activation=activation,
+            layer_norm_eps=layer_norm_eps,
+            batch_first=batch_first,
+            norm_first=norm_first,
+            device=device,
+            dtype=dtype,
+        )
+        self.sparse = sparse
+        self.auto_sparsity = auto_sparsity
+        if sparse:
+            if not auto_sparsity:
+                self.mask_type = mask_type
+                self.sparse_attn_window = sparse_attn_window
+                self.global_window = global_window
+            self.sparsity = sparsity
+        if group_norm:
+            self.norm1 = MyGroupNorm(int(group_norm), d_model, eps=layer_norm_eps, **factory_kwargs)
+            self.norm2 = MyGroupNorm(int(group_norm), d_model, eps=layer_norm_eps, **factory_kwargs)
+
+        self.norm_out = None
+        if self.norm_first & norm_out:
+            self.norm_out = MyGroupNorm(num_groups=int(norm_out), num_channels=d_model)
+        self.gamma_1 = (
+            LayerScale(d_model, init_values, True) if layer_scale else nn.Identity()
+        )
+        self.gamma_2 = (
+            LayerScale(d_model, init_values, True) if layer_scale else nn.Identity()
+        )
+
+        if sparse:
+            self.self_attn = MultiheadAttention(
+                d_model, nhead, dropout=dropout, batch_first=batch_first,
+                auto_sparsity=sparsity if auto_sparsity else 0,
+            )
+            self.__setattr__("src_mask", torch.zeros(1, 1))
+            self.mask_random_seed = mask_random_seed
+
+    def forward(self, src, src_mask=None, src_key_padding_mask=None):
+        """
+        if batch_first = False, src shape is (T, B, C)
+        the case where batch_first=True is not covered
+        """
+        device = src.device
+        x = src
+        T, B, C = x.shape
+        if self.sparse and not self.auto_sparsity:
+            assert src_mask is None
+            src_mask = self.src_mask
+            if src_mask.shape[-1] != T:
+                src_mask = get_mask(
+                    T,
+                    T,
+                    self.mask_type,
+                    self.sparse_attn_window,
+                    self.global_window,
+                    self.mask_random_seed,
+                    self.sparsity,
+                    device,
+                )
+                self.__setattr__("src_mask", src_mask)
+
+        if self.norm_first:
+            x = x + self.gamma_1(
+                self._sa_block(self.norm1(x), src_mask, src_key_padding_mask)
+            )
+            x = x + self.gamma_2(self._ff_block(self.norm2(x)))
+
+            if self.norm_out:
+                x = self.norm_out(x)
+        else:
+            x = self.norm1(
+                x + self.gamma_1(self._sa_block(x, src_mask, src_key_padding_mask))
+            )
+            x = self.norm2(x + self.gamma_2(self._ff_block(x)))
+
+        return x
+
+
+class CrossTransformerEncoderLayer(nn.Module):
+    def __init__(
+        self,
+        d_model: int,
+        nhead: int,
+        dim_feedforward: int = 2048,
+        dropout: float = 0.1,
+        activation=F.relu,
+        layer_norm_eps: float = 1e-5,
+        layer_scale: bool = False,
+        init_values: float = 1e-4,
+        norm_first: bool = False,
+        group_norm: bool = False,
+        norm_out: bool = False,
+        sparse=False,
+        mask_type="diag",
+        mask_random_seed=42,
+        sparse_attn_window=500,
+        global_window=50,
+        sparsity=0.95,
+        auto_sparsity=None,
+        device=None,
+        dtype=None,
+        batch_first=False,
+    ):
+        factory_kwargs = {"device": device, "dtype": dtype}
+        super().__init__()
+
+        self.sparse = sparse
+        self.auto_sparsity = auto_sparsity
+        if sparse:
+            if not auto_sparsity:
+                self.mask_type = mask_type
+                self.sparse_attn_window = sparse_attn_window
+                self.global_window = global_window
+            self.sparsity = sparsity
+
+        self.cross_attn: nn.Module
+        self.cross_attn = nn.MultiheadAttention(
+            d_model, nhead, dropout=dropout, batch_first=batch_first)
+        # Implementation of Feedforward model
+        self.linear1 = nn.Linear(d_model, dim_feedforward, **factory_kwargs)
+        self.dropout = nn.Dropout(dropout)
+        self.linear2 = nn.Linear(dim_feedforward, d_model, **factory_kwargs)
+
+        self.norm_first = norm_first
+        self.norm1: nn.Module
+        self.norm2: nn.Module
+        self.norm3: nn.Module
+        if group_norm:
+            self.norm1 = MyGroupNorm(int(group_norm), d_model, eps=layer_norm_eps, **factory_kwargs)
+            self.norm2 = MyGroupNorm(int(group_norm), d_model, eps=layer_norm_eps, **factory_kwargs)
+            self.norm3 = MyGroupNorm(int(group_norm), d_model, eps=layer_norm_eps, **factory_kwargs)
+        else:
+            self.norm1 = nn.LayerNorm(d_model, eps=layer_norm_eps, **factory_kwargs)
+            self.norm2 = nn.LayerNorm(d_model, eps=layer_norm_eps, **factory_kwargs)
+            self.norm3 = nn.LayerNorm(d_model, eps=layer_norm_eps, **factory_kwargs)
+
+        self.norm_out = None
+        if self.norm_first & norm_out:
+            self.norm_out = MyGroupNorm(num_groups=int(norm_out), num_channels=d_model)
+
+        self.gamma_1 = (
+            LayerScale(d_model, init_values, True) if layer_scale else nn.Identity()
+        )
+        self.gamma_2 = (
+            LayerScale(d_model, init_values, True) if layer_scale else nn.Identity()
+        )
+
+        self.dropout1 = nn.Dropout(dropout)
+        self.dropout2 = nn.Dropout(dropout)
+
+        # Legacy string support for activation function.
+        if isinstance(activation, str):
+            self.activation = self._get_activation_fn(activation)
+        else:
+            self.activation = activation
+
+        if sparse:
+            self.cross_attn = MultiheadAttention(
+                d_model, nhead, dropout=dropout, batch_first=batch_first,
+                auto_sparsity=sparsity if auto_sparsity else 0)
+            if not auto_sparsity:
+                self.__setattr__("mask", torch.zeros(1, 1))
+                self.mask_random_seed = mask_random_seed
+
+    def forward(self, q, k, mask=None):
+        """
+        Args:
+            q: tensor of shape (T, B, C)
+            k: tensor of shape (S, B, C)
+            mask: tensor of shape (T, S)
+
+        """
+        device = q.device
+        T, B, C = q.shape
+        S, B, C = k.shape
+        if self.sparse and not self.auto_sparsity:
+            assert mask is None
+            mask = self.mask
+            if mask.shape[-1] != S or mask.shape[-2] != T:
+                mask = get_mask(
+                    S,
+                    T,
+                    self.mask_type,
+                    self.sparse_attn_window,
+                    self.global_window,
+                    self.mask_random_seed,
+                    self.sparsity,
+                    device,
+                )
+                self.__setattr__("mask", mask)
+
+        if self.norm_first:
+            x = q + self.gamma_1(self._ca_block(self.norm1(q), self.norm2(k), mask))
+            x = x + self.gamma_2(self._ff_block(self.norm3(x)))
+            if self.norm_out:
+                x = self.norm_out(x)
+        else:
+            x = self.norm1(q + self.gamma_1(self._ca_block(q, k, mask)))
+            x = self.norm2(x + self.gamma_2(self._ff_block(x)))
+
+        return x
+
+    # self-attention block
+    def _ca_block(self, q, k, attn_mask=None):
+        x = self.cross_attn(q, k, k, attn_mask=attn_mask, need_weights=False)[0]
+        return self.dropout1(x)
+
+    # feed forward block
+    def _ff_block(self, x):
+        x = self.linear2(self.dropout(self.activation(self.linear1(x))))
+        return self.dropout2(x)
+
+    def _get_activation_fn(self, activation):
+        if activation == "relu":
+            return F.relu
+        elif activation == "gelu":
+            return F.gelu
+
+        raise RuntimeError("activation should be relu/gelu, not {}".format(activation))
+
+
+# ----------------- MULTI-BLOCKS MODELS: -----------------------
+
+
+class CrossTransformerEncoder(nn.Module):
+    def __init__(
+        self,
+        dim: int,
+        emb: str = "sin",
+        hidden_scale: float = 4.0,
+        num_heads: int = 8,
+        num_layers: int = 6,
+        cross_first: bool = False,
+        dropout: float = 0.0,
+        max_positions: int = 1000,
+        norm_in: bool = True,
+        norm_in_group: bool = False,
+        group_norm: int = False,
+        norm_first: bool = False,
+        norm_out: bool = False,
+        max_period: float = 10000.0,
+        weight_decay: float = 0.0,
+        lr: tp.Optional[float] = None,
+        layer_scale: bool = False,
+        gelu: bool = True,
+        sin_random_shift: int = 0,
+        weight_pos_embed: float = 1.0,
+        cape_mean_normalize: bool = True,
+        cape_augment: bool = True,
+        cape_glob_loc_scale: list = [5000.0, 1.0, 1.4],
+        sparse_self_attn: bool = False,
+        sparse_cross_attn: bool = False,
+        mask_type: str = "diag",
+        mask_random_seed: int = 42,
+        sparse_attn_window: int = 500,
+        global_window: int = 50,
+        auto_sparsity: bool = False,
+        sparsity: float = 0.95,
+    ):
+        super().__init__()
+        """
+        """
+        assert dim % num_heads == 0
+
+        hidden_dim = int(dim * hidden_scale)
+
+        self.num_layers = num_layers
+        # classic parity = 1 means that if idx%2 == 1 there is a
+        # classical encoder else there is a cross encoder
+        self.classic_parity = 1 if cross_first else 0
+        self.emb = emb
+        self.max_period = max_period
+        self.weight_decay = weight_decay
+        self.weight_pos_embed = weight_pos_embed
+        self.sin_random_shift = sin_random_shift
+        if emb == "cape":
+            self.cape_mean_normalize = cape_mean_normalize
+            self.cape_augment = cape_augment
+            self.cape_glob_loc_scale = cape_glob_loc_scale
+        if emb == "scaled":
+            self.position_embeddings = ScaledEmbedding(max_positions, dim, scale=0.2)
+
+        self.lr = lr
+
+        activation: tp.Any = F.gelu if gelu else F.relu
+
+        self.norm_in: nn.Module
+        self.norm_in_t: nn.Module
+        if norm_in:
+            self.norm_in = nn.LayerNorm(dim)
+            self.norm_in_t = nn.LayerNorm(dim)
+        elif norm_in_group:
+            self.norm_in = MyGroupNorm(int(norm_in_group), dim)
+            self.norm_in_t = MyGroupNorm(int(norm_in_group), dim)
+        else:
+            self.norm_in = nn.Identity()
+            self.norm_in_t = nn.Identity()
+
+        # spectrogram layers
+        self.layers = nn.ModuleList()
+        # temporal layers
+        self.layers_t = nn.ModuleList()
+
+        kwargs_common = {
+            "d_model": dim,
+            "nhead": num_heads,
+            "dim_feedforward": hidden_dim,
+            "dropout": dropout,
+            "activation": activation,
+            "group_norm": group_norm,
+            "norm_first": norm_first,
+            "norm_out": norm_out,
+            "layer_scale": layer_scale,
+            "mask_type": mask_type,
+            "mask_random_seed": mask_random_seed,
+            "sparse_attn_window": sparse_attn_window,
+            "global_window": global_window,
+            "sparsity": sparsity,
+            "auto_sparsity": auto_sparsity,
+            "batch_first": True,
+        }
+
+        kwargs_classic_encoder = dict(kwargs_common)
+        kwargs_classic_encoder.update({
+            "sparse": sparse_self_attn,
+        })
+        kwargs_cross_encoder = dict(kwargs_common)
+        kwargs_cross_encoder.update({
+            "sparse": sparse_cross_attn,
+        })
+
+        for idx in range(num_layers):
+            if idx % 2 == self.classic_parity:
+
+                self.layers.append(MyTransformerEncoderLayer(**kwargs_classic_encoder))
+                self.layers_t.append(
+                    MyTransformerEncoderLayer(**kwargs_classic_encoder)
+                )
+
+            else:
+                self.layers.append(CrossTransformerEncoderLayer(**kwargs_cross_encoder))
+
+                self.layers_t.append(
+                    CrossTransformerEncoderLayer(**kwargs_cross_encoder)
+                )
+
+    def forward(self, x, xt):
+        B, C, Fr, T1 = x.shape
+        pos_emb_2d = create_2d_sin_embedding(
+            C, Fr, T1, x.device, self.max_period
+        )  # (1, C, Fr, T1)
+        pos_emb_2d = rearrange(pos_emb_2d, "b c fr t1 -> b (t1 fr) c")
+        x = rearrange(x, "b c fr t1 -> b (t1 fr) c")
+        x = self.norm_in(x)
+        x = x + self.weight_pos_embed * pos_emb_2d
+
+        B, C, T2 = xt.shape
+        xt = rearrange(xt, "b c t2 -> b t2 c")  # now T2, B, C
+        pos_emb = self._get_pos_embedding(T2, B, C, x.device)
+        pos_emb = rearrange(pos_emb, "t2 b c -> b t2 c")
+        xt = self.norm_in_t(xt)
+        xt = xt + self.weight_pos_embed * pos_emb
+
+        for idx in range(self.num_layers):
+            if idx % 2 == self.classic_parity:
+                x = self.layers[idx](x)
+                xt = self.layers_t[idx](xt)
+            else:
+                old_x = x
+                x = self.layers[idx](x, xt)
+                xt = self.layers_t[idx](xt, old_x)
+
+        x = rearrange(x, "b (t1 fr) c -> b c fr t1", t1=T1)
+        xt = rearrange(xt, "b t2 c -> b c t2")
+        return x, xt
+
+    def _get_pos_embedding(self, T, B, C, device):
+        if self.emb == "sin":
+            shift = random.randrange(self.sin_random_shift + 1)
+            pos_emb = create_sin_embedding(
+                T, C, shift=shift, device=device, max_period=self.max_period
+            )
+        elif self.emb == "cape":
+            if self.training:
+                pos_emb = create_sin_embedding_cape(
+                    T,
+                    C,
+                    B,
+                    device=device,
+                    max_period=self.max_period,
+                    mean_normalize=self.cape_mean_normalize,
+                    augment=self.cape_augment,
+                    max_global_shift=self.cape_glob_loc_scale[0],
+                    max_local_shift=self.cape_glob_loc_scale[1],
+                    max_scale=self.cape_glob_loc_scale[2],
+                )
+            else:
+                pos_emb = create_sin_embedding_cape(
+                    T,
+                    C,
+                    B,
+                    device=device,
+                    max_period=self.max_period,
+                    mean_normalize=self.cape_mean_normalize,
+                    augment=False,
+                )
+
+        elif self.emb == "scaled":
+            pos = torch.arange(T, device=device)
+            pos_emb = self.position_embeddings(pos)[:, None]
+
+        return pos_emb
+
+    def make_optim_group(self):
+        group = {"params": list(self.parameters()), "weight_decay": self.weight_decay}
+        if self.lr is not None:
+            group["lr"] = self.lr
+        return group
+
+
+# Attention Modules
+
+
+class MultiheadAttention(nn.Module):
+    def __init__(
+        self,
+        embed_dim,
+        num_heads,
+        dropout=0.0,
+        bias=True,
+        add_bias_kv=False,
+        add_zero_attn=False,
+        kdim=None,
+        vdim=None,
+        batch_first=False,
+        auto_sparsity=None,
+    ):
+        super().__init__()
+        assert auto_sparsity is not None, "sanity check"
+        self.num_heads = num_heads
+        self.q = torch.nn.Linear(embed_dim, embed_dim, bias=bias)
+        self.k = torch.nn.Linear(embed_dim, embed_dim, bias=bias)
+        self.v = torch.nn.Linear(embed_dim, embed_dim, bias=bias)
+        self.attn_drop = torch.nn.Dropout(dropout)
+        self.proj = torch.nn.Linear(embed_dim, embed_dim, bias)
+        self.proj_drop = torch.nn.Dropout(dropout)
+        self.batch_first = batch_first
+        self.auto_sparsity = auto_sparsity
+
+    def forward(
+        self,
+        query,
+        key,
+        value,
+        key_padding_mask=None,
+        need_weights=True,
+        attn_mask=None,
+        average_attn_weights=True,
+    ):
+
+        if not self.batch_first:  # N, B, C
+            query = query.permute(1, 0, 2)  # B, N_q, C
+            key = key.permute(1, 0, 2)  # B, N_k, C
+            value = value.permute(1, 0, 2)  # B, N_k, C
+        B, N_q, C = query.shape
+        B, N_k, C = key.shape
+
+        q = (
+            self.q(query)
+            .reshape(B, N_q, self.num_heads, C // self.num_heads)
+            .permute(0, 2, 1, 3)
+        )
+        q = q.flatten(0, 1)
+        k = (
+            self.k(key)
+            .reshape(B, N_k, self.num_heads, C // self.num_heads)
+            .permute(0, 2, 1, 3)
+        )
+        k = k.flatten(0, 1)
+        v = (
+            self.v(value)
+            .reshape(B, N_k, self.num_heads, C // self.num_heads)
+            .permute(0, 2, 1, 3)
+        )
+        v = v.flatten(0, 1)
+
+        if self.auto_sparsity:
+            assert attn_mask is None
+            x = dynamic_sparse_attention(q, k, v, sparsity=self.auto_sparsity)
+        else:
+            x = scaled_dot_product_attention(q, k, v, attn_mask, dropout=self.attn_drop)
+        x = x.reshape(B, self.num_heads, N_q, C // self.num_heads)
+
+        x = x.transpose(1, 2).reshape(B, N_q, C)
+        x = self.proj(x)
+        x = self.proj_drop(x)
+        if not self.batch_first:
+            x = x.permute(1, 0, 2)
+        return x, None
+
+
+def scaled_query_key_softmax(q, k, att_mask):
+    from xformers.ops import masked_matmul
+    q = q / (k.size(-1)) ** 0.5
+    att = masked_matmul(q, k.transpose(-2, -1), att_mask)
+    att = torch.nn.functional.softmax(att, -1)
+    return att
+
+
+def scaled_dot_product_attention(q, k, v, att_mask, dropout):
+    att = scaled_query_key_softmax(q, k, att_mask=att_mask)
+    att = dropout(att)
+    y = att @ v
+    return y
+
+
+def _compute_buckets(x, R):
+    qq = torch.einsum('btf,bfhi->bhti', x, R)
+    qq = torch.cat([qq, -qq], dim=-1)
+    buckets = qq.argmax(dim=-1)
+
+    return buckets.permute(0, 2, 1).byte().contiguous()
+
+
+def dynamic_sparse_attention(query, key, value, sparsity, infer_sparsity=True, attn_bias=None):
+    # assert False, "The code for the custom sparse kernel is not ready for release yet."
+    from xformers.ops import find_locations, sparse_memory_efficient_attention
+    n_hashes = 32
+    proj_size = 4
+    query, key, value = [x.contiguous() for x in [query, key, value]]
+    with torch.no_grad():
+        R = torch.randn(1, query.shape[-1], n_hashes, proj_size // 2, device=query.device)
+        bucket_query = _compute_buckets(query, R)
+        bucket_key = _compute_buckets(key, R)
+        row_offsets, column_indices = find_locations(
+            bucket_query, bucket_key, sparsity, infer_sparsity)
+    return sparse_memory_efficient_attention(
+        query, key, value, row_offsets, column_indices, attn_bias)
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/utils.py b/AutoCoverTool/ref/music_remover/demucs/demucs/utils.py
new file mode 100755
index 0000000..38ef120
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/utils.py
@@ -0,0 +1,141 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+from collections import defaultdict
+from contextlib import contextmanager
+import math
+import os
+import tempfile
+import typing as tp
+
+import torch
+from torch.nn import functional as F
+from torch.utils.data import Subset
+
+
+def unfold(a, kernel_size, stride):
+    """Given input of size [*OT, T], output Tensor of size [*OT, F, K]
+    with K the kernel size, by extracting frames with the given stride.
+
+    This will pad the input so that `F = ceil(T / K)`.
+
+    see https://github.com/pytorch/pytorch/issues/60466
+    """
+    *shape, length = a.shape
+    n_frames = math.ceil(length / stride)
+    tgt_length = (n_frames - 1) * stride + kernel_size
+    a = F.pad(a, (0, tgt_length - length))
+    strides = list(a.stride())
+    assert strides[-1] == 1, 'data should be contiguous'
+    strides = strides[:-1] + [stride, 1]
+    return a.as_strided([*shape, n_frames, kernel_size], strides)
+
+
+def center_trim(tensor: torch.Tensor, reference: tp.Union[torch.Tensor, int]):
+    """
+    Center trim `tensor` with respect to `reference`, along the last dimension.
+    `reference` can also be a number, representing the length to trim to.
+    If the size difference != 0 mod 2, the extra sample is removed on the right side.
+    """
+    ref_size: int
+    if isinstance(reference, torch.Tensor):
+        ref_size = reference.size(-1)
+    else:
+        ref_size = reference
+    delta = tensor.size(-1) - ref_size
+    if delta < 0:
+        raise ValueError("tensor must be larger than reference. " f"Delta is {delta}.")
+    if delta:
+        tensor = tensor[..., delta // 2:-(delta - delta // 2)]
+    return tensor
+
+
+def pull_metric(history: tp.List[dict], name: str):
+    out = []
+    for metrics in history:
+        metric = metrics
+        for part in name.split("."):
+            metric = metric[part]
+        out.append(metric)
+    return out
+
+
+def EMA(beta: float = 1):
+    """
+    Exponential Moving Average callback.
+    Returns a single function that can be called to repeatidly update the EMA
+    with a dict of metrics. The callback will return
+    the new averaged dict of metrics.
+
+    Note that for `beta=1`, this is just plain averaging.
+    """
+    fix: tp.Dict[str, float] = defaultdict(float)
+    total: tp.Dict[str, float] = defaultdict(float)
+
+    def _update(metrics: dict, weight: float = 1) -> dict:
+        nonlocal total, fix
+        for key, value in metrics.items():
+            total[key] = total[key] * beta + weight * float(value)
+            fix[key] = fix[key] * beta + weight
+        return {key: tot / fix[key] for key, tot in total.items()}
+    return _update
+
+
+def sizeof_fmt(num: float, suffix: str = 'B'):
+    """
+    Given `num` bytes, return human readable size.
+    Taken from https://stackoverflow.com/a/1094933
+    """
+    for unit in ['', 'Ki', 'Mi', 'Gi', 'Ti', 'Pi', 'Ei', 'Zi']:
+        if abs(num) < 1024.0:
+            return "%3.1f%s%s" % (num, unit, suffix)
+        num /= 1024.0
+    return "%.1f%s%s" % (num, 'Yi', suffix)
+
+
+@contextmanager
+def temp_filenames(count: int, delete=True):
+    names = []
+    try:
+        for _ in range(count):
+            names.append(tempfile.NamedTemporaryFile(delete=False).name)
+        yield names
+    finally:
+        if delete:
+            for name in names:
+                os.unlink(name)
+
+
+def random_subset(dataset, max_samples: int, seed: int = 42):
+    if max_samples >= len(dataset):
+        return dataset
+
+    generator = torch.Generator().manual_seed(seed)
+    perm = torch.randperm(len(dataset), generator=generator)
+    return Subset(dataset, perm[:max_samples].tolist())
+
+
+class DummyPoolExecutor:
+    class DummyResult:
+        def __init__(self, func, *args, **kwargs):
+            self.func = func
+            self.args = args
+            self.kwargs = kwargs
+
+        def result(self):
+            return self.func(*self.args, **self.kwargs)
+
+    def __init__(self, workers=0):
+        pass
+
+    def submit(self, func, *args, **kwargs):
+        return DummyPoolExecutor.DummyResult(func, *args, **kwargs)
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, exc_tb):
+        return
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/wav.py b/AutoCoverTool/ref/music_remover/demucs/demucs/wav.py
new file mode 100644
index 0000000..a0e2dd4
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/wav.py
@@ -0,0 +1,243 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+"""Loading wav based datasets, including MusdbHQ."""
+
+from collections import OrderedDict
+import hashlib
+import math
+import json
+import os
+from pathlib import Path
+import tqdm
+
+import musdb
+import julius
+import torch as th
+from torch import distributed
+import torchaudio as ta
+from torch.nn import functional as F
+
+from .audio import convert_audio_channels
+from . import distrib
+
+MIXTURE = "mixture"
+EXT = ".wav"
+
+
+def _track_metadata(track, sources, normalize=True, ext=EXT):
+    track_length = None
+    track_samplerate = None
+    mean = 0
+    std = 1
+    for source in sources + [MIXTURE]:
+        file = track / f"{source}{ext}"
+        try:
+            info = ta.info(str(file))
+        except RuntimeError:
+            print(file)
+            raise
+        length = info.num_frames
+        if track_length is None:
+            track_length = length
+            track_samplerate = info.sample_rate
+        elif track_length != length:
+            raise ValueError(
+                f"Invalid length for file {file}: "
+                f"expecting {track_length} but got {length}.")
+        elif info.sample_rate != track_samplerate:
+            raise ValueError(
+                f"Invalid sample rate for file {file}: "
+                f"expecting {track_samplerate} but got {info.sample_rate}.")
+        if source == MIXTURE and normalize:
+            try:
+                wav, _ = ta.load(str(file))
+            except RuntimeError:
+                print(file)
+                raise
+            wav = wav.mean(0)
+            mean = wav.mean().item()
+            std = wav.std().item()
+
+    return {"length": length, "mean": mean, "std": std, "samplerate": track_samplerate}
+
+
+def build_metadata(path, sources, normalize=True, ext=EXT):
+    """
+    Build the metadata for `Wavset`.
+
+    Args:
+        path (str or Path): path to dataset.
+        sources (list[str]): list of sources to look for.
+        normalize (bool): if True, loads full track and store normalization
+            values based on the mixture file.
+        ext (str): extension of audio files (default is .wav).
+    """
+
+    meta = {}
+    path = Path(path)
+    pendings = []
+    from concurrent.futures import ThreadPoolExecutor
+    with ThreadPoolExecutor(8) as pool:
+        for root, folders, files in os.walk(path, followlinks=True):
+            root = Path(root)
+            if root.name.startswith('.') or folders or root == path:
+                continue
+            name = str(root.relative_to(path))
+            pendings.append((name, pool.submit(_track_metadata, root, sources, normalize, ext)))
+            # meta[name] = _track_metadata(root, sources, normalize, ext)
+        for name, pending in tqdm.tqdm(pendings, ncols=120):
+            meta[name] = pending.result()
+    return meta
+
+
+class Wavset:
+    def __init__(
+            self,
+            root, metadata, sources,
+            segment=None, shift=None, normalize=True,
+            samplerate=44100, channels=2, ext=EXT):
+        """
+        Waveset (or mp3 set for that matter). Can be used to train
+        with arbitrary sources. Each track should be one folder inside of `path`.
+        The folder should contain files named `{source}.{ext}`.
+
+        Args:
+            root (Path or str): root folder for the dataset.
+            metadata (dict): output from `build_metadata`.
+            sources (list[str]): list of source names.
+            segment (None or float): segment length in seconds. If `None`, returns entire tracks.
+            shift (None or float): stride in seconds bewteen samples.
+            normalize (bool): normalizes input audio, **based on the metadata content**,
+                i.e. the entire track is normalized, not individual extracts.
+            samplerate (int): target sample rate. if the file sample rate
+                is different, it will be resampled on the fly.
+            channels (int): target nb of channels. if different, will be
+                changed onthe fly.
+            ext (str): extension for audio files (default is .wav).
+
+        samplerate and channels are converted on the fly.
+        """
+        self.root = Path(root)
+        self.metadata = OrderedDict(metadata)
+        self.segment = segment
+        self.shift = shift or segment
+        self.normalize = normalize
+        self.sources = sources
+        self.channels = channels
+        self.samplerate = samplerate
+        self.ext = ext
+        self.num_examples = []
+        for name, meta in self.metadata.items():
+            track_duration = meta['length'] / meta['samplerate']
+            if segment is None or track_duration < segment:
+                examples = 1
+            else:
+                examples = int(math.ceil((track_duration - self.segment) / self.shift) + 1)
+            self.num_examples.append(examples)
+
+    def __len__(self):
+        return sum(self.num_examples)
+
+    def get_file(self, name, source):
+        return self.root / name / f"{source}{self.ext}"
+
+    def __getitem__(self, index):
+        for name, examples in zip(self.metadata, self.num_examples):
+            if index >= examples:
+                index -= examples
+                continue
+            meta = self.metadata[name]
+            num_frames = -1
+            offset = 0
+            if self.segment is not None:
+                offset = int(meta['samplerate'] * self.shift * index)
+                num_frames = int(math.ceil(meta['samplerate'] * self.segment))
+            wavs = []
+            for source in self.sources:
+                file = self.get_file(name, source)
+                wav, _ = ta.load(str(file), frame_offset=offset, num_frames=num_frames)
+                wav = convert_audio_channels(wav, self.channels)
+                wavs.append(wav)
+
+            example = th.stack(wavs)
+            example = julius.resample_frac(example, meta['samplerate'], self.samplerate)
+            if self.normalize:
+                example = (example - meta['mean']) / meta['std']
+            if self.segment:
+                length = int(self.segment * self.samplerate)
+                example = example[..., :length]
+                example = F.pad(example, (0, length - example.shape[-1]))
+            return example
+
+
+def get_wav_datasets(args, name='wav'):
+    """Extract the wav datasets from the XP arguments."""
+    path = getattr(args, name)
+    sig = hashlib.sha1(str(path).encode()).hexdigest()[:8]
+    metadata_file = Path(args.metadata) / ('wav_' + sig + ".json")
+    train_path = Path(path) / "train"
+    valid_path = Path(path) / "valid"
+    if not metadata_file.is_file() and distrib.rank == 0:
+        metadata_file.parent.mkdir(exist_ok=True, parents=True)
+        train = build_metadata(train_path, args.sources)
+        valid = build_metadata(valid_path, args.sources)
+        json.dump([train, valid], open(metadata_file, "w"))
+    if distrib.world_size > 1:
+        distributed.barrier()
+    train, valid = json.load(open(metadata_file))
+    if args.full_cv:
+        kw_cv = {}
+    else:
+        kw_cv = {'segment': args.segment, 'shift': args.shift}
+    train_set = Wavset(train_path, train, args.sources,
+                       segment=args.segment, shift=args.shift,
+                       samplerate=args.samplerate, channels=args.channels,
+                       normalize=args.normalize)
+    valid_set = Wavset(valid_path, valid, [MIXTURE] + list(args.sources),
+                       samplerate=args.samplerate, channels=args.channels,
+                       normalize=args.normalize, **kw_cv)
+    return train_set, valid_set
+
+
+def _get_musdb_valid():
+    # Return musdb valid set.
+    import yaml
+    setup_path = Path(musdb.__path__[0]) / 'configs' / 'mus.yaml'
+    setup = yaml.safe_load(open(setup_path, 'r'))
+    return setup['validation_tracks']
+
+
+def get_musdb_wav_datasets(args):
+    """Extract the musdb dataset from the XP arguments."""
+    sig = hashlib.sha1(str(args.musdb).encode()).hexdigest()[:8]
+    metadata_file = Path(args.metadata) / ('musdb_' + sig + ".json")
+    root = Path(args.musdb) / "train"
+    if not metadata_file.is_file() and distrib.rank == 0:
+        metadata_file.parent.mkdir(exist_ok=True, parents=True)
+        metadata = build_metadata(root, args.sources)
+        json.dump(metadata, open(metadata_file, "w"))
+    if distrib.world_size > 1:
+        distributed.barrier()
+    metadata = json.load(open(metadata_file))
+
+    valid_tracks = _get_musdb_valid()
+    if args.train_valid:
+        metadata_train = metadata
+    else:
+        metadata_train = {name: meta for name, meta in metadata.items() if name not in valid_tracks}
+    metadata_valid = {name: meta for name, meta in metadata.items() if name in valid_tracks}
+    if args.full_cv:
+        kw_cv = {}
+    else:
+        kw_cv = {'segment': args.segment, 'shift': args.shift}
+    train_set = Wavset(root, metadata_train, args.sources,
+                       segment=args.segment, shift=args.shift,
+                       samplerate=args.samplerate, channels=args.channels,
+                       normalize=args.normalize)
+    valid_set = Wavset(root, metadata_valid, [MIXTURE] + list(args.sources),
+                       samplerate=args.samplerate, channels=args.channels,
+                       normalize=args.normalize, **kw_cv)
+    return train_set, valid_set
diff --git a/AutoCoverTool/ref/music_remover/demucs/demucs/wdemucs.py b/AutoCoverTool/ref/music_remover/demucs/demucs/wdemucs.py
new file mode 100644
index 0000000..60ec8d0
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/demucs/wdemucs.py
@@ -0,0 +1,9 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+# For compat
+from .hdemucs import HDemucs
+
+WDemucs = HDemucs
diff --git a/AutoCoverTool/ref/music_remover/demucs/docs/linux.md b/AutoCoverTool/ref/music_remover/demucs/docs/linux.md
new file mode 100644
index 0000000..482ab5d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/docs/linux.md
@@ -0,0 +1,28 @@
+# Linux support for Demucs
+
+If your distribution has at least Python 3.7, and you just wish to separate
+tracks with Demucs, not train it, you can just run
+
+```bash
+pip3 install --user -U demucs
+# Then anytime you want to use demucs, just do
+python3 -m demucs -d cpu PATH_TO_AUDIO_FILE_1
+# If you have added the user specific pip bin/ folder to your path, you can also do
+demucs -d cpu PATH_TO_AUDIO_FILE_1
+```
+
+If Python is too old, or you want to be able to train, I recommend [installing Miniconda][miniconda], with Python 3.7 or more.
+
+```bash
+conda activate
+pip3 install -U demucs
+# Then anytime you want to use demucs, first do conda activate, then
+demucs -d cpu PATH_TO_AUDIO_FILE_1
+```
+
+Of course, you can also use a specific env for Demucs.
+
+**Important, torchaudio 0.12 update:** Torchaudio no longer supports decoding mp3s without ffmpeg installed. You must have ffmpeg installed, either through Anaconda (`conda install ffmpeg -c conda-forge`) or as a distribution package (e.g. `sudo apt-get install ffmpeg`).
+
+
+[miniconda]: https://docs.conda.io/en/latest/miniconda.html#linux-installers
diff --git a/AutoCoverTool/ref/music_remover/demucs/docs/mac.md b/AutoCoverTool/ref/music_remover/demucs/docs/mac.md
new file mode 100644
index 0000000..6e6c3d0
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/docs/mac.md
@@ -0,0 +1,28 @@
+# Mac OS X support for Demucs
+
+If you have a sufficiently recent version of OS X, you can just run
+
+```bash
+python3 -m pip install --user -U demucs
+# Then anytime you want to use demucs, just do
+python3 -m demucs -d cpu PATH_TO_AUDIO_FILE_1
+# If you have added the user specific pip bin/ folder to your path, you can also do
+demucs -d cpu PATH_TO_AUDIO_FILE_1
+```
+
+If you do not already have Anaconda installed or much experience with the terminal on Mac OS X here are some detailed instructions:
+
+1. Download [Anaconda 3.8 (or more recent) 64 bits for MacOS][anaconda]:
+2. Open [Anaconda Prompt in MacOSX][prompt]
+3. Follow these commands:
+```bash
+conda activate
+pip3 install -U demucs
+# Then anytime you want to use demucs, first do conda activate, then
+demucs -d cpu PATH_TO_AUDIO_FILE_1
+```
+
+**Important, torchaudio 0.12 update:** Torchaudio no longer supports decoding mp3s without ffmpeg installed. You must have ffmpeg installed, either through Anaconda (`conda install ffmpeg -c conda-forge`) or with Homebrew for instance (`brew install ffmpeg`).
+
+[anaconda]:  https://www.anaconda.com/distribution/#download-section
+[prompt]: https://docs.anaconda.com/anaconda/user-guide/getting-started/#open-nav-mac
diff --git a/AutoCoverTool/ref/music_remover/demucs/docs/mdx.md b/AutoCoverTool/ref/music_remover/demucs/docs/mdx.md
new file mode 100644
index 0000000..2a20f9c
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/docs/mdx.md
@@ -0,0 +1,73 @@
+# Music DemiXing challenge (MDX)
+
+If you want to use Demucs for the [MDX challenge](https://www.aicrowd.com/challenges/music-demixing-challenge-ismir-2021),
+please follow the instructions hereafter
+
+## Installing Demucs
+
+Follow the instructions from the [main README](https://github.com/facebookresearch/demucs#requirements)
+in order to setup Demucs using Anaconda. You will need the full setup up for training, including soundstretch.
+
+## Getting MusDB-HQ
+
+Download [MusDB-HQ](https://zenodo.org/record/3338373) to some folder and unzip it.
+
+## Training Demucs
+
+Train Demucs (you might need to change the batch size depending on the number of GPUs available).
+It seems 48 channels is enough to get the best performance on MusDB-HQ, and training will faster
+and less memory demanding. In any case, the 64 channels versions is timing out on the challenge.
+```bash
+./run.py --channels=48 --batch_size 64 --musdb=PATH_TO_MUSDB --is_wav [EXTRA_FLAGS]
+```
+
+### Post training
+
+Once the training is completed, a new model file will be exported in `models/`.
+
+You can look at the SDR on the MusDB dataset using `python result_table.py`.
+
+
+### Evaluate and export a model before training is over
+
+If you want to export a model before training is complete, use the following command:
+```bash
+python -m demucs [ALL EXACT TRAINING FLAGS] --save_model
+```
+You can also pass the `--half` flag, in order to save weights in half precision. This will divide the model size by 2 and won't impact SDR.
+
+Once this is done, you can partially evaluate a model with
+```bash
+./run.py --test NAME_OF_MODEL.th --musdb=PATH_TO_MUSDB --is_wav
+```
+
+**Note:** `NAME_OF_MODEL.th` is given relative to the models folder (given by `--models`, defaults to `models/`), so don't include it in the name.
+
+
+### Training smaller models
+
+If you want to quickly test idea, I would recommend training a 16 kHz model, and testing if things work there or not, before training the full 44kHz model. You can train one of those with
+```bash
+./run.py --channels=32 --samplerate 16000 --samples 160000 --data_stride 16000 --depth=5 --batch_size 64 --repitch=0 --musdb=PATH_TO_MUSDB --is_wav [EXTRA_FLAGS]
+```
+(repitch must be turned off, because things will break at 16kHz).
+
+## Submitting your model
+
+1. Git clone [the Music Demixing Challenge - Starter Kit - Demucs Edition](https://github.com/adefossez/music-demixing-challenge-starter-kit).
+2. Inside the starter kit, create a `models/` folder and copy over the trained model from the Demucs repo (renaming
+it for instance `my_model.th`)
+3. Inside the `test_demuc.py` file, change the function `prediction_setup`: comment the loading
+of the pre-trained model, and uncomment the code to load your own model.
+4. Edit the file `aicrowd.json` with your username.
+5. Install [git-lfs](https://git-lfs.github.com/). Then run
+
+```bash
+git lfs install
+git add models/
+git add -u .
+git commit -m "My Demucs submission"
+```
+6. Follow the [submission instructions](https://github.com/AIcrowd/music-demixing-challenge-starter-kit/blob/master/docs/SUBMISSION.md).
+
+Best of luck 🤞
diff --git a/AutoCoverTool/ref/music_remover/demucs/docs/release.md b/AutoCoverTool/ref/music_remover/demucs/docs/release.md
new file mode 100644
index 0000000..b5343ca
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/docs/release.md
@@ -0,0 +1,80 @@
+# Release notes for Demucs
+
+
+## V4.0.0a, TBC
+
+Adding hybrid transformer Demucs model.
+
+Added support for [Torchaudio implementation of HDemucs](https://pytorch.org/audio/main/tutorials/hybrid_demucs_tutorial.html), thanks @skim0514.
+
+## V3.0.6, 16th of November 2022
+
+Option to customize output path of stems (@CarlGao4)
+
+Fixed bug in pad1d leading to failure sometimes.
+
+## V3.0.5, 17th of August 2022
+
+Added `--segment` flag to customize the segment length and use less memory (thanks @CarlGao4).
+
+Fix reflect padding bug on small inputs.
+
+Compatible with pyTorch 1.12
+
+## V3.0.4, 24th of February 2022
+
+Added option to split into two stems (i.e. vocals, vs. non vocals), thanks to @CarlGao4.
+
+Added `--float32`, `--int24` and `--clip-mode` options to customize how output stems are saved.
+
+## V3.0.3, 2nd of December 2021
+
+Fix bug in weights used for different sources. Thanks @keunwoochoi for the report and fix.
+
+Improving drastically memory usage on GPU for long files. Thanks a lot @famzah for providing this.
+
+Adding multithread evaluation on CPU (`-j` option).
+
+(v3.0.2 had a bug with the CPU pool and is skipped.)
+
+## V3.0.1, 12th of November 2021
+
+Release of Demucs v3, featuring hybrid domain separation and much more.
+This drops support for Conv-Tasnet and training on the non HQ MusDB dataset.
+There is no version 3.0.0 because I messed up.
+
+## V2.0.2, 26th of May 2021
+
+- Fix in Tasnet (PR #178)
+- Use ffmpeg in priority when available instead of torchaudio to avoid small shift in MP3 data.
+- other minor fixes
+
+## v2.0.1, 11th of May 2021
+
+MusDB HQ support added. Custom wav dataset support added.
+Minor changes: issue with padding of mp3 and torchaudio reading, in order to limit that,
+Demucs now uses ffmpeg in priority and fallback to torchaudio.
+Replaced pre-trained demucs model with one trained on more recent codebase.
+
+## v2.0.0, 28th of April 2021
+
+This is a big release, with at lof of breaking changes. You will likely
+need to install Demucs from scratch.
+
+
+
+- Demucs now supports on the fly resampling by a factor of 2.
+This improves SDR almost 0.3 points.
+- Random scaling of each source added (From Uhlich et al. 2017).
+- Random pitch and tempo augmentation addded, from [Cohen-Hadria et al. 2019].
+- With extra augmentation, the best performing Demucs model now has only 64 channels
+instead of 100, so model size goes from 2.4GB to 1GB. Also SDR is up from 5.6 SDR to 6.3 when trained only on MusDB.
+-  Quantized model using [DiffQ](https://github.com/facebookresearch/diffq) has been added. Model size is 150MB, no loss in quality as far as I, or the metrics,
+can say.
+- Pretrained models are now using the TorchHub interface.
+- Overlap mode for separation, to limit inconsitencies at
+	frame boundaries, with linear transition over the overlap. Overlap is currently
+	at 25%. Not that this is only done for separation, not training, because
+	I added that quite late to the code. For Conv-TasNet this can improve
+	SDR quite a bit (+0.3 points, to 6.0).
+- PyPI hosting, for separation, not training!
diff --git a/AutoCoverTool/ref/music_remover/demucs/docs/training.md b/AutoCoverTool/ref/music_remover/demucs/docs/training.md
new file mode 100644
index 0000000..87e73ca
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/docs/training.md
@@ -0,0 +1,290 @@
+# Training (Hybrid) Demucs
+
+## Install all the dependencies
+
+You should install all the dependencies either with either Anaconda (using the env file `environment-cuda.yml` )
+or `pip`, with `requirements.txt`.
+
+## Datasets
+
+### MusDB HQ
+
+Note that we do not support MusDB non HQ training anymore.
+Get the [Musdb HQ](https://zenodo.org/record/3338373) dataset, and update the path to it in two places:
+- The `dset.musdb` key inside `conf/config.yaml`.
+- The variable `MUSDB_PATH` inside `tools/automix.py`.
+
+### Create the fine tuning datasets
+
+**This is only for the MDX 2021 competition models**
+
+I use a fine tuning on a dataset crafted by remixing songs in a musically plausible way.
+The automix script will make sure that BPM, first beat and pitches are aligned.
+In the file `tools/automix.py`, edit `OUTPATH` to suit your setup, as well as the `MUSDB_PATH`
+to point to your copy of MusDB HQ. Then run
+
+```bash
+export NUMBA_NUM_THREADS=1; python3 -m tools.automix
+```
+
+**Important:** the script will show many errors, those are normals. They just indicate when two stems
+ do not batch due to BPM or music scale difference.
+
+Finally, edit the file `conf/dset/auto_mus.yaml` and replace `dset.wav` to the value of `OUTPATH`.
+
+If you have a custom dataset, you can also uncomment the lines `dset2 = ...` and
+`dset3 = ...` to add your custom wav data and the test set of MusDB for Track B models.
+You can then replace the paths in `conf/dset/auto_extra.yaml`, `conf/dset/auto_extra_test.yaml`
+and `conf/dset/aetl.yaml` (this last one was using 10 mixes instead of 6 for each song).
+
+### Dataset metadata cache
+
+Datasets are scanned the first time they are used to determine the files and their durations.
+If you change a dataset and need a rescan, just delete the `metadata` folder.
+
+## A short intro to Dora
+
+I use [Dora][dora] for all the of experiments (XPs) management. You should have a look at the Dora README
+to learn about the tool. Here is a quick summary of what to know:
+
+- An XP is a unique set of hyper-parameters with a given signature. The signature is a hash of
+    those hyper-parameters. I will always refer to an XP with its signature, e.g. `9357e12e`.
+    We will see after that you can retrieve the hyper-params and re-rerun it in a single command.
+- In fact, the hash is defined as a delta between the base config and the one obtained with
+    the config overrides you passed from the command line.
+    **This means you must never change the `conf/**.yaml` files directly.**,
+    except for editing things like paths. Changing the default values in the config files means
+    the XP signature won't reflect that change, and wrong checkpoints might be reused.
+    I know, this is annoying, but the reason is that otherwise, any change to the config file would
+    mean that all XPs ran so far would see their signature change.
+
+### Dora commands
+
+Run `tar xvf outputs.tar.gz`. This will initialize the Dora XP repository, so that Dora knows
+which hyper-params match the signature like `9357e12e`. Once you have done that, you should be able
+to run the following:
+
+```bash
+dora info -f 81de367c  # this will show the hyper-parameter used by a specific XP.
+                       # Be careful some overrides might present twice, and the right most one
+                       # will give you the right value for it.
+dora run -d -f 81de367c   # run an XP with the hyper-parameters from XP 81de367c.
+                          # `-d` is for distributed, it will use all available GPUs.
+dora run -d -f 81de367c hdemucs.channels=32  # start from the config of XP 81de367c but change some hyper-params.
+                                             # This will give you a new XP with a new signature (here 3fe9c332).
+```
+
+An XP runs from a specific folder based on its signature, by default under the `outputs/` folder.
+You can safely interrupt a training and resume it, it will reuse any existing checkpoint, as it will
+reuse the same folder.
+If you made some change to the code and need to ignore a previous checkpoint you can use `dora run --clear [RUN ARGS]`.
+
+If you have a Slurm cluster, you can also use the `dora grid` command, e.g. `dora grid mdx`.
+Please refer to the [Dora documentation][dora] for more information.
+
+## Hyper parameters
+
+Have a look at [conf/config.yaml](../conf/config.yaml) for a list of all the hyper-parameters you can override.
+If you are not familiar with [Hydra](https://github.com/facebookresearch/hydra), go checkout their page
+to be familiar with how to provide overrides for your trainings.
+
+
+## Model architecture
+
+A number of architectures are supported. You can select one with `model=NAME`, and have a look
+in [conf/config.yaml'(../conf/config.yaml) for each architecture specific hyperparams.
+Those specific params will be always prefixed with the architecture name when passing the override
+from the command line or in grid files. Here is the list of models:
+
+- demucs: original time-only Demucs.
+- hdemucs: Hybrid Demucs (v3).
+- torch_hdemucs: Same as Hybrid Demucs, but using [torchaudio official implementation](https://pytorch.org/audio/stable/tutorials/hybrid_demucs_tutorial.html).
+- htdemucs: Hybrid Transformer Demucs (v4).
+
+### Storing config in files
+
+As mentioned earlier, you should never change the base config files. However, you can use Hydra config groups
+in order to store variants you often use. If you want to create a new variant combining multiple hyper-params,
+copy the file `conf/variant/example.yaml` to `conf/variant/my_variant.yaml`, and then you can use it with
+
+```bash
+dora train -d variant=my_variant
+```
+
+Once you have created this file, you should not edit it once you have started training models with it.
+
+
+## Fine tuning
+
+If a first model is trained, you can fine tune it with other settings (e.g. automix dataset) with
+
+```bash
+dora run -d -f 81de367c continue_from=81de367c dset=auto_mus variant=finetune
+````
+
+Note that you need both `-f 81de367c` and `continue_from=81de367c`. The first one indicates
+that the hyper-params of `81de367c` should be used as a starting point for the config.
+The second indicates that the weights from `81de367c` should be used as a starting point for the solver.
+
+
+## Model evaluation
+
+Your model will be evaluated automatically with the new SDR definition from MDX every 20 epochs.
+Old style SDR (which is quite slow) will only happen at the end of training.
+
+## Model Export
+
+
+In order to use your models with other commands (such as the `demucs` command for separation) you must
+export it. For that run
+
+```bash
+python3 -m tools.export 9357e12e [OTHER SIGS ...]  # replace with the appropriate signatures.
+```
+
+The models will be stored under `release_models/`. You can use them with the `demucs` separation command with the following flags:
+```bash
+demucs --repo ./release_models -n 9357e12e my_track.mp3
+```
+
+### Bag of models
+
+If you want to combine multiple models, potentially with different weights for each source, you can copy
+`demucs/remote/mdx.yaml` to `./release_models/my_bag.yaml`. You can then edit the list of models (all models used should have been exported first) and the weights per source and model (list of list, outer list is over models, inner list is over sources). You can then use your bag of model as
+
+```bash
+demucs --repo ./release_models -n my_bag my_track.mp3
+```
+
+## Model evaluation
+
+You can evaluate any pre-trained model or bag of models using the following command:
+```bash
+python3 -m tools.test_pretrained -n NAME_OF_MODEL [EXTRA ARGS]
+```
+where `NAME_OF_MODEL` is either the name of the bag (e.g. `mdx`, `repro_mdx_a`),
+or a single Dora signature of one of the model of the bags. You can pass `EXTRA ARGS` to customize
+the test options, like the number of random shifts (e.g. `test.shifts=2`). This will compute the old-style
+SDR and can take quite  bit of time.
+
+For custom models that were trained locally, you will need to indicate that you wish
+to use the local model repositories, with the `--repo ./release_models` flag, e.g.,
+```bash
+python3 -m tools.test_pretrained --repo ./release_models -n my_bag
+```
+
+
+## API to retrieve the model
+
+You can retrieve officially released models in Python using the following API:
+```python
+from demucs import pretrained
+from demucs.apply import apply_model
+bag = pretrained.get_model('htdemucs')    # for a bag of models or a named model
+                                          # (which is just a bag with 1 model).
+model = pretrained.get_model('955717e8')  # using the signature for single models.
+
+bag.models                       # list of individual models
+stems = apply_model(model, mix)  # apply the model to the given mix.
+```
+
+## Model Zoo
+
+### Hybrid Transformer Demucs
+
+The configuration for the Hybrid Transformer models are available in:
+
+```shell
+dora grid mmi --dry_run --init
+dora grid mmi_ft --dry_run --init  # fined tuned on each sources.
+```
+
+We release in particular `955717e8`, Hybrid Transformer Demucs using 5 layers, 512 channels, 10 seconds training segment length. We also release its fine tuned version, with one model
+for each source `f7e0c4bc`, `d12395a8`, `92cfc3b6`, `04573f0d` (drums, bass, other, vocals).
+The model `955717e8` is also named `htdemucs`, while the bag of models is provided
+as `htdemucs_ft`.
+
+We also release `75fc33f5`, a regular Hybrid Demucs trained on the same dataset,
+available as `hdemucs_mmi`.
+
+
+
+### Models from the MDX Competition 2021
+
+  
+Here is a short descriptions of the models used for the MDX submission, either Track A (MusDB HQ only)
+or Track B (extra training data allowed). Training happen in two stage, with the second stage
+being the fine tunining on the automix generated dataset.
+All the fine tuned models are available on our AWS repository
+(you can retrieve it with `demucs.pretrained.get_model(SIG)`). The bag of models are available
+by doing `demucs.pretrained.get_model(NAME)` with `NAME` begin either `mdx` (for Track A) or `mdx_extra`
+(for Track B).
+
+#### Track A
+
+The 4 models are:
+
+- `0d19c1c6`: fine-tuned on automix dataset from `9357e12e`
+- `7ecf8ec1`: fine-tuned on automix dataset from `e312f349`
+- `c511e2ab`: fine-tuned on automix dataset from `81de367c`
+- `7d865c68`: fine-tuned on automix dataset from `80a68df8`
+
+The 4 initial models (before fine tuning are):
+
+- `9357e12e`: 64ch time domain only improved Demucs, with new residual branches, group norm,
+  and singular value penalty.
+- `e312f349`: 64ch time domain only improved, with new residual branches, group norm,
+  and singular value penalty, trained with a loss that focus only on drums and bass.
+- `81de367c`: 48ch hybrid model , with residual branches, group norm,
+  singular value penalty penalty and amplitude spectrogram.
+- `80a68df8`: same as b5559babb but using CaC and different
+  random seed, as well different weigths per frequency bands in outermost layers.
+
+The hybrid models are combined with equal weights for all sources except for the bass.
+`0d19c1c6` (time domain) is used for both drums and bass. `7ecf8ec1` is used only for the bass.
+
+You can see all the hyper parameters at once with (one common line for all common hyper params, and then only shows
+the hyper parameters that differs), along with the DiffQ variants that are used for the `mdx_q` models:
+```
+dora grid mdx --dry_run --init
+dora grid mdx --dry_run --init
+```
+
+#### Track B
+
+- `e51eebcc`
+- `a1d90b5c`
+- `5d2d6c55`
+- `cfa93e08`
+
+All the models are 48ch hybrid demucs with different random seeds. Two of them
+are using CaC, and two are using amplitude spectrograms with masking.
+All the models are combined with equal weights for all sources.
+
+Things are a bit messy for Track B, there was a lot of fine tuning
+over different datasets. I won't describe the entire genealogy of models here,
+but all the information can be accessed with the `dora info -f SIG` command.
+
+Similarly you can do (those will contain a few extra lines, for training without the MusDB test set as training, and extra DiffQ XPs):
+```
+dora grid mdx_extra --dry_run --init
+```
+
+### Reproducibility and Ablation
+
+I updated the paper to report numbers with a more homogeneous setup than the one used for the competition.
+On MusDB HQ, I still need to use a combination of time only and hybrid models to achieve the best performance.
+The experiments are provided in the grids [repro.py](../demucs/grids/repro.py) and
+[repro_ft._py](../demucs/grids/repro_ft.py) for the fine tuning on the realistic mix datasets.
+
+The new bag of models reaches an SDR of 7.64 (vs. 7.68 for the original track A model). It uses
+2 time only models trained with residual branches, local attention and the SVD penalty,
+along with 2 hybrid models, with the same features, and using CaC representation.
+We average the performance of all the models with the same weight over all sources, unlike
+what was done for the original track A model. We trained for 600 epochs, against 360 before.
+
+The new bag of model is available as part of the pretrained model as `repro_mdx_a`.
+The time only bag is named `repro_mdx_a_time_only`, and the hybrid only `repro_mdx_a_hybrid_only`.
+Checkout the paper for more information on the training.
+
+[dora]: https://github.com/facebookresearch/dora
diff --git a/AutoCoverTool/ref/music_remover/demucs/docs/windows.md b/AutoCoverTool/ref/music_remover/demucs/docs/windows.md
new file mode 100644
index 0000000..36ec05d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/docs/windows.md
@@ -0,0 +1,58 @@
+# Windows support for Demucs
+
+## Installation and usage
+
+Parts of the code are untested on Windows (in particular, training a new model). If you don't have much experience with Anaconda, python or the shell, here are more detailed instructions. Note that **Demucs is not supported on 32bits systems** (as Pytorch is not available there).
+
+- First install Anaconda with **Python 3.7** or more recent, which you can find [here][install].
+- Start the [Anaconda prompt][prompt].
+
+Then, all commands that follow must be run from this prompt.
+
+### If you want to use your GPU
+
+If you have graphic cards produced by nVidia with more than 6GiB of memory, you can separate tracks with GPU acceleration. To achieve this, you must install Pytorch with CUDA. If Pytorch was already installed (you already installed Demucs for instance), first run  `python.exe -m pip uninstall torch torchaudio`.
+Then visit [Pytorch Home Page](https://pytorch.org/get-started/locally/) and follow the guide on it to install with CUDA support. 
+
+### Installation
+
+Start the Anaconda prompt, and run the following
+bash
+```
+conda install -c conda-forge ffmpeg
+python.exe -m pip install -U demucs PySoundFile
+```
+
+### Upgrade
+
+To upgrade Demucs, simply run `python.exe -m pip install -U demucs`, from the Anaconda prompt.
+
+### Usage
+
+Then to use Demucs, just start the **Anaconda prompt** and run:
+```
+demucs -d cpu "PATH_TO_AUDIO_FILE_1" ["PATH_TO_AUDIO_FILE_2" ...]
+```
+The `"` around the filename are required if the path contains spaces.
+The separated files will be under `C:\Users\YOUR_USERNAME\demucs\separated\demucs\`.
+
+
+### Separating an entire folder
+
+You can use the following command to separate an entire folder of mp3s for instance (replace the extension `.mp3` if needs be for other file types)
+```
+cd FOLDER
+for %i in (*.mp3) do (demucs -d cpu "%i")
+```
+
+
+## Potential errors
+
+If you have an error saying that `mkl_intel_thread.dll` cannot be found, you can try to first run
+`conda install -c defaults intel-openmp -f`. Then try again to run the `demucs` command. If it still doesn't work, you can try to run first `set CONDA_DLL_SEARCH_MODIFICATION_ENABLE=1`, then again the `demucs` command and hopefully it will work 🙏.
+
+**If you get a permission error**, please try starting the Anaconda Prompt as administrator.
+
+
+[install]: https://www.anaconda.com/distribution/#windows
+[prompt]: https://docs.anaconda.com/anaconda/user-guide/getting-started/#open-prompt-win
diff --git a/AutoCoverTool/ref/music_remover/demucs/environment-cpu.yml b/AutoCoverTool/ref/music_remover/demucs/environment-cpu.yml
new file mode 100644
index 0000000..f921d56
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/environment-cpu.yml
@@ -0,0 +1,28 @@
+name: demucs
+
+channels:
+  - pytorch
+  - conda-forge
+
+dependencies:
+  - python>=3.7,<3.10
+  - ffmpeg>=4.2
+  - pytorch>=1.8.1
+  - torchaudio>=0.8
+  - tqdm>=4.36
+  - pip
+  - pip:
+    - diffq>=0.2
+    - dora-search
+    - einops
+    - hydra-colorlog>=1.1
+    - hydra-core>=1.1
+    - julius>=0.2.3
+    - lameenc>=1.2
+    - openunmix
+    - musdb>=0.4.0
+    - museval>=0.4.0
+    - soundfile
+    - submitit
+    - treetable>=0.2.3
+
diff --git a/AutoCoverTool/ref/music_remover/demucs/environment-cuda.yml b/AutoCoverTool/ref/music_remover/demucs/environment-cuda.yml
new file mode 100644
index 0000000..abbd258
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/environment-cuda.yml
@@ -0,0 +1,28 @@
+name: demucs
+
+channels:
+  - pytorch
+  - conda-forge
+
+dependencies:
+  - python>=3.7,<3.10
+  - ffmpeg>=4.2
+  - pytorch>=1.8.1
+  - torchaudio>=0.8
+  - cudatoolkit>=10
+  - tqdm>=4.36
+  - pip
+  - pip:
+    - diffq>=0.2
+    - dora-search
+    - einops
+    - hydra-colorlog>=1.1
+    - hydra-core>=1.1
+    - julius>=0.2.3
+    - lameenc>=1.2
+    - openunmix
+    - musdb>=0.4.0
+    - museval>=0.4.0
+    - soundfile
+    - submitit
+    - treetable>=0.2.3
diff --git a/AutoCoverTool/ref/music_remover/demucs/hubconf.py b/AutoCoverTool/ref/music_remover/demucs/hubconf.py
new file mode 100644
index 0000000..4e64777
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/hubconf.py
@@ -0,0 +1,11 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+dependencies = ['dora-search', 'diffq', 'julius', 'lameenc', 'openunmix', 'pyyaml', 
+                'torch', 'torchaudio', 'tqdm']
+
+from demucs.pretrained import get_model
+
diff --git a/AutoCoverTool/ref/music_remover/demucs/mypy.ini b/AutoCoverTool/ref/music_remover/demucs/mypy.ini
new file mode 100644
index 0000000..c4e17f1
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/mypy.ini
@@ -0,0 +1,5 @@
+[mypy]
+
+[mypy-treetable,torchaudio.*,diffq,yaml,tqdm,lameenc,musdb,museval,openunmix.*,einops,xformers.*]
+ignore_missing_imports = True
+
diff --git a/AutoCoverTool/ref/music_remover/demucs/outputs.tar.gz b/AutoCoverTool/ref/music_remover/demucs/outputs.tar.gz
new file mode 100644
index 0000000..51933ac
Binary files /dev/null and b/AutoCoverTool/ref/music_remover/demucs/outputs.tar.gz differ
diff --git a/AutoCoverTool/ref/music_remover/demucs/readme.txt b/AutoCoverTool/ref/music_remover/demucs/readme.txt
new file mode 100644
index 0000000..7a33a51
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/readme.txt
@@ -0,0 +1,21 @@
+音乐分离工具
+
+简单介绍:
+    demucs源码地址: https://github.com/facebookresearch/demucs
+    本代码直接从上述源码拉取，使用的是Mon Nov 21 的main分支的版本
+
+基本改动:
+    封装separate_interface.py 文件，用于给定音频文件，生成伴奏文件
+
+环境安装:
+    1. GPU基本环境安装:
+        https://phabricator.ushow.media/w/%E9%9F%B3%E8%A7%86%E9%A2%91%E7%BB%84%E6%96%87%E6%A1%A3/%E7%8E%AF%E5%A2%83%E5%AE%89%E8%A3%85/gpu%E7%8E%AF%E5%A2%83%E5%AE%89%E8%A3%85/
+    2. 安装demucs环境
+        conda create -n demucs python==3.7
+    3. 安装 standard_audio 二进制文件
+        代码位置位于: av_cv_research/tools/music_remover/standard_audio
+        编译安装完成后存放于: /opt/soft/bin/standard_audio 即可
+
+快速使用（服务端）:
+    python3 separate_interface.py xishuashua.mp4 xishuashua.m4a
+    xishuashua.mp4 的时长为3分36s, 3次平均耗时为 27.33s
diff --git a/AutoCoverTool/ref/music_remover/demucs/requirements.txt b/AutoCoverTool/ref/music_remover/demucs/requirements.txt
new file mode 100644
index 0000000..c263020
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/requirements.txt
@@ -0,0 +1,19 @@
+# please make sure you have already a pytorch install that is cuda enabled!
+dora-search
+diffq>=0.2.1
+einops
+flake8
+hydra-colorlog>=1.1
+hydra-core>=1.1
+julius>=0.2.3
+lameenc>=1.2
+museval
+mypy
+openunmix
+pyyaml
+submitit
+torch>=1.8.1
+torchaudio>=0.8
+tqdm
+treetable
+soundfile>=0.10.3;sys_platform=="win32"
diff --git a/AutoCoverTool/ref/music_remover/demucs/requirements_minimal.txt b/AutoCoverTool/ref/music_remover/demucs/requirements_minimal.txt
new file mode 100644
index 0000000..f1ccb05
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/requirements_minimal.txt
@@ -0,0 +1,11 @@
+# please make sure you have already a pytorch install that is cuda enabled!
+dora-search
+diffq>=0.2.1
+einops
+julius>=0.2.3
+lameenc>=1.2
+openunmix
+pyyaml
+torch>=1.8.1
+torchaudio>=0.8
+tqdm
diff --git a/AutoCoverTool/ref/music_remover/demucs/setup.cfg b/AutoCoverTool/ref/music_remover/demucs/setup.cfg
new file mode 100644
index 0000000..d54d56a
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/setup.cfg
@@ -0,0 +1,8 @@
+[pep8]
+max-line-length = 100
+
+[flake8]
+max-line-length = 100
+
+[yapf]
+column_limit = 100
diff --git a/AutoCoverTool/ref/music_remover/demucs/setup.py b/AutoCoverTool/ref/music_remover/demucs/setup.py
new file mode 100644
index 0000000..dc3de9d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/setup.py
@@ -0,0 +1,75 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+# author: adefossez
+# Inspired from https://github.com/kennethreitz/setup.py
+
+from pathlib import Path
+
+from setuptools import setup
+
+
+NAME = 'demucs'
+DESCRIPTION = 'Music source separation in the waveform domain.'
+
+URL = 'https://github.com/facebookresearch/demucs'
+EMAIL = 'defossez@fb.com'
+AUTHOR = 'Alexandre Défossez'
+REQUIRES_PYTHON = '>=3.7.0'
+
+HERE = Path(__file__).parent
+
+# Get version without explicitely loading the module.
+for line in open('demucs/__init__.py'):
+    line = line.strip()
+    if '__version__' in line:
+        context = {}
+        exec(line, context)
+        VERSION = context['__version__']
+
+
+def load_requirements(name):
+    required = [i.strip() for i in open(HERE / name)]
+    required = [i for i in required if not i.startswith('#')]
+    return required
+
+
+REQUIRED = load_requirements('requirements_minimal.txt')
+ALL_REQUIRED = load_requirements('requirements.txt')
+
+try:
+    with open(HERE / "README.md", encoding='utf-8') as f:
+        long_description = '\n' + f.read()
+except FileNotFoundError:
+    long_description = DESCRIPTION
+
+setup(
+    name=NAME,
+    version=VERSION,
+    description=DESCRIPTION,
+    long_description=long_description,
+    long_description_content_type='text/markdown',
+    author=AUTHOR,
+    author_email=EMAIL,
+    python_requires=REQUIRES_PYTHON,
+    url=URL,
+    packages=['demucs'],
+    extras_require={
+        'dev': ALL_REQUIRED,
+    },
+    install_requires=REQUIRED,
+    include_package_data=True,
+    entry_points={
+        'console_scripts': ['demucs=demucs.separate:main'],
+    },
+    license='MIT License',
+    classifiers=[
+        # Trove classifiers
+        # Full list: https://pypi.python.org/pypi?%3Aaction=list_classifiers
+        'License :: OSI Approved :: MIT License',
+        'Topic :: Multimedia :: Sound/Audio',
+        'Topic :: Scientific/Engineering :: Artificial Intelligence',
+    ],
+)
diff --git a/AutoCoverTool/ref/music_remover/demucs/test.mp3 b/AutoCoverTool/ref/music_remover/demucs/test.mp3
new file mode 100644
index 0000000..668604d
Binary files /dev/null and b/AutoCoverTool/ref/music_remover/demucs/test.mp3 differ
diff --git a/AutoCoverTool/ref/music_remover/demucs/tools/__init__.py b/AutoCoverTool/ref/music_remover/demucs/tools/__init__.py
new file mode 100644
index 0000000..a7b735c
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/tools/__init__.py
@@ -0,0 +1,5 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
diff --git a/AutoCoverTool/ref/music_remover/demucs/tools/automix.py b/AutoCoverTool/ref/music_remover/demucs/tools/automix.py
new file mode 100644
index 0000000..91400b1
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/tools/automix.py
@@ -0,0 +1,343 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""
+This script creates realistic mixes with stems from different songs.
+In particular, it will align BPM, sync up the first beat and perform pitch
+shift to maximize pitches overlap.
+In order to limit artifacts, only parts that can be mixed with less than 15%
+tempo shift, and 3 semitones of pitch shift are mixed together.
+"""
+from collections import namedtuple
+from concurrent.futures import ProcessPoolExecutor
+import hashlib
+from pathlib import Path
+import random
+import shutil
+import tqdm
+import pickle
+
+from librosa.beat import beat_track
+from librosa.feature import chroma_cqt
+import numpy as np
+import torch
+from torch.nn import functional as F
+
+from dora.utils import try_load
+from demucs.audio import save_audio
+from demucs.repitch import repitch
+from demucs.pretrained import SOURCES
+from demucs.wav import build_metadata, Wavset, _get_musdb_valid
+
+
+MUSDB_PATH = '/checkpoint/defossez/datasets/musdbhq'
+EXTRA_WAV_PATH = "/checkpoint/defossez/datasets/allstems_44"
+# WARNING: OUTPATH will be completely erased.
+OUTPATH = Path.home() / 'tmp/demucs_mdx/automix_musdb/'
+CACHE = Path.home() / 'tmp/automix_cache'  # cache BPM and pitch information.
+CHANNELS = 2
+SR = 44100
+MAX_PITCH = 3  # maximum allowable pitch shift in semi tones
+MAX_TEMPO = 0.15  # maximum allowable tempo shift
+
+
+Spec = namedtuple("Spec", "tempo onsets kr track index")
+
+
+def rms(wav, window=10000):
+    """efficient rms computed for each time step over a given window."""
+    half = window // 2
+    window = 2 * half + 1
+    wav = F.pad(wav, (half, half))
+    tot = wav.pow(2).cumsum(dim=-1)
+    return ((tot[..., window - 1:] - tot[..., :-window + 1]) / window).sqrt()
+
+
+def analyse_track(dset, index):
+    """analyse track, extract bpm and distribution of notes from the bass line."""
+    track = dset[index]
+    mix = track.sum(0).mean(0)
+    ref = mix.std()
+
+    starts = (abs(mix) >= 1e-2 * ref).float().argmax().item()
+    track = track[..., starts:]
+
+    cache = CACHE / dset.sig
+    cache.mkdir(exist_ok=True, parents=True)
+
+    cache_file = cache / f"{index}.pkl"
+    cached = None
+    if cache_file.exists():
+        cached = try_load(cache_file)
+        if cached is not None:
+            tempo, events, hist_kr = cached
+
+    if cached is None:
+        drums = track[0].mean(0)
+        if drums.std() > 1e-2 * ref:
+            tempo, events = beat_track(drums.numpy(), units='time', sr=SR)
+        else:
+            print("failed drums", drums.std(), ref)
+            return None, track
+
+        bass = track[1].mean(0)
+        r = rms(bass)
+        peak = r.max()
+        mask = r >= 0.05 * peak
+        bass = bass[mask]
+        if bass.std() > 1e-2 * ref:
+            kr = torch.from_numpy(chroma_cqt(bass.numpy(), sr=SR))
+            hist_kr = (kr.max(dim=0, keepdim=True)[0] == kr).float().mean(1)
+        else:
+            print("failed bass", bass.std(), ref)
+            return None, track
+
+    pickle.dump([tempo, events, hist_kr], open(cache_file, 'wb'))
+    spec = Spec(tempo, events, hist_kr, track, index)
+    return spec, None
+
+
+def best_pitch_shift(kr_a, kr_b):
+    """find the best pitch shift between two chroma distributions."""
+    deltas = []
+    for p in range(12):
+        deltas.append((kr_a - kr_b).abs().mean())
+        kr_b = kr_b.roll(1, 0)
+
+    ps = np.argmin(deltas)
+    if ps > 6:
+        ps = ps - 12
+    return ps
+
+
+def align_stems(stems):
+    """Align the first beats of the stems.
+    This is a naive implementation. A grid with a time definition 10ms is defined and
+    each beat onset is represented as a gaussian over this grid.
+    Then, we try each possible time shift to make two grids align the best.
+    We repeat for all sources.
+    """
+    sources = len(stems)
+    width = 5e-3  # grid of 10ms
+    limit = 5
+    std = 2
+    x = torch.arange(-limit, limit + 1, 1).float()
+    gauss = torch.exp(-x**2 / (2 * std**2))
+
+    grids = []
+    for wav, onsets in stems:
+        le = wav.shape[-1]
+        dur = le / SR
+        grid = torch.zeros(int(le / width / SR))
+        for onset in onsets:
+            pos = int(onset / width)
+            if onset >= dur - 1:
+                continue
+            if onset < 1:
+                continue
+            grid[pos - limit:pos + limit + 1] += gauss
+        grids.append(grid)
+
+    shifts = [0]
+    for s in range(1, sources):
+        max_shift = int(4 / width)
+        dots = []
+        for shift in range(-max_shift, max_shift):
+            other = grids[s]
+            ref = grids[0]
+            if shift >= 0:
+                other = other[shift:]
+            else:
+                ref = ref[shift:]
+            le = min(len(other), len(ref))
+            dots.append((ref[:le].dot(other[:le]), int(shift * width * SR)))
+
+        _, shift = max(dots)
+        shifts.append(-shift)
+
+    outs = []
+    new_zero = min(shifts)
+    for (wav, _), shift in zip(stems, shifts):
+        offset = shift - new_zero
+        wav = F.pad(wav, (offset, 0))
+        outs.append(wav)
+
+    le = min(x.shape[-1] for x in outs)
+
+    outs = [w[..., :le] for w in outs]
+    return torch.stack(outs)
+
+
+def find_candidate(spec_ref, catalog, pitch_match=True):
+    """Given reference track, this finds a track in the catalog that
+    is a potential match (pitch and tempo delta must be within the allowable limits).
+    """
+    candidates = list(catalog)
+    random.shuffle(candidates)
+
+    for spec in candidates:
+        ok = False
+        for scale in [1/4, 1/2, 1, 2, 4]:
+            tempo = spec.tempo * scale
+            delta_tempo = spec_ref.tempo / tempo - 1
+            if abs(delta_tempo) < MAX_TEMPO:
+                ok = True
+                break
+        if not ok:
+            print(delta_tempo, spec_ref.tempo, spec.tempo, "FAILED TEMPO")
+            # too much of a tempo difference
+            continue
+        spec = spec._replace(tempo=tempo)
+
+        ps = 0
+        if pitch_match:
+            ps = best_pitch_shift(spec_ref.kr, spec.kr)
+            if abs(ps) > MAX_PITCH:
+                print("Failed pitch", ps)
+                # too much pitch difference
+                continue
+        return spec, delta_tempo, ps
+
+
+def get_part(spec, source, dt, dp):
+    """Apply given delta of tempo and delta of pitch to a stem."""
+    wav = spec.track[source]
+    if dt or dp:
+        wav = repitch(wav, dp, dt * 100, samplerate=SR, voice=source == 3)
+        spec = spec._replace(onsets=spec.onsets / (1 + dt))
+    return wav, spec
+
+
+def build_track(ref_index, catalog):
+    """Given the reference track index and a catalog of track, builds
+    a completely new track. One of the source at random from the ref track will
+    be kept and other sources will be drawn from the catalog.
+    """
+    order = list(range(len(SOURCES)))
+    random.shuffle(order)
+
+    stems = [None] * len(order)
+    indexes = [None] * len(order)
+    origs = [None] * len(order)
+    dps = [None] * len(order)
+    dts = [None] * len(order)
+
+    first = order[0]
+    spec_ref = catalog[ref_index]
+    stems[first] = (spec_ref.track[first], spec_ref.onsets)
+    indexes[first] = ref_index
+    origs[first] = spec_ref.track[first]
+    dps[first] = 0
+    dts[first] = 0
+
+    pitch_match = order != 0
+
+    for src in order[1:]:
+        spec, dt, dp = find_candidate(spec_ref, catalog, pitch_match=pitch_match)
+        if not pitch_match:
+            spec_ref = spec_ref._replace(kr=spec.kr)
+        pitch_match = True
+        dps[src] = dp
+        dts[src] = dt
+        wav, spec = get_part(spec, src, dt, dp)
+        stems[src] = (wav, spec.onsets)
+        indexes[src] = spec.index
+        origs.append(spec.track[src])
+    print("FINAL CHOICES", ref_index, indexes, dps, dts)
+    stems = align_stems(stems)
+    return stems, origs
+
+
+def get_musdb_dataset(part='train'):
+    root = Path(MUSDB_PATH) / part
+    ext = '.wav'
+    metadata = build_metadata(root, SOURCES, ext=ext, normalize=False)
+    valid_tracks = _get_musdb_valid()
+    metadata_train = {name: meta for name, meta in metadata.items() if name not in valid_tracks}
+    train_set = Wavset(
+        root, metadata_train, SOURCES, samplerate=SR, channels=CHANNELS,
+        normalize=False, ext=ext)
+    sig = hashlib.sha1(str(root).encode()).hexdigest()[:8]
+    train_set.sig = sig
+    return train_set
+
+
+def get_wav_dataset():
+    root = Path(EXTRA_WAV_PATH)
+    ext = '.wav'
+    metadata = _build_metadata(root, SOURCES, ext=ext, normalize=False)
+    train_set = Wavset(
+        root, metadata, SOURCES, samplerate=SR, channels=CHANNELS,
+        normalize=False, ext=ext)
+    sig = hashlib.sha1(str(root).encode()).hexdigest()[:8]
+    train_set.sig = sig
+    return train_set
+
+
+def main():
+    random.seed(4321)
+    if OUTPATH.exists():
+        shutil.rmtree(OUTPATH)
+    OUTPATH.mkdir(exist_ok=True, parents=True)
+    (OUTPATH / 'train').mkdir(exist_ok=True, parents=True)
+    (OUTPATH / 'valid').mkdir(exist_ok=True, parents=True)
+    out = OUTPATH / 'train'
+
+    dset = get_musdb_dataset()
+    # dset2 = get_wav_dataset()
+    # dset3 = get_musdb_dataset('test')
+    dset2 = None
+    dset3 = None
+    pendings = []
+    copies = 6
+    copies_rej = 2
+
+    with ProcessPoolExecutor(20) as pool:
+        for index in range(len(dset)):
+            pendings.append(pool.submit(analyse_track, dset, index))
+
+        if dset2:
+            for index in range(len(dset2)):
+                pendings.append(pool.submit(analyse_track, dset2, index))
+        if dset3:
+            for index in range(len(dset3)):
+                pendings.append(pool.submit(analyse_track, dset3, index))
+
+        catalog = []
+        rej = 0
+        for pending in tqdm.tqdm(pendings, ncols=120):
+            spec, track = pending.result()
+            if spec is not None:
+                catalog.append(spec)
+            else:
+                mix = track.sum(0)
+                for copy in range(copies_rej):
+                    folder = out / f'rej_{rej}_{copy}'
+                    folder.mkdir()
+                    save_audio(mix, folder / "mixture.wav", SR)
+                    for stem, source in zip(track, SOURCES):
+                        save_audio(stem, folder / f"{source}.wav", SR, clip='clamp')
+                    rej += 1
+
+    for copy in range(copies):
+        for index in range(len(catalog)):
+            track, origs = build_track(index, catalog)
+            mix = track.sum(0)
+            mx = mix.abs().max()
+            scale = max(1, 1.01 * mx)
+            mix = mix / scale
+            track = track / scale
+            folder = out / f'{copy}_{index}'
+            folder.mkdir()
+            save_audio(mix, folder / "mixture.wav", SR)
+            for stem, source, orig in zip(track, SOURCES, origs):
+                save_audio(stem, folder / f"{source}.wav", SR, clip='clamp')
+                # save_audio(stem.std() * orig / (1e-6 + orig.std()), folder / f"{source}_orig.wav",
+                #            SR, clip='clamp')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/tools/bench.py b/AutoCoverTool/ref/music_remover/demucs/tools/bench.py
new file mode 100644
index 0000000..edf6ceb
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/tools/bench.py
@@ -0,0 +1,78 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""
+benchmarking script, useful to check for OOM, reasonable train time,
+and for the MDX competion, estimate if we will match the time limit."""
+from contextlib import contextmanager
+import logging
+import sys
+import time
+import torch
+
+from demucs.train import get_solver, main
+from demucs.apply import apply_model
+
+logging.basicConfig(level=logging.INFO, stream=sys.stderr)
+
+
+class Result:
+    pass
+
+
+@contextmanager
+def bench():
+    import gc
+    gc.collect()
+    torch.cuda.reset_max_memory_allocated()
+    torch.cuda.empty_cache()
+    result = Result()
+    # before = torch.cuda.memory_allocated()
+    before = 0
+    begin = time.time()
+    try:
+        yield result
+    finally:
+        torch.cuda.synchronize()
+        mem = (torch.cuda.max_memory_allocated() - before) / 2 ** 20
+        tim = time.time() - begin
+        result.mem = mem
+        result.tim = tim
+
+
+xp = main.get_xp_from_sig(sys.argv[1])
+xp = main.get_xp(xp.argv + sys.argv[2:])
+with xp.enter():
+    solver = get_solver(xp.cfg)
+    if getattr(solver.model, 'use_train_segment', False):
+        batch = solver.augment(next(iter(solver.loaders['train'])))
+        solver.model.segment = Fraction(batch.shape[-1], solver.model.samplerate)
+        train_segment = solver.model.segment
+        solver.model.eval()
+    model = solver.model
+    model.cuda()
+    x = torch.randn(2, xp.cfg.dset.channels, int(10 * model.samplerate), device='cuda')
+    with bench() as res:
+        y = model(x)
+        y.sum().backward()
+    del y
+    for p in model.parameters():
+        p.grad = None
+    print(f"FB: {res.mem:.1f} MB, {res.tim * 1000:.1f} ms")
+
+    x = torch.randn(1, xp.cfg.dset.channels, int(model.segment * model.samplerate), device='cuda')
+    with bench() as res:
+        with torch.no_grad():
+            y = model(x)
+    del y
+    print(f"FV: {res.mem:.1f} MB, {res.tim * 1000:.1f} ms")
+
+    model.cpu()
+    torch.set_num_threads(1)
+    test = torch.randn(1, xp.cfg.dset.channels, model.samplerate * 40)
+    b = time.time()
+    apply_model(model, test, split=True, shifts=1)
+    print("CPU 40 sec:", time.time() - b)
diff --git a/AutoCoverTool/ref/music_remover/demucs/tools/convert.py b/AutoCoverTool/ref/music_remover/demucs/tools/convert.py
new file mode 100644
index 0000000..6c23222
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/tools/convert.py
@@ -0,0 +1,152 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+# Script to convert option names and model args from the dev branch to
+# the cleanup release one. There should be no reaso to use that anymore.
+
+import argparse
+import io
+import json
+from pathlib import Path
+import subprocess as sp
+
+import torch
+
+from demucs import train, pretrained, states
+
+DEV_REPO = Path.home() / 'tmp/release_demucs_mdx'
+
+
+TO_REMOVE = [
+    'demucs.dconv_kw.gelu=True',
+    'demucs.dconv_kw.nfreqs=0',
+    'demucs.dconv_kw.nfreqs=0',
+    'demucs.dconv_kw.version=4',
+    'demucs.norm=gn',
+    'wdemucs.nice=True',
+    'wdemucs.good=True',
+    'wdemucs.freq_emb=-0.2',
+    'special=True',
+    'special=False',
+]
+
+TO_REPLACE = [
+    ('power', 'svd'),
+    ('wdemucs', 'hdemucs'),
+    ('hdemucs.hybrid=True', 'hdemucs.hybrid_old=True'),
+    ('hdemucs.hybrid=2', 'hdemucs.hybrid=True'),
+]
+
+TO_INJECT = [
+    ('model=hdemucs', ['hdemucs.cac=False']),
+    ('model=hdemucs', ['hdemucs.norm_starts=999']),
+]
+
+
+def get_original_argv(sig):
+    return json.load(open(Path(DEV_REPO) / f'outputs/xps/{sig}/.argv.json'))
+
+
+def transform(argv, mappings, verbose=False):
+    for rm in TO_REMOVE:
+        while rm in argv:
+            argv.remove(rm)
+
+    for old, new in TO_REPLACE:
+        argv[:] = [a.replace(old, new) for a in argv]
+
+    for condition, args in TO_INJECT:
+        if condition in argv:
+            argv[:] = args + argv
+
+    for idx, arg in enumerate(argv):
+        if 'continue_from=' in arg:
+            dep_sig = arg.split('=')[1]
+            if dep_sig.startswith('"'):
+                dep_sig = eval(dep_sig)
+            if verbose:
+                print("Need to recursively convert dependency XP", dep_sig)
+            new_sig = convert(dep_sig, mappings, verbose).sig
+            argv[idx] = f'continue_from="{new_sig}"'
+
+
+def convert(sig, mappings, verbose=False):
+    argv = get_original_argv(sig)
+    if verbose:
+        print("Original argv", argv)
+    transform(argv, mappings, verbose)
+    if verbose:
+        print("New argv", argv)
+    xp = train.main.get_xp(argv)
+    train.main.init_xp(xp)
+    if verbose:
+        print("Mapping", sig, "->", xp.sig)
+    mappings[sig] = xp.sig
+    return xp
+
+
+def _eval_old(old_sig, x):
+    script = (
+        'from demucs import pretrained; import torch; import sys; import io; '
+        'buf = io.BytesIO(sys.stdin.buffer.read()); '
+        'x = torch.load(buf); m = pretrained.load_pretrained_model('
+        f'"{old_sig}"); torch.save(m(x), sys.stdout.buffer)')
+
+    buf = io.BytesIO()
+    torch.save(x, buf)
+    proc = sp.run(
+        ['python3', '-c', script], input=buf.getvalue(), capture_output=True, cwd=DEV_REPO)
+    if proc.returncode != 0:
+        print("Error", proc.stderr.decode())
+        assert False
+
+    buf = io.BytesIO(proc.stdout)
+    return torch.load(buf)
+
+
+def compare(old_sig, model):
+    test = torch.randn(1, 2, 44100 * 10)
+    old_out = _eval_old(old_sig, test)
+    out = model(test)
+
+    delta = 20 * torch.log10((out - old_out).norm() / out.norm()).item()
+    return delta
+
+
+def main():
+    torch.manual_seed(1234)
+    parser = argparse.ArgumentParser('convert')
+    parser.add_argument('sigs', nargs='*')
+    parser.add_argument('-o', '--output', type=Path, default=Path('release_models'))
+    parser.add_argument('-d', '--dump', action='store_true')
+    parser.add_argument('-c', '--compare', action='store_true')
+    parser.add_argument('-v', '--verbose', action='store_true')
+    args = parser.parse_args()
+
+    args.output.mkdir(exist_ok=True, parents=True)
+    mappings = {}
+    for sig in args.sigs:
+        xp = convert(sig, mappings, args.verbose)
+        if args.dump or args.compare:
+            old_pkg = pretrained._load_package(sig, old=True)
+            model = train.get_model(xp.cfg)
+            model.load_state_dict(old_pkg['state'])
+            if args.dump:
+                pkg = states.serialize_model(model, xp.cfg)
+                states.save_with_checksum(pkg, args.output / f'{xp.sig}.th')
+            if args.compare:
+                delta = compare(sig, model)
+                print("Delta for", sig, xp.sig, delta)
+
+        mappings[sig] = xp.sig
+
+    print("FINAL MAPPINGS")
+    for old, new in mappings.items():
+        print(old, " ", new)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/tools/export.py b/AutoCoverTool/ref/music_remover/demucs/tools/export.py
new file mode 100644
index 0000000..7dfce10
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/tools/export.py
@@ -0,0 +1,71 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""Export a trained model from the full checkpoint (with optimizer etc.) to
+a final checkpoint, with only the model itself. The model is always stored as
+half float to gain space, and because this has zero impact on the final loss.
+When DiffQ was used for training, the model will actually be quantized and bitpacked."""
+from argparse import ArgumentParser
+from fractions import Fraction
+import logging
+from pathlib import Path
+import sys
+import torch
+
+from demucs import train
+from demucs.states import serialize_model, save_with_checksum
+
+
+logger = logging.getLogger(__name__)
+
+
+def main():
+    logging.basicConfig(level=logging.INFO, stream=sys.stderr)
+
+    parser = ArgumentParser("tools.export", description="Export trained models from XP sigs.")
+    parser.add_argument('signatures', nargs='*', help='XP signatures.')
+    parser.add_argument('-o', '--out', type=Path, default=Path("release_models"),
+                        help="Path where to store release models (default release_models)")
+    parser.add_argument('-s', '--sign', action='store_true',
+                        help='Add sha256 prefix checksum to the filename.')
+
+    args = parser.parse_args()
+    args.out.mkdir(exist_ok=True, parents=True)
+
+    for sig in args.signatures:
+        xp = train.main.get_xp_from_sig(sig)
+        name = train.main.get_name(xp)
+        logger.info('Handling %s/%s', sig, name)
+
+        out_path = args.out / (sig + ".th")
+
+        solver = train.get_solver_from_sig(sig)
+        if len(solver.history) < solver.args.epochs:
+            logger.warning(
+                'Model %s has less epoch than expected (%d / %d)',
+                sig, len(solver.history), solver.args.epochs)
+
+        solver.model.load_state_dict(solver.best_state)
+        pkg = serialize_model(solver.model, solver.args, solver.quantizer, half=True)
+        if getattr(solver.model, 'use_train_segment', False):
+            batch = solver.augment(next(iter(solver.loaders['train'])))
+            pkg['kwargs']['segment'] = Fraction(batch.shape[-1], solver.model.samplerate)
+            print("Override", pkg['kwargs']['segment'])
+        valid, test = None, None
+        for m in solver.history:
+            if 'valid' in m:
+                valid = m['valid']
+            if 'test' in m:
+                test = m['test']
+        pkg['metrics'] = (valid, test)
+        if args.sign:
+            save_with_checksum(pkg, out_path)
+        else:
+            torch.save(pkg, out_path)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/tools/test_pretrained.py b/AutoCoverTool/ref/music_remover/demucs/tools/test_pretrained.py
new file mode 100644
index 0000000..3f4648d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/demucs/tools/test_pretrained.py
@@ -0,0 +1,43 @@
+# Copyright (c) Meta, Inc. and its affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the license found in the
+# LICENSE file in the root directory of this source tree.
+
+# Script to evaluate pretrained models.
+
+from argparse import ArgumentParser
+import logging
+import sys
+
+import torch
+
+from demucs import train, pretrained, evaluate
+
+
+def main():
+    torch.set_num_threads(1)
+    logging.basicConfig(stream=sys.stderr, level=logging.INFO)
+    parser = ArgumentParser("tools.test_pretrained",
+                            description="Evaluate pre-trained models or bags of models "
+                                        "on MusDB.")
+    pretrained.add_model_flags(parser)
+    parser.add_argument('overrides', nargs='*',
+                        help='Extra overrides, e.g. test.shifts=2.')
+    args = parser.parse_args()
+
+    xp = train.main.get_xp(args.overrides)
+    with xp.enter():
+        solver = train.get_solver(xp.cfg)
+
+    model = pretrained.get_model_from_args(args)
+    solver.model = model.to(solver.device)
+    solver.model.eval()
+
+    with torch.no_grad():
+        results = evaluate.evaluate(solver, xp.cfg.test.sdr)
+    print(results)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/AutoCoverTool/ref/music_remover/demucs/xishuashua.mp4 b/AutoCoverTool/ref/music_remover/demucs/xishuashua.mp4
new file mode 100644
index 0000000..a30c7ba
Binary files /dev/null and b/AutoCoverTool/ref/music_remover/demucs/xishuashua.mp4 differ
diff --git a/AutoCoverTool/ref/music_remover/readme.txt b/AutoCoverTool/ref/music_remover/readme.txt
new file mode 100644
index 0000000..7a33a51
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/readme.txt
@@ -0,0 +1,21 @@
+音乐分离工具
+
+简单介绍:
+    demucs源码地址: https://github.com/facebookresearch/demucs
+    本代码直接从上述源码拉取，使用的是Mon Nov 21 的main分支的版本
+
+基本改动:
+    封装separate_interface.py 文件，用于给定音频文件，生成伴奏文件
+
+环境安装:
+    1. GPU基本环境安装:
+        https://phabricator.ushow.media/w/%E9%9F%B3%E8%A7%86%E9%A2%91%E7%BB%84%E6%96%87%E6%A1%A3/%E7%8E%AF%E5%A2%83%E5%AE%89%E8%A3%85/gpu%E7%8E%AF%E5%A2%83%E5%AE%89%E8%A3%85/
+    2. 安装demucs环境
+        conda create -n demucs python==3.7
+    3. 安装 standard_audio 二进制文件
+        代码位置位于: av_cv_research/tools/music_remover/standard_audio
+        编译安装完成后存放于: /opt/soft/bin/standard_audio 即可
+
+快速使用（服务端）:
+    python3 separate_interface.py xishuashua.mp4 xishuashua.m4a
+    xishuashua.mp4 的时长为3分36s, 3次平均耗时为 27.33s
diff --git a/AutoCoverTool/ref/music_remover/separate_interface.py b/AutoCoverTool/ref/music_remover/separate_interface.py
new file mode 100644
index 0000000..ea3bb73
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/separate_interface.py
@@ -0,0 +1,103 @@
+"""
+分离的对外函数
+"""
+
+import os
+import sys
+import time
+import shutil
+import logging
+
+from demucs.pretrained import get_model
+from demucs.separate import *
+
+# 第三方二进制文件
+gs_standard_audio_exe = "/opt/soft/bin/standard_audio"
+gs_ffmpeg_exe = "ffmpeg"
+
+# 全局配置
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
+
+# 错误码
+ERR_CODE_SUCCESS = 0
+ERR_CODE_INPUT_FILE_NOT_EXISTS = 1
+
+
+class SeparateInterface:
+    """
+    分离器对外接口,只生成伴奏
+    """
+
+    def __init__(self):
+        sp_start = time.time()
+        # 评价之后该版本模型的效果效果最佳,性能也合适
+        # 对比评价过mdx_extra_q和htdemucs_ft
+        # 其中mdx_extra_q和mdx_extra速度一致，但是和声保留情况不如后者
+        # htdemucs_ft耗时是mdx_extra的1.6倍，在部分歌曲消去的程度上比mdx_extra好，但是和声没有mdx_extra保留的完整|详情见xishuashua的开头和声部分
+        self.model = get_model('mdx_extra')
+        self.tmp_dir = os.path.join("/tmp/separate")
+        if not os.path.exists(self.tmp_dir):
+            os.makedirs(self.tmp_dir)
+        logging.info("SeparateInterface: load model spent = {}".format(time.time() - sp_start))
+
+    def process_logic(self, cid, cache_dir, in_file, vocal_out_file, acc_out_file, dev='cuda'):
+        model = self.model
+        sp_start = time.time()
+        wav = load_track(in_file, model.audio_channels, model.samplerate)
+        logging.info("--------load_track:cid={},sp={}".format(cid, time.time() - sp_start))
+
+        # 模型推理
+        sp_start = time.time()
+        ref = wav.mean(0)
+        wav = (wav - ref.mean()) / ref.std()
+        # wav[None] -> 增加一个维度,原来是[2, xxx] -> [1, 2, xxx]
+        sources = apply_model(model, wav[None], device=dev, shifts=1, split=True, overlap=0.25, progress=True,
+                              num_workers=0)[0]
+        sources = sources * ref.std() + ref.mean()
+        logging.info("--------apply_model:cid={},sp={}".format(cid, time.time() - sp_start))
+
+        # 只保留伴奏
+        sources = list(sources)
+        vocals = sources.pop(model.sources.index("vocals"))
+        if vocals is not None:
+            save_audio(vocals, vocal_out_file, samplerate=model.samplerate)
+        other_stem = th.zeros_like(sources[0])
+        for sc in sources:
+            other_stem += sc
+        if acc_out_file is not None:
+            save_audio(other_stem, acc_out_file, samplerate=model.samplerate)
+
+        if vocal_out_file is not None:
+            if not os.path.exists(vocal_out_file):
+                return False
+        if acc_out_file is not None:
+            if not os.path.exists(acc_out_file):
+                return False
+        return True
+
+    def process(self, cid, in_file, vocal_out_file, acc_out_file, dev='cuda'):
+        if not os.path.exists(in_file):
+            return ERR_CODE_INPUT_FILE_NOT_EXISTS
+
+        st_time = time.time()
+        logging.info("--------process:cid={},{},{},{}".format(cid, in_file, vocal_out_file, acc_out_file))
+        cache_dir = os.path.join(self.tmp_dir, str(cid))
+        if os.path.exists(cache_dir):
+            shutil.rmtree(cache_dir)
+        os.makedirs(cache_dir)
+        # 核心处理逻辑
+        ret = self.process_logic(cid, cache_dir, in_file, vocal_out_file, acc_out_file, dev)
+        shutil.rmtree(cache_dir)
+        logging.info(
+            "--------finish:cid={},{},{},{}|{}|sp={}\n\n".format(cid, in_file, vocal_out_file, acc_out_file, dev, ret,
+                                                                 time.time() - st_time))
+        return ret
+
+#
+# if __name__ == '__main__':
+#     si = SeparateInterface()
+#     in_f = sys.argv[1]
+#     out_f = sys.argv[2]
+#     dev = sys.argv[3]  # cuda或者cpu
+#     for i in range(0, 3):
+#         si.process(str(1), in_f, out_f, dev)
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/CMakeLists.txt b/AutoCoverTool/ref/music_remover/standard_audio/CMakeLists.txt
new file mode 100644
index 0000000..5afa477
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/CMakeLists.txt
@@ -0,0 +1,16 @@
+cmake_minimum_required(VERSION 2.8)
+project(standard_audio)
+
+set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+set(CMAKE_CXX_STANDARD 11)
+
+
+include_directories(ref/alimter/inc)
+include_directories(ref/waves/inc)
+include_directories(ref/ebur128/inc)
+
+AUX_SOURCE_DIRECTORY(ref/alimter/src DIR_ALIMTER_SRCS)
+AUX_SOURCE_DIRECTORY(ref/waves/src DIR_WAVES_SRCS)
+AUX_SOURCE_DIRECTORY(ref/ebur128/src DIR_EBUR128_SRCS)
+
+add_executable(standard_audio main.cpp ${DIR_ALIMTER_SRCS} ${DIR_EBUR128_SRCS} ${DIR_WAVES_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/main.cpp b/AutoCoverTool/ref/music_remover/standard_audio/main.cpp
new file mode 100644
index 0000000..b448e0d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/main.cpp
@@ -0,0 +1,126 @@
+//
+// Created by yangjianli on 2022/12/5.
+//
+#include "WaveFile.h"
+#include "alimiter.h"
+#include "ebur128.h"
+
+#include <math.h>
+#include <vector>
+#include <sys/time.h>
+
+#define PROC_LEN 1024
+#define DEFAULT_BASELINE_DB (float)-14.57f
+
+// 采样率，通道数，源数据，数据长度，响度(dB), 达到目标响度需要的增益倍数
+int ebur128_whole(int channel, int sample_rate, short *data, const int len, double &gated_loudness, double &gain)
+{
+    ebur128_state *st = NULL;
+    st = ebur128_init(channel, sample_rate, EBUR128_MODE_I);
+    if (NULL == st)
+    {
+        return -1;
+    }
+    int pos = 0;
+    int temp_length = 0;
+    int ret;
+
+    while (pos < len)
+    {
+        temp_length = PROC_LEN;
+        if (len - pos < PROC_LEN)
+        {
+            temp_length = len - pos;
+        }
+        ret = ebur128_add_frames_short(st, data + pos, temp_length / channel);
+        if (ret != 0)
+        {
+            return -2;
+        }
+        pos += temp_length;
+    }
+
+    gated_loudness = -1;
+    ebur128_loudness_global(st, &gated_loudness);
+    float db = (DEFAULT_BASELINE_DB - gated_loudness) / 20.f;
+    gain = pow(10, db);
+    printf("gated_loudness = %f db = %f  gain = %f\n", gated_loudness, db, gain);
+    ebur128_destroy(&st);
+    return 0;
+}
+
+
+int main(int argc, char *argv[])
+{
+    struct timeval start;
+    struct timeval end;
+
+    if (argc < 3)
+    {
+        printf("example: ./exe in_wav out_wav!\n");
+        return -1;
+    }
+
+    gettimeofday(&start, NULL);
+
+    CWaveFile wave_file = CWaveFile(argv[1], false);
+    if (!wave_file.GetStatus())
+    {
+        printf("%s is not wav\n", argv[1]);
+        return -1;
+    }
+    int32_t sample_rate = wave_file.GetSampleRate();
+    int32_t channel = wave_file.GetChannels();
+    int32_t len = wave_file.GetTotalFrames() * channel;
+    short *buffer = new short[len];
+    wave_file.ReadFrameAsS16(buffer, wave_file.GetTotalFrames());
+
+    gettimeofday(&end, NULL);
+    printf("load_data|spend_time=%f\n", (end.tv_sec - start.tv_sec) * 1000.0 + (end.tv_usec - start.tv_usec) / 1000.0);
+
+    // 计算响度和预期拉伸的倍数
+    double gated_loudness = -1;
+    double gain = -1;
+    int err = ebur128_whole(channel, sample_rate, buffer, len, gated_loudness, gain);
+    if (err != 0 || gain == -1)
+    {
+        printf("%s ebur128 err=%d\n", argv[1], err);
+        return -1;
+    }
+    gettimeofday(&end, NULL);
+    printf("ebur128_whole|spend_time=%f\n", (end.tv_sec - start.tv_sec) * 1000.0 + (end.tv_usec - start.tv_usec) / 1000.0);
+
+
+    // 拉伸+压限防止爆音
+    CWaveFile out_file = CWaveFile(argv[2], true);
+    out_file.SetSampleFormat(SF_IEEE_FLOAT);
+    out_file.SetSampleRate(sample_rate);
+    out_file.SetChannels(channel);
+    out_file.SetupDone();
+
+    SUPERSOUND::Alimiter alimiter;
+    alimiter.SetParam(sample_rate, channel);
+    int step = 1024;
+    float* tmp_buffer = new float[step];
+    for(int i = 0; i < len; i+=step)
+    {
+        int cur_step = step;
+        if (i + cur_step > len)
+        {
+            cur_step = len - i;
+        }
+
+        for(int j = 0; j < cur_step; j++)
+        {
+            tmp_buffer[j] = float(buffer[i+j] / 32768.0 * gain);
+        }
+        alimiter.Filter(tmp_buffer, tmp_buffer, cur_step);
+        out_file.WriteFrame(tmp_buffer, cur_step / channel);
+    }
+
+    delete[] tmp_buffer;
+    delete[] buffer;
+    gettimeofday(&end, NULL);
+    printf("finish|spend_time=%f\n", (end.tv_sec - start.tv_sec) * 1000.0 + (end.tv_usec - start.tv_usec) / 1000.0);
+    return 0;
+}
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/CMakeLists.txt b/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/CMakeLists.txt
new file mode 100644
index 0000000..9748c4d
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_ALIMTER_SRCS)
+add_library(alimiter ${DIR_ALIMTER_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/inc/alimiter.h b/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/inc/alimiter.h
new file mode 100755
index 0000000..8022d39
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/inc/alimiter.h
@@ -0,0 +1,99 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现 FFMPEG 中的限制器，这个压限器对频谱友好，但是压得比较厉害
+
+#ifndef __ALIMITER_H__
+#define __ALIMITER_H__
+
+#include <stdint.h>
+#define ERROR_SUPERSOUND_SUCCESS 0
+#define ERROR_SUPERSOUND_PARAM -1
+#define ERROR_SUPERSOUND_MEMORY -2
+typedef struct AudioLimiterContext
+{
+	float limit;
+	float attack;
+	float release;
+	float att;
+	float level_in;
+	float level_out;
+	int32_t auto_release;
+	int32_t auto_level;
+	float asc;
+	int32_t asc_c;
+	int32_t asc_pos;
+	float asc_coeff;
+
+	float *buffer;
+	int32_t buffer_size;
+	int32_t buffer_max_size;
+	int32_t pos;
+	int32_t *nextpos;
+	float *nextdelta;
+
+	float delta;
+	int32_t nextiter;
+	int32_t nextlen;
+	int32_t asc_changed;
+}AudioLimiterContext;
+
+namespace SUPERSOUND
+{
+
+
+class Alimiter
+{
+public:
+	Alimiter();
+	~Alimiter();
+
+public:
+	void Flush();
+	int32_t GetLatecy();
+	int32_t SetParam(int32_t fs, int32_t channels);
+	void Filter(float * input, float * output, int32_t num);
+
+private:
+	void Uninit();
+	int32_t config_input();
+	float get_rdelta(AudioLimiterContext *s, float release, int sample_rate, float peak, float limit, float patt, int asc);
+
+private:
+	AudioLimiterContext m_alimiterCtx;
+	int m_nChannels;
+	int m_nFs;
+};
+
+
+}
+
+#endif /* __ALIMITER_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/src/alimiter.cpp b/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/src/alimiter.cpp
new file mode 100755
index 0000000..abbd622
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/alimter/src/alimiter.cpp
@@ -0,0 +1,306 @@
+
+#include "alimiter.h"
+#include <string.h>
+#include <math.h>
+#include <stdio.h>
+#include <new>
+
+#define MAX(a,b) (((a) > (b)) ? (a) : (b))
+#define MIN(a,b) (((a) < (b)) ? (a) : (b))
+#define MIDDLE(x, y, z) ((x)<(y)?((y)<(z)?(y):(x)<(z)?(z):(x)):((y)>(z)?(y):(x)>(z)?(z):(x)))
+#define SAFE_DELETE_PTR(ptr)    \
+{                                                               \
+        if(ptr)                                         \
+        {                                                       \
+                delete [] ptr;                  \
+                ptr = NULL;                             \
+        }                                                       \
+}
+
+namespace SUPERSOUND
+{
+
+
+Alimiter::Alimiter()
+{
+	memset(&m_alimiterCtx, 0, sizeof(m_alimiterCtx));
+
+	m_nChannels = 0;
+	m_nFs = 0;
+
+	Flush();
+}
+
+Alimiter::~Alimiter()
+{
+	Uninit();
+}
+
+void Alimiter::Flush()
+{
+	float * buffer = m_alimiterCtx.buffer;
+	float * nextdelta = m_alimiterCtx.nextdelta;
+	int32_t * nextpos = m_alimiterCtx.nextpos;
+	int32_t buffer_max_size = m_alimiterCtx.buffer_max_size;
+	int32_t buffer_size = m_alimiterCtx.buffer_size;
+
+	if(buffer)
+		memset(buffer, 0, sizeof(float) * buffer_max_size);
+	if(nextdelta)
+		memset(nextdelta, 0, sizeof(float) * buffer_max_size);
+	if(nextpos)
+		memset(nextpos, -1, sizeof(float) * buffer_max_size);
+
+	memset(&m_alimiterCtx, 0, sizeof(m_alimiterCtx));
+
+	m_alimiterCtx.level_in = 1;
+	m_alimiterCtx.level_out = 32000 / 32768.0;
+	m_alimiterCtx.limit = 1;
+	m_alimiterCtx.attack = 5;
+	m_alimiterCtx.release = 50;
+	m_alimiterCtx.auto_release = 0;
+	m_alimiterCtx.asc_coeff = 0.5;
+	m_alimiterCtx.auto_level = 1;
+
+	m_alimiterCtx.attack /= 1000;
+	m_alimiterCtx.release /= 1000;
+	m_alimiterCtx.att = 1;
+	m_alimiterCtx.asc_pos = -1;
+	m_alimiterCtx.asc_coeff = pow(0.5f, m_alimiterCtx.asc_coeff - 0.5f) * 2 * -1;
+
+	m_alimiterCtx.buffer = buffer;
+	m_alimiterCtx.nextdelta = nextdelta;
+	m_alimiterCtx.nextpos = nextpos;
+	m_alimiterCtx.buffer_max_size = buffer_max_size;
+	m_alimiterCtx.buffer_size = buffer_size;
+}
+
+int32_t Alimiter::GetLatecy()
+{
+	return m_alimiterCtx.buffer_size / m_nChannels;
+}
+
+int32_t Alimiter::SetParam( int32_t fs, int32_t channels )
+{
+	if((fs == m_nFs) && (channels == m_nChannels))
+		return ERROR_SUPERSOUND_SUCCESS;
+
+	m_nChannels = channels;
+	m_nFs = fs;
+
+	return config_input();
+}
+
+void Alimiter::Filter( float * input, float * output, int32_t num )
+{
+	num = num / m_nChannels;
+	int channels = m_nChannels;
+	int buffer_size = m_alimiterCtx.buffer_size;
+	float * buffer = m_alimiterCtx.buffer;
+	float release = m_alimiterCtx.release;
+	float limit = m_alimiterCtx.limit;
+	float * nextdelta = m_alimiterCtx.nextdelta;
+	float level = m_alimiterCtx.auto_level ? 1 / limit : 1;
+	float level_out = m_alimiterCtx.level_out;
+	float level_in = m_alimiterCtx.level_in;
+	int *nextpos = m_alimiterCtx.nextpos;
+
+	float * buf;
+	float * dst;
+	float * src;
+	int n, c, i;
+	AudioLimiterContext * s = &m_alimiterCtx;
+
+	dst = output;
+	src = input;
+
+	for (n = 0; n < num; n++) {
+		float peak = 0;
+
+		for (c = 0; c < channels; c++) {
+			float sample = src[c] * level_in;
+
+			buffer[s->pos + c] = sample;
+			peak = MAX(peak, fabs(sample));
+		}
+
+		if (s->auto_release && peak > limit) {
+			s->asc += peak;
+			s->asc_c++;
+		}
+
+		if (peak > limit) {
+			float patt = MIN(limit / peak, 1);
+			float rdelta = get_rdelta(s, release, m_nFs,
+				peak, limit, patt, 0);
+			float delta = (limit / peak - s->att) / buffer_size * channels;
+			int found = 0;
+
+			if (delta < s->delta) {
+				s->delta = delta;
+				nextpos[0] = s->pos;
+				nextpos[1] = -1;
+				nextdelta[0] = rdelta;
+				s->nextlen = 1;
+				s->nextiter= 0;
+			} else {
+				for (i = s->nextiter; i < s->nextiter + s->nextlen; i++) {
+					int j = i % buffer_size;
+					float ppeak, pdelta;
+
+					ppeak = fabs(buffer[nextpos[j]]) > fabs(buffer[nextpos[j] + 1]) ?
+						fabs(buffer[nextpos[j]]) : fabs(buffer[nextpos[j] + 1]);
+					pdelta = (limit / peak - limit / ppeak) / (((buffer_size - nextpos[j] + s->pos) % buffer_size) / channels);
+					if (pdelta < nextdelta[j]) {
+						nextdelta[j] = pdelta;
+						found = 1;
+						break;
+					}
+				}
+				if (found) {
+					s->nextlen = i - s->nextiter + 1;
+					nextpos[(s->nextiter + s->nextlen) % buffer_size] = s->pos;
+					nextdelta[(s->nextiter + s->nextlen) % buffer_size] = rdelta;
+					nextpos[(s->nextiter + s->nextlen + 1) % buffer_size] = -1;
+					s->nextlen++;
+				}
+			}
+		}
+
+		buf = &s->buffer[(s->pos + channels) % buffer_size];
+		peak = 0;
+		for (c = 0; c < channels; c++) {
+			float sample = buf[c];
+
+			peak = MAX(peak, fabs(sample));
+		}
+
+		if (s->pos == s->asc_pos && !s->asc_changed)
+			s->asc_pos = -1;
+
+		if (s->auto_release && s->asc_pos == -1 && peak > limit) {
+			s->asc -= peak;
+			s->asc_c--;
+		}
+
+		s->att += s->delta;
+
+		for (c = 0; c < channels; c++)
+			dst[c] = buf[c] * s->att;
+
+		if ((s->pos + channels) % buffer_size == nextpos[s->nextiter]) {
+			if (s->auto_release) {
+				s->delta = get_rdelta(s, release, m_nFs,
+					peak, limit, s->att, 1);
+				if (s->nextlen > 1) {
+					int pnextpos = nextpos[(s->nextiter + 1) % buffer_size];
+					float ppeak = fabs(buffer[pnextpos]) > fabs(buffer[pnextpos + 1]) ?
+						fabs(buffer[pnextpos]) :
+					fabs(buffer[pnextpos + 1]);
+					float pdelta = (limit / ppeak - s->att) /
+						(((buffer_size + pnextpos -
+						((s->pos + channels) % buffer_size)) %
+						buffer_size) / channels);
+					if (pdelta < s->delta)
+						s->delta = pdelta;
+				}
+			} else {
+				s->delta = nextdelta[s->nextiter];
+				s->att = limit / peak;
+			}
+
+			s->nextlen -= 1;
+			nextpos[s->nextiter] = -1;
+			s->nextiter = (s->nextiter + 1) % buffer_size;
+		}
+
+		if (s->att > 1.) {
+			s->att = 1.;
+			s->delta = 0.;
+			s->nextiter = 0;
+			s->nextlen = 0;
+			nextpos[0] = -1;
+		}
+
+		if (s->att <= 0.) {
+			s->att = 0.000001f;
+			s->delta = (1 - s->att) / (m_nFs * release);
+		}
+
+		if (s->att != 1 && (1 - s->att) < 0.000001f)
+			s->att = 1;
+
+		if (s->delta != 0 && fabs(s->delta) < 0.000001f)
+			s->delta = 0;
+
+		for (c = 0; c < channels; c++)
+			dst[c] = MIDDLE(dst[c], -limit, limit) * level * level_out;
+
+		s->pos = (s->pos + channels) % buffer_size;
+		src += channels;
+		dst += channels;
+	}
+}
+
+void Alimiter::Uninit()
+{
+	SAFE_DELETE_PTR(m_alimiterCtx.buffer);
+	SAFE_DELETE_PTR(m_alimiterCtx.nextdelta);
+	SAFE_DELETE_PTR(m_alimiterCtx.nextpos);
+}
+
+int32_t Alimiter::config_input()
+{
+	int obuffer_size = int(m_nFs * m_nChannels * 100 / 1000. + m_nChannels);
+	if(obuffer_size < m_nChannels)
+		return ERROR_SUPERSOUND_PARAM;
+
+	if(obuffer_size > m_alimiterCtx.buffer_max_size)
+	{
+		SAFE_DELETE_PTR(m_alimiterCtx.buffer);
+		m_alimiterCtx.buffer = new(std::nothrow) float[obuffer_size];
+		if(m_alimiterCtx.buffer == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_alimiterCtx.buffer, 0, sizeof(float) * obuffer_size);
+
+		SAFE_DELETE_PTR(m_alimiterCtx.nextdelta);
+		m_alimiterCtx.nextdelta = new(std::nothrow) float[obuffer_size];
+		if(m_alimiterCtx.nextdelta == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_alimiterCtx.nextdelta, 0, sizeof(float) * obuffer_size);
+
+		SAFE_DELETE_PTR(m_alimiterCtx.nextpos);
+		m_alimiterCtx.nextpos = new(std::nothrow) int32_t[obuffer_size];
+		if(m_alimiterCtx.nextpos == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_alimiterCtx.nextpos, -1, obuffer_size*sizeof(int32_t));
+
+		m_alimiterCtx.buffer_max_size = obuffer_size;
+	}
+
+	m_alimiterCtx.buffer_size = int(m_nFs * m_alimiterCtx.attack * m_nChannels);
+	m_alimiterCtx.buffer_size -= m_alimiterCtx.buffer_size % m_nChannels;
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+float Alimiter::get_rdelta( AudioLimiterContext *s, float release, int sample_rate, float peak, float limit, float patt, int asc )
+{
+	float rdelta = (1 - patt) / (sample_rate * release);
+
+	if (asc && s->auto_release && s->asc_c > 0) {
+		float a_att = limit / (s->asc_coeff * s->asc) * (float)s->asc_c;
+
+		if (a_att > patt) {
+			float delta = MAX((a_att - patt) / (sample_rate * release), rdelta / 10);
+
+			if (delta < rdelta)
+				rdelta = delta;
+		}
+	}
+
+	return rdelta;
+}
+
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/CMakeLists.txt b/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/CMakeLists.txt
new file mode 100644
index 0000000..18a5a86
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_EBUR128_SRCS)
+add_library(ebur128 ${DIR_EBUR128_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/inc/ebur128.h b/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/inc/ebur128.h
new file mode 100755
index 0000000..faa66c6
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/inc/ebur128.h
@@ -0,0 +1,425 @@
+/* See COPYING file for copyright and license details. */
+
+#ifndef EBUR128_H_
+#define EBUR128_H_
+
+/** \file ebur128.h
+ *  \brief libebur128 - a library for loudness measurement according to
+ *         the EBU R128 standard.
+ */
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#define EBUR128_VERSION_MAJOR 1
+#define EBUR128_VERSION_MINOR 2
+#define EBUR128_VERSION_PATCH 4
+
+#include <stddef.h>       /* for size_t */
+
+/** \enum channel
+ *  Use these values when setting the channel map with ebur128_set_channel().
+ *  See definitions in ITU R-REC-BS 1770-4
+ */
+enum channel {
+  EBUR128_UNUSED = 0,     /**< unused channel (for example LFE channel) */
+  EBUR128_LEFT   = 1,
+  EBUR128_Mp030  = 1,     /**< itu M+030 */
+  EBUR128_RIGHT  = 2,
+  EBUR128_Mm030  = 2,     /**< itu M-030 */
+  EBUR128_CENTER = 3,
+  EBUR128_Mp000  = 3,     /**< itu M+000 */
+  EBUR128_LEFT_SURROUND  = 4,
+  EBUR128_Mp110  = 4,     /**< itu M+110 */
+  EBUR128_RIGHT_SURROUND = 5,
+  EBUR128_Mm110  = 5,     /**< itu M-110 */
+  EBUR128_DUAL_MONO,      /**< a channel that is counted twice */
+  EBUR128_MpSC,           /**< itu M+SC */
+  EBUR128_MmSC,           /**< itu M-SC */
+  EBUR128_Mp060,          /**< itu M+060 */
+  EBUR128_Mm060,          /**< itu M-060 */
+  EBUR128_Mp090,          /**< itu M+090 */
+  EBUR128_Mm090,          /**< itu M-090 */
+  EBUR128_Mp135,          /**< itu M+135 */
+  EBUR128_Mm135,          /**< itu M-135 */
+  EBUR128_Mp180,          /**< itu M+180 */
+  EBUR128_Up000,          /**< itu U+000 */
+  EBUR128_Up030,          /**< itu U+030 */
+  EBUR128_Um030,          /**< itu U-030 */
+  EBUR128_Up045,          /**< itu U+045 */
+  EBUR128_Um045,          /**< itu U-030 */
+  EBUR128_Up090,          /**< itu U+090 */
+  EBUR128_Um090,          /**< itu U-090 */
+  EBUR128_Up110,          /**< itu U+110 */
+  EBUR128_Um110,          /**< itu U-110 */
+  EBUR128_Up135,          /**< itu U+135 */
+  EBUR128_Um135,          /**< itu U-135 */
+  EBUR128_Up180,          /**< itu U+180 */
+  EBUR128_Tp000,          /**< itu T+000 */
+  EBUR128_Bp000,          /**< itu B+000 */
+  EBUR128_Bp045,          /**< itu B+045 */
+  EBUR128_Bm045           /**< itu B-045 */
+};
+
+/** \enum error
+ *  Error return values.
+ */
+enum error {
+  EBUR128_SUCCESS = 0,
+  EBUR128_ERROR_NOMEM,
+  EBUR128_ERROR_INVALID_MODE,
+  EBUR128_ERROR_INVALID_CHANNEL_INDEX,
+  EBUR128_ERROR_NO_CHANGE
+};
+
+/** \enum mode
+ *  Use these values in ebur128_init (or'ed). Try to use the lowest possible
+ *  modes that suit your needs, as performance will be better.
+ */
+enum mode {
+  /** can call ebur128_loudness_momentary */
+  EBUR128_MODE_M           = (1 << 0),
+  /** can call ebur128_loudness_shortterm */
+  EBUR128_MODE_S           = (1 << 1) | EBUR128_MODE_M,
+  /** can call ebur128_loudness_global_* and ebur128_relative_threshold */
+  EBUR128_MODE_I           = (1 << 2) | EBUR128_MODE_M,
+  /** can call ebur128_loudness_range */
+  EBUR128_MODE_LRA         = (1 << 3) | EBUR128_MODE_S,
+  /** can call ebur128_sample_peak */
+  EBUR128_MODE_SAMPLE_PEAK = (1 << 4) | EBUR128_MODE_M,
+  /** can call ebur128_true_peak */
+  EBUR128_MODE_TRUE_PEAK   = (1 << 5) | EBUR128_MODE_M
+                                      | EBUR128_MODE_SAMPLE_PEAK,
+  /** uses histogram algorithm to calculate loudness */
+  EBUR128_MODE_HISTOGRAM   = (1 << 6)
+};
+
+/** forward declaration of ebur128_state_internal */
+struct ebur128_state_internal;
+
+/** \brief Contains information about the state of a loudness measurement.
+ *
+ *  You should not need to modify this struct directly.
+ */
+typedef struct {
+  int mode;                           /**< The current mode. */
+  unsigned int channels;              /**< The number of channels. */
+  unsigned long samplerate;           /**< The sample rate. */
+  struct ebur128_state_internal* d;   /**< Internal state. */
+} ebur128_state;
+
+/** \brief Get library version number. Do not pass null pointers here.
+ *
+ *  @param major major version number of library
+ *  @param minor minor version number of library
+ *  @param patch patch version number of library
+ */
+void ebur128_get_version(int* major, int* minor, int* patch);
+
+/** \brief Initialize library state.
+ *
+ *  @param channels the number of channels.
+ *  @param samplerate the sample rate.
+ *  @param mode see the mode enum for possible values.
+ *  @return an initialized library state, or NULL on error.
+ */
+ebur128_state* ebur128_init(unsigned int channels,
+                            unsigned long samplerate,
+                            int mode);
+
+/** \brief Destroy library state.
+ *
+ *  @param st pointer to a library state.
+ */
+void ebur128_destroy(ebur128_state** st);
+
+/** \brief Set channel type.
+ *
+ *  The default is:
+ *  - 0 -> EBUR128_LEFT
+ *  - 1 -> EBUR128_RIGHT
+ *  - 2 -> EBUR128_CENTER
+ *  - 3 -> EBUR128_UNUSED
+ *  - 4 -> EBUR128_LEFT_SURROUND
+ *  - 5 -> EBUR128_RIGHT_SURROUND
+ *
+ *  @param st library state.
+ *  @param channel_number zero based channel index.
+ *  @param value channel type from the "channel" enum.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_set_channel(ebur128_state* st,
+                        unsigned int channel_number,
+                        int value);
+
+/** \brief Change library parameters.
+ *
+ *  Note that the channel map will be reset when setting a different number of
+ *  channels. The current unfinished block will be lost.
+ *
+ *  @param st library state.
+ *  @param channels new number of channels.
+ *  @param samplerate new sample rate.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM on memory allocation error. The state will be
+ *      invalid and must be destroyed.
+ *    - EBUR128_ERROR_NO_CHANGE if channels and sample rate were not changed.
+ */
+int ebur128_change_parameters(ebur128_state* st,
+                              unsigned int channels,
+                              unsigned long samplerate);
+
+/** \brief Set the maximum window duration.
+ *
+ *  Set the maximum duration that will be used for ebur128_window_loudness().
+ *  Note that this destroys the current content of the audio buffer.
+ *
+ *  @param st library state.
+ *  @param window duration of the window in ms.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM on memory allocation error. The state will be
+ *      invalid and must be destroyed.
+ *    - EBUR128_ERROR_NO_CHANGE if window duration not changed.
+ */
+int ebur128_set_max_window(ebur128_state* st, unsigned long window);
+
+/** \brief Set the maximum history.
+ *
+ *  Set the maximum history that will be stored for loudness integration.
+ *  More history provides more accurate results, but requires more resources.
+ *
+ *  Applies to ebur128_loudness_range() and ebur128_loudness_global() when
+ *  EBUR128_MODE_HISTOGRAM is not set.
+ *
+ *  Default is ULONG_MAX (at least ~50 days).
+ *  Minimum is 3000ms for EBUR128_MODE_LRA and 400ms for EBUR128_MODE_M.
+ *
+ *  @param st library state.
+ *  @param history duration of history in ms.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NO_CHANGE if history not changed.
+ */
+int ebur128_set_max_history(ebur128_state* st, unsigned long history);
+
+/** \brief Add frames to be processed.
+ *
+ *  @param st library state.
+ *  @param src array of source frames. Channels must be interleaved.
+ *  @param frames number of frames. Not number of samples!
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM on memory allocation error.
+ */
+int ebur128_add_frames_short(ebur128_state* st,
+                             const short* src,
+                             size_t frames);
+/** \brief See \ref ebur128_add_frames_short */
+int ebur128_add_frames_int(ebur128_state* st,
+                             const int* src,
+                             size_t frames);
+/** \brief See \ref ebur128_add_frames_short */
+int ebur128_add_frames_float(ebur128_state* st,
+                             const float* src,
+                             size_t frames);
+/** \brief See \ref ebur128_add_frames_short */
+int ebur128_add_frames_double(ebur128_state* st,
+                             const double* src,
+                             size_t frames);
+
+/** \brief Get global integrated loudness in LUFS.
+ *
+ *  @param st library state.
+ *  @param out integrated loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_I" has not been set.
+ */
+int ebur128_loudness_global(ebur128_state* st, double* out);
+/** \brief Get global integrated loudness in LUFS across multiple instances.
+ *
+ *  @param sts array of library states.
+ *  @param size length of sts
+ *  @param out integrated loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_I" has not been set.
+ */
+int ebur128_loudness_global_multiple(ebur128_state** sts,
+                                     size_t size,
+                                     double* out);
+
+/** \brief Get momentary loudness (last 400ms) in LUFS.
+ *
+ *  @param st library state.
+ *  @param out momentary loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ */
+int ebur128_loudness_momentary(ebur128_state* st, double* out);
+/** \brief Get short-term loudness (last 3s) in LUFS.
+ *
+ *  @param st library state.
+ *  @param out short-term loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_S" has not been set.
+ */
+int ebur128_loudness_shortterm(ebur128_state* st, double* out);
+
+/** \brief Get loudness of the specified window in LUFS.
+ *
+ *  window must not be larger than the current window set in st.
+ *  The current window can be changed by calling ebur128_set_max_window().
+ *
+ *  @param st library state.
+ *  @param window window in ms to calculate loudness.
+ *  @param out loudness in LUFS. -HUGE_VAL if result is negative infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if window larger than current window in st.
+ */
+int ebur128_loudness_window(ebur128_state* st,
+                            unsigned long window,
+                            double* out);
+
+/** \brief Get loudness range (LRA) of programme in LU.
+ *
+ *  Calculates loudness range according to EBU 3342.
+ *
+ *  @param st library state.
+ *  @param out loudness range (LRA) in LU. Will not be changed in case of
+ *             error. EBUR128_ERROR_NOMEM or EBUR128_ERROR_INVALID_MODE will be
+ *             returned in this case.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM in case of memory allocation error.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_LRA" has not been set.
+ */
+int ebur128_loudness_range(ebur128_state* st, double* out);
+/** \brief Get loudness range (LRA) in LU across multiple instances.
+ *
+ *  Calculates loudness range according to EBU 3342.
+ *
+ *  @param sts array of library states.
+ *  @param size length of sts
+ *  @param out loudness range (LRA) in LU. Will not be changed in case of
+ *             error. EBUR128_ERROR_NOMEM or EBUR128_ERROR_INVALID_MODE will be
+ *             returned in this case.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM in case of memory allocation error.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_LRA" has not been set.
+ */
+int ebur128_loudness_range_multiple(ebur128_state** sts,
+                                    size_t size,
+                                    double* out);
+
+/** \brief Get maximum sample peak from all frames that have been processed.
+ *
+ *  The equation to convert to dBFS is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum sample peak in float format (1.0 is 0 dBFS)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_SAMPLE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_sample_peak(ebur128_state* st,
+                        unsigned int channel_number,
+                        double* out);
+
+/** \brief Get maximum sample peak from the last call to add_frames().
+ *
+ *  The equation to convert to dBFS is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum sample peak in float format (1.0 is 0 dBFS)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_SAMPLE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_prev_sample_peak(ebur128_state* st,
+                             unsigned int channel_number,
+                             double* out);
+
+/** \brief Get maximum true peak from all frames that have been processed.
+ *
+ *  Uses an implementation defined algorithm to calculate the true peak. Do not
+ *  try to compare resulting values across different versions of the library,
+ *  as the algorithm may change.
+ *
+ *  The current implementation uses a custom polyphase FIR interpolator to
+ *  calculate true peak. Will oversample 4x for sample rates < 96000 Hz, 2x for
+ *  sample rates < 192000 Hz and leave the signal unchanged for 192000 Hz.
+ *
+ *  The equation to convert to dBTP is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum true peak in float format (1.0 is 0 dBTP)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_TRUE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_true_peak(ebur128_state* st,
+                      unsigned int channel_number,
+                      double* out);
+
+/** \brief Get maximum true peak from the last call to add_frames().
+ *
+ *  Uses an implementation defined algorithm to calculate the true peak. Do not
+ *  try to compare resulting values across different versions of the library,
+ *  as the algorithm may change.
+ *
+ *  The current implementation uses a custom polyphase FIR interpolator to
+ *  calculate true peak. Will oversample 4x for sample rates < 96000 Hz, 2x for
+ *  sample rates < 192000 Hz and leave the signal unchanged for 192000 Hz.
+ *
+ *  The equation to convert to dBTP is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum true peak in float format (1.0 is 0 dBTP)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_TRUE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_prev_true_peak(ebur128_state* st,
+                           unsigned int channel_number,
+                           double* out);
+
+/** \brief Get relative threshold in LUFS.
+ *
+ *  @param st library state
+ *  @param out relative threshold in LUFS.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_I" has not
+ *      been set.
+ */
+int ebur128_relative_threshold(ebur128_state* st, double* out);
+#ifdef __cplusplus
+}
+#endif
+
+#endif  /* EBUR128_H_ */
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/src/ebur128.c b/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/src/ebur128.c
new file mode 100755
index 0000000..6c10f1e
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/ebur128/src/ebur128.c
@@ -0,0 +1,1333 @@
+/* See COPYING file for copyright and license details. */
+
+#include "ebur128.h"
+
+#include <float.h>
+#include <limits.h>
+#include <math.h> /* You may have to define _USE_MATH_DEFINES if you use MSVC */
+#include <stdio.h>
+#include <stdlib.h>
+
+/* This can be replaced by any BSD-like queue implementation. */
+#include <sys/queue.h>
+
+#define CHECK_ERROR(condition, errorcode, goto_point)                          \
+  if ((condition)) {                                                           \
+    errcode = (errorcode);                                                     \
+    goto goto_point;                                                           \
+  }
+
+STAILQ_HEAD(ebur128_double_queue, ebur128_dq_entry);
+struct ebur128_dq_entry {
+  double z;
+  STAILQ_ENTRY(ebur128_dq_entry) entries;
+};
+
+#define ALMOST_ZERO 0.000001
+
+typedef struct {              /* Data structure for polyphase FIR interpolator */
+  unsigned int factor;        /* Interpolation factor of the interpolator */
+  unsigned int taps;          /* Taps (prefer odd to increase zero coeffs) */
+  unsigned int channels;      /* Number of channels */
+  unsigned int delay;         /* Size of delay buffer */
+  struct {
+    unsigned int count;       /* Number of coefficients in this subfilter */
+    unsigned int* index;      /* Delay index of corresponding filter coeff */
+    double* coeff;            /* List of subfilter coefficients */
+  }* filter;                  /* List of subfilters (one for each factor) */
+  float** z;                  /* List of delay buffers (one for each channel) */
+  unsigned int zi;            /* Current delay buffer index */
+} interpolator;
+
+struct ebur128_state_internal {
+  /** Filtered audio data (used as ring buffer). */
+  double* audio_data;
+  /** Size of audio_data array. */
+  size_t audio_data_frames;
+  /** Current index for audio_data. */
+  size_t audio_data_index;
+  /** How many frames are needed for a gating block. Will correspond to 400ms
+   *  of audio at initialization, and 100ms after the first block (75% overlap
+   *  as specified in the 2011 revision of BS1770). */
+  unsigned long needed_frames;
+  /** The channel map. Has as many elements as there are channels. */
+  int* channel_map;
+  /** How many samples fit in 100ms (rounded). */
+  unsigned long samples_in_100ms;
+  /** BS.1770 filter coefficients (nominator). */
+  double b[5];
+  /** BS.1770 filter coefficients (denominator). */
+  double a[5];
+  /** BS.1770 filter state. */
+  double v[5][5];
+  /** Linked list of block energies. */
+  struct ebur128_double_queue block_list;
+  unsigned long block_list_max;
+  unsigned long block_list_size;
+  /** Linked list of 3s-block energies, used to calculate LRA. */
+  struct ebur128_double_queue short_term_block_list;
+  unsigned long st_block_list_max;
+  unsigned long st_block_list_size;
+  int use_histogram;
+  unsigned long *block_energy_histogram;
+  unsigned long *short_term_block_energy_histogram;
+  /** Keeps track of when a new short term block is needed. */
+  size_t short_term_frame_counter;
+  /** Maximum sample peak, one per channel */
+  double* sample_peak;
+  double* prev_sample_peak;
+  /** Maximum true peak, one per channel */
+  double* true_peak;
+  double* prev_true_peak;
+  interpolator* interp;
+  float* resampler_buffer_input;
+  size_t resampler_buffer_input_frames;
+  float* resampler_buffer_output;
+  size_t resampler_buffer_output_frames;
+  /** The maximum window duration in ms. */
+  unsigned long window;
+  unsigned long history;
+};
+
+static double relative_gate = -10.0;
+
+/* Those will be calculated when initializing the library */
+static double relative_gate_factor;
+static double minus_twenty_decibels;
+static double histogram_energies[1000];
+static double histogram_energy_boundaries[1001];
+
+static interpolator* interp_create(unsigned int taps, unsigned int factor, unsigned int channels) {
+  interpolator* interp = calloc(1, sizeof(interpolator));
+  unsigned int j = 0;
+
+  interp->taps = taps;
+  interp->factor = factor;
+  interp->channels = channels;
+  interp->delay = (interp->taps + interp->factor - 1) / interp->factor;
+
+  /* Initialize the filter memory
+   * One subfilter per interpolation factor. */
+  interp->filter = calloc(interp->factor, sizeof(*interp->filter));
+  for (j = 0; j < interp->factor; j++) {
+    interp->filter[j].index = calloc(interp->delay, sizeof(unsigned int));
+    interp->filter[j].coeff = calloc(interp->delay, sizeof(double));
+  }
+  /* One delay buffer per channel. */
+  interp->z = calloc(interp->channels, sizeof(float*));
+  for (j = 0; j < interp->channels; j++) {
+    interp->z[j] = calloc( interp->delay, sizeof(float) );
+  }
+
+  /* Calculate the filter coefficients */
+  for (j = 0; j < interp->taps; j++) {
+    /* Calculate sinc */
+    double m = (double)j - (double)(interp->taps - 1) / 2.0;
+    double c = 1.0;
+    if (fabs(m) > ALMOST_ZERO) {
+      c = sin(m * M_PI / interp->factor) / (m * M_PI / interp->factor);
+    }
+    /* Apply Hanning window */
+    c *= 0.5 * (1 - cos(2 * M_PI * j / (interp->taps - 1)));
+
+    if (fabs(c) > ALMOST_ZERO) { /* Ignore any zero coeffs. */
+      /* Put the coefficient into the correct subfilter */
+      unsigned int f = j % interp->factor;
+      unsigned int t = interp->filter[f].count++;
+      interp->filter[f].coeff[t] = c;
+      interp->filter[f].index[t] = j / interp->factor;
+    }
+  }
+  return interp;
+}
+
+static void interp_destroy(interpolator* interp) {
+  unsigned int j = 0;
+  if (!interp) {
+    return;
+  }
+  for (j = 0; j < interp->factor; j++) {
+    free(interp->filter[j].index);
+    free(interp->filter[j].coeff);
+  }
+  free(interp->filter);
+  for (j = 0; j < interp->channels; j++) {
+    free(interp->z[j]);
+  }
+  free(interp->z);
+  free(interp);
+}
+
+static size_t interp_process(interpolator* interp, size_t frames, float* in, float* out) {
+  size_t frame = 0;
+  unsigned int chan = 0;
+  unsigned int f = 0;
+  unsigned int t = 0;
+  unsigned int out_stride = interp->channels * interp->factor;
+  float* outp = 0;
+  double acc = 0;
+  double c = 0;
+
+  for (frame = 0; frame < frames; frame++) {
+    for (chan = 0; chan < interp->channels; chan++) {
+      /* Add sample to delay buffer */
+      interp->z[chan][interp->zi] = *in++;
+      /* Apply coefficients */
+      outp = out + chan;
+      for (f = 0; f < interp->factor; f++) {
+        acc = 0.0;
+        for (t = 0; t < interp->filter[f].count; t++) {
+          int i = (int)interp->zi - (int)interp->filter[f].index[t];
+          if (i < 0) {
+            i += interp->delay;
+          }
+          c = interp->filter[f].coeff[t];
+          acc += interp->z[chan][i] * c;
+        }
+        *outp = (float)acc;
+        outp += interp->channels;
+      }
+    }
+    out += out_stride;
+    interp->zi++;
+    if (interp->zi == interp->delay) {
+      interp->zi = 0;
+    }
+  }
+
+  return frames * interp->factor;
+}
+
+static void ebur128_init_filter(ebur128_state* st) {
+  int i, j;
+
+  double f0 = 1681.974450955533;
+  double G  =    3.999843853973347;
+  double Q  =    0.7071752369554196;
+
+  double K  = tan(M_PI * f0 / (double) st->samplerate);
+  double Vh = pow(10.0, G / 20.0);
+  double Vb = pow(Vh, 0.4996667741545416);
+
+  double pb[3] = {0.0,  0.0, 0.0};
+  double pa[3] = {1.0,  0.0, 0.0};
+  double rb[3] = {1.0, -2.0, 1.0};
+  double ra[3] = {1.0,  0.0, 0.0};
+
+  double a0 =      1.0 + K / Q + K * K      ;
+  pb[0] =     (Vh + Vb * K / Q + K * K) / a0;
+  pb[1] =           2.0 * (K * K -  Vh) / a0;
+  pb[2] =     (Vh - Vb * K / Q + K * K) / a0;
+  pa[1] =           2.0 * (K * K - 1.0) / a0;
+  pa[2] =         (1.0 - K / Q + K * K) / a0;
+
+  /* fprintf(stderr, "%.14f %.14f %.14f %.14f %.14f\n",
+                     b1[0], b1[1], b1[2], a1[1], a1[2]); */
+
+  f0 = 38.13547087602444;
+  Q  =  0.5003270373238773;
+  K  = tan(M_PI * f0 / (double) st->samplerate);
+
+  ra[1] =   2.0 * (K * K - 1.0) / (1.0 + K / Q + K * K);
+  ra[2] = (1.0 - K / Q + K * K) / (1.0 + K / Q + K * K);
+
+  /* fprintf(stderr, "%.14f %.14f\n", a2[1], a2[2]); */
+
+  st->d->b[0] = pb[0] * rb[0];
+  st->d->b[1] = pb[0] * rb[1] + pb[1] * rb[0];
+  st->d->b[2] = pb[0] * rb[2] + pb[1] * rb[1] + pb[2] * rb[0];
+  st->d->b[3] = pb[1] * rb[2] + pb[2] * rb[1];
+  st->d->b[4] = pb[2] * rb[2];
+
+  st->d->a[0] = pa[0] * ra[0];
+  st->d->a[1] = pa[0] * ra[1] + pa[1] * ra[0];
+  st->d->a[2] = pa[0] * ra[2] + pa[1] * ra[1] + pa[2] * ra[0];
+  st->d->a[3] = pa[1] * ra[2] + pa[2] * ra[1];
+  st->d->a[4] = pa[2] * ra[2];
+
+  for (i = 0; i < 5; ++i) {
+    for (j = 0; j < 5; ++j) {
+      st->d->v[i][j] = 0.0;
+    }
+  }
+}
+
+static int ebur128_init_channel_map(ebur128_state* st) {
+  size_t i;
+  st->d->channel_map = (int*) malloc(st->channels * sizeof(int));
+  if (!st->d->channel_map) {
+    return EBUR128_ERROR_NOMEM;
+  }
+  if (st->channels == 4) {
+    st->d->channel_map[0] = EBUR128_LEFT;
+    st->d->channel_map[1] = EBUR128_RIGHT;
+    st->d->channel_map[2] = EBUR128_LEFT_SURROUND;
+    st->d->channel_map[3] = EBUR128_RIGHT_SURROUND;
+  } else if (st->channels == 5) {
+    st->d->channel_map[0] = EBUR128_LEFT;
+    st->d->channel_map[1] = EBUR128_RIGHT;
+    st->d->channel_map[2] = EBUR128_CENTER;
+    st->d->channel_map[3] = EBUR128_LEFT_SURROUND;
+    st->d->channel_map[4] = EBUR128_RIGHT_SURROUND;
+  } else {
+    for (i = 0; i < st->channels; ++i) {
+      switch (i) {
+        case 0:  st->d->channel_map[i] = EBUR128_LEFT;           break;
+        case 1:  st->d->channel_map[i] = EBUR128_RIGHT;          break;
+        case 2:  st->d->channel_map[i] = EBUR128_CENTER;         break;
+        case 3:  st->d->channel_map[i] = EBUR128_UNUSED;         break;
+        case 4:  st->d->channel_map[i] = EBUR128_LEFT_SURROUND;  break;
+        case 5:  st->d->channel_map[i] = EBUR128_RIGHT_SURROUND; break;
+        default: st->d->channel_map[i] = EBUR128_UNUSED;         break;
+      }
+    }
+  }
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_init_resampler(ebur128_state* st) {
+  int errcode = EBUR128_SUCCESS;
+
+  if (st->samplerate < 96000) {
+    st->d->interp = interp_create(49, 4, st->channels);
+    CHECK_ERROR(!st->d->interp, EBUR128_ERROR_NOMEM, exit)
+  } else if (st->samplerate < 192000) {
+    st->d->interp = interp_create(49, 2, st->channels);
+    CHECK_ERROR(!st->d->interp, EBUR128_ERROR_NOMEM, exit)
+  } else {
+    st->d->resampler_buffer_input = NULL;
+    st->d->resampler_buffer_output = NULL;
+    st->d->interp = NULL;
+    goto exit;
+  }
+
+  st->d->resampler_buffer_input_frames = st->d->samples_in_100ms * 4;
+  st->d->resampler_buffer_input = malloc(st->d->resampler_buffer_input_frames *
+                                      st->channels *
+                                      sizeof(float));
+  CHECK_ERROR(!st->d->resampler_buffer_input, EBUR128_ERROR_NOMEM, free_interp)
+
+  st->d->resampler_buffer_output_frames =
+                                    st->d->resampler_buffer_input_frames *
+                                    st->d->interp->factor;
+  st->d->resampler_buffer_output = malloc
+                                      (st->d->resampler_buffer_output_frames *
+                                       st->channels *
+                                       sizeof(float));
+  CHECK_ERROR(!st->d->resampler_buffer_output, EBUR128_ERROR_NOMEM, free_input)
+
+  return errcode;
+
+free_interp:
+  interp_destroy(st->d->interp);
+  st->d->interp = NULL;
+free_input:
+  free(st->d->resampler_buffer_input);
+  st->d->resampler_buffer_input = NULL;
+exit:
+  return errcode;
+}
+
+static void ebur128_destroy_resampler(ebur128_state* st) {
+  free(st->d->resampler_buffer_input);
+  st->d->resampler_buffer_input = NULL;
+  free(st->d->resampler_buffer_output);
+  st->d->resampler_buffer_output = NULL;
+  interp_destroy(st->d->interp);
+  st->d->interp = NULL;
+}
+
+void ebur128_get_version(int* major, int* minor, int* patch) {
+  *major = EBUR128_VERSION_MAJOR;
+  *minor = EBUR128_VERSION_MINOR;
+  *patch = EBUR128_VERSION_PATCH;
+}
+
+ebur128_state* ebur128_init(unsigned int channels,
+                            unsigned long samplerate,
+                            int mode) {
+  int result;
+  int errcode;
+  ebur128_state* st;
+  unsigned int i;
+  size_t j;
+
+  if (channels == 0 || samplerate < 5) {
+    return NULL;
+  }
+
+  st = (ebur128_state*) malloc(sizeof(ebur128_state));
+  CHECK_ERROR(!st, 0, exit)
+  st->d = (struct ebur128_state_internal*)
+          malloc(sizeof(struct ebur128_state_internal));
+  CHECK_ERROR(!st->d, 0, free_state)
+  st->channels = channels;
+  errcode = ebur128_init_channel_map(st);
+  CHECK_ERROR(errcode, 0, free_internal)
+
+  st->d->sample_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->sample_peak, 0, free_channel_map)
+  st->d->prev_sample_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->prev_sample_peak, 0, free_sample_peak)
+  st->d->true_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->true_peak, 0, free_prev_sample_peak)
+  st->d->prev_true_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->prev_true_peak, 0, free_true_peak)
+  for (i = 0; i < channels; ++i) {
+    st->d->sample_peak[i] = 0.0;
+    st->d->prev_sample_peak[i] = 0.0;
+    st->d->true_peak[i] = 0.0;
+    st->d->prev_true_peak[i] = 0.0;
+  }
+
+  st->d->use_histogram = mode & EBUR128_MODE_HISTOGRAM ? 1 : 0;
+  st->d->history = ULONG_MAX;
+  st->samplerate = samplerate;
+  st->d->samples_in_100ms = (st->samplerate + 5) / 10;
+  st->mode = mode;
+  if ((mode & EBUR128_MODE_S) == EBUR128_MODE_S) {
+    st->d->window = 3000;
+  } else if ((mode & EBUR128_MODE_M) == EBUR128_MODE_M) {
+    st->d->window = 400;
+  } else {
+    goto free_prev_true_peak;
+  }
+  st->d->audio_data_frames = st->samplerate * st->d->window / 1000;
+  if (st->d->audio_data_frames % st->d->samples_in_100ms) {
+    /* round up to multiple of samples_in_100ms */
+    st->d->audio_data_frames = st->d->audio_data_frames
+                             + st->d->samples_in_100ms
+                             - (st->d->audio_data_frames % st->d->samples_in_100ms);
+  }
+  st->d->audio_data = (double*) malloc(st->d->audio_data_frames *
+                                       st->channels *
+                                       sizeof(double));
+  CHECK_ERROR(!st->d->audio_data, 0, free_true_peak)
+  for (j = 0; j < st->d->audio_data_frames * st->channels; ++j) {
+    st->d->audio_data[j] = 0.0;
+  }
+
+  ebur128_init_filter(st);
+
+  if (st->d->use_histogram) {
+    st->d->block_energy_histogram = malloc(1000 * sizeof(unsigned long));
+    CHECK_ERROR(!st->d->block_energy_histogram, 0, free_audio_data)
+    for (i = 0; i < 1000; ++i) {
+      st->d->block_energy_histogram[i] = 0;
+    }
+  } else {
+    st->d->block_energy_histogram = NULL;
+  }
+  if (st->d->use_histogram) {
+    st->d->short_term_block_energy_histogram = malloc(1000 * sizeof(unsigned long));
+    CHECK_ERROR(!st->d->short_term_block_energy_histogram, 0, free_block_energy_histogram)
+    for (i = 0; i < 1000; ++i) {
+      st->d->short_term_block_energy_histogram[i] = 0;
+    }
+  } else {
+    st->d->short_term_block_energy_histogram = NULL;
+  }
+  STAILQ_INIT(&st->d->block_list);
+  st->d->block_list_size = 0;
+  st->d->block_list_max = st->d->history / 100;
+  STAILQ_INIT(&st->d->short_term_block_list);
+  st->d->st_block_list_size = 0;
+  st->d->st_block_list_max = st->d->history / 3000;
+  st->d->short_term_frame_counter = 0;
+
+  result = ebur128_init_resampler(st);
+  CHECK_ERROR(result, 0, free_short_term_block_energy_histogram)
+
+  /* the first block needs 400ms of audio data */
+  st->d->needed_frames = st->d->samples_in_100ms * 4;
+  /* start at the beginning of the buffer */
+  st->d->audio_data_index = 0;
+
+  /* initialize static constants */
+  relative_gate_factor = pow(10.0, relative_gate / 10.0);
+  minus_twenty_decibels = pow(10.0, -20.0 / 10.0);
+  histogram_energy_boundaries[0] = pow(10.0, (-70.0 + 0.691) / 10.0);
+  if (st->d->use_histogram) {
+    for (i = 0; i < 1000; ++i) {
+      histogram_energies[i] = pow(10.0, ((double) i / 10.0 - 69.95 + 0.691) / 10.0);
+    }
+    for (i = 1; i < 1001; ++i) {
+      histogram_energy_boundaries[i] = pow(10.0, ((double) i / 10.0 - 70.0 + 0.691) / 10.0);
+    }
+  }
+
+  return st;
+
+free_short_term_block_energy_histogram:
+  free(st->d->short_term_block_energy_histogram);
+free_block_energy_histogram:
+  free(st->d->block_energy_histogram);
+free_audio_data:
+  free(st->d->audio_data);
+free_prev_true_peak:
+  free(st->d->prev_true_peak);
+free_true_peak:
+  free(st->d->true_peak);
+free_prev_sample_peak:
+  free(st->d->prev_sample_peak);
+free_sample_peak:
+  free(st->d->sample_peak);
+free_channel_map:
+  free(st->d->channel_map);
+free_internal:
+  free(st->d);
+free_state:
+  free(st);
+exit:
+  return NULL;
+}
+
+void ebur128_destroy(ebur128_state** st) {
+  struct ebur128_dq_entry* entry;
+  free((*st)->d->block_energy_histogram);
+  free((*st)->d->short_term_block_energy_histogram);
+  free((*st)->d->audio_data);
+  free((*st)->d->channel_map);
+  free((*st)->d->sample_peak);
+  free((*st)->d->prev_sample_peak);
+  free((*st)->d->true_peak);
+  free((*st)->d->prev_true_peak);
+  while (!STAILQ_EMPTY(&(*st)->d->block_list)) {
+    entry = STAILQ_FIRST(&(*st)->d->block_list);
+    STAILQ_REMOVE_HEAD(&(*st)->d->block_list, entries);
+    free(entry);
+  }
+  while (!STAILQ_EMPTY(&(*st)->d->short_term_block_list)) {
+    entry = STAILQ_FIRST(&(*st)->d->short_term_block_list);
+    STAILQ_REMOVE_HEAD(&(*st)->d->short_term_block_list, entries);
+    free(entry);
+  }
+  ebur128_destroy_resampler(*st);
+  free((*st)->d);
+  free(*st);
+  *st = NULL;
+}
+
+static void ebur128_check_true_peak(ebur128_state* st, size_t frames) {
+  size_t c, i, frames_out;
+
+  frames_out = interp_process(st->d->interp, frames,
+                 st->d->resampler_buffer_input,
+                 st->d->resampler_buffer_output);
+
+  for (i = 0; i < frames_out; ++i) {
+    for (c = 0; c < st->channels; ++c) {
+      float val = st->d->resampler_buffer_output[i * st->channels + c];
+
+      if (val > st->d->prev_true_peak[c]) {
+        st->d->prev_true_peak[c] = val;
+      } else if (-val > st->d->prev_true_peak[c]) {
+        st->d->prev_true_peak[c] = -val;
+      }
+    }
+  }
+}
+
+#ifdef __SSE2_MATH__
+#include <xmmintrin.h>
+#define TURN_ON_FTZ \
+        unsigned int mxcsr = _mm_getcsr(); \
+        _mm_setcsr(mxcsr | _MM_FLUSH_ZERO_ON);
+#define TURN_OFF_FTZ _mm_setcsr(mxcsr);
+#define FLUSH_MANUALLY
+#else
+#warning "manual FTZ is being used, please enable SSE2 (-msse2 -mfpmath=sse)"
+#define TURN_ON_FTZ
+#define TURN_OFF_FTZ
+#define FLUSH_MANUALLY \
+    st->d->v[ci][4] = fabs(st->d->v[ci][4]) < DBL_MIN ? 0.0 : st->d->v[ci][4]; \
+    st->d->v[ci][3] = fabs(st->d->v[ci][3]) < DBL_MIN ? 0.0 : st->d->v[ci][3]; \
+    st->d->v[ci][2] = fabs(st->d->v[ci][2]) < DBL_MIN ? 0.0 : st->d->v[ci][2]; \
+    st->d->v[ci][1] = fabs(st->d->v[ci][1]) < DBL_MIN ? 0.0 : st->d->v[ci][1];
+#endif
+
+#define EBUR128_FILTER(type, min_scale, max_scale)                             \
+static void ebur128_filter_##type(ebur128_state* st, const type* src,          \
+                                  size_t frames) {                             \
+  static double scaling_factor =                                               \
+                 -((double) (min_scale)) > (double) (max_scale) ?              \
+                 -((double) (min_scale)) : (double) (max_scale);               \
+  double* audio_data = st->d->audio_data + st->d->audio_data_index;            \
+  size_t i, c;                                                                 \
+                                                                               \
+  TURN_ON_FTZ                                                                  \
+                                                                               \
+  if ((st->mode & EBUR128_MODE_SAMPLE_PEAK) == EBUR128_MODE_SAMPLE_PEAK) {     \
+    for (c = 0; c < st->channels; ++c) {                                       \
+      double max = 0.0;                                                        \
+      for (i = 0; i < frames; ++i) {                                           \
+        if (src[i * st->channels + c] > max) {                                 \
+          max =        src[i * st->channels + c];                              \
+        } else if (-src[i * st->channels + c] > max) {                         \
+          max = -1.0 * src[i * st->channels + c];                              \
+        }                                                                      \
+      }                                                                        \
+      max /= scaling_factor;                                                   \
+      if (max > st->d->prev_sample_peak[c]) st->d->prev_sample_peak[c] = max;  \
+    }                                                                          \
+  }                                                                            \
+  if ((st->mode & EBUR128_MODE_TRUE_PEAK) == EBUR128_MODE_TRUE_PEAK &&         \
+      st->d->interp) {                                                         \
+    for (c = 0; c < st->channels; ++c) {                                       \
+      for (i = 0; i < frames; ++i) {                                           \
+        st->d->resampler_buffer_input[i * st->channels + c] =                  \
+                      (float) (src[i * st->channels + c] / scaling_factor);    \
+      }                                                                        \
+    }                                                                          \
+    ebur128_check_true_peak(st, frames);                                       \
+  }                                                                            \
+  for (c = 0; c < st->channels; ++c) {                                         \
+    int ci = st->d->channel_map[c] - 1;                                        \
+    if (ci < 0) continue;                                                      \
+    else if (ci == EBUR128_DUAL_MONO - 1) ci = 0; /*dual mono */               \
+    for (i = 0; i < frames; ++i) {                                             \
+      st->d->v[ci][0] = (double) (src[i * st->channels + c] / scaling_factor)  \
+                   - st->d->a[1] * st->d->v[ci][1]                             \
+                   - st->d->a[2] * st->d->v[ci][2]                             \
+                   - st->d->a[3] * st->d->v[ci][3]                             \
+                   - st->d->a[4] * st->d->v[ci][4];                            \
+      audio_data[i * st->channels + c] =                                       \
+                     st->d->b[0] * st->d->v[ci][0]                             \
+                   + st->d->b[1] * st->d->v[ci][1]                             \
+                   + st->d->b[2] * st->d->v[ci][2]                             \
+                   + st->d->b[3] * st->d->v[ci][3]                             \
+                   + st->d->b[4] * st->d->v[ci][4];                            \
+      st->d->v[ci][4] = st->d->v[ci][3];                                       \
+      st->d->v[ci][3] = st->d->v[ci][2];                                       \
+      st->d->v[ci][2] = st->d->v[ci][1];                                       \
+      st->d->v[ci][1] = st->d->v[ci][0];                                       \
+    }                                                                          \
+    FLUSH_MANUALLY                                                             \
+  }                                                                            \
+  TURN_OFF_FTZ                                                                 \
+}
+EBUR128_FILTER(short, SHRT_MIN, SHRT_MAX)
+EBUR128_FILTER(int, INT_MIN, INT_MAX)
+EBUR128_FILTER(float, -1.0f, 1.0f)
+EBUR128_FILTER(double, -1.0, 1.0)
+
+static double ebur128_energy_to_loudness(double energy) {
+  return 10 * (log(energy) / log(10.0)) - 0.691;
+}
+
+static size_t find_histogram_index(double energy) {
+  size_t index_min = 0;
+  size_t index_max = 1000;
+  size_t index_mid;
+
+  do {
+    index_mid = (index_min + index_max) / 2;
+    if (energy >= histogram_energy_boundaries[index_mid]) {
+      index_min = index_mid;
+    } else {
+      index_max = index_mid;
+    }
+  } while (index_max - index_min != 1);
+
+  return index_min;
+}
+
+static int ebur128_calc_gating_block(ebur128_state* st, size_t frames_per_block,
+                                     double* optional_output) {
+  size_t i, c;
+  double sum = 0.0;
+  double channel_sum;
+  for (c = 0; c < st->channels; ++c) {
+    if (st->d->channel_map[c] == EBUR128_UNUSED) {
+      continue;
+    }
+    channel_sum = 0.0;
+    if (st->d->audio_data_index < frames_per_block * st->channels) {
+      for (i = 0; i < st->d->audio_data_index / st->channels; ++i) {
+        channel_sum += st->d->audio_data[i * st->channels + c] *
+                       st->d->audio_data[i * st->channels + c];
+      }
+      for (i = st->d->audio_data_frames -
+              (frames_per_block -
+               st->d->audio_data_index / st->channels);
+           i < st->d->audio_data_frames; ++i) {
+        channel_sum += st->d->audio_data[i * st->channels + c] *
+                       st->d->audio_data[i * st->channels + c];
+      }
+    } else {
+      for (i = st->d->audio_data_index / st->channels - frames_per_block;
+           i < st->d->audio_data_index / st->channels;
+           ++i) {
+        channel_sum += st->d->audio_data[i * st->channels + c] *
+                       st->d->audio_data[i * st->channels + c];
+      }
+    }
+    if (st->d->channel_map[c] == EBUR128_Mp110 ||
+        st->d->channel_map[c] == EBUR128_Mm110 ||
+        st->d->channel_map[c] == EBUR128_Mp060 ||
+        st->d->channel_map[c] == EBUR128_Mm060 ||
+        st->d->channel_map[c] == EBUR128_Mp090 ||
+        st->d->channel_map[c] == EBUR128_Mm090) {
+      channel_sum *= 1.41;
+    } else if (st->d->channel_map[c] == EBUR128_DUAL_MONO) {
+      channel_sum *= 2.0;
+    }
+    sum += channel_sum;
+  }
+  sum /= (double) frames_per_block;
+  if (optional_output) {
+    *optional_output = sum;
+    return EBUR128_SUCCESS;
+  } else if (sum >= histogram_energy_boundaries[0]) {
+    if (st->d->use_histogram) {
+      ++st->d->block_energy_histogram[find_histogram_index(sum)];
+    } else {
+      struct ebur128_dq_entry* block;
+      if (st->d->block_list_size == st->d->block_list_max) {
+        block = STAILQ_FIRST(&st->d->block_list);
+        STAILQ_REMOVE_HEAD(&st->d->block_list, entries);
+      } else {
+        block = (struct ebur128_dq_entry*) malloc(sizeof(struct ebur128_dq_entry));
+        if (!block) {
+          return EBUR128_ERROR_NOMEM;
+        }
+        st->d->block_list_size++;
+      }
+      block->z = sum;
+      STAILQ_INSERT_TAIL(&st->d->block_list, block, entries);
+    }
+    return EBUR128_SUCCESS;
+  } else {
+    return EBUR128_SUCCESS;
+  }
+}
+
+int ebur128_set_channel(ebur128_state* st,
+                        unsigned int channel_number,
+                        int value) {
+  if (channel_number >= st->channels) {
+    return 1;
+  }
+  if (value == EBUR128_DUAL_MONO &&
+      (st->channels != 1 || channel_number != 0)) {
+    fprintf(stderr, "EBUR128_DUAL_MONO only works with mono files!\n");
+    return 1;
+  }
+  st->d->channel_map[channel_number] = value;
+  return 0;
+}
+
+int ebur128_change_parameters(ebur128_state* st,
+                              unsigned int channels,
+                              unsigned long samplerate) {
+  int errcode = EBUR128_SUCCESS;
+  size_t j;
+
+  if (channels == 0 || samplerate < 5) {
+    return EBUR128_ERROR_NOMEM;
+  }
+
+  if (channels == st->channels &&
+      samplerate == st->samplerate) {
+    return EBUR128_ERROR_NO_CHANGE;
+  }
+
+  free(st->d->audio_data);
+  st->d->audio_data = NULL;
+
+  if (channels != st->channels) {
+    unsigned int i;
+
+    free(st->d->channel_map); st->d->channel_map = NULL;
+    free(st->d->sample_peak); st->d->sample_peak = NULL;
+    free(st->d->prev_sample_peak); st->d->prev_sample_peak = NULL;
+    free(st->d->true_peak);   st->d->true_peak = NULL;
+    free(st->d->prev_true_peak); st->d->prev_true_peak = NULL;
+    st->channels = channels;
+
+    errcode = ebur128_init_channel_map(st);
+    CHECK_ERROR(errcode, EBUR128_ERROR_NOMEM, exit)
+
+    st->d->sample_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->sample_peak, EBUR128_ERROR_NOMEM, exit)
+    st->d->prev_sample_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->prev_sample_peak, EBUR128_ERROR_NOMEM, exit)
+    st->d->true_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->true_peak, EBUR128_ERROR_NOMEM, exit)
+    st->d->prev_true_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->prev_true_peak, EBUR128_ERROR_NOMEM, exit)
+    for (i = 0; i < channels; ++i) {
+      st->d->sample_peak[i] = 0.0;
+      st->d->prev_sample_peak[i] = 0.0;
+      st->d->true_peak[i] = 0.0;
+      st->d->prev_true_peak[i] = 0.0;
+    }
+  }
+  if (samplerate != st->samplerate) {
+    st->samplerate = samplerate;
+    st->d->samples_in_100ms = (st->samplerate + 5) / 10;
+    ebur128_init_filter(st);
+  }
+  st->d->audio_data_frames = st->samplerate * st->d->window / 1000;
+  if (st->d->audio_data_frames % st->d->samples_in_100ms) {
+    /* round up to multiple of samples_in_100ms */
+    st->d->audio_data_frames = st->d->audio_data_frames
+                             + st->d->samples_in_100ms
+                             - (st->d->audio_data_frames % st->d->samples_in_100ms);
+  }
+  st->d->audio_data = (double*) malloc(st->d->audio_data_frames *
+                                       st->channels *
+                                       sizeof(double));
+  CHECK_ERROR(!st->d->audio_data, EBUR128_ERROR_NOMEM, exit)
+  for (j = 0; j < st->d->audio_data_frames * st->channels; ++j) {
+    st->d->audio_data[j] = 0.0;
+  }
+
+  ebur128_destroy_resampler(st);
+  errcode = ebur128_init_resampler(st);
+  CHECK_ERROR(errcode, EBUR128_ERROR_NOMEM, exit)
+
+  /* the first block needs 400ms of audio data */
+  st->d->needed_frames = st->d->samples_in_100ms * 4;
+  /* start at the beginning of the buffer */
+  st->d->audio_data_index = 0;
+  /* reset short term frame counter */
+  st->d->short_term_frame_counter = 0;
+
+exit:
+  return errcode;
+}
+
+int ebur128_set_max_window(ebur128_state* st, unsigned long window)
+{
+  int errcode = EBUR128_SUCCESS;
+  size_t j;
+
+  if ((st->mode & EBUR128_MODE_S) == EBUR128_MODE_S && window < 3000) {
+    window = 3000;
+  } else if ((st->mode & EBUR128_MODE_M) == EBUR128_MODE_M && window < 400) {
+    window = 400;
+  }
+  if (window == st->d->window) {
+    return EBUR128_ERROR_NO_CHANGE;
+  }
+
+  st->d->window = window;
+  free(st->d->audio_data);
+  st->d->audio_data = NULL;
+  st->d->audio_data_frames = st->samplerate * st->d->window / 1000;
+  if (st->d->audio_data_frames % st->d->samples_in_100ms) {
+    /* round up to multiple of samples_in_100ms */
+    st->d->audio_data_frames = st->d->audio_data_frames
+                             + st->d->samples_in_100ms
+                             - (st->d->audio_data_frames % st->d->samples_in_100ms);
+  }
+  st->d->audio_data = (double*) malloc(st->d->audio_data_frames *
+                                       st->channels *
+                                       sizeof(double));
+  CHECK_ERROR(!st->d->audio_data, EBUR128_ERROR_NOMEM, exit)
+  for (j = 0; j < st->d->audio_data_frames * st->channels; ++j) {
+    st->d->audio_data[j] = 0.0;
+  }
+
+  /* the first block needs 400ms of audio data */
+  st->d->needed_frames = st->d->samples_in_100ms * 4;
+  /* start at the beginning of the buffer */
+  st->d->audio_data_index = 0;
+  /* reset short term frame counter */
+  st->d->short_term_frame_counter = 0;
+
+exit:
+  return errcode;
+}
+
+int ebur128_set_max_history(ebur128_state* st, unsigned long history)
+{
+  if ((st->mode & EBUR128_MODE_LRA) == EBUR128_MODE_LRA && history < 3000) {
+    history = 3000;
+  } else if ((st->mode & EBUR128_MODE_M) == EBUR128_MODE_M && history < 400) {
+    history = 400;
+  }
+  if (history == st->d->history) {
+    return EBUR128_ERROR_NO_CHANGE;
+  }
+  st->d->history = history;
+  st->d->block_list_max = st->d->history / 100;
+  st->d->st_block_list_max = st->d->history / 3000;
+  while (st->d->block_list_size > st->d->block_list_max) {
+    struct ebur128_dq_entry* block = STAILQ_FIRST(&st->d->block_list);
+    STAILQ_REMOVE_HEAD(&st->d->block_list, entries);
+    free(block);
+    st->d->block_list_size--;
+  }
+  while (st->d->st_block_list_size > st->d->st_block_list_max) {
+    struct ebur128_dq_entry* block = STAILQ_FIRST(&st->d->short_term_block_list);
+    STAILQ_REMOVE_HEAD(&st->d->short_term_block_list, entries);
+    free(block);
+    st->d->st_block_list_size--;
+  }
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_energy_shortterm(ebur128_state* st, double* out);
+#define EBUR128_ADD_FRAMES(type)                                               \
+int ebur128_add_frames_##type(ebur128_state* st,                               \
+                              const type* src, size_t frames) {                \
+  size_t src_index = 0;                                                        \
+  unsigned int c = 0;                                                          \
+  for (c = 0; c < st->channels; c++) {                                         \
+    st->d->prev_sample_peak[c] = 0.0;                                          \
+    st->d->prev_true_peak[c] = 0.0;                                            \
+  }                                                                            \
+  while (frames > 0) {                                                         \
+    if (frames >= st->d->needed_frames) {                                      \
+      ebur128_filter_##type(st, src + src_index, st->d->needed_frames);        \
+      src_index += st->d->needed_frames * st->channels;                        \
+      frames -= st->d->needed_frames;                                          \
+      st->d->audio_data_index += st->d->needed_frames * st->channels;          \
+      /* calculate the new gating block */                                     \
+      if ((st->mode & EBUR128_MODE_I) == EBUR128_MODE_I) {                     \
+        if (ebur128_calc_gating_block(st, st->d->samples_in_100ms * 4, NULL)) {\
+          return EBUR128_ERROR_NOMEM;                                          \
+        }                                                                      \
+      }                                                                        \
+      if ((st->mode & EBUR128_MODE_LRA) == EBUR128_MODE_LRA) {                 \
+        st->d->short_term_frame_counter += st->d->needed_frames;               \
+        if (st->d->short_term_frame_counter == st->d->samples_in_100ms * 30) { \
+          struct ebur128_dq_entry* block;                                      \
+          double st_energy;                                                    \
+          if (ebur128_energy_shortterm(st, &st_energy) == EBUR128_SUCCESS &&   \
+                  st_energy >= histogram_energy_boundaries[0]) {               \
+            if (st->d->use_histogram) {                                        \
+              ++st->d->short_term_block_energy_histogram[                      \
+                                              find_histogram_index(st_energy)];\
+            } else {                                                           \
+              if (st->d->st_block_list_size == st->d->st_block_list_max) {     \
+                block = STAILQ_FIRST(&st->d->short_term_block_list);           \
+                STAILQ_REMOVE_HEAD(&st->d->short_term_block_list, entries);    \
+              } else {                                                         \
+                block = (struct ebur128_dq_entry*)                             \
+                        malloc(sizeof(struct ebur128_dq_entry));               \
+                if (!block) return EBUR128_ERROR_NOMEM;                        \
+                st->d->st_block_list_size++;                                   \
+              }                                                                \
+              block->z = st_energy;                                            \
+              STAILQ_INSERT_TAIL(&st->d->short_term_block_list,                \
+                                 block, entries);                              \
+            }                                                                  \
+          }                                                                    \
+          st->d->short_term_frame_counter = st->d->samples_in_100ms * 20;      \
+        }                                                                      \
+      }                                                                        \
+      /* 100ms are needed for all blocks besides the first one */              \
+      st->d->needed_frames = st->d->samples_in_100ms;                          \
+      /* reset audio_data_index when buffer full */                            \
+      if (st->d->audio_data_index == st->d->audio_data_frames * st->channels) {\
+        st->d->audio_data_index = 0;                                           \
+      }                                                                        \
+    } else {                                                                   \
+      ebur128_filter_##type(st, src + src_index, frames);                      \
+      st->d->audio_data_index += frames * st->channels;                        \
+      if ((st->mode & EBUR128_MODE_LRA) == EBUR128_MODE_LRA) {                 \
+        st->d->short_term_frame_counter += frames;                             \
+      }                                                                        \
+      st->d->needed_frames -= frames;                                          \
+      frames = 0;                                                              \
+    }                                                                          \
+  }                                                                            \
+  for (c = 0; c < st->channels; c++) {                                         \
+    if (st->d->prev_sample_peak[c] > st->d->sample_peak[c]) {                  \
+      st->d->sample_peak[c] = st->d->prev_sample_peak[c];                      \
+    }                                                                          \
+    if (st->d->prev_true_peak[c] > st->d->true_peak[c]) {                      \
+      st->d->true_peak[c] = st->d->prev_true_peak[c];                          \
+    }                                                                          \
+  }                                                                            \
+  return EBUR128_SUCCESS;                                                      \
+}
+EBUR128_ADD_FRAMES(short)
+EBUR128_ADD_FRAMES(int)
+EBUR128_ADD_FRAMES(float)
+EBUR128_ADD_FRAMES(double)
+
+static int ebur128_calc_relative_threshold(ebur128_state* st,
+                                           size_t* above_thresh_counter,
+                                           double* relative_threshold) {
+  struct ebur128_dq_entry* it;
+  size_t i;
+
+  if (st->d->use_histogram) {
+    for (i = 0; i < 1000; ++i) {
+      *relative_threshold += st->d->block_energy_histogram[i] *
+                            histogram_energies[i];
+      *above_thresh_counter += st->d->block_energy_histogram[i];
+    }
+  } else {
+    STAILQ_FOREACH(it, &st->d->block_list, entries) {
+      ++*above_thresh_counter;
+      *relative_threshold += it->z;
+    }
+  }
+
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_gated_loudness(ebur128_state** sts, size_t size,
+                                  double* out) {
+  struct ebur128_dq_entry* it;
+  double gated_loudness = 0.0;
+  double relative_threshold = 0.0;
+  size_t above_thresh_counter = 0;
+  size_t i, j, start_index;
+
+  for (i = 0; i < size; i++) {
+    if (sts[i] && (sts[i]->mode & EBUR128_MODE_I) != EBUR128_MODE_I) {
+      return EBUR128_ERROR_INVALID_MODE;
+    }
+  }
+
+  for (i = 0; i < size; i++) {
+    if (!sts[i]) {
+      continue;
+    }
+    ebur128_calc_relative_threshold(sts[i], &above_thresh_counter, &relative_threshold);
+  }
+  if (!above_thresh_counter) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+
+  relative_threshold /= (double)above_thresh_counter;
+  relative_threshold *= relative_gate_factor;
+
+  above_thresh_counter = 0;
+  if (relative_threshold < histogram_energy_boundaries[0]) {
+    start_index = 0;
+  } else {
+    start_index = find_histogram_index(relative_threshold);
+    if (relative_threshold > histogram_energies[start_index]) {
+      ++start_index;
+    }
+  }
+  for (i = 0; i < size; i++) {
+    if (!sts[i]) {
+      continue;
+    }
+    if (sts[i]->d->use_histogram) {
+      for (j = start_index; j < 1000; ++j) {
+        gated_loudness += sts[i]->d->block_energy_histogram[j] *
+                          histogram_energies[j];
+        above_thresh_counter += sts[i]->d->block_energy_histogram[j];
+      }
+    } else {
+      STAILQ_FOREACH(it, &sts[i]->d->block_list, entries) {
+        if (it->z >= relative_threshold) {
+          ++above_thresh_counter;
+          gated_loudness += it->z;
+        }
+      }
+    }
+  }
+  if (!above_thresh_counter) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  gated_loudness /= (double) above_thresh_counter;
+  *out = ebur128_energy_to_loudness(gated_loudness);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_relative_threshold(ebur128_state* st, double* out) {
+  double relative_threshold = 0.0;
+  size_t above_thresh_counter = 0;
+
+  if ((st->mode & EBUR128_MODE_I) != EBUR128_MODE_I) {
+    return EBUR128_ERROR_INVALID_MODE;
+  }
+
+  ebur128_calc_relative_threshold(st, &above_thresh_counter, &relative_threshold);
+
+  if (!above_thresh_counter) {
+      *out = -70.0;
+      return EBUR128_SUCCESS;
+  }
+
+  relative_threshold /= (double)above_thresh_counter;
+  relative_threshold *= relative_gate_factor;
+
+  *out = ebur128_energy_to_loudness(relative_threshold);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_loudness_global(ebur128_state* st, double* out) {
+  return ebur128_gated_loudness(&st, 1, out);
+}
+
+int ebur128_loudness_global_multiple(ebur128_state** sts, size_t size,
+                                     double* out) {
+  return ebur128_gated_loudness(sts, size, out);
+}
+
+static int ebur128_energy_in_interval(ebur128_state* st,
+                                      size_t interval_frames,
+                                      double* out) {
+  if (interval_frames > st->d->audio_data_frames) {
+    return EBUR128_ERROR_INVALID_MODE;
+  }
+  ebur128_calc_gating_block(st, interval_frames, out);
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_energy_shortterm(ebur128_state* st, double* out) {
+  return ebur128_energy_in_interval(st, st->d->samples_in_100ms * 30, out);
+}
+
+int ebur128_loudness_momentary(ebur128_state* st, double* out) {
+  double energy;
+  int error = ebur128_energy_in_interval(st, st->d->samples_in_100ms * 4,
+                                         &energy);
+  if (error) {
+    return error;
+  } else if (energy <= 0.0) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  *out = ebur128_energy_to_loudness(energy);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_loudness_shortterm(ebur128_state* st, double* out) {
+  double energy;
+  int error = ebur128_energy_shortterm(st, &energy);
+  if (error) {
+    return error;
+  } else if (energy <= 0.0) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  *out = ebur128_energy_to_loudness(energy);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_loudness_window(ebur128_state* st,
+                            unsigned long window,
+                            double* out) {
+  double energy;
+  size_t interval_frames = st->samplerate * window / 1000;
+  int error = ebur128_energy_in_interval(st, interval_frames, &energy);
+  if (error) {
+    return error;
+  } else if (energy <= 0.0) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  *out = ebur128_energy_to_loudness(energy);
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_double_cmp(const void *p1, const void *p2) {
+  const double* d1 = (const double*) p1;
+  const double* d2 = (const double*) p2;
+  return (*d1 > *d2) - (*d1 < *d2);
+}
+
+/* EBU - TECH 3342 */
+int ebur128_loudness_range_multiple(ebur128_state** sts, size_t size,
+                                    double* out) {
+  size_t i, j;
+  struct ebur128_dq_entry* it;
+  double* stl_vector;
+  size_t stl_size;
+  double* stl_relgated;
+  size_t stl_relgated_size;
+  double stl_power, stl_integrated;
+  /* High and low percentile energy */
+  double h_en, l_en;
+  int use_histogram = 0;
+
+  for (i = 0; i < size; ++i) {
+    if (sts[i]) {
+      if ((sts[i]->mode & EBUR128_MODE_LRA) != EBUR128_MODE_LRA) {
+        return EBUR128_ERROR_INVALID_MODE;
+      }
+      if (i == 0 && sts[i]->mode & EBUR128_MODE_HISTOGRAM) {
+        use_histogram = 1;
+      } else if (use_histogram != !!(sts[i]->mode & EBUR128_MODE_HISTOGRAM)) {
+        return EBUR128_ERROR_INVALID_MODE;
+      }
+    }
+  }
+
+  if (use_histogram) {
+    unsigned long hist[1000] = { 0 };
+    size_t percentile_low, percentile_high;
+    size_t index;
+
+    stl_size = 0;
+    stl_power = 0.0;
+    for (i = 0; i < size; ++i) {
+      if (!sts[i]) {
+        continue;
+      }
+      for (j = 0; j < 1000; ++j) {
+        hist[j]   += sts[i]->d->short_term_block_energy_histogram[j];
+        stl_size  += sts[i]->d->short_term_block_energy_histogram[j];
+        stl_power += sts[i]->d->short_term_block_energy_histogram[j]
+                     * histogram_energies[j];
+      }
+    }
+    if (!stl_size) {
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+
+    stl_power /= stl_size;
+    stl_integrated = minus_twenty_decibels * stl_power;
+
+    if (stl_integrated < histogram_energy_boundaries[0]) {
+      index = 0;
+    } else {
+      index = find_histogram_index(stl_integrated);
+      if (stl_integrated > histogram_energies[index]) {
+        ++index;
+      }
+    }
+    stl_size = 0;
+    for (j = index; j < 1000; ++j) {
+      stl_size += hist[j];
+    }
+    if (!stl_size) {
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+
+    percentile_low  = (size_t) ((stl_size - 1) * 0.1 + 0.5);
+    percentile_high = (size_t) ((stl_size - 1) * 0.95 + 0.5);
+
+    stl_size = 0;
+    j = index;
+    while (stl_size <= percentile_low) {
+      stl_size += hist[j++];
+    }
+    l_en = histogram_energies[j - 1];
+    while (stl_size <= percentile_high) {
+      stl_size += hist[j++];
+    }
+    h_en = histogram_energies[j - 1];
+    *out = ebur128_energy_to_loudness(h_en) - ebur128_energy_to_loudness(l_en);
+    return EBUR128_SUCCESS;
+
+  } else {
+    stl_size = 0;
+    for (i = 0; i < size; ++i) {
+      if (!sts[i]) {
+        continue;
+      }
+      STAILQ_FOREACH(it, &sts[i]->d->short_term_block_list, entries) {
+        ++stl_size;
+      }
+    }
+    if (!stl_size) {
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+    stl_vector = (double*) malloc(stl_size * sizeof(double));
+    if (!stl_vector) {
+      return EBUR128_ERROR_NOMEM;
+    }
+
+    j = 0;
+    for (i = 0; i < size; ++i) {
+      if (!sts[i]) {
+        continue;
+      }
+      STAILQ_FOREACH(it, &sts[i]->d->short_term_block_list, entries) {
+        stl_vector[j] = it->z;
+        ++j;
+      }
+    }
+    qsort(stl_vector, stl_size, sizeof(double), ebur128_double_cmp);
+    stl_power = 0.0;
+    for (i = 0; i < stl_size; ++i) {
+      stl_power += stl_vector[i];
+    }
+    stl_power /= (double) stl_size;
+    stl_integrated = minus_twenty_decibels * stl_power;
+
+    stl_relgated = stl_vector;
+    stl_relgated_size = stl_size;
+    while (stl_relgated_size > 0 && *stl_relgated < stl_integrated) {
+      ++stl_relgated;
+      --stl_relgated_size;
+    }
+
+    if (stl_relgated_size) {
+      h_en = stl_relgated[(size_t) ((stl_relgated_size - 1) * 0.95 + 0.5)];
+      l_en = stl_relgated[(size_t) ((stl_relgated_size - 1) * 0.1 + 0.5)];
+      free(stl_vector);
+      *out = ebur128_energy_to_loudness(h_en) - ebur128_energy_to_loudness(l_en);
+      return EBUR128_SUCCESS;
+    } else {
+      free(stl_vector);
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+  }
+}
+
+int ebur128_loudness_range(ebur128_state* st, double* out) {
+  return ebur128_loudness_range_multiple(&st, 1, out);
+}
+
+int ebur128_sample_peak(ebur128_state* st,
+                        unsigned int channel_number,
+                        double* out) {
+  if ((st->mode & EBUR128_MODE_SAMPLE_PEAK) != EBUR128_MODE_SAMPLE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_prev_sample_peak(ebur128_state* st,
+                             unsigned int channel_number,
+                             double* out) {
+  if ((st->mode & EBUR128_MODE_SAMPLE_PEAK) != EBUR128_MODE_SAMPLE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->prev_sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_true_peak(ebur128_state* st,
+                      unsigned int channel_number,
+                      double* out) {
+  if ((st->mode & EBUR128_MODE_TRUE_PEAK) != EBUR128_MODE_TRUE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->true_peak[channel_number] > st->d->sample_peak[channel_number]
+       ? st->d->true_peak[channel_number]
+       : st->d->sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_prev_true_peak(ebur128_state* st,
+                      unsigned int channel_number,
+                      double* out) {
+  if ((st->mode & EBUR128_MODE_TRUE_PEAK) != EBUR128_MODE_TRUE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->prev_true_peak[channel_number]
+                              > st->d->prev_sample_peak[channel_number]
+       ? st->d->prev_true_peak[channel_number]
+       : st->d->prev_sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/CMakeLists.txt b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/CMakeLists.txt
new file mode 100644
index 0000000..3045b00
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_WAVES_SRCS)
+add_library(waves ${DIR_WAVES_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/inc/ExtraMono.h b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/inc/ExtraMono.h
new file mode 100755
index 0000000..280fab0
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/inc/ExtraMono.h
@@ -0,0 +1,230 @@
+
+#include <string>
+#include <string.h>
+
+#define SIZE_LONG 4
+#define SIZE_SHORT 2
+
+#define SIZE_FLAG 4
+#define FMT_TAG 0x0001
+
+#define BITS_PER_BYTE 8
+
+#ifndef AFS_CMPL_MAX_WAV	
+#define AFS_CMPL_MAX_WAV 15360000	// 时长16分（960*16000）
+#endif
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个32位数据
+//+---------------------------------------------------------------------------+
+unsigned long fa_read_u32(FILE* fp)
+{
+	unsigned long cx;
+	unsigned char temp[SIZE_LONG];
+
+	fread(temp, sizeof(unsigned char), SIZE_LONG, fp);
+	cx =  (unsigned long)temp[0];
+	cx |= (unsigned long)temp[1] << 8;
+	cx |= (unsigned long)temp[2] << 16;
+	cx |= (unsigned long)temp[3] << 24;
+	return cx;
+}
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个16位数据
+//+---------------------------------------------------------------------------+
+unsigned short fa_read_u16(FILE *fp)
+{
+	unsigned short cx;
+	unsigned char  temp[SIZE_SHORT];
+
+	fread(temp, sizeof(unsigned char), SIZE_SHORT, fp);
+	cx = temp[0] | (temp[1] * 256);
+	return cx;
+}
+
+int GetWaveHeadLen(const char* pszFile,unsigned short &channels, int &nPos, int& nLength)
+{
+	//+---------------------------------------------------------------------------+
+	//+ 读取WAVE的头信息
+	//+---------------------------------------------------------------------------+
+	unsigned char  temp[SIZE_FLAG];
+	unsigned short bits_per_sample;
+	unsigned long  x_size;
+	unsigned long  n_skip;
+
+	unsigned short format;
+	//unsigned short channels;
+	unsigned long  sample_rate;
+	unsigned short block_align;
+	unsigned long  data_size;
+	int nCnt = 0;
+
+	/* 读取通用信息 */
+	FILE* pWavFile = fopen(pszFile, "rb");
+	if ( pWavFile == NULL )
+	{
+		printf("Input file can not be opened!\n");
+		return -1;
+	}
+
+	fseek(pWavFile, 0, SEEK_END );
+	nLength = ftell(pWavFile);
+	fseek(pWavFile, 0, SEEK_SET );
+
+	// 判断资源标识为"RIFF"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "RIFF", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Resource flag is not RIFF!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+	nCnt += SIZE_LONG;
+
+	// 判断文件标识为"WAVE"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "WAVE", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "File flag is not WAVE\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	// 判断格式标识为"fmt "
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "fmt ", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Format flag is not FMT!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	x_size = fa_read_u32(pWavFile);
+	nCnt += SIZE_LONG;
+
+	// 判断编码格式为0x0001
+	format = fa_read_u16(pWavFile);
+	nCnt += SIZE_SHORT;
+	if ( format != FMT_TAG )
+	{
+		fprintf(stderr, "Encoding format is not 0x0001!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+
+	// 读取声道数目和采样频率
+	channels = fa_read_u16(pWavFile);
+	sample_rate = fa_read_u32(pWavFile);
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+
+	// 读取对齐单位和样本位数
+	block_align = fa_read_u16(pWavFile);
+	bits_per_sample = fa_read_u16(pWavFile);
+
+	/* 读取特殊信息 */
+	x_size -= (4*SIZE_SHORT + 2*SIZE_LONG);
+	if ( x_size != 0 )
+	{
+		fseek(pWavFile, x_size, SEEK_CUR);
+	}
+
+	// 读取数据大小
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	while ( memcmp(temp, "data", SIZE_FLAG) != 0 )
+	{
+		n_skip = fa_read_u32(pWavFile);
+		fseek(pWavFile, n_skip, SEEK_CUR);
+
+		fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	}
+
+	data_size = fa_read_u32(pWavFile);
+	fclose(pWavFile);
+
+	//+---------------------------------------------------------------------------+
+	//+ 返回WAVE的头长度
+	//+---------------------------------------------------------------------------+
+	nPos = nCnt;
+	int nHeadLength = nLength - data_size;
+	return nHeadLength;
+}
+
+bool ExtraMono(const std::string &sInput, const std::string &sOutput)
+{
+	FILE *pFile = fopen(sInput.c_str(), "rb");
+	if ( NULL == pFile )
+	{
+		printf("Fopen Error %s", sInput.c_str());
+		return false;
+	}
+
+	FILE *pFile2 = fopen(sOutput.c_str(), "wb");
+	if ( NULL == pFile2 )
+	{
+		printf("Fopen2 Error %s", sOutput.c_str());
+		return false;
+	}
+
+	short *pBuf = new short[AFS_CMPL_MAX_WAV];
+	int nLen = 0;
+
+	nLen = fread(pBuf, sizeof(short), AFS_CMPL_MAX_WAV, pFile);
+	if ( nLen <= 0 )
+	{
+		perror("Fread Error!");
+		return false;
+	}
+
+	unsigned short channels=0;
+	int nPos;
+	int nLength;
+	int nHeadByte = GetWaveHeadLen(sInput.c_str(),channels, nPos, nLength);
+	int nHeadShort = nHeadByte/2;
+	
+	if (channels==1)
+	{
+		fwrite(pBuf + nHeadShort, sizeof(short), nLen - nHeadShort, pFile2);
+	}
+	else
+	{
+		short *pBuf2 = new short[AFS_CMPL_MAX_WAV];
+		memcpy( pBuf2, pBuf, nHeadShort*sizeof(short));
+		pBuf2[nPos] = 1;
+
+		unsigned char tmp[2];
+		memcpy(tmp, &pBuf2[nPos], 2);
+
+		pBuf2[nPos] = static_cast<short>(tmp[0] | tmp[1]*256);
+
+		short *pWav = pBuf + nHeadShort;
+		nLen -= nHeadShort;
+
+		int halfnlen=nLen/2;
+		for (int i=0;i<=halfnlen;i++ )
+		{
+			pBuf2[nHeadShort+i] = *(pWav+i*2);
+		}
+		fwrite(pBuf2, sizeof(short), nLen+nHeadShort, pFile2);
+
+		delete []pBuf;
+		delete []pBuf2;
+		pBuf = NULL;
+		pBuf2 = NULL;
+	}
+
+
+	fclose(pFile);
+	fclose(pFile2);
+	return true;
+}
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/inc/WaveFile.h b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/inc/WaveFile.h
new file mode 100755
index 0000000..8b57806
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/inc/WaveFile.h
@@ -0,0 +1,74 @@
+#ifndef WAVE_FILE_H
+#define WAVE_FILE_H
+
+#include <stdio.h>
+#include <stdint.h>
+
+
+typedef enum SAMPLE_FORMAT
+{
+    SF_U8 = 8,
+    SF_S16 = 16,
+    SF_S24 = 24,
+    SF_S32 = 32,
+    SF_IEEE_FLOAT = 0x100 + 32,
+    SF_IEEE_DOUBLE = 0x100 + 64,
+    SF_MAX,
+} SAMPLE_FORMAT;
+
+/* 主处理对象 **/
+class CWaveFile
+{
+public:
+	/* 构造传入文件及 是读还是写 **/
+    CWaveFile(const char* Filename, bool Write);
+    virtual ~CWaveFile();
+
+public:
+    int GetChannels();
+    int GetSampleRate();
+    double GetDuration();  // in second
+    uint32_t GetChannelMask();
+    void SetChannels(int Channels);
+    void SetSampleRate(int SampleRate);
+    void SetSampleFormat(SAMPLE_FORMAT Format);
+    void SetChannelMask(uint32_t Mask);
+    void Stat();
+    void SetupDone();
+    bool ReadFrameAsS16(short* FrameSamples, int Frames = 1);
+    bool ReadFrameAsDouble(double* FrameSamples, int Frames = 1);
+	bool ReadFrameAsfloat(float* FrameSamples, int Frames = 1);
+	void WriteRaw(void* Raw, int Size);
+    void WriteFrame(uint8_t* FrameSamples, int Frames = 1);
+    void WriteFrame(short* FrameSamples, int Frames = 1);
+    void WriteFrame(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrameS24(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrame(double* FrameSamples, int Frames = 1);
+    void WriteFrame(float* FrameSamples, int Frames=1);
+    void Seek(int FramePos, int Where = SEEK_SET);
+	bool GetStatus();
+	SAMPLE_FORMAT GetFormat();
+	int GetTotalFrames();
+	int GetFramesRead();
+
+
+protected:
+    FILE* File;
+    int Channels;					/* 通道数 **/
+    int SampleRate;					/* 采样率 **/
+    SAMPLE_FORMAT Format;			/* 采样精度 **/
+    int SampleSize; // Measured in Bits
+    unsigned int FrameStartPos;		/* 音频数据的起始位置 **/
+    unsigned long TotalFrames;		/* 总帧数，如果16bit，则一个short为一帧 **/
+    unsigned long FramesRead;
+    double Duration;				/* 时长 **/
+
+    bool ReadOnly;					/* 是度还是写 **/
+
+    uint32_t ChannelMask;
+
+	bool m_bOK;		/* 文件是否已经被打开 **/
+};
+
+
+#endif
\ No newline at end of file
diff --git a/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/src/WaveFile.cpp b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/src/WaveFile.cpp
new file mode 100755
index 0000000..1a47272
--- /dev/null
+++ b/AutoCoverTool/ref/music_remover/standard_audio/ref/waves/src/WaveFile.cpp
@@ -0,0 +1,818 @@
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <memory.h>
+#include <errno.h>
+
+#if WIN32
+#else
+#include <inttypes.h>
+#endif
+
+#include "WaveFile.h"
+
+#define SPEAKER_FRONT_LEFT             0x1
+#define SPEAKER_FRONT_RIGHT            0x2
+#define SPEAKER_FRONT_CENTER           0x4
+#define SPEAKER_LOW_FREQUENCY          0x8
+#define SPEAKER_BACK_LEFT              0x10
+#define SPEAKER_BACK_RIGHT             0x20
+#define SPEAKER_FRONT_LEFT_OF_CENTER   0x40
+#define SPEAKER_FRONT_RIGHT_OF_CENTER  0x80
+#define SPEAKER_BACK_CENTER            0x100
+#define SPEAKER_SIDE_LEFT              0x200
+#define SPEAKER_SIDE_RIGHT             0x400
+#define SPEAKER_TOP_CENTER             0x800
+#define SPEAKER_TOP_FRONT_LEFT         0x1000
+#define SPEAKER_TOP_FRONT_CENTER       0x2000
+#define SPEAKER_TOP_FRONT_RIGHT        0x4000
+#define SPEAKER_TOP_BACK_LEFT          0x8000
+#define SPEAKER_TOP_BACK_CENTER        0x10000
+#define SPEAKER_TOP_BACK_RIGHT         0x20000
+#define SPEAKER_RESERVED               0x80000000
+
+
+#define SPEAKER_REAR_CENTER_SURROUND   SPEAKER_BACK_CENTER 
+
+#define DCA_MONO 0
+#define DCA_CHANNEL 1
+#define DCA_STEREO 2
+#define DCA_STEREO_SUMDIFF 3
+#define DCA_STEREO_TOTAL 4
+#define DCA_3F 5
+#define DCA_2F1R 6
+#define DCA_3F1R 7
+#define DCA_2F2R 8
+#define DCA_3F2R 9
+#define DCA_4F2R 10
+
+#define DCA_DOLBY 101 /* FIXME */
+
+#define DCA_CHANNEL_MAX  DCA_3F2R /* We don't handle anything above that */
+#define DCA_CHANNEL_BITS 6
+#define DCA_CHANNEL_MASK 0x3F
+
+#define DCA_LFE 0x80
+#define DCA_ADJUST_LEVEL 0x100
+
+#define WAVE_FORMAT_PCM        0x0001
+#define WAVE_FORMAT_IEEE_FLOAT 0x0003
+#define WAVE_FORMAT_EXTENSIBLE 0xFFFE
+
+static uint8_t wav_header[] = {
+    'R', 'I', 'F', 'F', 0xfc, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 16, 0, 0, 0,
+    WAVE_FORMAT_PCM, WAVE_FORMAT_PCM >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0,
+    'd', 'a', 't', 'a', 0xd8, 0xff, 0xff, 0xff
+};
+
+static uint8_t wavmulti_header[] = {
+    'R', 'I', 'F', 'F', 0xf0, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 40, 0, 0, 0,
+    (uint8_t)(WAVE_FORMAT_EXTENSIBLE & 0xFF), WAVE_FORMAT_EXTENSIBLE >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 22, 0,
+    0, 0, 0, 0, 0, 0,
+    WAVE_FORMAT_IEEE_FLOAT, WAVE_FORMAT_IEEE_FLOAT >> 8,
+    0, 0, 0, 0, 0x10, 0x00, 0x80, 0, 0, 0xaa, 0, 0x38, 0x9b, 0x71,
+    'd', 'a', 't', 'a', 0xb4, 0xff, 0xff, 0xff
+};
+
+static void store4 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+    buf[2] = value >> 16;
+    buf[3] = value >> 24;
+}
+
+static void store2 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+}
+
+
+static uint32_t find_chunk(FILE * file, const uint8_t chunk_id[4])
+{
+    uint8_t buffer[8];
+    while (1) {
+        size_t chunksize;
+        size_t s = fread(buffer, 1, 8, file);
+        if (s < 8)
+            return 0;
+        chunksize = (uint32_t)buffer[4] | ((uint32_t)buffer[5] << 8) |
+            ((uint32_t)buffer[6] << 16) | ((uint32_t)buffer[7] << 24);
+        if (!memcmp(buffer, chunk_id, 4))
+            return chunksize;
+        fseek(file, chunksize, SEEK_CUR);
+    }
+}
+
+
+CWaveFile::CWaveFile(const char* Filename, bool Write)
+    : Duration(0), ReadOnly(false), m_bOK(false)
+{
+    Channels = 0;
+
+	/* 打开文件 **/
+    File = fopen(Filename, Write ? "wb":"rb");
+    if ( !File )
+        return;
+    
+	/* 设置写文件初始参数 **/
+    if ( Write )
+    {
+        SampleRate = 44100;
+        Channels = 2;
+        Format = SF_S16;
+        SampleSize = 16;
+		ChannelMask = 0;
+		m_bOK = true;
+        return;
+    }
+
+    ReadOnly = true;
+
+    size_t s;
+    uint8_t buffer[8];
+    uint8_t *fmt = NULL;
+    uint32_t v;
+    uint32_t avg_bps;
+    uint32_t block_align;
+    unsigned short FormatType;
+    unsigned short SampleType;
+
+    static const uint8_t riff[4] = { 'R', 'I', 'F', 'F' };
+    static const uint8_t wave[4] = { 'W', 'A', 'V', 'E' };
+    static const uint8_t fmt_[4] = { 'f', 'm', 't', ' ' };
+    static const uint8_t data[4] = { 'd', 'a', 't', 'a' };
+
+	/* 前四个字节为 riff **/
+    s = fread(buffer, 1, 8, File);
+    if (s < 8)
+        goto err2;
+
+    if (memcmp(buffer, riff, 4))
+        goto err2;
+
+	/* 8~12为wave **/
+    /* TODO: check size (in buffer[4..8]) */
+    s = fread(buffer, 1, 4, File);
+    if (s < 4)
+        goto err2;
+
+    if (memcmp(buffer, wave, 4))
+        goto err2;
+
+    s = find_chunk(File, fmt_);
+    if ( s != 16 && s != 18 && s != 40 )
+        goto err2;
+
+    fmt = (uint8_t*)malloc(s);
+    if (!fmt)
+        goto err2;
+
+    if (fread(fmt, 1, s, File) != s)
+        goto err3;
+
+    /* wFormatTag */
+    v = (uint32_t)fmt[0] | ((uint32_t)fmt[1] << 8);
+    if (v != WAVE_FORMAT_PCM && v != WAVE_FORMAT_IEEE_FLOAT && v != WAVE_FORMAT_EXTENSIBLE)
+        goto err3;
+
+    FormatType = v;
+
+    if (s == 40 && 0xfffe == v)
+    {
+        // fmt begins at 0x14 of the wave file
+        v = *(unsigned short*)&fmt[0x2C - 0x14];
+    }
+
+    SampleType = v;
+
+    /* wChannels */
+    v = (uint32_t)fmt[2] | ((uint32_t)fmt[3] << 8);
+
+    Channels = v;
+
+    if (v < 1 || v > 32)
+        goto err3;
+
+    /* dwSamplesPerSec */
+    SampleRate = (uint32_t)fmt[4] | ((uint32_t)fmt[5] << 8) |
+        ((uint32_t)fmt[6] << 16) | ((uint32_t)fmt[7] << 24);
+
+    /* dwAvgBytesPerSec */
+    avg_bps = (uint32_t)fmt[8] | ((uint32_t)fmt[9] << 8) |
+        ((uint32_t)fmt[10] << 16) | ((uint32_t)fmt[11] << 24);
+
+    /* wBlockAlign */
+    block_align = (uint32_t)fmt[12] | ((uint32_t)fmt[13] << 8);
+
+    /* wBitsPerSample */
+    SampleSize = (uint32_t)fmt[14] | ((uint32_t)fmt[15] << 8);
+    if (SampleSize != 8 && SampleSize != 16 && SampleSize != 32 && SampleSize != 24 && SampleSize != 64)
+        goto err3;
+
+    switch (SampleSize)
+    {
+    case 8:
+        Format = SF_U8;
+        break;
+    case 16:
+        Format = SF_S16;
+        break;
+    case 24:
+        Format = SF_S24;
+        break;
+    case 32:
+    {
+        if (SampleType == WAVE_FORMAT_IEEE_FLOAT)
+            Format = SF_IEEE_FLOAT;
+        else
+            Format = SF_S32;
+
+    }
+    break;
+    case 64:
+        if (SampleType != WAVE_FORMAT_IEEE_FLOAT)
+            goto err3;
+        Format = SF_IEEE_DOUBLE;
+        break;
+    }
+
+
+    // Handle 24-bit samples individually
+#if 0
+    if (SampleSize == 24 && Channels <= 2)
+    {
+        int ba24 = Channels * (SampleSize / 8); // Align to 4x
+
+        ba24 = (ba24 + 3) / 4 * 4;
+
+        if (block_align != ba24)
+            goto err3;
+    }
+    else
+#endif
+    {
+        if (block_align != Channels * (SampleSize / 8))
+            goto err3;
+    }
+
+    if (avg_bps != block_align * SampleRate)
+        goto err3;
+
+    v = find_chunk(File, data);
+
+    if (v == 0 || v % block_align != 0)
+        goto err3;
+
+    TotalFrames = v / block_align;
+
+    FramesRead = 0;
+
+    if (FormatType == WAVE_FORMAT_EXTENSIBLE)
+    {
+        ChannelMask = *(unsigned int*)(&fmt[0x14]);
+    }
+    else
+    {
+        ChannelMask = 0;
+    }
+    
+    FrameStartPos = ftell(File);
+
+    free(fmt);
+	m_bOK = true;
+    return;
+
+err3:
+    free(fmt);
+err2:
+    fclose(File);
+
+    File = NULL;
+}
+
+bool CWaveFile::GetStatus()
+{
+	return m_bOK;
+}
+
+SAMPLE_FORMAT CWaveFile::GetFormat()
+{
+	return Format;
+}
+
+int CWaveFile::GetTotalFrames()
+{
+	return TotalFrames;
+}
+
+int CWaveFile::GetFramesRead()
+{
+	return FramesRead;
+}
+
+CWaveFile::~CWaveFile()
+{
+    if (File != NULL)
+    {
+        if (!ReadOnly)
+        {
+            unsigned int Size = ftell(File) - FrameStartPos;// 44;
+
+            fseek(File, FrameStartPos - 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+
+            Size += FrameStartPos - 8;
+
+            fseek(File, 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+        }
+
+        fclose(File);
+    }
+}
+
+int CWaveFile::GetSampleRate()
+{
+    return SampleRate;
+}
+
+void CWaveFile::SetSampleRate(int SampleRate)
+{
+    this->SampleRate = SampleRate;
+}
+
+void CWaveFile::SetupDone()
+{
+    unsigned char Header[68];
+
+    fseek(File, 0, SEEK_SET);
+
+    SampleSize = Format & 0xFF;
+
+    if (ChannelMask)
+    {
+        memcpy(Header, wavmulti_header, sizeof(wavmulti_header));
+
+        if (Format < SF_IEEE_FLOAT)
+        {
+         //   store2(Header + 20, WAVE_FORMAT_PCM);
+            store2(Header + 44, WAVE_FORMAT_PCM);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        store2(Header + 38, SampleSize / 8 * 8);
+        store4(Header + 40, ChannelMask);
+
+        fwrite(Header, sizeof(wavmulti_header), 1, File);
+    }
+    else
+    {
+        memcpy(Header, wav_header, sizeof(wav_header));
+
+        if (Format >= SF_IEEE_FLOAT)
+        {
+            store2(Header + 20, WAVE_FORMAT_IEEE_FLOAT);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        fwrite(Header, sizeof(wav_header), 1, File);
+    }
+
+
+    FrameStartPos = ftell(File);
+}
+
+
+void CWaveFile::Seek(int FramePos, int Where)
+{
+    // Ignoring Where
+
+    fseek(File, FrameStartPos + FramePos * Channels* (SampleSize / 8), Where);
+
+    FramesRead = FramePos;
+
+}
+
+int CWaveFile::GetChannels()
+{
+    return Channels;
+}
+
+void CWaveFile::SetChannels(int Channels)
+{
+    this->Channels = Channels;
+}
+
+void CWaveFile::SetSampleFormat(SAMPLE_FORMAT Format)
+{
+    this->Format = Format;
+}
+
+uint32_t CWaveFile::GetChannelMask()
+{
+    return ChannelMask;
+}
+
+void CWaveFile::SetChannelMask(uint32_t Mask)
+{
+    ChannelMask = Mask;
+}
+
+bool CWaveFile::ReadFrameAsS16(short* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) << 8;
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+        return Frames == fread(FrameSamples, sizeof(FrameSamples[0])*Channels, Frames, File);
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 8);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 16);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        double DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+bool CWaveFile::ReadFrameAsfloat(float* FrameSamples, int Frames)
+{
+	if (FramesRead >= TotalFrames)
+		return false;
+
+	FramesRead += Frames;
+
+	switch (Format)
+	{
+	case SF_U8:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 1, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S16:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 2, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S24:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 3, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S32:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 4, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_IEEE_FLOAT:
+	{
+		float DirectSamples[32];
+
+		if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+		{
+			for (int frame = 0; frame < Frames; frame++)
+			{
+				for (int ch = 0; ch < Channels; ch++)
+				{
+					FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+				}
+			}
+			return true;
+		}
+		return false;
+	}
+	case SF_IEEE_DOUBLE:
+	{
+		if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+		{
+			return true;
+		}
+		return false;
+	}
+	}
+	return false;
+}
+
+bool CWaveFile::ReadFrameAsDouble(double* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File)) 
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 2, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample ))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+void CWaveFile::WriteRaw(void* Raw, int Size)
+{
+	fwrite(Raw, Size, 1, File);
+}
+
+
+void CWaveFile::WriteFrame(uint8_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(short* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(int32_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrameS24(int32_t* FrameSamples, int Frames)
+{
+    for (int c = 0; c < Channels; c++)
+    {
+        fwrite(&FrameSamples[c], 3, 1, File);
+    }
+}
+
+void CWaveFile::WriteFrame(double* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(float* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+
+double CWaveFile::GetDuration()
+{
+    return Duration;
+}
diff --git a/AutoCoverTool/ref/pic_au_tools/main.py b/AutoCoverTool/ref/pic_au_tools/main.py
new file mode 100644
index 0000000..6db2a4d
--- /dev/null
+++ b/AutoCoverTool/ref/pic_au_tools/main.py
@@ -0,0 +1,16 @@
+# 这是一个示例 Python 脚本。
+
+# 按 Shift+F10 执行或将其替换为您的代码。
+# 按 双击 Shift 在所有地方搜索类、文件、工具窗口、操作和设置。
+
+
+def print_hi(name):
+    # 在下面的代码行中使用断点来调试脚本。
+    print(f'Hi, {name}')  # 按 Ctrl+F8 切换断点。
+
+
+# 按间距中的绿色按钮以运行脚本。
+if __name__ == '__main__':
+    print_hi('PyCharm')
+
+# 访问 https://www.jetbrains.com/help/pycharm/ 获取 PyCharm 帮助
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/click_apply.png b/AutoCoverTool/ref/pic_au_tools/picture/click_apply.png
new file mode 100644
index 0000000..4a4692e
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/click_apply.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/click_library.png b/AutoCoverTool/ref/pic_au_tools/picture/click_library.png
new file mode 100644
index 0000000..709519f
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/click_library.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/click_sure.jpg b/AutoCoverTool/ref/pic_au_tools/picture/click_sure.jpg
new file mode 100644
index 0000000..8f3382f
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/click_sure.jpg differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/close_all_files.png b/AutoCoverTool/ref/pic_au_tools/picture/close_all_files.png
new file mode 100644
index 0000000..6215929
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/close_all_files.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/close_time.png b/AutoCoverTool/ref/pic_au_tools/picture/close_time.png
new file mode 100644
index 0000000..3ce8362
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/close_time.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/create_vocal.png b/AutoCoverTool/ref/pic_au_tools/picture/create_vocal.png
new file mode 100644
index 0000000..c2ba81e
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/create_vocal.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/end_time.png b/AutoCoverTool/ref/pic_au_tools/picture/end_time.png
new file mode 100644
index 0000000..7128e39
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/end_time.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/get_library.png b/AutoCoverTool/ref/pic_au_tools/picture/get_library.png
new file mode 100644
index 0000000..44649dd
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/get_library.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/modify_display.png b/AutoCoverTool/ref/pic_au_tools/picture/modify_display.png
new file mode 100644
index 0000000..2cfa19b
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/modify_display.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/modify_gain.png b/AutoCoverTool/ref/pic_au_tools/picture/modify_gain.png
new file mode 100644
index 0000000..39b0ca2
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/modify_gain.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/open.png b/AutoCoverTool/ref/pic_au_tools/picture/open.png
new file mode 100644
index 0000000..f3b4683
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/open.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/open_library.png.png b/AutoCoverTool/ref/pic_au_tools/picture/open_library.png.png
new file mode 100644
index 0000000..a1c4242
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/open_library.png.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/picture_tools.py b/AutoCoverTool/ref/pic_au_tools/picture/picture_tools.py
new file mode 100644
index 0000000..d6136aa
--- /dev/null
+++ b/AutoCoverTool/ref/pic_au_tools/picture/picture_tools.py
@@ -0,0 +1,27 @@
+import time
+import pyautogui
+
+
+# 通过图片识别定位
+def get_pic(pic_name):
+    pyautogui.screenshot('screenshot.png')
+    # pyautogui.screenshot('img12.png', region=(0, 0, 1110, 776))
+    Part = pyautogui.locateOnScreen(pic_name, confidence=0.85)  # <class 'pyscreeze.Box'>
+    point = pyautogui.center(Part)
+    print(point)
+    return point
+
+# im = pyautogui.screenshot()
+# print((type(im), im.getdata(100, 200)))
+#
+# a = get_pic("11.png")
+# print(a)
+# pyautogui.click(a)
+# #
+# click_file = get_pic("select_files.png")
+# pyautogui.rightClick(click_file)
+#
+# # click_clear = mouse.click(button="left", coords=(128, 115))
+# time.sleep(2)
+# click_clear = get_pic("img_11.png")
+# pyautogui.click(click_clear)
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/save_as_ok.png b/AutoCoverTool/ref/pic_au_tools/picture/save_as_ok.png
new file mode 100644
index 0000000..389634a
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/save_as_ok.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/save_library.png b/AutoCoverTool/ref/pic_au_tools/picture/save_library.png
new file mode 100644
index 0000000..cef8d20
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/save_library.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/save_vocal_file.png b/AutoCoverTool/ref/pic_au_tools/picture/save_vocal_file.png
new file mode 100644
index 0000000..92c3e16
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/save_vocal_file.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/screenshot.png b/AutoCoverTool/ref/pic_au_tools/picture/screenshot.png
new file mode 100644
index 0000000..445bd26
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/screenshot.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/search_name.png b/AutoCoverTool/ref/pic_au_tools/picture/search_name.png
new file mode 100644
index 0000000..d3870f8
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/search_name.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/select_files.png b/AutoCoverTool/ref/pic_au_tools/picture/select_files.png
new file mode 100644
index 0000000..97e7d65
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/select_files.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/select_library.png b/AutoCoverTool/ref/pic_au_tools/picture/select_library.png
new file mode 100644
index 0000000..1d87bcc
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/select_library.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/picture/start_time.png b/AutoCoverTool/ref/pic_au_tools/picture/start_time.png
new file mode 100644
index 0000000..cd0f6de
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/picture/start_time.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/read_all_files.py b/AutoCoverTool/ref/pic_au_tools/read_all_files.py
new file mode 100644
index 0000000..e452a2e
--- /dev/null
+++ b/AutoCoverTool/ref/pic_au_tools/read_all_files.py
@@ -0,0 +1,65 @@
+import os
+
+
+def find_file(search_path, include_str=None, filter_strs=None):
+    if filter_strs is None:
+        filter_strs = []
+
+    files = []
+    # 获取路径下所有文件
+    names = os.listdir(search_path)
+    for name in names:
+        path = os.path.abspath(os.path.join(search_path, name))
+        if os.path.isfile(path):
+            # 如果不包含指定字符串则
+            if include_str is not None and include_str not in name:
+                continue
+
+            # 如果未break，说明不包含filter_strs中的字符
+            for filter_str in filter_strs:
+                if filter_str in name:
+                    break
+            else:
+                files.append(path)
+        else:
+            files += find_file(path, include_str=include_str, filter_strs=filter_strs)
+    return files
+
+
+# 读取多有文件架
+def find_dos():
+    a = os.listdir("docs/Songs")
+    for i in a:
+        if i.endswith(".meta"):
+            a.remove(i)
+    return a
+
+
+if __name__ == '__main__':
+    # 获取全部文件
+    # f = find_file("./txt")
+    # print(f)
+
+    # # 获取包含指定字符的文件
+    # f = find_file("/Users/lbj/Desktop/Beat", include_str=".txt")
+    # print(f)
+    #
+
+    # # 获取不包含指定字符的文件
+    f = find_file(r"../me_3_w4\me_3_w4", include_str="dv", filter_strs=[".pkf"])
+    print(f)
+    a = f[0].split('\\')
+    # 列表中删除已使用的文件
+    f.remove(f[0])
+    print(f)
+    # 获取文件
+    print(a[-1])
+    del_a = a.remove(a[-1])
+    address = '\\'.join(a)
+    # 获取文件地址
+    print(address)
+
+    #
+    # # 获取包含指定字符且不包含某些指定字符的文件
+    # f = find_file(r"test", include_str="wav", filter_strs=[".meta", "__init__"])
+    # print(f)
diff --git a/AutoCoverTool/ref/pic_au_tools/screenshot.png b/AutoCoverTool/ref/pic_au_tools/screenshot.png
new file mode 100644
index 0000000..e56127b
Binary files /dev/null and b/AutoCoverTool/ref/pic_au_tools/screenshot.png differ
diff --git a/AutoCoverTool/ref/pic_au_tools/star_app.py b/AutoCoverTool/ref/pic_au_tools/star_app.py
new file mode 100644
index 0000000..47c701f
--- /dev/null
+++ b/AutoCoverTool/ref/pic_au_tools/star_app.py
@@ -0,0 +1,392 @@
+import pyautogui
+import pywinauto
+from pywinauto import application, mouse
+import time
+from pywinauto.keyboard import send_keys
+from read_all_files import find_file
+from picture.picture_tools import get_pic
+
+gs_rate_dict = {
+    611752105020256284: 38.340000,
+    611752105020286433: 33.730000,
+    611752105020286443: 11.370000,
+    611752105020286446: 31.920000,
+    611752105020290639: 62.400000,
+    611752105020290695: 20.550000,
+    611752105020315328: 43.860000,
+    611752105020315368: 25.740000,
+    611752105020336950: 47.170000,
+    611752105020343687: 30.000000,
+    611752105020343699: 19.210000,
+    611752105020351134: 43.300000,
+    611752105020357112: 27.560000,
+    611752105020378620: 58.470000,
+    611752105020387015: 11.220000,
+    611752105020394121: 30.660000,
+    611752105020394297: 112.720000,
+    611752105020411654: 32.330000,
+    611752105020417688: 50.610000,
+    611752105020548211: 42.730000,
+    611752105020563523: -1.000000,
+    611752105021285282: -1.000000,
+    611752105021332759: 11.370000,
+    611752105022446809: 7.600000,
+    611752105022647082: 3.340000,
+    611752105022667231: 43.260000,
+    611752105022735101: 3.680000,
+    611752105022736204: 17.650000,
+    611752105022745595: 29.430000,
+    611752105022770952: 10.820000,
+    611752105022842004: 25.400000,
+    611752105022842477: 10.020000,
+    611752105023434557: 28.160000,
+    611752105023532439: 11.850000,
+    611752105023623965: 3.710000,
+    611752105024250202: 43.550000,
+    611752105024628047: 22.520000,
+    611752105024676794: 63.380000,
+    611752105024678976: 14.350000,
+    611752105024679221: 0.290000,
+    611752105024953316: 10.350000,
+    611752105025104181: 28.890000,
+    611752105026189342: 1.380000,
+    611752105026523547: 27.950000,
+    611752105026707760: 0.000000,
+    611752105026771723: 32.100000,
+    611752105026946178: 16.860000,
+    611752105027047993: 20.380000,
+    611752105027188746: 23.900000,
+    611752105027189453: 13.640000,
+    611752105027302268: 21.030000,
+    611752105027557408: 13.050000,
+    611752105028650636: 31.310000,
+    611752105028683824: 15.920000,
+    611752105029990849: 56.810000,
+    611752105029993297: 2.490000,
+    611752105030077711: 28.960000,
+    611752105030104548: 15.830000,
+    611752105030419624: 0.790000,
+    611752105030419633: 8.080000,
+    611752105030419688: 5.850000,
+    611752105030433779: 1.080000,
+    611752105015523266: 16.160000,
+    611752105017233541: 43.910000,
+    611752105030414513: 16.330000,
+    611752105030414549: 29.890000,
+    611752105030414557: 16.210000,
+    611752105030414588: 18.900000,
+    611752105030414597: 16.540000,
+    611752105030414613: 2.210000,
+    611752105030414615: 0.320000,
+    611752105030414619: 26.420000,
+    611752105030414633: 17.250000,
+    611752105030414638: 8.300000,
+    611752105030414689: 2.600000,
+    611752105030414702: 0.550000,
+    611752105030414742: 28.310000,
+    611752105030414763: 1.040000,
+    611752105030414773: 9.100000,
+    611752105030414777: 34.650000,
+    611752105030414779: 22.240000,
+    611752105030414784: 0.580000,
+    611752105030414890: 23.920000,
+    611752105030414915: 6.020000,
+    611752105030414925: 2.250000,
+    611752105030414929: 8.110000,
+    611752105030414935: 4.750000,
+    611752105030414943: 1.600000,
+    611752105030414957: 18.950000,
+    611752105030414962: 17.460000,
+    611752105030414976: 0.690000,
+    611752105030414993: 30.170000,
+    611752105030414995: 8.410000,
+    611752105030415003: 28.620000,
+    611752105030415014: 6.500000,
+    611752105030415018: 2.070000,
+    611752105030415032: 5.830000,
+    611752105030415056: 0.440000,
+    611752105030415067: 8.300000,
+    611752105030415071: 22.970000,
+    611752105030415074: 0.000000,
+    611752105030415083: 5.010000,
+    611752105030415087: 7.950000,
+    611752105030415100: 1.180000,
+    611752105030415103: 35.110000
+}
+
+
+# 程序打开
+def open_app():
+    # 此处填写AU_APP的绝对路径
+    app = application.Application(backend='uia').start(
+        r"C:\Program Files\Adobe\Adobe Audition CC 2017\Adobe Audition CC.exe")
+    time.sleep(4)
+    # 设置窗口最大化74
+    click_sure = get_pic("./picture/click_sure.jpeg")
+    pyautogui.click(click_sure)
+    time.sleep(2)
+    app_top_window = app.top_window()
+    app_top_window.maximize()
+
+
+dlg = pywinauto.Desktop()
+
+
+# 获取所有文件
+def get_all_file():
+    # files = find_file(r"test", filter_strs=[".mp3", ".pkf"])
+    files = find_file(r"me_3_w4_zy", include_str="dv", filter_strs=[".pkf"])
+    count_file = len(files)
+    return files, count_file
+
+
+# 拿到文件地址
+def get_file():
+    # all_files = get_all_file()[0]
+    # print(all_files)
+    # 切割获取
+    add_file = file_name[0].split('\\')
+    # print(add_file)
+    # 列表中删除已用的文件信息
+    file_name.remove(file_name[0])
+    # wav文件获取
+    wav_file = add_file[-1]
+    # print(wav_file)
+    add_file.remove(add_file[-1])
+    address = '\\'.join(add_file)
+    # print(address)
+    # address = r"D:\project\tools\au_tools\test\611752105027601574"
+
+    vocal = r"vocal.mp3"
+    return address, wav_file, vocal
+
+
+# 打开导入文件位置空间弹窗
+def open_file(file, file_address, st_tm):
+    send_keys("^o")
+    time.sleep(2)
+    # 切换控件窗口
+    dlg_open_file = dlg[".*Open File.*"]
+    # 打开的文件内容输入
+    send_keys(file)
+    time.sleep(1)
+    # 获取desk实例化=
+    start_time_inst = None
+    if file == get_file_name[2]:
+        print("这是vocal")
+        # dlg_open_file.window(found_index=0, class_name=".*Edit.*").click()
+        dlg_open_file.window(found_index=0, title_re=".*地址.*").click()
+        send_keys(file_address)
+        time.sleep(1)
+        dlg_open_file.window(found_index=0, title_re=".*地址区段工具栏.*").click()
+        # dlg_open_file.window(found_index=0, title_re=".*打开.*").click()
+        time.sleep(1)
+        # open_click = get_pic("./picture/open.png")
+        open_click = get_pic("./picture/open.jpeg")
+        # print(open_click)
+        # mouse.click(button="left", coords=(775,519))
+        pyautogui.click(open_click)
+        wait_dlg("Adobe Audition CC")
+        time.sleep(1)
+        start_time_inst = get_pic("./picture/start_time.jpeg")
+        revise_time("0:{}".format(round(st_tm, 3)), "0:{}".format(round(st_tm + 60, 3)))
+        time.sleep(2)
+        start_vocal_vts3()
+    else:
+        # 文件打开
+        print("这里是wav")
+        # dlg_open_file.window(found_index=0, title_re=".*打开.*").click()
+        open_click = get_pic("./picture/open.jpeg")
+        pyautogui.click(open_click)
+        # mouse.click(button="left", coords=(775, 519))
+        wait_dlg("Adobe Audition CC")
+        time.sleep(1)
+        start_time_inst = get_pic("./picture/start_time.jpeg")
+        star_wav_vst3(file)
+    pyautogui.click(start_time_inst)
+    send_keys("0:0.000")
+    close_time = get_pic("./picture/close_time.jpeg")
+    pyautogui.click(close_time)
+    time.sleep(1)
+
+
+def revise_time(st_tm, ed_tm):
+    print("reverse_time={}".format(st_tm))
+    # 修改开始时间
+    time.sleep(1)
+    # time_start = mouse.click(button="left", coords=(588, 981))
+    # start_time = get_pic("./picture/start_time.png")
+    start_time = get_pic("./picture/start_time.jpeg")
+    pyautogui.click(start_time)
+    send_keys(st_tm)
+    time.sleep(1)
+    # time_end = mouse.click(button="left", coords=(648, 981))
+    # end_time = get_pic("./picture/end_time.png")
+    # end_time = get_pic("./picture/end_time.jpeg")
+    # pyautogui.click(end_time)
+    # send_keys(ed_tm)
+    # 关闭选中时间部分
+    # close_time = mouse.click(button="left", coords=(800, 981))
+    close_time = get_pic("./picture/close_time.jpeg")
+    pyautogui.click(close_time)
+
+
+#  通过快捷键执行vocal的vts3
+def start_vocal_vts3():
+    time.sleep(2)
+    # send_keys("^%z")
+    send_keys("^'")
+    wait_dlg("Effect - Chameleon2")
+
+    # 恢复状态
+    # restruct_vocal = get_pic("./picture/restruct.jpeg")
+    # pyautogui.click(restruct_vocal)
+    # time.sleep(1)
+    # pyautogui.click(restruct_vocal)
+
+    # 点击创建按钮
+    # 打开弹窗
+    time.sleep(1)
+    # mouse.click(button="left", coords=(766, 522))
+    # 创建文件
+    create_vocal = get_pic("./picture/create_vocal.jpeg")
+    pyautogui.click(create_vocal)
+    # create_file = mouse.click(button="left", coords=(951, 186))
+    time.sleep(2)
+    send_keys("{SPACE}")
+    time.sleep(10)
+    # 保存文件
+    # save_file = mouse.click(button="left", coords=(844, 501))
+    # save_vocal = get_pic("./picture/save_library.png")
+    save_vocal = get_pic("./picture/save_library.jpeg")
+    time.sleep(1)
+    pyautogui.click(save_vocal)
+    # save_file = mouse.click(button="left", coords=(844, 501))
+    time.sleep(2)
+    # 保存内容
+    send_keys(f"vocal{get_file_name[1]}")
+    time.sleep(1)
+    # save_click = mouse.click(button="left", coords=(757, 592))
+    save_vocal_file = get_pic("./picture/save_vocal_file.jpeg")
+    pyautogui.click(save_vocal_file)
+    time.sleep(1)
+    send_keys('%{F4}')
+
+    # 关闭弹窗
+    # dlg_close_window = dlg["Effect - Chameleon2"]
+    # dlg_close_window.window(found_index=0, title_re=".*关闭.*")
+    # wait_dlg("Effect - Chameleon2")
+
+
+# 执行wav的vst3
+def star_wav_vst3(file):
+    time.sleep(2)
+    send_keys("^'")
+    wait_dlg("Effect - Chameleon2")
+    # open_library = mouse.click(button="left", coords=(1010, 188))
+
+    # 恢复状态
+    # restruct_vocal = get_pic("./picture/restruct.jpeg")
+    # pyautogui.click(restruct_vocal)
+    # time.sleep(1)
+    # pyautogui.click(restruct_vocal)
+
+    open_library = get_pic("./picture/click_library.jpeg")
+    pyautogui.click(open_library)
+    wait_dlg("ChameleonLibrary - ")
+    mouse.click(button="left", coords=(387, 572))
+    # search_name = get_pic("./picture/search_name.jpeg")
+    # pyautogui.click(search_name)
+    send_keys(f"vocal{get_file_name[1]}")
+    time.sleep(2)
+    # 选择搜索到的文件
+    # wait_dlg("ChameleonLibrary - ")
+    # select_profile = mouse.double_click(button="left", coords=(978, 492))
+    mouse.click(button="left", coords=(722, 297))
+    # move_library = get_pic("./picture/get_library.jpeg")
+    # pyautogui.moveTo(move_library)
+    time.sleep(1)
+    select_library = get_pic("./picture/select_library.jpeg")
+    pyautogui.doubleClick(select_library)
+    # 关闭弹窗
+    time.sleep(1)
+    # 关闭弹窗
+    send_keys('%{F4}')
+
+    # close_profile = mouse.double_click(button="left", coords=(1675, 297))
+    # 修改显示
+    wait_dlg("Effect - Chameleon2")
+    # modify_chameleon_display = mouse.double_click(button="left", coords=(1326, 124))
+    # modify_chameleon_display = get_pic("./picture/modify_display.png")
+    # pyautogui.doubleClick(modify_chameleon_display)
+    # 修改_gain
+    # time.sleep(2)
+    mouse.click(button="left", coords=(1200, 720))
+    # modify_gain = get_pic("./picture/modify_gain.jpeg")
+    # modify_gain.y += 50
+    time.sleep(1)
+    send_keys("15")
+
+    apply_file = get_pic("./picture/click_apply.jpeg")
+    pyautogui.click(apply_file)
+    time.sleep(3)
+    wait_dlg("Adobe Audition CC")
+
+    time.sleep(5)
+    save_as(file)
+    clear_file()
+
+
+# 保存
+def save_as(file):
+    send_keys("^+s")
+    time.sleep(2)
+    send_keys(str(file).replace("_dv_", "_dev_").replace(".mp3", ""))
+    # save_ok = mouse.click(button="left", coords=(1014, 647))
+    save_ok = get_pic("./picture/save_as_ok.jpeg")
+    pyautogui.click(save_ok)
+    time.sleep(3)
+
+
+# 清空内容显示
+def clear_file():
+    time.sleep(2)
+    send_keys("^]")
+
+
+# 等到待窗口启用
+def wait_dlg(win_name):
+    try:
+        new_dlg = dlg[win_name]
+        new_dlg.wait(wait_for="ready", timeout=20, retry_interval=1)
+        # print("等待通过，当前新建连接窗口处于可见状态")
+    except EnvironmentError:
+        print("请检查弹窗未打开")
+
+
+# star_test
+def start_test():
+    import os
+    global get_file_name
+    for i in range(file_count):
+        get_file_name = get_file()
+        dst_file = os.path.join("C:/Users/xianfeng.li/Desktop/jianli/test",
+                                str(get_file_name[1]).replace("_dv_", "_dev_"))
+        print(dst_file)
+        if os.path.exists(dst_file):
+            continue
+        print(f"本次检测内容包含{get_file_name}")
+        st_tm = gs_rate_dict[int(str(get_file_name[1]).split("_")[0])]
+        open_file(get_file_name[2], get_file_name[0], st_tm)
+        time.sleep(3)
+        print(f"结束文件{get_file_name[1]}的{get_file_name[2]}")
+        open_file(get_file_name[1], get_file_name[0], 0)
+        time.sleep(3)
+        print(f"结束文件{get_file_name[1]}")
+
+
+if __name__ == '__main__':
+    open_app()
+    file_count = get_all_file()[1]
+    file_name = get_all_file()[0]
+    start_test()
diff --git a/AutoCoverTool/ref/so_vits_svc/Eng_docs.md b/AutoCoverTool/ref/so_vits_svc/Eng_docs.md
new file mode 100644
index 0000000..78f6db8
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/Eng_docs.md
@@ -0,0 +1,83 @@
+# SoftVC VITS Singing Voice Conversion
+## Updates
+> According to incomplete statistics, it seems that training with multiple speakers may lead to **worsened leaking of voice timbre**. It is not recommended to train models with more than 5 speakers. The current suggestion is to try to train models with only a single speaker if you want to achieve a voice timbre that is more similar to the target.
+> Fixed the issue with unwanted staccato, improving audio quality by a decent amount.\
+> The 2.0 version has been moved to the 2.0 branch.\
+> Version 3.0 uses the code structure of FreeVC, which isn't compatible with older versions.\
+> Compared to [DiffSVC](https://github.com/prophesier/diff-svc) , diffsvc performs much better when the training data is of extremely high quality, but this repository may perform better on datasets with lower quality. Additionally, this repository is much faster in terms of inference speed compared to diffsvc.
+
+## Model Overview
+A singing voice coversion (SVC) model, using the SoftVC encoder to extract features from the input audio, sent into VITS along with the F0 to replace the original input to acheive a voice conversion effect. Additionally, changing the vocoder to [NSF HiFiGAN](https://github.com/openvpi/DiffSinger/tree/refactor/modules/nsf_hifigan) to fix the issue with unwanted staccato.
+## Notice
++ The current branch is the 32kHz version, which requires less vram during inferencing, as well as faster inferencing speeds, and datasets for said branch take up less disk space. Thus the 32 kHz branch is recommended for use.
++ If you want to train 48 kHz variant models, switch to the [main branch](https://github.com/innnky/so-vits-svc/tree/main).
+## Colab notebook script for dataset creation and training.
+[colab training notebook](https://colab.research.google.com/drive/1rCUOOVG7-XQlVZuWRAj5IpGrMM8t07pE?usp=sharing)
+
+## Required models
++ soft vc hubert：[hubert-soft-0d54a1f4.pt](https://github.com/bshall/hubert/releases/download/v0.1/hubert-soft-0d54a1f4.pt)
+  + Place under `hubert`.
++ Pretrained models [G_0.pth](https://huggingface.co/innnky/sovits_pretrained/resolve/main/G_0.pth) and [D_0.pth](https://huggingface.co/innnky/sovits_pretrained/resolve/main/D_0.pth)
+  + Place under `logs/32k`.
+  + Pretrained models are required, because from experiments, training from scratch can be rather unpredictable to say the least, and training with a pretrained model can greatly improve training speeds.
+  + The pretrained model includes云灏, 即霜, 辉宇·星AI, 派蒙, and 绫地宁宁, covering the common ranges of both male and female voices, and so it can be seen as a rather universal pretrained model.
+  + The pretrained model exludes the `optimizer speaker_embedding` section, rendering it only usable for pretraining and incapable of inferencing with.
+```shell
+# For simple downloading.
+# hubert
+wget -P hubert/ https://github.com/bshall/hubert/releases/download/v0.1/hubert-soft-0d54a1f4.pt
+# G&D pretrained models
+wget -P logs/32k/ https://huggingface.co/innnky/sovits_pretrained/resolve/main/G_0.pth
+wget -P logs/32k/ https://huggingface.co/innnky/sovits_pretrained/resolve/main/D_0.pth
+
+```
+
+
+## Dataset preparation
+All that is required is that the data be put under the `dataset_raw` folder in the structure format provided below.
+```shell
+dataset_raw
+├───speaker0
+│   ├───xxx1-xxx1.wav
+│   ├───...
+│   └───Lxx-0xx8.wav
+└───speaker1
+    ├───xx2-0xxx2.wav
+    ├───...
+    └───xxx7-xxx007.wav
+```
+
+## Data pre-processing.
+1. Resample to 32khz
+
+```shell
+python resample.py
+ ```
+2. Automatically sort out training set, validation set, test set, and automatically generate configuration files.
+```shell
+python preprocess_flist_config.py
+# Notice.
+# The n_speakers value in the config will be set automatically according to the amount of speakers in the dataset.
+# To reserve space for additionally added speakers in the dataset, the n_speakers value will be be set to twice the actual amount.
+# If you want even more space for adding more data, you can edit the n_speakers value in the config after runing this step.
+# This can not be changed after training starts.
+```
+3. Generate hubert and F0 features/
+```shell
+python preprocess_hubert_f0.py
+```
+After running the step above, the `dataset` folder will contain all the pre-processed data, you can delete the `dataset_raw` folder after that.
+
+## Training.
+```shell
+python train.py -c configs/config.json -m 32k
+```
+
+## Inferencing.
+
+Use [inference_main.py](inference_main.py)
++ Edit `model_path` to your newest checkpoint.
++ Place the input audio under the `raw` folder.
++ Change `clean_names` to the output file name.
++ Use `trans` to edit the pitch shifting amount (semitones). 
++ Change `spk_list` to the speaker name.
diff --git a/AutoCoverTool/ref/so_vits_svc/LICENSE b/AutoCoverTool/ref/so_vits_svc/LICENSE
new file mode 100644
index 0000000..c7202d4
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2021 Jingyi Li
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/AutoCoverTool/ref/so_vits_svc/README.md b/AutoCoverTool/ref/so_vits_svc/README.md
new file mode 100644
index 0000000..5905096
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/README.md
@@ -0,0 +1,123 @@
+# SoftVC VITS Singing Voice Conversion
+## English docs
+[英语资料](Eng_docs.md)
+
+
+## Update
+> 据不完全统计，多说话人似乎会导致**音色泄漏加重**，不建议训练超过5人的模型，目前的建议是如果想炼出来更像目标音色，**尽可能炼单说话人的**\
+> 断音问题已解决，音质提升了不少\
+> 2.0版本已经移至 sovits_2.0分支\
+> 3.0版本使用FreeVC的代码结构，与旧版本不通用\
+> 与[DiffSVC](https://github.com/prophesier/diff-svc) 相比，在训练数据质量非常高时diffsvc有着更好的表现，对于质量差一些的数据集，本仓库可能会有更好的表现，此外，本仓库推理速度上比diffsvc快很多
+
+
+## 模型简介
+歌声音色转换模型，通过SoftVC内容编码器提取源音频语音特征，与F0同时输入VITS替换原本的文本输入达到歌声转换的效果。同时，更换声码器为 [NSF HiFiGAN](https://github.com/openvpi/DiffSinger/tree/refactor/modules/nsf_hifigan) 解决断音问题
+
+
+## 注意
++ 当前分支是32khz版本的分支，32khz模型推理更快，显存占用大幅减小，数据集所占硬盘空间也大幅降低，推荐训练该版本模型
++ 如果要训练48khz的模型请切换到[main分支](https://github.com/innnky/so-vits-svc/tree/main) 
+
+
+## 预先下载的模型文件
++ soft vc hubert：[hubert-soft-0d54a1f4.pt](https://github.com/bshall/hubert/releases/download/v0.1/hubert-soft-0d54a1f4.pt)
+  + 放在hubert目录下
++ 预训练底模文件 [G_0.pth](https://huggingface.co/innnky/sovits_pretrained/resolve/main/G_0.pth) 与 [D_0.pth](https://huggingface.co/innnky/sovits_pretrained/resolve/main/D_0.pth)
+  + 放在logs/32k 目录下
+  + 预训练底模为必选项，因为据测试从零开始训练有概率不收敛，同时底模也能加快训练速度
+  + 预训练底模训练数据集包含云灏 即霜 辉宇·星AI 派蒙 绫地宁宁，覆盖男女生常见音域，可以认为是相对通用的底模
+  + 底模删除了optimizer speaker_embedding 等无关权重, 只可以用于初始化训练，无法用于推理
+  + 该底模和48khz底模通用
+```shell
+# 一键下载
+# hubert
+wget -P hubert/ https://github.com/bshall/hubert/releases/download/v0.1/hubert-soft-0d54a1f4.pt
+# G与D预训练模型
+wget -P logs/32k/ https://huggingface.co/innnky/sovits_pretrained/resolve/main/G_0.pth
+wget -P logs/32k/ https://huggingface.co/innnky/sovits_pretrained/resolve/main/D_0.pth
+
+```
+
+
+## colab一键数据集制作、训练脚本
+[一键colab](https://colab.research.google.com/drive/1_-gh9i-wCPNlRZw6pYF-9UufetcVrGBX?usp=sharing)
+
+
+## 数据集准备
+仅需要以以下文件结构将数据集放入dataset_raw目录即可
+```shell
+dataset_raw
+├───speaker0
+│   ├───xxx1-xxx1.wav
+│   ├───...
+│   └───Lxx-0xx8.wav
+└───speaker1
+    ├───xx2-0xxx2.wav
+    ├───...
+    └───xxx7-xxx007.wav
+```
+
+
+## 数据预处理
+1. 重采样至 32khz
+
+```shell
+python resample.py
+ ```
+2. 自动划分训练集 验证集 测试集 以及自动生成配置文件
+```shell
+python preprocess_flist_config.py
+# 注意
+# 自动生成的配置文件中，说话人数量n_speakers会自动按照数据集中的人数而定
+# 为了给之后添加说话人留下一定空间，n_speakers自动设置为 当前数据集人数乘2
+# 如果想多留一些空位可以在此步骤后 自行修改生成的config.json中n_speakers数量
+# 一旦模型开始训练后此项不可再更改
+```
+3. 生成hubert与f0
+```shell
+python preprocess_hubert_f0.py
+```
+执行完以上步骤后 dataset 目录便是预处理完成的数据，可以删除dataset_raw文件夹了
+
+
+## 训练
+```shell
+python train.py -c configs/config.json -m 32k
+```
+
+
+## 推理
+
+使用 [inference_main.py](inference_main.py)
++ 更改model_path为你自己训练的最新模型记录点
++ 将待转换的音频放在raw文件夹下
++ clean_names 写待转换的音频名称
++ trans 填写变调半音数量
++ spk_list 填写合成的说话人名称
+
+
+## Onnx导出
+### 重要的事情说三遍：导出Onnx时，请重新克隆整个仓库！！！导出Onnx时，请重新克隆整个仓库！！！导出Onnx时，请重新克隆整个仓库！！！
+使用 [onnx_export.py](onnx_export.py)
++ 新建文件夹：checkpoints 并打开
++ 在checkpoints文件夹中新建一个文件夹作为项目文件夹，文件夹名为你的项目名称
++ 将你的模型更名为model.pth，配置文件更名为config.json，并放置到刚才创建的文件夹下
++ 将 [onnx_export.py](onnx_export.py) 中path = "NyaruTaffy" 的 "NyaruTaffy" 修改为你的项目名称
++ 运行 [onnx_export.py](onnx_export.py) 
++ 等待执行完毕，在你的项目文件夹下会生成一个model.onnx，即为导出的模型
++ 注意：若想导出48K模型，请按照以下步骤修改文件，或者直接使用48K.py
+   + 请打开[model_onnx.py](model_onnx.py)，将其中最后一个class的hps中32000改为48000
+   + 请打开[nvSTFT](/vdecoder/hifigan/nvSTFT.py)，将其中所有32000改为48000
+   ### Onnx模型支持的UI
+   + [MoeSS](https://github.com/NaruseMioShirakana/MoeSS)
++ 我去除了所有的训练用函数和一切复杂的转置，一行都没有保留，因为我认为只有去除了这些东西，才知道你用的是Onnx
+
+## Gradio（WebUI）
+使用 [sovits_gradio.py](sovits_gradio.py)
++ 新建文件夹：checkpoints 并打开
++ 在checkpoints文件夹中新建一个文件夹作为项目文件夹，文件夹名为你的项目名称
++ 将你的模型更名为model.pth，配置文件更名为config.json，并放置到刚才创建的文件夹下
++ 运行 [sovits_gradio.py](sovits_gradio.py) 
+
+
diff --git a/AutoCoverTool/ref/so_vits_svc/add_speaker.py b/AutoCoverTool/ref/so_vits_svc/add_speaker.py
new file mode 100644
index 0000000..e224f07
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/add_speaker.py
@@ -0,0 +1,62 @@
+import os
+import argparse
+from tqdm import tqdm
+from random import shuffle
+import json
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--train_list", type=str, default="./filelists/train.txt", help="path to train list")
+    parser.add_argument("--val_list", type=str, default="./filelists/val.txt", help="path to val list")
+    parser.add_argument("--test_list", type=str, default="./filelists/test.txt", help="path to test list")
+    parser.add_argument("--source_dir", type=str, default="./dataset/32k", help="path to source dir")
+    args = parser.parse_args()
+
+    previous_config = json.load(open("configs/config.json", "rb"))
+
+    train = []
+    val = []
+    test = []
+    idx = 0
+    spk_dict = previous_config["spk"]
+    spk_id = max([i for i in spk_dict.values()]) + 1
+    for speaker in tqdm(os.listdir(args.source_dir)):
+        if speaker not in spk_dict.keys():
+            spk_dict[speaker] = spk_id
+            spk_id += 1
+        wavs = [os.path.join(args.source_dir, speaker, i)for i in os.listdir(os.path.join(args.source_dir, speaker))]
+        wavs = [i for i in wavs if i.endswith("wav")]
+        shuffle(wavs)
+        train += wavs[2:-10]
+        val += wavs[:2]
+        test += wavs[-10:]
+
+    assert previous_config["model"]["n_speakers"] > len(spk_dict.keys())
+    shuffle(train)
+    shuffle(val)
+    shuffle(test)
+            
+    print("Writing", args.train_list)
+    with open(args.train_list, "w") as f:
+        for fname in tqdm(train):
+            wavpath = fname
+            f.write(wavpath + "\n")
+        
+    print("Writing", args.val_list)
+    with open(args.val_list, "w") as f:
+        for fname in tqdm(val):
+            wavpath = fname
+            f.write(wavpath + "\n")
+            
+    print("Writing", args.test_list)
+    with open(args.test_list, "w") as f:
+        for fname in tqdm(test):
+            wavpath = fname
+            f.write(wavpath + "\n")
+
+    previous_config["spk"] = spk_dict
+
+    print("Writing configs/config.json")
+    with open("configs/config.json", "w") as f:
+        json.dump(previous_config, f, indent=2)
diff --git a/AutoCoverTool/ref/so_vits_svc/attentions.py b/AutoCoverTool/ref/so_vits_svc/attentions.py
new file mode 100644
index 0000000..4e0b0c1
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/attentions.py
@@ -0,0 +1,303 @@
+import copy
+import math
+import numpy as np
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+import commons
+import modules
+from modules import LayerNorm
+   
+
+class Encoder(nn.Module):
+  def __init__(self, hidden_channels, filter_channels, n_heads, n_layers, kernel_size=1, p_dropout=0., window_size=4, **kwargs):
+    super().__init__()
+    self.hidden_channels = hidden_channels
+    self.filter_channels = filter_channels
+    self.n_heads = n_heads
+    self.n_layers = n_layers
+    self.kernel_size = kernel_size
+    self.p_dropout = p_dropout
+    self.window_size = window_size
+
+    self.drop = nn.Dropout(p_dropout)
+    self.attn_layers = nn.ModuleList()
+    self.norm_layers_1 = nn.ModuleList()
+    self.ffn_layers = nn.ModuleList()
+    self.norm_layers_2 = nn.ModuleList()
+    for i in range(self.n_layers):
+      self.attn_layers.append(MultiHeadAttention(hidden_channels, hidden_channels, n_heads, p_dropout=p_dropout, window_size=window_size))
+      self.norm_layers_1.append(LayerNorm(hidden_channels))
+      self.ffn_layers.append(FFN(hidden_channels, hidden_channels, filter_channels, kernel_size, p_dropout=p_dropout))
+      self.norm_layers_2.append(LayerNorm(hidden_channels))
+
+  def forward(self, x, x_mask):
+    attn_mask = x_mask.unsqueeze(2) * x_mask.unsqueeze(-1)
+    x = x * x_mask
+    for i in range(self.n_layers):
+      y = self.attn_layers[i](x, x, attn_mask)
+      y = self.drop(y)
+      x = self.norm_layers_1[i](x + y)
+
+      y = self.ffn_layers[i](x, x_mask)
+      y = self.drop(y)
+      x = self.norm_layers_2[i](x + y)
+    x = x * x_mask
+    return x
+
+
+class Decoder(nn.Module):
+  def __init__(self, hidden_channels, filter_channels, n_heads, n_layers, kernel_size=1, p_dropout=0., proximal_bias=False, proximal_init=True, **kwargs):
+    super().__init__()
+    self.hidden_channels = hidden_channels
+    self.filter_channels = filter_channels
+    self.n_heads = n_heads
+    self.n_layers = n_layers
+    self.kernel_size = kernel_size
+    self.p_dropout = p_dropout
+    self.proximal_bias = proximal_bias
+    self.proximal_init = proximal_init
+
+    self.drop = nn.Dropout(p_dropout)
+    self.self_attn_layers = nn.ModuleList()
+    self.norm_layers_0 = nn.ModuleList()
+    self.encdec_attn_layers = nn.ModuleList()
+    self.norm_layers_1 = nn.ModuleList()
+    self.ffn_layers = nn.ModuleList()
+    self.norm_layers_2 = nn.ModuleList()
+    for i in range(self.n_layers):
+      self.self_attn_layers.append(MultiHeadAttention(hidden_channels, hidden_channels, n_heads, p_dropout=p_dropout, proximal_bias=proximal_bias, proximal_init=proximal_init))
+      self.norm_layers_0.append(LayerNorm(hidden_channels))
+      self.encdec_attn_layers.append(MultiHeadAttention(hidden_channels, hidden_channels, n_heads, p_dropout=p_dropout))
+      self.norm_layers_1.append(LayerNorm(hidden_channels))
+      self.ffn_layers.append(FFN(hidden_channels, hidden_channels, filter_channels, kernel_size, p_dropout=p_dropout, causal=True))
+      self.norm_layers_2.append(LayerNorm(hidden_channels))
+
+  def forward(self, x, x_mask, h, h_mask):
+    """
+    x: decoder input
+    h: encoder output
+    """
+    self_attn_mask = commons.subsequent_mask(x_mask.size(2)).to(device=x.device, dtype=x.dtype)
+    encdec_attn_mask = h_mask.unsqueeze(2) * x_mask.unsqueeze(-1)
+    x = x * x_mask
+    for i in range(self.n_layers):
+      y = self.self_attn_layers[i](x, x, self_attn_mask)
+      y = self.drop(y)
+      x = self.norm_layers_0[i](x + y)
+
+      y = self.encdec_attn_layers[i](x, h, encdec_attn_mask)
+      y = self.drop(y)
+      x = self.norm_layers_1[i](x + y)
+      
+      y = self.ffn_layers[i](x, x_mask)
+      y = self.drop(y)
+      x = self.norm_layers_2[i](x + y)
+    x = x * x_mask
+    return x
+
+
+class MultiHeadAttention(nn.Module):
+  def __init__(self, channels, out_channels, n_heads, p_dropout=0., window_size=None, heads_share=True, block_length=None, proximal_bias=False, proximal_init=False):
+    super().__init__()
+    assert channels % n_heads == 0
+
+    self.channels = channels
+    self.out_channels = out_channels
+    self.n_heads = n_heads
+    self.p_dropout = p_dropout
+    self.window_size = window_size
+    self.heads_share = heads_share
+    self.block_length = block_length
+    self.proximal_bias = proximal_bias
+    self.proximal_init = proximal_init
+    self.attn = None
+
+    self.k_channels = channels // n_heads
+    self.conv_q = nn.Conv1d(channels, channels, 1)
+    self.conv_k = nn.Conv1d(channels, channels, 1)
+    self.conv_v = nn.Conv1d(channels, channels, 1)
+    self.conv_o = nn.Conv1d(channels, out_channels, 1)
+    self.drop = nn.Dropout(p_dropout)
+
+    if window_size is not None:
+      n_heads_rel = 1 if heads_share else n_heads
+      rel_stddev = self.k_channels**-0.5
+      self.emb_rel_k = nn.Parameter(torch.randn(n_heads_rel, window_size * 2 + 1, self.k_channels) * rel_stddev)
+      self.emb_rel_v = nn.Parameter(torch.randn(n_heads_rel, window_size * 2 + 1, self.k_channels) * rel_stddev)
+
+    nn.init.xavier_uniform_(self.conv_q.weight)
+    nn.init.xavier_uniform_(self.conv_k.weight)
+    nn.init.xavier_uniform_(self.conv_v.weight)
+    if proximal_init:
+      with torch.no_grad():
+        self.conv_k.weight.copy_(self.conv_q.weight)
+        self.conv_k.bias.copy_(self.conv_q.bias)
+      
+  def forward(self, x, c, attn_mask=None):
+    q = self.conv_q(x)
+    k = self.conv_k(c)
+    v = self.conv_v(c)
+    
+    x, self.attn = self.attention(q, k, v, mask=attn_mask)
+
+    x = self.conv_o(x)
+    return x
+
+  def attention(self, query, key, value, mask=None):
+    # reshape [b, d, t] -> [b, n_h, t, d_k]
+    b, d, t_s, t_t = (*key.size(), query.size(2))
+    query = query.view(b, self.n_heads, self.k_channels, t_t).transpose(2, 3)
+    key = key.view(b, self.n_heads, self.k_channels, t_s).transpose(2, 3)
+    value = value.view(b, self.n_heads, self.k_channels, t_s).transpose(2, 3)
+
+    scores = torch.matmul(query / math.sqrt(self.k_channels), key.transpose(-2, -1))
+    if self.window_size is not None:
+      assert t_s == t_t, "Relative attention is only available for self-attention."
+      key_relative_embeddings = self._get_relative_embeddings(self.emb_rel_k, t_s)
+      rel_logits = self._matmul_with_relative_keys(query /math.sqrt(self.k_channels), key_relative_embeddings)
+      scores_local = self._relative_position_to_absolute_position(rel_logits)
+      scores = scores + scores_local
+    if self.proximal_bias:
+      assert t_s == t_t, "Proximal bias is only available for self-attention."
+      scores = scores + self._attention_bias_proximal(t_s).to(device=scores.device, dtype=scores.dtype)
+    if mask is not None:
+      scores = scores.masked_fill(mask == 0, -1e4)
+      if self.block_length is not None:
+        assert t_s == t_t, "Local attention is only available for self-attention."
+        block_mask = torch.ones_like(scores).triu(-self.block_length).tril(self.block_length)
+        scores = scores.masked_fill(block_mask == 0, -1e4)
+    p_attn = F.softmax(scores, dim=-1) # [b, n_h, t_t, t_s]
+    p_attn = self.drop(p_attn)
+    output = torch.matmul(p_attn, value)
+    if self.window_size is not None:
+      relative_weights = self._absolute_position_to_relative_position(p_attn)
+      value_relative_embeddings = self._get_relative_embeddings(self.emb_rel_v, t_s)
+      output = output + self._matmul_with_relative_values(relative_weights, value_relative_embeddings)
+    output = output.transpose(2, 3).contiguous().view(b, d, t_t) # [b, n_h, t_t, d_k] -> [b, d, t_t]
+    return output, p_attn
+
+  def _matmul_with_relative_values(self, x, y):
+    """
+    x: [b, h, l, m]
+    y: [h or 1, m, d]
+    ret: [b, h, l, d]
+    """
+    ret = torch.matmul(x, y.unsqueeze(0))
+    return ret
+
+  def _matmul_with_relative_keys(self, x, y):
+    """
+    x: [b, h, l, d]
+    y: [h or 1, m, d]
+    ret: [b, h, l, m]
+    """
+    ret = torch.matmul(x, y.unsqueeze(0).transpose(-2, -1))
+    return ret
+
+  def _get_relative_embeddings(self, relative_embeddings, length):
+    max_relative_position = 2 * self.window_size + 1
+    # Pad first before slice to avoid using cond ops.
+    pad_length = max(length - (self.window_size + 1), 0)
+    slice_start_position = max((self.window_size + 1) - length, 0)
+    slice_end_position = slice_start_position + 2 * length - 1
+    if pad_length > 0:
+      padded_relative_embeddings = F.pad(
+          relative_embeddings,
+          commons.convert_pad_shape([[0, 0], [pad_length, pad_length], [0, 0]]))
+    else:
+      padded_relative_embeddings = relative_embeddings
+    used_relative_embeddings = padded_relative_embeddings[:,slice_start_position:slice_end_position]
+    return used_relative_embeddings
+
+  def _relative_position_to_absolute_position(self, x):
+    """
+    x: [b, h, l, 2*l-1]
+    ret: [b, h, l, l]
+    """
+    batch, heads, length, _ = x.size()
+    # Concat columns of pad to shift from relative to absolute indexing.
+    x = F.pad(x, commons.convert_pad_shape([[0,0],[0,0],[0,0],[0,1]]))
+
+    # Concat extra elements so to add up to shape (len+1, 2*len-1).
+    x_flat = x.view([batch, heads, length * 2 * length])
+    x_flat = F.pad(x_flat, commons.convert_pad_shape([[0,0],[0,0],[0,length-1]]))
+
+    # Reshape and slice out the padded elements.
+    x_final = x_flat.view([batch, heads, length+1, 2*length-1])[:, :, :length, length-1:]
+    return x_final
+
+  def _absolute_position_to_relative_position(self, x):
+    """
+    x: [b, h, l, l]
+    ret: [b, h, l, 2*l-1]
+    """
+    batch, heads, length, _ = x.size()
+    # padd along column
+    x = F.pad(x, commons.convert_pad_shape([[0, 0], [0, 0], [0, 0], [0, length-1]]))
+    x_flat = x.view([batch, heads, length**2 + length*(length -1)])
+    # add 0's in the beginning that will skew the elements after reshape
+    x_flat = F.pad(x_flat, commons.convert_pad_shape([[0, 0], [0, 0], [length, 0]]))
+    x_final = x_flat.view([batch, heads, length, 2*length])[:,:,:,1:]
+    return x_final
+
+  def _attention_bias_proximal(self, length):
+    """Bias for self-attention to encourage attention to close positions.
+    Args:
+      length: an integer scalar.
+    Returns:
+      a Tensor with shape [1, 1, length, length]
+    """
+    r = torch.arange(length, dtype=torch.float32)
+    diff = torch.unsqueeze(r, 0) - torch.unsqueeze(r, 1)
+    return torch.unsqueeze(torch.unsqueeze(-torch.log1p(torch.abs(diff)), 0), 0)
+
+
+class FFN(nn.Module):
+  def __init__(self, in_channels, out_channels, filter_channels, kernel_size, p_dropout=0., activation=None, causal=False):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.filter_channels = filter_channels
+    self.kernel_size = kernel_size
+    self.p_dropout = p_dropout
+    self.activation = activation
+    self.causal = causal
+
+    if causal:
+      self.padding = self._causal_padding
+    else:
+      self.padding = self._same_padding
+
+    self.conv_1 = nn.Conv1d(in_channels, filter_channels, kernel_size)
+    self.conv_2 = nn.Conv1d(filter_channels, out_channels, kernel_size)
+    self.drop = nn.Dropout(p_dropout)
+
+  def forward(self, x, x_mask):
+    x = self.conv_1(self.padding(x * x_mask))
+    if self.activation == "gelu":
+      x = x * torch.sigmoid(1.702 * x)
+    else:
+      x = torch.relu(x)
+    x = self.drop(x)
+    x = self.conv_2(self.padding(x * x_mask))
+    return x * x_mask
+  
+  def _causal_padding(self, x):
+    if self.kernel_size == 1:
+      return x
+    pad_l = self.kernel_size - 1
+    pad_r = 0
+    padding = [[0, 0], [0, 0], [pad_l, pad_r]]
+    x = F.pad(x, commons.convert_pad_shape(padding))
+    return x
+
+  def _same_padding(self, x):
+    if self.kernel_size == 1:
+      return x
+    pad_l = (self.kernel_size - 1) // 2
+    pad_r = self.kernel_size // 2
+    padding = [[0, 0], [0, 0], [pad_l, pad_r]]
+    x = F.pad(x, commons.convert_pad_shape(padding))
+    return x
diff --git a/AutoCoverTool/ref/so_vits_svc/commons.py b/AutoCoverTool/ref/so_vits_svc/commons.py
new file mode 100644
index 0000000..0748880
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/commons.py
@@ -0,0 +1,188 @@
+import math
+import numpy as np
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+def slice_pitch_segments(x, ids_str, segment_size=4):
+  ret = torch.zeros_like(x[:, :segment_size])
+  for i in range(x.size(0)):
+    idx_str = ids_str[i]
+    idx_end = idx_str + segment_size
+    ret[i] = x[i, idx_str:idx_end]
+  return ret
+
+def rand_slice_segments_with_pitch(x, pitch, x_lengths=None, segment_size=4):
+  b, d, t = x.size()
+  if x_lengths is None:
+    x_lengths = t
+  ids_str_max = x_lengths - segment_size + 1
+  ids_str = (torch.rand([b]).to(device=x.device) * ids_str_max).to(dtype=torch.long)
+  ret = slice_segments(x, ids_str, segment_size)
+  ret_pitch = slice_pitch_segments(pitch, ids_str, segment_size)
+  return ret, ret_pitch, ids_str
+
+def init_weights(m, mean=0.0, std=0.01):
+  classname = m.__class__.__name__
+  if classname.find("Conv") != -1:
+    m.weight.data.normal_(mean, std)
+
+
+def get_padding(kernel_size, dilation=1):
+  return int((kernel_size*dilation - dilation)/2)
+
+
+def convert_pad_shape(pad_shape):
+  l = pad_shape[::-1]
+  pad_shape = [item for sublist in l for item in sublist]
+  return pad_shape
+
+
+def intersperse(lst, item):
+  result = [item] * (len(lst) * 2 + 1)
+  result[1::2] = lst
+  return result
+
+
+def kl_divergence(m_p, logs_p, m_q, logs_q):
+  """KL(P||Q)"""
+  kl = (logs_q - logs_p) - 0.5
+  kl += 0.5 * (torch.exp(2. * logs_p) + ((m_p - m_q)**2)) * torch.exp(-2. * logs_q)
+  return kl
+
+
+def rand_gumbel(shape):
+  """Sample from the Gumbel distribution, protect from overflows."""
+  uniform_samples = torch.rand(shape) * 0.99998 + 0.00001
+  return -torch.log(-torch.log(uniform_samples))
+
+
+def rand_gumbel_like(x):
+  g = rand_gumbel(x.size()).to(dtype=x.dtype, device=x.device)
+  return g
+
+
+def slice_segments(x, ids_str, segment_size=4):
+  ret = torch.zeros_like(x[:, :, :segment_size])
+  for i in range(x.size(0)):
+    idx_str = ids_str[i]
+    idx_end = idx_str + segment_size
+    ret[i] = x[i, :, idx_str:idx_end]
+  return ret
+
+
+def rand_slice_segments(x, x_lengths=None, segment_size=4):
+  b, d, t = x.size()
+  if x_lengths is None:
+    x_lengths = t
+  ids_str_max = x_lengths - segment_size + 1
+  ids_str = (torch.rand([b]).to(device=x.device) * ids_str_max).to(dtype=torch.long)
+  ret = slice_segments(x, ids_str, segment_size)
+  return ret, ids_str
+
+
+def rand_spec_segments(x, x_lengths=None, segment_size=4):
+  b, d, t = x.size()
+  if x_lengths is None:
+    x_lengths = t
+  ids_str_max = x_lengths - segment_size
+  ids_str = (torch.rand([b]).to(device=x.device) * ids_str_max).to(dtype=torch.long)
+  ret = slice_segments(x, ids_str, segment_size)
+  return ret, ids_str
+
+
+def get_timing_signal_1d(
+    length, channels, min_timescale=1.0, max_timescale=1.0e4):
+  position = torch.arange(length, dtype=torch.float)
+  num_timescales = channels // 2
+  log_timescale_increment = (
+      math.log(float(max_timescale) / float(min_timescale)) /
+      (num_timescales - 1))
+  inv_timescales = min_timescale * torch.exp(
+      torch.arange(num_timescales, dtype=torch.float) * -log_timescale_increment)
+  scaled_time = position.unsqueeze(0) * inv_timescales.unsqueeze(1)
+  signal = torch.cat([torch.sin(scaled_time), torch.cos(scaled_time)], 0)
+  signal = F.pad(signal, [0, 0, 0, channels % 2])
+  signal = signal.view(1, channels, length)
+  return signal
+
+
+def add_timing_signal_1d(x, min_timescale=1.0, max_timescale=1.0e4):
+  b, channels, length = x.size()
+  signal = get_timing_signal_1d(length, channels, min_timescale, max_timescale)
+  return x + signal.to(dtype=x.dtype, device=x.device)
+
+
+def cat_timing_signal_1d(x, min_timescale=1.0, max_timescale=1.0e4, axis=1):
+  b, channels, length = x.size()
+  signal = get_timing_signal_1d(length, channels, min_timescale, max_timescale)
+  return torch.cat([x, signal.to(dtype=x.dtype, device=x.device)], axis)
+
+
+def subsequent_mask(length):
+  mask = torch.tril(torch.ones(length, length)).unsqueeze(0).unsqueeze(0)
+  return mask
+
+
+@torch.jit.script
+def fused_add_tanh_sigmoid_multiply(input_a, input_b, n_channels):
+  n_channels_int = n_channels[0]
+  in_act = input_a + input_b
+  t_act = torch.tanh(in_act[:, :n_channels_int, :])
+  s_act = torch.sigmoid(in_act[:, n_channels_int:, :])
+  acts = t_act * s_act
+  return acts
+
+
+def convert_pad_shape(pad_shape):
+  l = pad_shape[::-1]
+  pad_shape = [item for sublist in l for item in sublist]
+  return pad_shape
+
+
+def shift_1d(x):
+  x = F.pad(x, convert_pad_shape([[0, 0], [0, 0], [1, 0]]))[:, :, :-1]
+  return x
+
+
+def sequence_mask(length, max_length=None):
+  if max_length is None:
+    max_length = length.max()
+  x = torch.arange(max_length, dtype=length.dtype, device=length.device)
+  return x.unsqueeze(0) < length.unsqueeze(1)
+
+
+def generate_path(duration, mask):
+  """
+  duration: [b, 1, t_x]
+  mask: [b, 1, t_y, t_x]
+  """
+  device = duration.device
+  
+  b, _, t_y, t_x = mask.shape
+  cum_duration = torch.cumsum(duration, -1)
+  
+  cum_duration_flat = cum_duration.view(b * t_x)
+  path = sequence_mask(cum_duration_flat, t_y).to(mask.dtype)
+  path = path.view(b, t_x, t_y)
+  path = path - F.pad(path, convert_pad_shape([[0, 0], [1, 0], [0, 0]]))[:, :-1]
+  path = path.unsqueeze(1).transpose(2,3) * mask
+  return path
+
+
+def clip_grad_value_(parameters, clip_value, norm_type=2):
+  if isinstance(parameters, torch.Tensor):
+    parameters = [parameters]
+  parameters = list(filter(lambda p: p.grad is not None, parameters))
+  norm_type = float(norm_type)
+  if clip_value is not None:
+    clip_value = float(clip_value)
+
+  total_norm = 0
+  for p in parameters:
+    param_norm = p.grad.data.norm(norm_type)
+    total_norm += param_norm.item() ** norm_type
+    if clip_value is not None:
+      p.grad.data.clamp_(min=-clip_value, max=clip_value)
+  total_norm = total_norm ** (1. / norm_type)
+  return total_norm
diff --git a/AutoCoverTool/ref/so_vits_svc/configs/config.json b/AutoCoverTool/ref/so_vits_svc/configs/config.json
new file mode 100644
index 0000000..13a503c
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/configs/config.json
@@ -0,0 +1 @@
+请使用生成的config文件
\ No newline at end of file
diff --git a/AutoCoverTool/ref/so_vits_svc/data_utils.py b/AutoCoverTool/ref/so_vits_svc/data_utils.py
new file mode 100644
index 0000000..1f5d4e2
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/data_utils.py
@@ -0,0 +1,154 @@
+import time
+import os
+import random
+import numpy as np
+import torch
+import torch.utils.data
+
+import commons
+from mel_processing import spectrogram_torch, spec_to_mel_torch
+from utils import load_wav_to_torch, load_filepaths_and_text, transform
+
+# import h5py
+
+
+"""Multi speaker version"""
+
+
+class TextAudioSpeakerLoader(torch.utils.data.Dataset):
+    """
+        1) loads audio, speaker_id, text pairs
+        2) normalizes text and converts them to sequences of integers
+        3) computes spectrograms from audio files.
+    """
+
+    def __init__(self, audiopaths, hparams):
+        self.audiopaths = load_filepaths_and_text(audiopaths)
+        self.max_wav_value = hparams.data.max_wav_value
+        self.sampling_rate = hparams.data.sampling_rate
+        self.filter_length = hparams.data.filter_length
+        self.hop_length = hparams.data.hop_length
+        self.win_length = hparams.data.win_length
+        self.sampling_rate = hparams.data.sampling_rate
+        self.use_sr = hparams.train.use_sr
+        self.spec_len = hparams.train.max_speclen
+        self.spk_map = hparams.spk
+
+        random.seed(1234)
+        random.shuffle(self.audiopaths)
+
+    def get_audio(self, filename):
+        filename = filename.replace("\\", "/")
+        audio, sampling_rate = load_wav_to_torch(filename)
+        if sampling_rate != self.sampling_rate:
+            raise ValueError("{} SR doesn't match target {} SR".format(
+                sampling_rate, self.sampling_rate))
+        audio_norm = audio / self.max_wav_value
+        audio_norm = audio_norm.unsqueeze(0)
+        spec_filename = filename.replace(".wav", ".spec.pt")
+        if os.path.exists(spec_filename):
+            spec = torch.load(spec_filename)
+        else:
+            spec = spectrogram_torch(audio_norm, self.filter_length,
+                                     self.sampling_rate, self.hop_length, self.win_length,
+                                     center=False)
+            spec = torch.squeeze(spec, 0)
+            torch.save(spec, spec_filename)
+
+        spk = filename.split("/")[-2]
+        spk = torch.LongTensor([self.spk_map[spk]])
+
+        c = torch.load(filename + ".soft.pt").squeeze(0)
+        c = torch.repeat_interleave(c, repeats=2, dim=1)
+
+        f0 = np.load(filename + ".f0.npy")
+        f0 = torch.FloatTensor(f0)
+        lmin = min(c.size(-1), spec.size(-1), f0.shape[0])
+        assert abs(c.size(-1) - spec.size(-1)) < 4, (c.size(-1), spec.size(-1), f0.shape, filename)
+        assert abs(lmin - spec.size(-1)) < 4, (c.size(-1), spec.size(-1), f0.shape)
+        assert abs(lmin - c.size(-1)) < 4, (c.size(-1), spec.size(-1), f0.shape)
+        spec, c, f0 = spec[:, :lmin], c[:, :lmin], f0[:lmin]
+        audio_norm = audio_norm[:, :lmin * self.hop_length]
+        _spec, _c, _audio_norm, _f0 = spec, c, audio_norm, f0
+        while spec.size(-1) < self.spec_len:
+            spec = torch.cat((spec, _spec), -1)
+            c = torch.cat((c, _c), -1)
+            f0 = torch.cat((f0, _f0), -1)
+            audio_norm = torch.cat((audio_norm, _audio_norm), -1)
+        start = random.randint(0, spec.size(-1) - self.spec_len)
+        end = start + self.spec_len
+        spec = spec[:, start:end]
+        c = c[:, start:end]
+        f0 = f0[start:end]
+        audio_norm = audio_norm[:, start * self.hop_length:end * self.hop_length]
+
+        return c, f0, spec, audio_norm, spk
+
+    def __getitem__(self, index):
+        return self.get_audio(self.audiopaths[index][0])
+
+    def __len__(self):
+        return len(self.audiopaths)
+
+
+class EvalDataLoader(torch.utils.data.Dataset):
+    """
+        1) loads audio, speaker_id, text pairs
+        2) normalizes text and converts them to sequences of integers
+        3) computes spectrograms from audio files.
+    """
+
+    def __init__(self, audiopaths, hparams):
+        self.audiopaths = load_filepaths_and_text(audiopaths)
+        self.max_wav_value = hparams.data.max_wav_value
+        self.sampling_rate = hparams.data.sampling_rate
+        self.filter_length = hparams.data.filter_length
+        self.hop_length = hparams.data.hop_length
+        self.win_length = hparams.data.win_length
+        self.sampling_rate = hparams.data.sampling_rate
+        self.use_sr = hparams.train.use_sr
+        self.audiopaths = self.audiopaths[:5]
+        self.spk_map = hparams.spk
+
+
+    def get_audio(self, filename):
+        filename = filename.replace("\\", "/")
+        audio, sampling_rate = load_wav_to_torch(filename)
+        if sampling_rate != self.sampling_rate:
+            raise ValueError("{} SR doesn't match target {} SR".format(
+                sampling_rate, self.sampling_rate))
+        audio_norm = audio / self.max_wav_value
+        audio_norm = audio_norm.unsqueeze(0)
+        spec_filename = filename.replace(".wav", ".spec.pt")
+        if os.path.exists(spec_filename):
+            spec = torch.load(spec_filename)
+        else:
+            spec = spectrogram_torch(audio_norm, self.filter_length,
+                                     self.sampling_rate, self.hop_length, self.win_length,
+                                     center=False)
+            spec = torch.squeeze(spec, 0)
+            torch.save(spec, spec_filename)
+
+        spk = filename.split("/")[-2]
+        spk = torch.LongTensor([self.spk_map[spk]])
+
+        c = torch.load(filename + ".soft.pt").squeeze(0)
+
+        c = torch.repeat_interleave(c, repeats=2, dim=1)
+
+        f0 = np.load(filename + ".f0.npy")
+        f0 = torch.FloatTensor(f0)
+        lmin = min(c.size(-1), spec.size(-1), f0.shape[0])
+        assert abs(c.size(-1) - spec.size(-1)) < 4, (c.size(-1), spec.size(-1), f0.shape)
+        assert abs(f0.shape[0] - spec.shape[-1]) < 4, (c.size(-1), spec.size(-1), f0.shape)
+        spec, c, f0 = spec[:, :lmin], c[:, :lmin], f0[:lmin]
+        audio_norm = audio_norm[:, :lmin * self.hop_length]
+
+        return c, f0, spec, audio_norm, spk
+
+    def __getitem__(self, index):
+        return self.get_audio(self.audiopaths[index][0])
+
+    def __len__(self):
+        return len(self.audiopaths)
+
diff --git a/AutoCoverTool/ref/so_vits_svc/filelists/test.txt b/AutoCoverTool/ref/so_vits_svc/filelists/test.txt
new file mode 100644
index 0000000..5246bc4
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/filelists/test.txt
@@ -0,0 +1,7 @@
+./dataset/32k/yunhao/001829.wav
+./dataset/32k/yunhao/001827.wav
+./dataset/32k/jishuang/000104.wav
+./dataset/32k/nen/kne110_005.wav
+./dataset/32k/nen/kne110_004.wav
+./dataset/32k/jishuang/000223.wav
+./dataset/32k/yunhao/001828.wav
diff --git a/AutoCoverTool/ref/so_vits_svc/filelists/train.txt b/AutoCoverTool/ref/so_vits_svc/filelists/train.txt
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/so_vits_svc/filelists/val.txt b/AutoCoverTool/ref/so_vits_svc/filelists/val.txt
new file mode 100644
index 0000000..40d9d47
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/filelists/val.txt
@@ -0,0 +1,6 @@
+./dataset/32k/nen/kne110_005.wav
+./dataset/32k/yunhao/001827.wav
+./dataset/32k/jishuang/000104.wav
+./dataset/32k/jishuang/000223.wav
+./dataset/32k/nen/kne110_004.wav
+./dataset/32k/yunhao/001828.wav
diff --git a/AutoCoverTool/ref/so_vits_svc/flask_api.py b/AutoCoverTool/ref/so_vits_svc/flask_api.py
new file mode 100644
index 0000000..8cc236a
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/flask_api.py
@@ -0,0 +1,56 @@
+import io
+import logging
+
+import soundfile
+import torch
+import torchaudio
+from flask import Flask, request, send_file
+from flask_cors import CORS
+
+from inference.infer_tool import Svc, RealTimeVC
+
+app = Flask(__name__)
+
+CORS(app)
+
+logging.getLogger('numba').setLevel(logging.WARNING)
+
+
+@app.route("/voiceChangeModel", methods=["POST"])
+def voice_change_model():
+    request_form = request.form
+    wave_file = request.files.get("sample", None)
+    # 变调信息
+    f_pitch_change = float(request_form.get("fPitchChange", 0))
+    # DAW所需的采样率
+    daw_sample = int(float(request_form.get("sampleRate", 0)))
+    speaker_id = int(float(request_form.get("sSpeakId", 0)))
+    # http获得wav文件并转换
+    input_wav_path = io.BytesIO(wave_file.read())
+
+    # 模型推理
+    if raw_infer:
+        out_audio, out_sr = svc_model.infer(speaker_id, f_pitch_change, input_wav_path)
+        tar_audio = torchaudio.functional.resample(out_audio, svc_model.target_sample, daw_sample)
+    else:
+        out_audio = svc.process(svc_model, speaker_id, f_pitch_change, input_wav_path)
+        tar_audio = torchaudio.functional.resample(torch.from_numpy(out_audio), svc_model.target_sample, daw_sample)
+    # 返回音频
+    out_wav_path = io.BytesIO()
+    soundfile.write(out_wav_path, tar_audio.cpu().numpy(), daw_sample, format="wav")
+    out_wav_path.seek(0)
+    return send_file(out_wav_path, download_name="temp.wav", as_attachment=True)
+
+
+if __name__ == '__main__':
+    # 启用则为直接切片合成，False为交叉淡化方式
+    # vst插件调整0.3-0.5s切片时间可以降低延迟，直接切片方法会有连接处爆音、交叉淡化会有轻微重叠声音
+    # 自行选择能接受的方法，或将vst最大切片时间调整为1s，此处设为Ture，延迟大音质稳定一些
+    raw_infer = True
+    # 每个模型和config是唯一对应的
+    model_name = "logs/32k/G_174000-Copy1.pth"
+    config_name = "configs/config.json"
+    svc_model = Svc(model_name, config_name)
+    svc = RealTimeVC()
+    # 此处与vst插件对应，不建议更改
+    app.run(port=6842, host="0.0.0.0", debug=False, threaded=False)
diff --git a/AutoCoverTool/ref/so_vits_svc/hubert/__init__.py b/AutoCoverTool/ref/so_vits_svc/hubert/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/so_vits_svc/hubert/hubert_model.py b/AutoCoverTool/ref/so_vits_svc/hubert/hubert_model.py
new file mode 100644
index 0000000..7fb642d
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/hubert/hubert_model.py
@@ -0,0 +1,222 @@
+import copy
+import random
+from typing import Optional, Tuple
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as t_func
+from torch.nn.modules.utils import consume_prefix_in_state_dict_if_present
+
+
+class Hubert(nn.Module):
+    def __init__(self, num_label_embeddings: int = 100, mask: bool = True):
+        super().__init__()
+        self._mask = mask
+        self.feature_extractor = FeatureExtractor()
+        self.feature_projection = FeatureProjection()
+        self.positional_embedding = PositionalConvEmbedding()
+        self.norm = nn.LayerNorm(768)
+        self.dropout = nn.Dropout(0.1)
+        self.encoder = TransformerEncoder(
+            nn.TransformerEncoderLayer(
+                768, 12, 3072, activation="gelu", batch_first=True
+            ),
+            12,
+        )
+        self.proj = nn.Linear(768, 256)
+
+        self.masked_spec_embed = nn.Parameter(torch.FloatTensor(768).uniform_())
+        self.label_embedding = nn.Embedding(num_label_embeddings, 256)
+
+    def mask(self, x: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
+        mask = None
+        if self.training and self._mask:
+            mask = _compute_mask((x.size(0), x.size(1)), 0.8, 10, x.device, 2)
+            x[mask] = self.masked_spec_embed.to(x.dtype)
+        return x, mask
+
+    def encode(
+            self, x: torch.Tensor, layer: Optional[int] = None
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        x = self.feature_extractor(x)
+        x = self.feature_projection(x.transpose(1, 2))
+        x, mask = self.mask(x)
+        x = x + self.positional_embedding(x)
+        x = self.dropout(self.norm(x))
+        x = self.encoder(x, output_layer=layer)
+        return x, mask
+
+    def logits(self, x: torch.Tensor) -> torch.Tensor:
+        logits = torch.cosine_similarity(
+            x.unsqueeze(2),
+            self.label_embedding.weight.unsqueeze(0).unsqueeze(0),
+            dim=-1,
+        )
+        return logits / 0.1
+
+    def forward(self, x: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
+        x, mask = self.encode(x)
+        x = self.proj(x)
+        logits = self.logits(x)
+        return logits, mask
+
+
+class HubertSoft(Hubert):
+    def __init__(self):
+        super().__init__()
+
+    @torch.inference_mode()
+    def units(self, wav: torch.Tensor) -> torch.Tensor:
+        wav = t_func.pad(wav, ((400 - 320) // 2, (400 - 320) // 2))
+        x, _ = self.encode(wav)
+        return self.proj(x)
+
+
+class FeatureExtractor(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.conv0 = nn.Conv1d(1, 512, 10, 5, bias=False)
+        self.norm0 = nn.GroupNorm(512, 512)
+        self.conv1 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv2 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv3 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv4 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv5 = nn.Conv1d(512, 512, 2, 2, bias=False)
+        self.conv6 = nn.Conv1d(512, 512, 2, 2, bias=False)
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = t_func.gelu(self.norm0(self.conv0(x)))
+        x = t_func.gelu(self.conv1(x))
+        x = t_func.gelu(self.conv2(x))
+        x = t_func.gelu(self.conv3(x))
+        x = t_func.gelu(self.conv4(x))
+        x = t_func.gelu(self.conv5(x))
+        x = t_func.gelu(self.conv6(x))
+        return x
+
+
+class FeatureProjection(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.norm = nn.LayerNorm(512)
+        self.projection = nn.Linear(512, 768)
+        self.dropout = nn.Dropout(0.1)
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.norm(x)
+        x = self.projection(x)
+        x = self.dropout(x)
+        return x
+
+
+class PositionalConvEmbedding(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.conv = nn.Conv1d(
+            768,
+            768,
+            kernel_size=128,
+            padding=128 // 2,
+            groups=16,
+        )
+        self.conv = nn.utils.weight_norm(self.conv, name="weight", dim=2)
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.conv(x.transpose(1, 2))
+        x = t_func.gelu(x[:, :, :-1])
+        return x.transpose(1, 2)
+
+
+class TransformerEncoder(nn.Module):
+    def __init__(
+            self, encoder_layer: nn.TransformerEncoderLayer, num_layers: int
+    ) -> None:
+        super(TransformerEncoder, self).__init__()
+        self.layers = nn.ModuleList(
+            [copy.deepcopy(encoder_layer) for _ in range(num_layers)]
+        )
+        self.num_layers = num_layers
+
+    def forward(
+            self,
+            src: torch.Tensor,
+            mask: torch.Tensor = None,
+            src_key_padding_mask: torch.Tensor = None,
+            output_layer: Optional[int] = None,
+    ) -> torch.Tensor:
+        output = src
+        for layer in self.layers[:output_layer]:
+            output = layer(
+                output, src_mask=mask, src_key_padding_mask=src_key_padding_mask
+            )
+        return output
+
+
+def _compute_mask(
+        shape: Tuple[int, int],
+        mask_prob: float,
+        mask_length: int,
+        device: torch.device,
+        min_masks: int = 0,
+) -> torch.Tensor:
+    batch_size, sequence_length = shape
+
+    if mask_length < 1:
+        raise ValueError("`mask_length` has to be bigger than 0.")
+
+    if mask_length > sequence_length:
+        raise ValueError(
+            f"`mask_length` has to be smaller than `sequence_length`, but got `mask_length`: {mask_length} and `sequence_length`: {sequence_length}`"
+        )
+
+    # compute number of masked spans in batch
+    num_masked_spans = int(mask_prob * sequence_length / mask_length + random.random())
+    num_masked_spans = max(num_masked_spans, min_masks)
+
+    # make sure num masked indices <= sequence_length
+    if num_masked_spans * mask_length > sequence_length:
+        num_masked_spans = sequence_length // mask_length
+
+    # SpecAugment mask to fill
+    mask = torch.zeros((batch_size, sequence_length), device=device, dtype=torch.bool)
+
+    # uniform distribution to sample from, make sure that offset samples are < sequence_length
+    uniform_dist = torch.ones(
+        (batch_size, sequence_length - (mask_length - 1)), device=device
+    )
+
+    # get random indices to mask
+    mask_indices = torch.multinomial(uniform_dist, num_masked_spans)
+
+    # expand masked indices to masked spans
+    mask_indices = (
+        mask_indices.unsqueeze(dim=-1)
+        .expand((batch_size, num_masked_spans, mask_length))
+        .reshape(batch_size, num_masked_spans * mask_length)
+    )
+    offsets = (
+        torch.arange(mask_length, device=device)[None, None, :]
+        .expand((batch_size, num_masked_spans, mask_length))
+        .reshape(batch_size, num_masked_spans * mask_length)
+    )
+    mask_idxs = mask_indices + offsets
+
+    # scatter indices to mask
+    mask = mask.scatter(1, mask_idxs, True)
+
+    return mask
+
+
+def hubert_soft(
+        path: str,
+) -> HubertSoft:
+    r"""HuBERT-Soft from `"A Comparison of Discrete and Soft Speech Units for Improved Voice Conversion"`.
+    Args:
+        path (str): path of a pretrained model
+    """
+    hubert = HubertSoft()
+    checkpoint = torch.load(path)
+    consume_prefix_in_state_dict_if_present(checkpoint, "module.")
+    hubert.load_state_dict(checkpoint)
+    hubert.eval()
+    return hubert
diff --git a/AutoCoverTool/ref/so_vits_svc/hubert/hubert_model_onnx.py b/AutoCoverTool/ref/so_vits_svc/hubert/hubert_model_onnx.py
new file mode 100644
index 0000000..d18f3c2
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/hubert/hubert_model_onnx.py
@@ -0,0 +1,217 @@
+import copy
+import random
+from typing import Optional, Tuple
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as t_func
+from torch.nn.modules.utils import consume_prefix_in_state_dict_if_present
+
+
+class Hubert(nn.Module):
+    def __init__(self, num_label_embeddings: int = 100, mask: bool = True):
+        super().__init__()
+        self._mask = mask
+        self.feature_extractor = FeatureExtractor()
+        self.feature_projection = FeatureProjection()
+        self.positional_embedding = PositionalConvEmbedding()
+        self.norm = nn.LayerNorm(768)
+        self.dropout = nn.Dropout(0.1)
+        self.encoder = TransformerEncoder(
+            nn.TransformerEncoderLayer(
+                768, 12, 3072, activation="gelu", batch_first=True
+            ),
+            12,
+        )
+        self.proj = nn.Linear(768, 256)
+
+        self.masked_spec_embed = nn.Parameter(torch.FloatTensor(768).uniform_())
+        self.label_embedding = nn.Embedding(num_label_embeddings, 256)
+
+    def mask(self, x: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
+        mask = None
+        if self.training and self._mask:
+            mask = _compute_mask((x.size(0), x.size(1)), 0.8, 10, x.device, 2)
+            x[mask] = self.masked_spec_embed.to(x.dtype)
+        return x, mask
+
+    def encode(
+            self, x: torch.Tensor, layer: Optional[int] = None
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        x = self.feature_extractor(x)
+        x = self.feature_projection(x.transpose(1, 2))
+        x, mask = self.mask(x)
+        x = x + self.positional_embedding(x)
+        x = self.dropout(self.norm(x))
+        x = self.encoder(x, output_layer=layer)
+        return x, mask
+
+    def logits(self, x: torch.Tensor) -> torch.Tensor:
+        logits = torch.cosine_similarity(
+            x.unsqueeze(2),
+            self.label_embedding.weight.unsqueeze(0).unsqueeze(0),
+            dim=-1,
+        )
+        return logits / 0.1
+
+
+class HubertSoft(Hubert):
+    def __init__(self):
+        super().__init__()
+
+    def units(self, wav: torch.Tensor) -> torch.Tensor:
+        wav = t_func.pad(wav, ((400 - 320) // 2, (400 - 320) // 2))
+        x, _ = self.encode(wav)
+        return self.proj(x)
+
+    def forward(self, x):
+        return self.units(x)
+
+class FeatureExtractor(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.conv0 = nn.Conv1d(1, 512, 10, 5, bias=False)
+        self.norm0 = nn.GroupNorm(512, 512)
+        self.conv1 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv2 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv3 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv4 = nn.Conv1d(512, 512, 3, 2, bias=False)
+        self.conv5 = nn.Conv1d(512, 512, 2, 2, bias=False)
+        self.conv6 = nn.Conv1d(512, 512, 2, 2, bias=False)
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = t_func.gelu(self.norm0(self.conv0(x)))
+        x = t_func.gelu(self.conv1(x))
+        x = t_func.gelu(self.conv2(x))
+        x = t_func.gelu(self.conv3(x))
+        x = t_func.gelu(self.conv4(x))
+        x = t_func.gelu(self.conv5(x))
+        x = t_func.gelu(self.conv6(x))
+        return x
+
+
+class FeatureProjection(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.norm = nn.LayerNorm(512)
+        self.projection = nn.Linear(512, 768)
+        self.dropout = nn.Dropout(0.1)
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.norm(x)
+        x = self.projection(x)
+        x = self.dropout(x)
+        return x
+
+
+class PositionalConvEmbedding(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.conv = nn.Conv1d(
+            768,
+            768,
+            kernel_size=128,
+            padding=128 // 2,
+            groups=16,
+        )
+        self.conv = nn.utils.weight_norm(self.conv, name="weight", dim=2)
+
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.conv(x.transpose(1, 2))
+        x = t_func.gelu(x[:, :, :-1])
+        return x.transpose(1, 2)
+
+
+class TransformerEncoder(nn.Module):
+    def __init__(
+            self, encoder_layer: nn.TransformerEncoderLayer, num_layers: int
+    ) -> None:
+        super(TransformerEncoder, self).__init__()
+        self.layers = nn.ModuleList(
+            [copy.deepcopy(encoder_layer) for _ in range(num_layers)]
+        )
+        self.num_layers = num_layers
+
+    def forward(
+            self,
+            src: torch.Tensor,
+            mask: torch.Tensor = None,
+            src_key_padding_mask: torch.Tensor = None,
+            output_layer: Optional[int] = None,
+    ) -> torch.Tensor:
+        output = src
+        for layer in self.layers[:output_layer]:
+            output = layer(
+                output, src_mask=mask, src_key_padding_mask=src_key_padding_mask
+            )
+        return output
+
+
+def _compute_mask(
+        shape: Tuple[int, int],
+        mask_prob: float,
+        mask_length: int,
+        device: torch.device,
+        min_masks: int = 0,
+) -> torch.Tensor:
+    batch_size, sequence_length = shape
+
+    if mask_length < 1:
+        raise ValueError("`mask_length` has to be bigger than 0.")
+
+    if mask_length > sequence_length:
+        raise ValueError(
+            f"`mask_length` has to be smaller than `sequence_length`, but got `mask_length`: {mask_length} and `sequence_length`: {sequence_length}`"
+        )
+
+    # compute number of masked spans in batch
+    num_masked_spans = int(mask_prob * sequence_length / mask_length + random.random())
+    num_masked_spans = max(num_masked_spans, min_masks)
+
+    # make sure num masked indices <= sequence_length
+    if num_masked_spans * mask_length > sequence_length:
+        num_masked_spans = sequence_length // mask_length
+
+    # SpecAugment mask to fill
+    mask = torch.zeros((batch_size, sequence_length), device=device, dtype=torch.bool)
+
+    # uniform distribution to sample from, make sure that offset samples are < sequence_length
+    uniform_dist = torch.ones(
+        (batch_size, sequence_length - (mask_length - 1)), device=device
+    )
+
+    # get random indices to mask
+    mask_indices = torch.multinomial(uniform_dist, num_masked_spans)
+
+    # expand masked indices to masked spans
+    mask_indices = (
+        mask_indices.unsqueeze(dim=-1)
+        .expand((batch_size, num_masked_spans, mask_length))
+        .reshape(batch_size, num_masked_spans * mask_length)
+    )
+    offsets = (
+        torch.arange(mask_length, device=device)[None, None, :]
+        .expand((batch_size, num_masked_spans, mask_length))
+        .reshape(batch_size, num_masked_spans * mask_length)
+    )
+    mask_idxs = mask_indices + offsets
+
+    # scatter indices to mask
+    mask = mask.scatter(1, mask_idxs, True)
+
+    return mask
+
+
+def hubert_soft(
+        path: str,
+) -> HubertSoft:
+    r"""HuBERT-Soft from `"A Comparison of Discrete and Soft Speech Units for Improved Voice Conversion"`.
+    Args:
+        path (str): path of a pretrained model
+    """
+    hubert = HubertSoft()
+    checkpoint = torch.load(path)
+    consume_prefix_in_state_dict_if_present(checkpoint, "module.")
+    hubert.load_state_dict(checkpoint)
+    hubert.eval()
+    return hubert
diff --git a/AutoCoverTool/ref/so_vits_svc/hubert/put_hubert_ckpt_here b/AutoCoverTool/ref/so_vits_svc/hubert/put_hubert_ckpt_here
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/so_vits_svc/inference/__init__.py b/AutoCoverTool/ref/so_vits_svc/inference/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/so_vits_svc/inference/infer_tool.py b/AutoCoverTool/ref/so_vits_svc/inference/infer_tool.py
new file mode 100644
index 0000000..2bfa86d
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/inference/infer_tool.py
@@ -0,0 +1,327 @@
+import hashlib
+import json
+import logging
+import os
+import time
+from pathlib import Path
+
+import librosa
+import maad
+import numpy as np
+# import onnxruntime
+import parselmouth
+import soundfile
+import torch
+import torchaudio
+
+from hubert import hubert_model
+import utils
+from models import SynthesizerTrn
+
+logging.getLogger('matplotlib').setLevel(logging.WARNING)
+
+
+def read_temp(file_name):
+    if not os.path.exists(file_name):
+        with open(file_name, "w") as f:
+            f.write(json.dumps({"info": "temp_dict"}))
+        return {}
+    else:
+        try:
+            with open(file_name, "r") as f:
+                data = f.read()
+            data_dict = json.loads(data)
+            if os.path.getsize(file_name) > 50 * 1024 * 1024:
+                f_name = file_name.replace("\\", "/").split("/")[-1]
+                print(f"clean {f_name}")
+                for wav_hash in list(data_dict.keys()):
+                    if int(time.time()) - int(data_dict[wav_hash]["time"]) > 14 * 24 * 3600:
+                        del data_dict[wav_hash]
+        except Exception as e:
+            print(e)
+            print(f"{file_name} error,auto rebuild file")
+            data_dict = {"info": "temp_dict"}
+        return data_dict
+
+
+def write_temp(file_name, data):
+    with open(file_name, "w") as f:
+        f.write(json.dumps(data))
+
+
+def timeit(func):
+    def run(*args, **kwargs):
+        t = time.time()
+        res = func(*args, **kwargs)
+        print('executing \'%s\' costed %.3fs' % (func.__name__, time.time() - t))
+        return res
+
+    return run
+
+
+def format_wav(audio_path):
+    if Path(audio_path).suffix == '.wav':
+        return
+    raw_audio, raw_sample_rate = librosa.load(audio_path, mono=True, sr=None)
+    soundfile.write(Path(audio_path).with_suffix(".wav"), raw_audio, raw_sample_rate)
+
+
+def get_end_file(dir_path, end):
+    file_lists = []
+    for root, dirs, files in os.walk(dir_path):
+        files = [f for f in files if f[0] != '.']
+        dirs[:] = [d for d in dirs if d[0] != '.']
+        for f_file in files:
+            if f_file.endswith(end):
+                file_lists.append(os.path.join(root, f_file).replace("\\", "/"))
+    return file_lists
+
+
+def get_md5(content):
+    return hashlib.new("md5", content).hexdigest()
+
+
+def resize2d_f0(x, target_len):
+    source = np.array(x)
+    source[source < 0.001] = np.nan
+    target = np.interp(np.arange(0, len(source) * target_len, len(source)) / target_len, np.arange(0, len(source)),
+                       source)
+    res = np.nan_to_num(target)
+    return res
+
+
+def get_f0(x, p_len, f0_up_key=0):
+    time_step = 160 / 16000 * 1000
+    f0_min = 50
+    f0_max = 1100
+    f0_mel_min = 1127 * np.log(1 + f0_min / 700)
+    f0_mel_max = 1127 * np.log(1 + f0_max / 700)
+
+    f0 = parselmouth.Sound(x, 16000).to_pitch_ac(
+        time_step=time_step / 1000, voicing_threshold=0.6,
+        pitch_floor=f0_min, pitch_ceiling=f0_max).selected_array['frequency']
+    if len(f0) > p_len:
+        f0 = f0[:p_len]
+    pad_size = (p_len - len(f0) + 1) // 2
+    if (pad_size > 0 or p_len - len(f0) - pad_size > 0):
+        f0 = np.pad(f0, [[pad_size, p_len - len(f0) - pad_size]], mode='constant')
+
+    f0 *= pow(2, f0_up_key / 12)
+    f0_mel = 1127 * np.log(1 + f0 / 700)
+    f0_mel[f0_mel > 0] = (f0_mel[f0_mel > 0] - f0_mel_min) * 254 / (f0_mel_max - f0_mel_min) + 1
+    f0_mel[f0_mel <= 1] = 1
+    f0_mel[f0_mel > 255] = 255
+    f0_coarse = np.rint(f0_mel).astype(np.int)
+    return f0_coarse, f0
+
+
+def clean_pitch(input_pitch):
+    num_nan = np.sum(input_pitch == 1)
+    if num_nan / len(input_pitch) > 0.9:
+        input_pitch[input_pitch != 1] = 1
+    return input_pitch
+
+
+def plt_pitch(input_pitch):
+    input_pitch = input_pitch.astype(float)
+    input_pitch[input_pitch == 1] = np.nan
+    return input_pitch
+
+
+def f0_to_pitch(ff):
+    f0_pitch = 69 + 12 * np.log2(ff / 440)
+    return f0_pitch
+
+
+def fill_a_to_b(a, b):
+    if len(a) < len(b):
+        for _ in range(0, len(b) - len(a)):
+            a.append(a[0])
+
+
+def mkdir(paths: list):
+    for path in paths:
+        if not os.path.exists(path):
+            os.mkdir(path)
+
+
+class Svc(object):
+    def __init__(self, net_g_path, config_path, hubert_path="data/models/hubert-soft-0d54a1f4.pt",
+                 onnx=False):
+        self.onnx = onnx
+        self.net_g_path = net_g_path
+        self.hubert_path = hubert_path
+        self.dev = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.net_g_ms = None
+        self.hps_ms = utils.get_hparams_from_file(config_path)
+        self.target_sample = self.hps_ms.data.sampling_rate
+        self.hop_size = self.hps_ms.data.hop_length
+        self.speakers = {}
+        for spk, sid in self.hps_ms.spk.items():
+            self.speakers[sid] = spk
+        self.spk2id = self.hps_ms.spk
+        # 加载hubert
+        self.hubert_soft = hubert_model.hubert_soft(hubert_path)
+        if torch.cuda.is_available():
+            self.hubert_soft = self.hubert_soft.cuda()
+        self.load_model()
+
+    def load_model(self):
+        # 获取模型配置
+        if self.onnx:
+            raise NotImplementedError
+            # self.net_g_ms = SynthesizerTrnForONNX(
+            #     178,
+            #     self.hps_ms.data.filter_length // 2 + 1,
+            #     self.hps_ms.train.segment_size // self.hps_ms.data.hop_length,
+            #     n_speakers=self.hps_ms.data.n_speakers,
+            #     **self.hps_ms.model)
+            # _ = utils.load_checkpoint(self.net_g_path, self.net_g_ms, None)
+        else:
+            self.net_g_ms = SynthesizerTrn(
+                self.hps_ms.data.filter_length // 2 + 1,
+                self.hps_ms.train.segment_size // self.hps_ms.data.hop_length,
+                **self.hps_ms.model)
+            _ = utils.load_checkpoint(self.net_g_path, self.net_g_ms, None)
+        if "half" in self.net_g_path and torch.cuda.is_available():
+            _ = self.net_g_ms.half().eval().to(self.dev)
+        else:
+            _ = self.net_g_ms.eval().to(self.dev)
+
+    def get_units(self, source, sr):
+
+        source = source.unsqueeze(0).to(self.dev)
+        with torch.inference_mode():
+            start = time.time()
+            units = self.hubert_soft.units(source)
+            use_time = time.time() - start
+            print("hubert use time:{}".format(use_time))
+            return units
+
+    def get_unit_pitch(self, in_path, tran):
+        source, sr = torchaudio.load(in_path)
+        source = torchaudio.functional.resample(source, sr, 16000)
+        if len(source.shape) == 2 and source.shape[1] >= 2:
+            source = torch.mean(source, dim=0).unsqueeze(0)
+        soft = self.get_units(source, sr).squeeze(0).cpu().numpy()
+        f0_coarse, f0 = get_f0(source.cpu().numpy()[0], soft.shape[0] * 2, tran)
+        return soft, f0
+
+    def infer(self, speaker_id, tran, raw_path, dev=False):
+        if type(speaker_id) == str:
+            speaker_id = self.spk2id[speaker_id]
+        sid = torch.LongTensor([int(speaker_id)]).to(self.dev).unsqueeze(0)
+        soft, pitch = self.get_unit_pitch(raw_path, tran)
+        f0 = torch.FloatTensor(clean_pitch(pitch)).unsqueeze(0).to(self.dev)
+        if "half" in self.net_g_path and torch.cuda.is_available():
+            stn_tst = torch.HalfTensor(soft)
+        else:
+            stn_tst = torch.FloatTensor(soft)
+        with torch.no_grad():
+            x_tst = stn_tst.unsqueeze(0).to(self.dev)
+            start = time.time()
+            x_tst = torch.repeat_interleave(x_tst, repeats=2, dim=1).transpose(1, 2)
+            audio = self.net_g_ms.infer(x_tst, f0=f0, g=sid)[0, 0].data.float()
+            use_time = time.time() - start
+            print("vits use time:{}".format(use_time))
+        return audio, audio.shape[-1]
+
+
+# class SvcONNXInferModel(object):
+#     def __init__(self, hubert_onnx, vits_onnx, config_path):
+#         self.config_path = config_path
+#         self.vits_onnx = vits_onnx
+#         self.hubert_onnx = hubert_onnx
+#         self.hubert_onnx_session = onnxruntime.InferenceSession(hubert_onnx, providers=['CUDAExecutionProvider', ])
+#         self.inspect_onnx(self.hubert_onnx_session)
+#         self.vits_onnx_session = onnxruntime.InferenceSession(vits_onnx, providers=['CUDAExecutionProvider', ])
+#         self.inspect_onnx(self.vits_onnx_session)
+#         self.hps_ms = utils.get_hparams_from_file(self.config_path)
+#         self.target_sample = self.hps_ms.data.sampling_rate
+#         self.feature_input = FeatureInput(self.hps_ms.data.sampling_rate, self.hps_ms.data.hop_length)
+#
+#     @staticmethod
+#     def inspect_onnx(session):
+#         for i in session.get_inputs():
+#             print("name:{}\tshape:{}\tdtype:{}".format(i.name, i.shape, i.type))
+#         for i in session.get_outputs():
+#             print("name:{}\tshape:{}\tdtype:{}".format(i.name, i.shape, i.type))
+#
+#     def infer(self, speaker_id, tran, raw_path):
+#         sid = np.array([int(speaker_id)], dtype=np.int64)
+#         soft, pitch = self.get_unit_pitch(raw_path, tran)
+#         pitch = np.expand_dims(pitch, axis=0).astype(np.int64)
+#         stn_tst = soft
+#         x_tst = np.expand_dims(stn_tst, axis=0)
+#         x_tst_lengths = np.array([stn_tst.shape[0]], dtype=np.int64)
+#         # 使用ONNX Runtime进行推理
+#         start = time.time()
+#         audio = self.vits_onnx_session.run(output_names=["audio"],
+#                                            input_feed={
+#                                                "hidden_unit": x_tst,
+#                                                "lengths": x_tst_lengths,
+#                                                "pitch": pitch,
+#                                                "sid": sid,
+#                                            })[0][0, 0]
+#         use_time = time.time() - start
+#         print("vits_onnx_session.run time:{}".format(use_time))
+#         audio = torch.from_numpy(audio)
+#         return audio, audio.shape[-1]
+#
+#     def get_units(self, source, sr):
+#         source = torchaudio.functional.resample(source, sr, 16000)
+#         if len(source.shape) == 2 and source.shape[1] >= 2:
+#             source = torch.mean(source, dim=0).unsqueeze(0)
+#         source = source.unsqueeze(0)
+#         # 使用ONNX Runtime进行推理
+#         start = time.time()
+#         units = self.hubert_onnx_session.run(output_names=["embed"],
+#                                              input_feed={"source": source.numpy()})[0]
+#         use_time = time.time() - start
+#         print("hubert_onnx_session.run time:{}".format(use_time))
+#         return units
+#
+#     def transcribe(self, source, sr, length, transform):
+#         feature_pit = self.feature_input.compute_f0(source, sr)
+#         feature_pit = feature_pit * 2 ** (transform / 12)
+#         feature_pit = resize2d_f0(feature_pit, length)
+#         coarse_pit = self.feature_input.coarse_f0(feature_pit)
+#         return coarse_pit
+#
+#     def get_unit_pitch(self, in_path, tran):
+#         source, sr = torchaudio.load(in_path)
+#         soft = self.get_units(source, sr).squeeze(0)
+#         input_pitch = self.transcribe(source.numpy()[0], sr, soft.shape[0], tran)
+#         return soft, input_pitch
+
+
+class RealTimeVC:
+    def __init__(self):
+        self.last_chunk = None
+        self.last_o = None
+        self.chunk_len = 16000  # 区块长度
+        self.pre_len = 3840  # 交叉淡化长度，640的倍数
+
+    """输入输出都是1维numpy 音频波形数组"""
+
+    def process(self, svc_model, speaker_id, f_pitch_change, input_wav_path):
+        audio, sr = torchaudio.load(input_wav_path)
+        audio = audio.cpu().numpy()[0]
+        temp_wav = io.BytesIO()
+        if self.last_chunk is None:
+            input_wav_path.seek(0)
+            audio, sr = svc_model.infer(speaker_id, f_pitch_change, input_wav_path)
+            audio = audio.cpu().numpy()
+            self.last_chunk = audio[-self.pre_len:]
+            self.last_o = audio
+            return audio[-self.chunk_len:]
+        else:
+            audio = np.concatenate([self.last_chunk, audio])
+            soundfile.write(temp_wav, audio, sr, format="wav")
+            temp_wav.seek(0)
+            audio, sr = svc_model.infer(speaker_id, f_pitch_change, temp_wav)
+            audio = audio.cpu().numpy()
+            ret = maad.util.crossfade(self.last_o, audio, self.pre_len)
+            self.last_chunk = audio[-self.pre_len:]
+            self.last_o = audio
+            return ret[self.chunk_len:2 * self.chunk_len]
diff --git a/AutoCoverTool/ref/so_vits_svc/inference/infer_tool_grad.py b/AutoCoverTool/ref/so_vits_svc/inference/infer_tool_grad.py
new file mode 100644
index 0000000..39359a8
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/inference/infer_tool_grad.py
@@ -0,0 +1,160 @@
+import hashlib
+import json
+import logging
+import os
+import time
+from pathlib import Path
+import io
+import librosa
+import maad
+import numpy as np
+from inference import slicer
+import parselmouth
+import soundfile
+import torch
+import torchaudio
+
+from hubert import hubert_model
+import utils
+from models import SynthesizerTrn
+logging.getLogger('numba').setLevel(logging.WARNING)
+logging.getLogger('matplotlib').setLevel(logging.WARNING)
+
+def resize2d_f0(x, target_len):
+    source = np.array(x)
+    source[source < 0.001] = np.nan
+    target = np.interp(np.arange(0, len(source) * target_len, len(source)) / target_len, np.arange(0, len(source)),
+                       source)
+    res = np.nan_to_num(target)
+    return res
+
+def get_f0(x, p_len,f0_up_key=0):
+
+    time_step = 160 / 16000 * 1000
+    f0_min = 50
+    f0_max = 1100
+    f0_mel_min = 1127 * np.log(1 + f0_min / 700)
+    f0_mel_max = 1127 * np.log(1 + f0_max / 700)
+
+    f0 = parselmouth.Sound(x, 16000).to_pitch_ac(
+        time_step=time_step / 1000, voicing_threshold=0.6,
+        pitch_floor=f0_min, pitch_ceiling=f0_max).selected_array['frequency']
+
+    pad_size=(p_len - len(f0) + 1) // 2
+    if(pad_size>0 or p_len - len(f0) - pad_size>0):
+        f0 = np.pad(f0,[[pad_size,p_len - len(f0) - pad_size]], mode='constant')
+
+    f0 *= pow(2, f0_up_key / 12)
+    f0_mel = 1127 * np.log(1 + f0 / 700)
+    f0_mel[f0_mel > 0] = (f0_mel[f0_mel > 0] - f0_mel_min) * 254 / (f0_mel_max - f0_mel_min) + 1
+    f0_mel[f0_mel <= 1] = 1
+    f0_mel[f0_mel > 255] = 255
+    f0_coarse = np.rint(f0_mel).astype(np.int)
+    return f0_coarse, f0
+
+def clean_pitch(input_pitch):
+    num_nan = np.sum(input_pitch == 1)
+    if num_nan / len(input_pitch) > 0.9:
+        input_pitch[input_pitch != 1] = 1
+    return input_pitch
+
+
+def plt_pitch(input_pitch):
+    input_pitch = input_pitch.astype(float)
+    input_pitch[input_pitch == 1] = np.nan
+    return input_pitch
+
+
+def f0_to_pitch(ff):
+    f0_pitch = 69 + 12 * np.log2(ff / 440)
+    return f0_pitch
+
+
+def fill_a_to_b(a, b):
+    if len(a) < len(b):
+        for _ in range(0, len(b) - len(a)):
+            a.append(a[0])
+
+
+def mkdir(paths: list):
+    for path in paths:
+        if not os.path.exists(path):
+            os.mkdir(path)
+
+
+class VitsSvc(object):
+    def __init__(self):
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.SVCVITS = None
+        self.hps = None
+        self.speakers = None
+        self.hubert_soft = hubert_model.hubert_soft("hubert/model.pt")
+
+    def set_device(self, device):
+        self.device = torch.device(device)
+        self.hubert_soft.to(self.device)
+        if self.SVCVITS != None:
+            self.SVCVITS.to(self.device)
+
+    def loadCheckpoint(self, path):
+        self.hps = utils.get_hparams_from_file(f"checkpoints/{path}/config.json")
+        self.SVCVITS = SynthesizerTrn(
+            self.hps.data.filter_length // 2 + 1,
+            self.hps.train.segment_size // self.hps.data.hop_length,
+            **self.hps.model)
+        _ = utils.load_checkpoint(f"checkpoints/{path}/model.pth", self.SVCVITS, None)
+        _ = self.SVCVITS.eval().to(self.device)
+        self.speakers = self.hps.spk
+
+    def get_units(self, source, sr):
+        source = source.unsqueeze(0).to(self.device)
+        with torch.inference_mode():
+            units = self.hubert_soft.units(source)
+            return units
+
+
+    def get_unit_pitch(self, in_path, tran):
+        source, sr = torchaudio.load(in_path)
+        source = torchaudio.functional.resample(source, sr, 16000)
+        if len(source.shape) == 2 and source.shape[1] >= 2:
+            source = torch.mean(source, dim=0).unsqueeze(0)
+        soft = self.get_units(source, sr).squeeze(0).cpu().numpy()
+        f0_coarse, f0 = get_f0(source.cpu().numpy()[0], soft.shape[0]*2, tran)
+        return soft, f0
+
+    def infer(self, speaker_id, tran, raw_path):
+        speaker_id = self.speakers[speaker_id]
+        sid = torch.LongTensor([int(speaker_id)]).to(self.device).unsqueeze(0)
+        soft, pitch = self.get_unit_pitch(raw_path, tran)
+        f0 = torch.FloatTensor(clean_pitch(pitch)).unsqueeze(0).to(self.device)
+        stn_tst = torch.FloatTensor(soft)
+        with torch.no_grad():
+            x_tst = stn_tst.unsqueeze(0).to(self.device)
+            x_tst = torch.repeat_interleave(x_tst, repeats=2, dim=1).transpose(1, 2)
+            audio = self.SVCVITS.infer(x_tst, f0=f0, g=sid)[0,0].data.float()
+        return audio, audio.shape[-1]
+
+    def inference(self,srcaudio,chara,tran,slice_db):
+        sampling_rate, audio = srcaudio
+        audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
+        if len(audio.shape) > 1:
+            audio = librosa.to_mono(audio.transpose(1, 0))
+        if sampling_rate != 16000:
+            audio = librosa.resample(audio, orig_sr=sampling_rate, target_sr=16000)
+        soundfile.write("tmpwav.wav", audio, 16000, format="wav")
+        chunks = slicer.cut("tmpwav.wav", db_thresh=slice_db)
+        audio_data, audio_sr = slicer.chunks2audio("tmpwav.wav", chunks)
+        audio = []
+        for (slice_tag, data) in audio_data:
+            length = int(np.ceil(len(data) / audio_sr * self.hps.data.sampling_rate))
+            raw_path = io.BytesIO()
+            soundfile.write(raw_path, data, audio_sr, format="wav")
+            raw_path.seek(0)
+            if slice_tag:
+                _audio = np.zeros(length)
+            else:
+                out_audio, out_sr = self.infer(chara, tran, raw_path)
+                _audio = out_audio.cpu().numpy()
+            audio.extend(list(_audio))
+        audio = (np.array(audio) * 32768.0).astype('int16')
+        return (self.hps.data.sampling_rate,audio)
diff --git a/AutoCoverTool/ref/so_vits_svc/inference/slicer.py b/AutoCoverTool/ref/so_vits_svc/inference/slicer.py
new file mode 100644
index 0000000..b05840b
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/inference/slicer.py
@@ -0,0 +1,142 @@
+import librosa
+import torch
+import torchaudio
+
+
+class Slicer:
+    def __init__(self,
+                 sr: int,
+                 threshold: float = -40.,
+                 min_length: int = 5000,
+                 min_interval: int = 300,
+                 hop_size: int = 20,
+                 max_sil_kept: int = 5000):
+        if not min_length >= min_interval >= hop_size:
+            raise ValueError('The following condition must be satisfied: min_length >= min_interval >= hop_size')
+        if not max_sil_kept >= hop_size:
+            raise ValueError('The following condition must be satisfied: max_sil_kept >= hop_size')
+        min_interval = sr * min_interval / 1000
+        self.threshold = 10 ** (threshold / 20.)
+        self.hop_size = round(sr * hop_size / 1000)
+        self.win_size = min(round(min_interval), 4 * self.hop_size)
+        self.min_length = round(sr * min_length / 1000 / self.hop_size)
+        self.min_interval = round(min_interval / self.hop_size)
+        self.max_sil_kept = round(sr * max_sil_kept / 1000 / self.hop_size)
+
+    def _apply_slice(self, waveform, begin, end):
+        if len(waveform.shape) > 1:
+            return waveform[:, begin * self.hop_size: min(waveform.shape[1], end * self.hop_size)]
+        else:
+            return waveform[begin * self.hop_size: min(waveform.shape[0], end * self.hop_size)]
+
+    # @timeit
+    def slice(self, waveform):
+        if len(waveform.shape) > 1:
+            samples = librosa.to_mono(waveform)
+        else:
+            samples = waveform
+        if samples.shape[0] <= self.min_length:
+            return {"0": {"slice": False, "split_time": f"0,{len(waveform)}"}}
+        rms_list = librosa.feature.rms(y=samples, frame_length=self.win_size, hop_length=self.hop_size).squeeze(0)
+        sil_tags = []
+        silence_start = None
+        clip_start = 0
+        for i, rms in enumerate(rms_list):
+            # Keep looping while frame is silent.
+            if rms < self.threshold:
+                # Record start of silent frames.
+                if silence_start is None:
+                    silence_start = i
+                continue
+            # Keep looping while frame is not silent and silence start has not been recorded.
+            if silence_start is None:
+                continue
+            # Clear recorded silence start if interval is not enough or clip is too short
+            is_leading_silence = silence_start == 0 and i > self.max_sil_kept
+            need_slice_middle = i - silence_start >= self.min_interval and i - clip_start >= self.min_length
+            if not is_leading_silence and not need_slice_middle:
+                silence_start = None
+                continue
+            # Need slicing. Record the range of silent frames to be removed.
+            if i - silence_start <= self.max_sil_kept:
+                pos = rms_list[silence_start: i + 1].argmin() + silence_start
+                if silence_start == 0:
+                    sil_tags.append((0, pos))
+                else:
+                    sil_tags.append((pos, pos))
+                clip_start = pos
+            elif i - silence_start <= self.max_sil_kept * 2:
+                pos = rms_list[i - self.max_sil_kept: silence_start + self.max_sil_kept + 1].argmin()
+                pos += i - self.max_sil_kept
+                pos_l = rms_list[silence_start: silence_start + self.max_sil_kept + 1].argmin() + silence_start
+                pos_r = rms_list[i - self.max_sil_kept: i + 1].argmin() + i - self.max_sil_kept
+                if silence_start == 0:
+                    sil_tags.append((0, pos_r))
+                    clip_start = pos_r
+                else:
+                    sil_tags.append((min(pos_l, pos), max(pos_r, pos)))
+                    clip_start = max(pos_r, pos)
+            else:
+                pos_l = rms_list[silence_start: silence_start + self.max_sil_kept + 1].argmin() + silence_start
+                pos_r = rms_list[i - self.max_sil_kept: i + 1].argmin() + i - self.max_sil_kept
+                if silence_start == 0:
+                    sil_tags.append((0, pos_r))
+                else:
+                    sil_tags.append((pos_l, pos_r))
+                clip_start = pos_r
+            silence_start = None
+        # Deal with trailing silence.
+        total_frames = rms_list.shape[0]
+        if silence_start is not None and total_frames - silence_start >= self.min_interval:
+            silence_end = min(total_frames, silence_start + self.max_sil_kept)
+            pos = rms_list[silence_start: silence_end + 1].argmin() + silence_start
+            sil_tags.append((pos, total_frames + 1))
+        # Apply and return slices.
+        if len(sil_tags) == 0:
+            return {"0": {"slice": False, "split_time": f"0,{len(waveform)}"}}
+        else:
+            chunks = []
+            # 第一段静音并非从头开始，补上有声片段
+            if sil_tags[0][0]:
+                chunks.append(
+                    {"slice": False, "split_time": f"0,{min(waveform.shape[0], sil_tags[0][0] * self.hop_size)}"})
+            for i in range(0, len(sil_tags)):
+                # 标识有声片段（跳过第一段）
+                if i:
+                    chunks.append({"slice": False,
+                                   "split_time": f"{sil_tags[i - 1][1] * self.hop_size},{min(waveform.shape[0], sil_tags[i][0] * self.hop_size)}"})
+                # 标识所有静音片段
+                chunks.append({"slice": True,
+                               "split_time": f"{sil_tags[i][0] * self.hop_size},{min(waveform.shape[0], sil_tags[i][1] * self.hop_size)}"})
+            # 最后一段静音并非结尾，补上结尾片段
+            if sil_tags[-1][1] * self.hop_size < len(waveform):
+                chunks.append({"slice": False, "split_time": f"{sil_tags[-1][1] * self.hop_size},{len(waveform)}"})
+            chunk_dict = {}
+            for i in range(len(chunks)):
+                chunk_dict[str(i)] = chunks[i]
+            return chunk_dict
+
+
+def cut(audio_path, db_thresh=-30, min_len=5000):
+    audio, sr = librosa.load(audio_path, sr=None)
+    slicer = Slicer(
+        sr=sr,
+        threshold=db_thresh,
+        min_length=min_len
+    )
+    chunks = slicer.slice(audio)
+    return chunks
+
+
+def chunks2audio(audio_path, chunks):
+    chunks = dict(chunks)
+    audio, sr = torchaudio.load(audio_path)
+    if len(audio.shape) == 2 and audio.shape[1] >= 2:
+        audio = torch.mean(audio, dim=0).unsqueeze(0)
+    audio = audio.cpu().numpy()[0]
+    result = []
+    for k, v in chunks.items():
+        tag = v["split_time"].split(",")
+        if tag[0] != tag[1]:
+            result.append((v["slice"], audio[int(tag[0]):int(tag[1])]))
+    return result, sr
diff --git a/AutoCoverTool/ref/so_vits_svc/inference_main.py b/AutoCoverTool/ref/so_vits_svc/inference_main.py
new file mode 100644
index 0000000..20a9439
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/inference_main.py
@@ -0,0 +1,83 @@
+import io
+import os
+import sys
+import logging
+import time
+from pathlib import Path
+
+import librosa
+import numpy as np
+import soundfile
+
+from inference import infer_tool
+from inference import slicer
+from inference.infer_tool import Svc
+
+logging.getLogger('numba').setLevel(logging.WARNING)
+chunks_dict = infer_tool.read_temp("ref/so-vits-svc/inference/chunks_temp.json")
+
+
+def inf(model_path, config_path, raw_audio_path, dst_path, dev):
+    # model_path = "logs/32k/G_174000-Copy1.pth"
+    # config_path = "configs/config.json"
+    svc_model = Svc(model_path, config_path)
+    out_dir = os.path.dirname(dst_path)
+    print(dst_path)
+    os.makedirs(out_dir, exist_ok=True)
+    # 支持多个wav文件，放在raw文件夹下
+    tran = 0
+    spk_list = ['speaker0']  # 每次同时合成多语者音色
+    slice_db = -40  # 默认-40，嘈杂的音频可以-30，干声保留呼吸可以-50
+    wav_format = 'wav'  # 音频输出格式
+
+    # infer_tool.fill_a_to_b(trans, clean_names)
+    # for clean_name, tran in zip(clean_names, trans):
+    #     raw_audio_path = f"raw/{clean_name}"
+    #     if "." not in raw_audio_path:
+    #         raw_audio_path += ".wav"
+    infer_tool.format_wav(raw_audio_path)
+    wav_path = Path(raw_audio_path).with_suffix('.wav')
+    chunks = slicer.cut(wav_path, db_thresh=slice_db)
+    audio_data, audio_sr = slicer.chunks2audio(wav_path, chunks)
+
+    for spk in spk_list:
+        audio = []
+        for (slice_tag, data) in audio_data:
+            print(f'#=====segment start, {round(len(data) / audio_sr, 3)}s======')
+            length = int(np.ceil(len(data) / audio_sr * svc_model.target_sample))
+            raw_path = io.BytesIO()
+            soundfile.write(raw_path, data, audio_sr, format="wav")
+            raw_path.seek(0)
+            if slice_tag:
+                print('jump empty segment')
+                _audio = np.zeros(length)
+            else:
+                out_audio, out_sr = svc_model.infer(spk, tran, raw_path, dev == "test")
+                _audio = out_audio.cpu().numpy()
+            audio.extend(list(_audio))
+        soundfile.write(dst_path, audio, svc_model.target_sample, format=wav_format)
+
+
+if __name__ == '__main__':
+    g_model = sys.argv[1]  # 模型地址
+    g_config = sys.argv[2]  # 配置文件地址
+    g_audio_path = sys.argv[3]  # 输入的音频文件地址,wav
+    g_dst_path = sys.argv[4]  # 输出的音频文件地址
+    if os.path.exists(g_dst_path):
+        print("{} success ...".format(g_dst_path))
+        exit(0)
+
+    g_dev = "prod"
+    if len(sys.argv) > 5:
+        g_dev = sys.argv[5]
+
+    g_aa, g_sr = librosa.load(g_audio_path)
+    d = librosa.get_duration(g_aa, g_sr)
+    # if g_dev != "test":
+    # if d > 250:
+    #     print("{} too long".format(g_audio_path))
+    #     exit(0)
+
+    st = time.time()
+    inf(g_model, g_config, g_audio_path, g_dst_path, g_dev)
+    print("{}, inference sp={}".format(g_audio_path, time.time() - st))
diff --git a/AutoCoverTool/ref/so_vits_svc/logs/32k/put_pretrained_model_here b/AutoCoverTool/ref/so_vits_svc/logs/32k/put_pretrained_model_here
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/so_vits_svc/losses.py b/AutoCoverTool/ref/so_vits_svc/losses.py
new file mode 100644
index 0000000..41f9be6
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/losses.py
@@ -0,0 +1,61 @@
+import torch 
+from torch.nn import functional as F
+
+import commons
+
+
+def feature_loss(fmap_r, fmap_g):
+  loss = 0
+  for dr, dg in zip(fmap_r, fmap_g):
+    for rl, gl in zip(dr, dg):
+      rl = rl.float().detach()
+      gl = gl.float()
+      loss += torch.mean(torch.abs(rl - gl))
+
+  return loss * 2 
+
+
+def discriminator_loss(disc_real_outputs, disc_generated_outputs):
+  loss = 0
+  r_losses = []
+  g_losses = []
+  for dr, dg in zip(disc_real_outputs, disc_generated_outputs):
+    dr = dr.float()
+    dg = dg.float()
+    r_loss = torch.mean((1-dr)**2)
+    g_loss = torch.mean(dg**2)
+    loss += (r_loss + g_loss)
+    r_losses.append(r_loss.item())
+    g_losses.append(g_loss.item())
+
+  return loss, r_losses, g_losses
+
+
+def generator_loss(disc_outputs):
+  loss = 0
+  gen_losses = []
+  for dg in disc_outputs:
+    dg = dg.float()
+    l = torch.mean((1-dg)**2)
+    gen_losses.append(l)
+    loss += l
+
+  return loss, gen_losses
+
+
+def kl_loss(z_p, logs_q, m_p, logs_p, z_mask):
+  """
+  z_p, logs_q: [b, h, t_t]
+  m_p, logs_p: [b, h, t_t]
+  """
+  z_p = z_p.float()
+  logs_q = logs_q.float()
+  m_p = m_p.float()
+  logs_p = logs_p.float()
+  z_mask = z_mask.float()
+  #print(logs_p)
+  kl = logs_p - logs_q - 0.5
+  kl += 0.5 * ((z_p - m_p)**2) * torch.exp(-2. * logs_p)
+  kl = torch.sum(kl * z_mask)
+  l = kl / torch.sum(z_mask)
+  return l
diff --git a/AutoCoverTool/ref/so_vits_svc/mel_processing.py b/AutoCoverTool/ref/so_vits_svc/mel_processing.py
new file mode 100644
index 0000000..99c5b35
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/mel_processing.py
@@ -0,0 +1,112 @@
+import math
+import os
+import random
+import torch
+from torch import nn
+import torch.nn.functional as F
+import torch.utils.data
+import numpy as np
+import librosa
+import librosa.util as librosa_util
+from librosa.util import normalize, pad_center, tiny
+from scipy.signal import get_window
+from scipy.io.wavfile import read
+from librosa.filters import mel as librosa_mel_fn
+
+MAX_WAV_VALUE = 32768.0
+
+
+def dynamic_range_compression_torch(x, C=1, clip_val=1e-5):
+    """
+    PARAMS
+    ------
+    C: compression factor
+    """
+    return torch.log(torch.clamp(x, min=clip_val) * C)
+
+
+def dynamic_range_decompression_torch(x, C=1):
+    """
+    PARAMS
+    ------
+    C: compression factor used to compress
+    """
+    return torch.exp(x) / C
+
+
+def spectral_normalize_torch(magnitudes):
+    output = dynamic_range_compression_torch(magnitudes)
+    return output
+
+
+def spectral_de_normalize_torch(magnitudes):
+    output = dynamic_range_decompression_torch(magnitudes)
+    return output
+
+
+mel_basis = {}
+hann_window = {}
+
+
+def spectrogram_torch(y, n_fft, sampling_rate, hop_size, win_size, center=False):
+    if torch.min(y) < -1.:
+        print('min value is ', torch.min(y))
+    if torch.max(y) > 1.:
+        print('max value is ', torch.max(y))
+
+    global hann_window
+    dtype_device = str(y.dtype) + '_' + str(y.device)
+    wnsize_dtype_device = str(win_size) + '_' + dtype_device
+    if wnsize_dtype_device not in hann_window:
+        hann_window[wnsize_dtype_device] = torch.hann_window(win_size).to(dtype=y.dtype, device=y.device)
+
+    y = torch.nn.functional.pad(y.unsqueeze(1), (int((n_fft-hop_size)/2), int((n_fft-hop_size)/2)), mode='reflect')
+    y = y.squeeze(1)
+
+    spec = torch.stft(y, n_fft, hop_length=hop_size, win_length=win_size, window=hann_window[wnsize_dtype_device],
+                      center=center, pad_mode='reflect', normalized=False, onesided=True, return_complex=False)
+
+    spec = torch.sqrt(spec.pow(2).sum(-1) + 1e-6)
+    return spec
+
+
+def spec_to_mel_torch(spec, n_fft, num_mels, sampling_rate, fmin, fmax):
+    global mel_basis
+    dtype_device = str(spec.dtype) + '_' + str(spec.device)
+    fmax_dtype_device = str(fmax) + '_' + dtype_device
+    if fmax_dtype_device not in mel_basis:
+        mel = librosa_mel_fn(sr=sampling_rate, n_fft=n_fft, n_mels=num_mels, fmin=fmin, fmax=fmax)
+        mel_basis[fmax_dtype_device] = torch.from_numpy(mel).to(dtype=spec.dtype, device=spec.device)
+    spec = torch.matmul(mel_basis[fmax_dtype_device], spec)
+    spec = spectral_normalize_torch(spec)
+    return spec
+
+
+def mel_spectrogram_torch(y, n_fft, num_mels, sampling_rate, hop_size, win_size, fmin, fmax, center=False):
+    if torch.min(y) < -1.:
+        print('min value is ', torch.min(y))
+    if torch.max(y) > 1.:
+        print('max value is ', torch.max(y))
+
+    global mel_basis, hann_window
+    dtype_device = str(y.dtype) + '_' + str(y.device)
+    fmax_dtype_device = str(fmax) + '_' + dtype_device
+    wnsize_dtype_device = str(win_size) + '_' + dtype_device
+    if fmax_dtype_device not in mel_basis:
+        mel = librosa_mel_fn(sr=sampling_rate, n_fft=n_fft, n_mels=num_mels, fmin=fmin, fmax=fmax)
+        mel_basis[fmax_dtype_device] = torch.from_numpy(mel).to(dtype=y.dtype, device=y.device)
+    if wnsize_dtype_device not in hann_window:
+        hann_window[wnsize_dtype_device] = torch.hann_window(win_size).to(dtype=y.dtype, device=y.device)
+
+    y = torch.nn.functional.pad(y.unsqueeze(1), (int((n_fft-hop_size)/2), int((n_fft-hop_size)/2)), mode='reflect')
+    y = y.squeeze(1)
+
+    spec = torch.stft(y, n_fft, hop_length=hop_size, win_length=win_size, window=hann_window[wnsize_dtype_device],
+                      center=center, pad_mode='reflect', normalized=False, onesided=True, return_complex=False)
+
+    spec = torch.sqrt(spec.pow(2).sum(-1) + 1e-6)
+
+    spec = torch.matmul(mel_basis[fmax_dtype_device], spec)
+    spec = spectral_normalize_torch(spec)
+
+    return spec
diff --git a/AutoCoverTool/ref/so_vits_svc/model_onnx.py b/AutoCoverTool/ref/so_vits_svc/model_onnx.py
new file mode 100644
index 0000000..eaae733
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/model_onnx.py
@@ -0,0 +1,328 @@
+import copy
+import math
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+import attentions
+import commons
+import modules
+
+from torch.nn import Conv1d, ConvTranspose1d, AvgPool1d, Conv2d
+from torch.nn.utils import weight_norm, remove_weight_norm, spectral_norm
+from commons import init_weights, get_padding
+from vdecoder.hifigan.models import Generator
+from utils import f0_to_coarse
+
+class ResidualCouplingBlock(nn.Module):
+  def __init__(self,
+      channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      n_flows=4,
+      gin_channels=0):
+    super().__init__()
+    self.channels = channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.n_flows = n_flows
+    self.gin_channels = gin_channels
+
+    self.flows = nn.ModuleList()
+    for i in range(n_flows):
+      self.flows.append(modules.ResidualCouplingLayer(channels, hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=gin_channels, mean_only=True))
+      self.flows.append(modules.Flip())
+
+  def forward(self, x, x_mask, g=None, reverse=False):
+    if not reverse:
+      for flow in self.flows:
+        x, _ = flow(x, x_mask, g=g, reverse=reverse)
+    else:
+      for flow in reversed(self.flows):
+        x = flow(x, x_mask, g=g, reverse=reverse)
+    return x
+
+
+class Encoder(nn.Module):
+  def __init__(self,
+      in_channels,
+      out_channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      gin_channels=0):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+
+    self.pre = nn.Conv1d(in_channels, hidden_channels, 1)
+    self.enc = modules.WN(hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=gin_channels)
+    self.proj = nn.Conv1d(hidden_channels, out_channels * 2, 1)
+
+  def forward(self, x, x_lengths, g=None):
+    # print(x.shape,x_lengths.shape)
+    x_mask = torch.unsqueeze(commons.sequence_mask(x_lengths, x.size(2)), 1).to(x.dtype)
+    x = self.pre(x) * x_mask
+    x = self.enc(x, x_mask, g=g)
+    stats = self.proj(x) * x_mask
+    m, logs = torch.split(stats, self.out_channels, dim=1)
+    z = (m + torch.randn_like(m) * torch.exp(logs)) * x_mask
+    return z, m, logs, x_mask
+
+
+class TextEncoder(nn.Module):
+  def __init__(self,
+      in_channels,
+      out_channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      gin_channels=0,
+      filter_channels=None,
+      n_heads=None,
+      p_dropout=None):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+    self.pre = nn.Conv1d(in_channels, hidden_channels, 1)
+    self.proj = nn.Conv1d(hidden_channels, out_channels * 2, 1)
+    self.f0_emb = nn.Embedding(256, hidden_channels)
+
+    self.enc_ =  attentions.Encoder(
+        hidden_channels,
+        filter_channels,
+        n_heads,
+        n_layers,
+        kernel_size,
+        p_dropout)
+
+  def forward(self, x, x_lengths, f0=None):
+    x_mask = torch.unsqueeze(commons.sequence_mask(x_lengths, x.size(2)), 1).to(x.dtype)
+    x = self.pre(x) * x_mask
+    x = x + self.f0_emb(f0.long()).transpose(1,2)
+    x = self.enc_(x * x_mask, x_mask)
+    stats = self.proj(x) * x_mask
+    m, logs = torch.split(stats, self.out_channels, dim=1)
+    z = (m + torch.randn_like(m) * torch.exp(logs)) * x_mask
+
+    return z, m, logs, x_mask
+
+
+
+class DiscriminatorP(torch.nn.Module):
+    def __init__(self, period, kernel_size=5, stride=3, use_spectral_norm=False):
+        super(DiscriminatorP, self).__init__()
+        self.period = period
+        self.use_spectral_norm = use_spectral_norm
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv2d(1, 32, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(32, 128, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(128, 512, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(512, 1024, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(1024, 1024, (kernel_size, 1), 1, padding=(get_padding(kernel_size, 1), 0))),
+        ])
+        self.conv_post = norm_f(Conv2d(1024, 1, (3, 1), 1, padding=(1, 0)))
+
+    def forward(self, x):
+        fmap = []
+
+        # 1d to 2d
+        b, c, t = x.shape
+        if t % self.period != 0: # pad first
+            n_pad = self.period - (t % self.period)
+            x = F.pad(x, (0, n_pad), "reflect")
+            t = t + n_pad
+        x = x.view(b, c, t // self.period, self.period)
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, modules.LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class DiscriminatorS(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(DiscriminatorS, self).__init__()
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv1d(1, 16, 15, 1, padding=7)),
+            norm_f(Conv1d(16, 64, 41, 4, groups=4, padding=20)),
+            norm_f(Conv1d(64, 256, 41, 4, groups=16, padding=20)),
+            norm_f(Conv1d(256, 1024, 41, 4, groups=64, padding=20)),
+            norm_f(Conv1d(1024, 1024, 41, 4, groups=256, padding=20)),
+            norm_f(Conv1d(1024, 1024, 5, 1, padding=2)),
+        ])
+        self.conv_post = norm_f(Conv1d(1024, 1, 3, 1, padding=1))
+
+    def forward(self, x):
+        fmap = []
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, modules.LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class MultiPeriodDiscriminator(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(MultiPeriodDiscriminator, self).__init__()
+        periods = [2,3,5,7,11]
+
+        discs = [DiscriminatorS(use_spectral_norm=use_spectral_norm)]
+        discs = discs + [DiscriminatorP(i, use_spectral_norm=use_spectral_norm) for i in periods]
+        self.discriminators = nn.ModuleList(discs)
+
+    def forward(self, y, y_hat):
+        y_d_rs = []
+        y_d_gs = []
+        fmap_rs = []
+        fmap_gs = []
+        for i, d in enumerate(self.discriminators):
+            y_d_r, fmap_r = d(y)
+            y_d_g, fmap_g = d(y_hat)
+            y_d_rs.append(y_d_r)
+            y_d_gs.append(y_d_g)
+            fmap_rs.append(fmap_r)
+            fmap_gs.append(fmap_g)
+
+        return y_d_rs, y_d_gs, fmap_rs, fmap_gs
+        
+        
+class SpeakerEncoder(torch.nn.Module):
+    def __init__(self, mel_n_channels=80, model_num_layers=3, model_hidden_size=256, model_embedding_size=256):
+        super(SpeakerEncoder, self).__init__()
+        self.lstm = nn.LSTM(mel_n_channels, model_hidden_size, model_num_layers, batch_first=True)
+        self.linear = nn.Linear(model_hidden_size, model_embedding_size)
+        self.relu = nn.ReLU()
+
+    def forward(self, mels):
+        self.lstm.flatten_parameters()
+        _, (hidden, _) = self.lstm(mels)
+        embeds_raw = self.relu(self.linear(hidden[-1]))
+        return embeds_raw / torch.norm(embeds_raw, dim=1, keepdim=True)
+        
+    def compute_partial_slices(self, total_frames, partial_frames, partial_hop):
+        mel_slices = []
+        for i in range(0, total_frames-partial_frames, partial_hop):
+            mel_range = torch.arange(i, i+partial_frames)
+            mel_slices.append(mel_range)
+            
+        return mel_slices
+    
+    def embed_utterance(self, mel, partial_frames=128, partial_hop=64):
+        mel_len = mel.size(1)
+        last_mel = mel[:,-partial_frames:]
+        
+        if mel_len > partial_frames:
+            mel_slices = self.compute_partial_slices(mel_len, partial_frames, partial_hop)
+            mels = list(mel[:,s] for s in mel_slices)
+            mels.append(last_mel)
+            mels = torch.stack(tuple(mels), 0).squeeze(1)
+        
+            with torch.no_grad():
+                partial_embeds = self(mels)
+            embed = torch.mean(partial_embeds, axis=0).unsqueeze(0)
+            #embed = embed / torch.linalg.norm(embed, 2)
+        else:
+            with torch.no_grad():
+                embed = self(last_mel)
+        
+        return embed
+
+
+class SynthesizerTrn(nn.Module):
+  """
+  Synthesizer for Training
+  """
+
+  def __init__(self, 
+    spec_channels,
+    segment_size,
+    inter_channels,
+    hidden_channels,
+    filter_channels,
+    n_heads,
+    n_layers,
+    kernel_size,
+    p_dropout,
+    resblock, 
+    resblock_kernel_sizes, 
+    resblock_dilation_sizes, 
+    upsample_rates, 
+    upsample_initial_channel, 
+    upsample_kernel_sizes,
+    gin_channels,
+    ssl_dim,
+    n_speakers,
+    **kwargs):
+
+    super().__init__()
+    self.spec_channels = spec_channels
+    self.inter_channels = inter_channels
+    self.hidden_channels = hidden_channels
+    self.filter_channels = filter_channels
+    self.n_heads = n_heads
+    self.n_layers = n_layers
+    self.kernel_size = kernel_size
+    self.p_dropout = p_dropout
+    self.resblock = resblock
+    self.resblock_kernel_sizes = resblock_kernel_sizes
+    self.resblock_dilation_sizes = resblock_dilation_sizes
+    self.upsample_rates = upsample_rates
+    self.upsample_initial_channel = upsample_initial_channel
+    self.upsample_kernel_sizes = upsample_kernel_sizes
+    self.segment_size = segment_size
+    self.gin_channels = gin_channels
+    self.ssl_dim = ssl_dim
+    self.emb_g = nn.Embedding(n_speakers, gin_channels)
+
+    self.enc_p_ = TextEncoder(ssl_dim, inter_channels, hidden_channels, 5, 1, 16,0, filter_channels, n_heads, p_dropout)
+    hps = {
+        "sampling_rate": 32000,
+        "inter_channels": 192,
+        "resblock": "1",
+        "resblock_kernel_sizes": [3, 7, 11],
+        "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
+        "upsample_rates": [10, 8, 2, 2],
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [16, 16, 4, 4],
+        "gin_channels": 256,
+    }
+    self.dec = Generator(h=hps)
+    self.enc_q = Encoder(spec_channels, inter_channels, hidden_channels, 5, 1, 16, gin_channels=gin_channels)
+    self.flow = ResidualCouplingBlock(inter_channels, hidden_channels, 5, 1, 4, gin_channels=gin_channels)
+
+  def forward(self, c, c_lengths, f0, g=None):
+    g = self.emb_g(g.unsqueeze(0)).transpose(1,2)
+    z_p, m_p, logs_p, c_mask = self.enc_p_(c.transpose(1,2), c_lengths, f0=f0_to_coarse(f0))
+    z = self.flow(z_p, c_mask, g=g, reverse=True)
+    o = self.dec(z * c_mask, g=g, f0=f0.float())
+    return o
+    
diff --git a/AutoCoverTool/ref/so_vits_svc/model_onnx_48k.py b/AutoCoverTool/ref/so_vits_svc/model_onnx_48k.py
new file mode 100644
index 0000000..6d9955b
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/model_onnx_48k.py
@@ -0,0 +1,328 @@
+import copy
+import math
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+import attentions
+import commons
+import modules
+
+from torch.nn import Conv1d, ConvTranspose1d, AvgPool1d, Conv2d
+from torch.nn.utils import weight_norm, remove_weight_norm, spectral_norm
+from commons import init_weights, get_padding
+from vdecoder.hifigan.models import Generator
+from utils import f0_to_coarse
+
+class ResidualCouplingBlock(nn.Module):
+  def __init__(self,
+      channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      n_flows=4,
+      gin_channels=0):
+    super().__init__()
+    self.channels = channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.n_flows = n_flows
+    self.gin_channels = gin_channels
+
+    self.flows = nn.ModuleList()
+    for i in range(n_flows):
+      self.flows.append(modules.ResidualCouplingLayer(channels, hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=gin_channels, mean_only=True))
+      self.flows.append(modules.Flip())
+
+  def forward(self, x, x_mask, g=None, reverse=False):
+    if not reverse:
+      for flow in self.flows:
+        x, _ = flow(x, x_mask, g=g, reverse=reverse)
+    else:
+      for flow in reversed(self.flows):
+        x = flow(x, x_mask, g=g, reverse=reverse)
+    return x
+
+
+class Encoder(nn.Module):
+  def __init__(self,
+      in_channels,
+      out_channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      gin_channels=0):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+
+    self.pre = nn.Conv1d(in_channels, hidden_channels, 1)
+    self.enc = modules.WN(hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=gin_channels)
+    self.proj = nn.Conv1d(hidden_channels, out_channels * 2, 1)
+
+  def forward(self, x, x_lengths, g=None):
+    # print(x.shape,x_lengths.shape)
+    x_mask = torch.unsqueeze(commons.sequence_mask(x_lengths, x.size(2)), 1).to(x.dtype)
+    x = self.pre(x) * x_mask
+    x = self.enc(x, x_mask, g=g)
+    stats = self.proj(x) * x_mask
+    m, logs = torch.split(stats, self.out_channels, dim=1)
+    z = (m + torch.randn_like(m) * torch.exp(logs)) * x_mask
+    return z, m, logs, x_mask
+
+
+class TextEncoder(nn.Module):
+  def __init__(self,
+      in_channels,
+      out_channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      gin_channels=0,
+      filter_channels=None,
+      n_heads=None,
+      p_dropout=None):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+    self.pre = nn.Conv1d(in_channels, hidden_channels, 1)
+    self.proj = nn.Conv1d(hidden_channels, out_channels * 2, 1)
+    self.f0_emb = nn.Embedding(256, hidden_channels)
+
+    self.enc_ =  attentions.Encoder(
+        hidden_channels,
+        filter_channels,
+        n_heads,
+        n_layers,
+        kernel_size,
+        p_dropout)
+
+  def forward(self, x, x_lengths, f0=None):
+    x_mask = torch.unsqueeze(commons.sequence_mask(x_lengths, x.size(2)), 1).to(x.dtype)
+    x = self.pre(x) * x_mask
+    x = x + self.f0_emb(f0.long()).transpose(1,2)
+    x = self.enc_(x * x_mask, x_mask)
+    stats = self.proj(x) * x_mask
+    m, logs = torch.split(stats, self.out_channels, dim=1)
+    z = (m + torch.randn_like(m) * torch.exp(logs)) * x_mask
+
+    return z, m, logs, x_mask
+
+
+
+class DiscriminatorP(torch.nn.Module):
+    def __init__(self, period, kernel_size=5, stride=3, use_spectral_norm=False):
+        super(DiscriminatorP, self).__init__()
+        self.period = period
+        self.use_spectral_norm = use_spectral_norm
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv2d(1, 32, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(32, 128, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(128, 512, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(512, 1024, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(1024, 1024, (kernel_size, 1), 1, padding=(get_padding(kernel_size, 1), 0))),
+        ])
+        self.conv_post = norm_f(Conv2d(1024, 1, (3, 1), 1, padding=(1, 0)))
+
+    def forward(self, x):
+        fmap = []
+
+        # 1d to 2d
+        b, c, t = x.shape
+        if t % self.period != 0: # pad first
+            n_pad = self.period - (t % self.period)
+            x = F.pad(x, (0, n_pad), "reflect")
+            t = t + n_pad
+        x = x.view(b, c, t // self.period, self.period)
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, modules.LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class DiscriminatorS(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(DiscriminatorS, self).__init__()
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv1d(1, 16, 15, 1, padding=7)),
+            norm_f(Conv1d(16, 64, 41, 4, groups=4, padding=20)),
+            norm_f(Conv1d(64, 256, 41, 4, groups=16, padding=20)),
+            norm_f(Conv1d(256, 1024, 41, 4, groups=64, padding=20)),
+            norm_f(Conv1d(1024, 1024, 41, 4, groups=256, padding=20)),
+            norm_f(Conv1d(1024, 1024, 5, 1, padding=2)),
+        ])
+        self.conv_post = norm_f(Conv1d(1024, 1, 3, 1, padding=1))
+
+    def forward(self, x):
+        fmap = []
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, modules.LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class MultiPeriodDiscriminator(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(MultiPeriodDiscriminator, self).__init__()
+        periods = [2,3,5,7,11]
+
+        discs = [DiscriminatorS(use_spectral_norm=use_spectral_norm)]
+        discs = discs + [DiscriminatorP(i, use_spectral_norm=use_spectral_norm) for i in periods]
+        self.discriminators = nn.ModuleList(discs)
+
+    def forward(self, y, y_hat):
+        y_d_rs = []
+        y_d_gs = []
+        fmap_rs = []
+        fmap_gs = []
+        for i, d in enumerate(self.discriminators):
+            y_d_r, fmap_r = d(y)
+            y_d_g, fmap_g = d(y_hat)
+            y_d_rs.append(y_d_r)
+            y_d_gs.append(y_d_g)
+            fmap_rs.append(fmap_r)
+            fmap_gs.append(fmap_g)
+
+        return y_d_rs, y_d_gs, fmap_rs, fmap_gs
+        
+        
+class SpeakerEncoder(torch.nn.Module):
+    def __init__(self, mel_n_channels=80, model_num_layers=3, model_hidden_size=256, model_embedding_size=256):
+        super(SpeakerEncoder, self).__init__()
+        self.lstm = nn.LSTM(mel_n_channels, model_hidden_size, model_num_layers, batch_first=True)
+        self.linear = nn.Linear(model_hidden_size, model_embedding_size)
+        self.relu = nn.ReLU()
+
+    def forward(self, mels):
+        self.lstm.flatten_parameters()
+        _, (hidden, _) = self.lstm(mels)
+        embeds_raw = self.relu(self.linear(hidden[-1]))
+        return embeds_raw / torch.norm(embeds_raw, dim=1, keepdim=True)
+        
+    def compute_partial_slices(self, total_frames, partial_frames, partial_hop):
+        mel_slices = []
+        for i in range(0, total_frames-partial_frames, partial_hop):
+            mel_range = torch.arange(i, i+partial_frames)
+            mel_slices.append(mel_range)
+            
+        return mel_slices
+    
+    def embed_utterance(self, mel, partial_frames=128, partial_hop=64):
+        mel_len = mel.size(1)
+        last_mel = mel[:,-partial_frames:]
+        
+        if mel_len > partial_frames:
+            mel_slices = self.compute_partial_slices(mel_len, partial_frames, partial_hop)
+            mels = list(mel[:,s] for s in mel_slices)
+            mels.append(last_mel)
+            mels = torch.stack(tuple(mels), 0).squeeze(1)
+        
+            with torch.no_grad():
+                partial_embeds = self(mels)
+            embed = torch.mean(partial_embeds, axis=0).unsqueeze(0)
+            #embed = embed / torch.linalg.norm(embed, 2)
+        else:
+            with torch.no_grad():
+                embed = self(last_mel)
+        
+        return embed
+
+
+class SynthesizerTrn(nn.Module):
+  """
+  Synthesizer for Training
+  """
+
+  def __init__(self, 
+    spec_channels,
+    segment_size,
+    inter_channels,
+    hidden_channels,
+    filter_channels,
+    n_heads,
+    n_layers,
+    kernel_size,
+    p_dropout,
+    resblock, 
+    resblock_kernel_sizes, 
+    resblock_dilation_sizes, 
+    upsample_rates, 
+    upsample_initial_channel, 
+    upsample_kernel_sizes,
+    gin_channels,
+    ssl_dim,
+    n_speakers,
+    **kwargs):
+
+    super().__init__()
+    self.spec_channels = spec_channels
+    self.inter_channels = inter_channels
+    self.hidden_channels = hidden_channels
+    self.filter_channels = filter_channels
+    self.n_heads = n_heads
+    self.n_layers = n_layers
+    self.kernel_size = kernel_size
+    self.p_dropout = p_dropout
+    self.resblock = resblock
+    self.resblock_kernel_sizes = resblock_kernel_sizes
+    self.resblock_dilation_sizes = resblock_dilation_sizes
+    self.upsample_rates = upsample_rates
+    self.upsample_initial_channel = upsample_initial_channel
+    self.upsample_kernel_sizes = upsample_kernel_sizes
+    self.segment_size = segment_size
+    self.gin_channels = gin_channels
+    self.ssl_dim = ssl_dim
+    self.emb_g = nn.Embedding(n_speakers, gin_channels)
+
+    self.enc_p_ = TextEncoder(ssl_dim, inter_channels, hidden_channels, 5, 1, 16,0, filter_channels, n_heads, p_dropout)
+    hps = {
+        "sampling_rate": 48000,
+        "inter_channels": 192,
+        "resblock": "1",
+        "resblock_kernel_sizes": [3, 7, 11],
+        "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
+        "upsample_rates": [10, 8, 2, 2],
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [16, 16, 4, 4],
+        "gin_channels": 256,
+    }
+    self.dec = Generator(h=hps)
+    self.enc_q = Encoder(spec_channels, inter_channels, hidden_channels, 5, 1, 16, gin_channels=gin_channels)
+    self.flow = ResidualCouplingBlock(inter_channels, hidden_channels, 5, 1, 4, gin_channels=gin_channels)
+
+  def forward(self, c, c_lengths, f0, g=None):
+    g = self.emb_g(g.unsqueeze(0)).transpose(1,2)
+    z_p, m_p, logs_p, c_mask = self.enc_p_(c.transpose(1,2), c_lengths, f0=f0_to_coarse(f0))
+    z = self.flow(z_p, c_mask, g=g, reverse=True)
+    o = self.dec(z * c_mask, g=g, f0=f0.float())
+    return o
+    
diff --git a/AutoCoverTool/ref/so_vits_svc/models.py b/AutoCoverTool/ref/so_vits_svc/models.py
new file mode 100644
index 0000000..bdbce84
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/models.py
@@ -0,0 +1,351 @@
+import copy
+import math
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+import attentions
+import commons
+import modules
+
+from torch.nn import Conv1d, ConvTranspose1d, AvgPool1d, Conv2d
+from torch.nn.utils import weight_norm, remove_weight_norm, spectral_norm
+from commons import init_weights, get_padding
+from vdecoder.hifigan.models import Generator
+from utils import f0_to_coarse
+
+class ResidualCouplingBlock(nn.Module):
+  def __init__(self,
+      channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      n_flows=4,
+      gin_channels=0):
+    super().__init__()
+    self.channels = channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.n_flows = n_flows
+    self.gin_channels = gin_channels
+
+    self.flows = nn.ModuleList()
+    for i in range(n_flows):
+      self.flows.append(modules.ResidualCouplingLayer(channels, hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=gin_channels, mean_only=True))
+      self.flows.append(modules.Flip())
+
+  def forward(self, x, x_mask, g=None, reverse=False):
+    if not reverse:
+      for flow in self.flows:
+        x, _ = flow(x, x_mask, g=g, reverse=reverse)
+    else:
+      for flow in reversed(self.flows):
+        x = flow(x, x_mask, g=g, reverse=reverse)
+    return x
+
+
+class Encoder(nn.Module):
+  def __init__(self,
+      in_channels,
+      out_channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      gin_channels=0):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+
+    self.pre = nn.Conv1d(in_channels, hidden_channels, 1)
+    self.enc = modules.WN(hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=gin_channels)
+    self.proj = nn.Conv1d(hidden_channels, out_channels * 2, 1)
+
+  def forward(self, x, x_lengths, g=None):
+    # print(x.shape,x_lengths.shape)
+    x_mask = torch.unsqueeze(commons.sequence_mask(x_lengths, x.size(2)), 1).to(x.dtype)
+    x = self.pre(x) * x_mask
+    x = self.enc(x, x_mask, g=g)
+    stats = self.proj(x) * x_mask
+    m, logs = torch.split(stats, self.out_channels, dim=1)
+    z = (m + torch.randn_like(m) * torch.exp(logs)) * x_mask
+    return z, m, logs, x_mask
+
+
+class TextEncoder(nn.Module):
+  def __init__(self,
+      in_channels,
+      out_channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      gin_channels=0,
+      filter_channels=None,
+      n_heads=None,
+      p_dropout=None):
+    super().__init__()
+    self.in_channels = in_channels
+    self.out_channels = out_channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+    self.pre = nn.Conv1d(in_channels, hidden_channels, 1)
+    self.proj = nn.Conv1d(hidden_channels, out_channels * 2, 1)
+    self.f0_emb = nn.Embedding(256, hidden_channels)
+
+    self.enc_ =  attentions.Encoder(
+        hidden_channels,
+        filter_channels,
+        n_heads,
+        n_layers,
+        kernel_size,
+        p_dropout)
+
+  def forward(self, x, x_lengths, f0=None):
+    x_mask = torch.unsqueeze(commons.sequence_mask(x_lengths, x.size(2)), 1).to(x.dtype)
+    x = self.pre(x) * x_mask
+    x = x + self.f0_emb(f0).transpose(1,2)
+    x = self.enc_(x * x_mask, x_mask)
+    stats = self.proj(x) * x_mask
+    m, logs = torch.split(stats, self.out_channels, dim=1)
+    z = (m + torch.randn_like(m) * torch.exp(logs)) * x_mask
+
+    return z, m, logs, x_mask
+
+
+
+class DiscriminatorP(torch.nn.Module):
+    def __init__(self, period, kernel_size=5, stride=3, use_spectral_norm=False):
+        super(DiscriminatorP, self).__init__()
+        self.period = period
+        self.use_spectral_norm = use_spectral_norm
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv2d(1, 32, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(32, 128, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(128, 512, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(512, 1024, (kernel_size, 1), (stride, 1), padding=(get_padding(kernel_size, 1), 0))),
+            norm_f(Conv2d(1024, 1024, (kernel_size, 1), 1, padding=(get_padding(kernel_size, 1), 0))),
+        ])
+        self.conv_post = norm_f(Conv2d(1024, 1, (3, 1), 1, padding=(1, 0)))
+
+    def forward(self, x):
+        fmap = []
+
+        # 1d to 2d
+        b, c, t = x.shape
+        if t % self.period != 0: # pad first
+            n_pad = self.period - (t % self.period)
+            x = F.pad(x, (0, n_pad), "reflect")
+            t = t + n_pad
+        x = x.view(b, c, t // self.period, self.period)
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, modules.LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class DiscriminatorS(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(DiscriminatorS, self).__init__()
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv1d(1, 16, 15, 1, padding=7)),
+            norm_f(Conv1d(16, 64, 41, 4, groups=4, padding=20)),
+            norm_f(Conv1d(64, 256, 41, 4, groups=16, padding=20)),
+            norm_f(Conv1d(256, 1024, 41, 4, groups=64, padding=20)),
+            norm_f(Conv1d(1024, 1024, 41, 4, groups=256, padding=20)),
+            norm_f(Conv1d(1024, 1024, 5, 1, padding=2)),
+        ])
+        self.conv_post = norm_f(Conv1d(1024, 1, 3, 1, padding=1))
+
+    def forward(self, x):
+        fmap = []
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, modules.LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class MultiPeriodDiscriminator(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(MultiPeriodDiscriminator, self).__init__()
+        periods = [2,3,5,7,11]
+
+        discs = [DiscriminatorS(use_spectral_norm=use_spectral_norm)]
+        discs = discs + [DiscriminatorP(i, use_spectral_norm=use_spectral_norm) for i in periods]
+        self.discriminators = nn.ModuleList(discs)
+
+    def forward(self, y, y_hat):
+        y_d_rs = []
+        y_d_gs = []
+        fmap_rs = []
+        fmap_gs = []
+        for i, d in enumerate(self.discriminators):
+            y_d_r, fmap_r = d(y)
+            y_d_g, fmap_g = d(y_hat)
+            y_d_rs.append(y_d_r)
+            y_d_gs.append(y_d_g)
+            fmap_rs.append(fmap_r)
+            fmap_gs.append(fmap_g)
+
+        return y_d_rs, y_d_gs, fmap_rs, fmap_gs
+        
+        
+class SpeakerEncoder(torch.nn.Module):
+    def __init__(self, mel_n_channels=80, model_num_layers=3, model_hidden_size=256, model_embedding_size=256):
+        super(SpeakerEncoder, self).__init__()
+        self.lstm = nn.LSTM(mel_n_channels, model_hidden_size, model_num_layers, batch_first=True)
+        self.linear = nn.Linear(model_hidden_size, model_embedding_size)
+        self.relu = nn.ReLU()
+
+    def forward(self, mels):
+        self.lstm.flatten_parameters()
+        _, (hidden, _) = self.lstm(mels)
+        embeds_raw = self.relu(self.linear(hidden[-1]))
+        return embeds_raw / torch.norm(embeds_raw, dim=1, keepdim=True)
+        
+    def compute_partial_slices(self, total_frames, partial_frames, partial_hop):
+        mel_slices = []
+        for i in range(0, total_frames-partial_frames, partial_hop):
+            mel_range = torch.arange(i, i+partial_frames)
+            mel_slices.append(mel_range)
+            
+        return mel_slices
+    
+    def embed_utterance(self, mel, partial_frames=128, partial_hop=64):
+        mel_len = mel.size(1)
+        last_mel = mel[:,-partial_frames:]
+        
+        if mel_len > partial_frames:
+            mel_slices = self.compute_partial_slices(mel_len, partial_frames, partial_hop)
+            mels = list(mel[:,s] for s in mel_slices)
+            mels.append(last_mel)
+            mels = torch.stack(tuple(mels), 0).squeeze(1)
+        
+            with torch.no_grad():
+                partial_embeds = self(mels)
+            embed = torch.mean(partial_embeds, axis=0).unsqueeze(0)
+            #embed = embed / torch.linalg.norm(embed, 2)
+        else:
+            with torch.no_grad():
+                embed = self(last_mel)
+        
+        return embed
+
+
+class SynthesizerTrn(nn.Module):
+  """
+  Synthesizer for Training
+  """
+
+  def __init__(self, 
+    spec_channels,
+    segment_size,
+    inter_channels,
+    hidden_channels,
+    filter_channels,
+    n_heads,
+    n_layers,
+    kernel_size,
+    p_dropout,
+    resblock, 
+    resblock_kernel_sizes, 
+    resblock_dilation_sizes, 
+    upsample_rates, 
+    upsample_initial_channel, 
+    upsample_kernel_sizes,
+    gin_channels,
+    ssl_dim,
+    n_speakers,
+    **kwargs):
+
+    super().__init__()
+    self.spec_channels = spec_channels
+    self.inter_channels = inter_channels
+    self.hidden_channels = hidden_channels
+    self.filter_channels = filter_channels
+    self.n_heads = n_heads
+    self.n_layers = n_layers
+    self.kernel_size = kernel_size
+    self.p_dropout = p_dropout
+    self.resblock = resblock
+    self.resblock_kernel_sizes = resblock_kernel_sizes
+    self.resblock_dilation_sizes = resblock_dilation_sizes
+    self.upsample_rates = upsample_rates
+    self.upsample_initial_channel = upsample_initial_channel
+    self.upsample_kernel_sizes = upsample_kernel_sizes
+    self.segment_size = segment_size
+    self.gin_channels = gin_channels
+    self.ssl_dim = ssl_dim
+    self.emb_g = nn.Embedding(n_speakers, gin_channels)
+
+    self.enc_p_ = TextEncoder(ssl_dim, inter_channels, hidden_channels, 5, 1, 16,0, filter_channels, n_heads, p_dropout)
+    hps = {
+        "sampling_rate": 32000,
+        "inter_channels": 192,
+        "resblock": "1",
+        "resblock_kernel_sizes": [3, 7, 11],
+        "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
+        "upsample_rates": [10, 8, 2, 2],
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [16, 16, 4, 4],
+        "gin_channels": 256,
+    }
+    self.dec = Generator(h=hps)
+    self.enc_q = Encoder(spec_channels, inter_channels, hidden_channels, 5, 1, 16, gin_channels=gin_channels)
+    self.flow = ResidualCouplingBlock(inter_channels, hidden_channels, 5, 1, 4, gin_channels=gin_channels)
+
+  def forward(self, c, f0, spec, g=None, mel=None, c_lengths=None, spec_lengths=None):
+    if c_lengths == None:
+      c_lengths = (torch.ones(c.size(0)) * c.size(-1)).to(c.device)
+    if spec_lengths == None:
+      spec_lengths = (torch.ones(spec.size(0)) * spec.size(-1)).to(spec.device)
+
+    g = self.emb_g(g).transpose(1,2)
+
+    z_ptemp, m_p, logs_p, _ = self.enc_p_(c, c_lengths, f0=f0_to_coarse(f0))
+    z, m_q, logs_q, spec_mask = self.enc_q(spec, spec_lengths, g=g) 
+
+    z_p = self.flow(z, spec_mask, g=g)
+    z_slice, pitch_slice, ids_slice = commons.rand_slice_segments_with_pitch(z, f0, spec_lengths, self.segment_size)
+
+    # o = self.dec(z_slice, g=g)
+    o = self.dec(z_slice, g=g, f0=pitch_slice)
+
+    return o, ids_slice, spec_mask, (z, z_p, m_p, logs_p, m_q, logs_q)
+
+  def infer(self, c, f0, g=None, mel=None, c_lengths=None):
+    if c_lengths == None:
+      c_lengths = (torch.ones(c.size(0)) * c.size(-1)).to(c.device)
+    g = self.emb_g(g).transpose(1,2)
+
+    z_p, m_p, logs_p, c_mask = self.enc_p_(c, c_lengths, f0=f0_to_coarse(f0))
+    z = self.flow(z_p, c_mask, g=g, reverse=True)
+
+    o = self.dec(z * c_mask, g=g, f0=f0)
+
+    return o
diff --git a/AutoCoverTool/ref/so_vits_svc/modules.py b/AutoCoverTool/ref/so_vits_svc/modules.py
new file mode 100644
index 0000000..52ee14e
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/modules.py
@@ -0,0 +1,342 @@
+import copy
+import math
+import numpy as np
+import scipy
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+from torch.nn import Conv1d, ConvTranspose1d, AvgPool1d, Conv2d
+from torch.nn.utils import weight_norm, remove_weight_norm
+
+import commons
+from commons import init_weights, get_padding
+
+
+LRELU_SLOPE = 0.1
+
+
+class LayerNorm(nn.Module):
+  def __init__(self, channels, eps=1e-5):
+    super().__init__()
+    self.channels = channels
+    self.eps = eps
+
+    self.gamma = nn.Parameter(torch.ones(channels))
+    self.beta = nn.Parameter(torch.zeros(channels))
+
+  def forward(self, x):
+    x = x.transpose(1, -1)
+    x = F.layer_norm(x, (self.channels,), self.gamma, self.beta, self.eps)
+    return x.transpose(1, -1)
+
+ 
+class ConvReluNorm(nn.Module):
+  def __init__(self, in_channels, hidden_channels, out_channels, kernel_size, n_layers, p_dropout):
+    super().__init__()
+    self.in_channels = in_channels
+    self.hidden_channels = hidden_channels
+    self.out_channels = out_channels
+    self.kernel_size = kernel_size
+    self.n_layers = n_layers
+    self.p_dropout = p_dropout
+    assert n_layers > 1, "Number of layers should be larger than 0."
+
+    self.conv_layers = nn.ModuleList()
+    self.norm_layers = nn.ModuleList()
+    self.conv_layers.append(nn.Conv1d(in_channels, hidden_channels, kernel_size, padding=kernel_size//2))
+    self.norm_layers.append(LayerNorm(hidden_channels))
+    self.relu_drop = nn.Sequential(
+        nn.ReLU(),
+        nn.Dropout(p_dropout))
+    for _ in range(n_layers-1):
+      self.conv_layers.append(nn.Conv1d(hidden_channels, hidden_channels, kernel_size, padding=kernel_size//2))
+      self.norm_layers.append(LayerNorm(hidden_channels))
+    self.proj = nn.Conv1d(hidden_channels, out_channels, 1)
+    self.proj.weight.data.zero_()
+    self.proj.bias.data.zero_()
+
+  def forward(self, x, x_mask):
+    x_org = x
+    for i in range(self.n_layers):
+      x = self.conv_layers[i](x * x_mask)
+      x = self.norm_layers[i](x)
+      x = self.relu_drop(x)
+    x = x_org + self.proj(x)
+    return x * x_mask
+
+
+class DDSConv(nn.Module):
+  """
+  Dialted and Depth-Separable Convolution
+  """
+  def __init__(self, channels, kernel_size, n_layers, p_dropout=0.):
+    super().__init__()
+    self.channels = channels
+    self.kernel_size = kernel_size
+    self.n_layers = n_layers
+    self.p_dropout = p_dropout
+
+    self.drop = nn.Dropout(p_dropout)
+    self.convs_sep = nn.ModuleList()
+    self.convs_1x1 = nn.ModuleList()
+    self.norms_1 = nn.ModuleList()
+    self.norms_2 = nn.ModuleList()
+    for i in range(n_layers):
+      dilation = kernel_size ** i
+      padding = (kernel_size * dilation - dilation) // 2
+      self.convs_sep.append(nn.Conv1d(channels, channels, kernel_size, 
+          groups=channels, dilation=dilation, padding=padding
+      ))
+      self.convs_1x1.append(nn.Conv1d(channels, channels, 1))
+      self.norms_1.append(LayerNorm(channels))
+      self.norms_2.append(LayerNorm(channels))
+
+  def forward(self, x, x_mask, g=None):
+    if g is not None:
+      x = x + g
+    for i in range(self.n_layers):
+      y = self.convs_sep[i](x * x_mask)
+      y = self.norms_1[i](y)
+      y = F.gelu(y)
+      y = self.convs_1x1[i](y)
+      y = self.norms_2[i](y)
+      y = F.gelu(y)
+      y = self.drop(y)
+      x = x + y
+    return x * x_mask
+
+
+class WN(torch.nn.Module):
+  def __init__(self, hidden_channels, kernel_size, dilation_rate, n_layers, gin_channels=0, p_dropout=0):
+    super(WN, self).__init__()
+    assert(kernel_size % 2 == 1)
+    self.hidden_channels =hidden_channels
+    self.kernel_size = kernel_size,
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.gin_channels = gin_channels
+    self.p_dropout = p_dropout
+
+    self.in_layers = torch.nn.ModuleList()
+    self.res_skip_layers = torch.nn.ModuleList()
+    self.drop = nn.Dropout(p_dropout)
+
+    if gin_channels != 0:
+      cond_layer = torch.nn.Conv1d(gin_channels, 2*hidden_channels*n_layers, 1)
+      self.cond_layer = torch.nn.utils.weight_norm(cond_layer, name='weight')
+
+    for i in range(n_layers):
+      dilation = dilation_rate ** i
+      padding = int((kernel_size * dilation - dilation) / 2)
+      in_layer = torch.nn.Conv1d(hidden_channels, 2*hidden_channels, kernel_size,
+                                 dilation=dilation, padding=padding)
+      in_layer = torch.nn.utils.weight_norm(in_layer, name='weight')
+      self.in_layers.append(in_layer)
+
+      # last one is not necessary
+      if i < n_layers - 1:
+        res_skip_channels = 2 * hidden_channels
+      else:
+        res_skip_channels = hidden_channels
+
+      res_skip_layer = torch.nn.Conv1d(hidden_channels, res_skip_channels, 1)
+      res_skip_layer = torch.nn.utils.weight_norm(res_skip_layer, name='weight')
+      self.res_skip_layers.append(res_skip_layer)
+
+  def forward(self, x, x_mask, g=None, **kwargs):
+    output = torch.zeros_like(x)
+    n_channels_tensor = torch.IntTensor([self.hidden_channels])
+
+    if g is not None:
+      g = self.cond_layer(g)
+
+    for i in range(self.n_layers):
+      x_in = self.in_layers[i](x)
+      if g is not None:
+        cond_offset = i * 2 * self.hidden_channels
+        g_l = g[:,cond_offset:cond_offset+2*self.hidden_channels,:]
+      else:
+        g_l = torch.zeros_like(x_in)
+
+      acts = commons.fused_add_tanh_sigmoid_multiply(
+          x_in,
+          g_l,
+          n_channels_tensor)
+      acts = self.drop(acts)
+
+      res_skip_acts = self.res_skip_layers[i](acts)
+      if i < self.n_layers - 1:
+        res_acts = res_skip_acts[:,:self.hidden_channels,:]
+        x = (x + res_acts) * x_mask
+        output = output + res_skip_acts[:,self.hidden_channels:,:]
+      else:
+        output = output + res_skip_acts
+    return output * x_mask
+
+  def remove_weight_norm(self):
+    if self.gin_channels != 0:
+      torch.nn.utils.remove_weight_norm(self.cond_layer)
+    for l in self.in_layers:
+      torch.nn.utils.remove_weight_norm(l)
+    for l in self.res_skip_layers:
+     torch.nn.utils.remove_weight_norm(l)
+
+
+class ResBlock1(torch.nn.Module):
+    def __init__(self, channels, kernel_size=3, dilation=(1, 3, 5)):
+        super(ResBlock1, self).__init__()
+        self.convs1 = nn.ModuleList([
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[0],
+                               padding=get_padding(kernel_size, dilation[0]))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[1],
+                               padding=get_padding(kernel_size, dilation[1]))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[2],
+                               padding=get_padding(kernel_size, dilation[2])))
+        ])
+        self.convs1.apply(init_weights)
+
+        self.convs2 = nn.ModuleList([
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=1,
+                               padding=get_padding(kernel_size, 1))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=1,
+                               padding=get_padding(kernel_size, 1))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=1,
+                               padding=get_padding(kernel_size, 1)))
+        ])
+        self.convs2.apply(init_weights)
+
+    def forward(self, x, x_mask=None):
+        for c1, c2 in zip(self.convs1, self.convs2):
+            xt = F.leaky_relu(x, LRELU_SLOPE)
+            if x_mask is not None:
+                xt = xt * x_mask
+            xt = c1(xt)
+            xt = F.leaky_relu(xt, LRELU_SLOPE)
+            if x_mask is not None:
+                xt = xt * x_mask
+            xt = c2(xt)
+            x = xt + x
+        if x_mask is not None:
+            x = x * x_mask
+        return x
+
+    def remove_weight_norm(self):
+        for l in self.convs1:
+            remove_weight_norm(l)
+        for l in self.convs2:
+            remove_weight_norm(l)
+
+
+class ResBlock2(torch.nn.Module):
+    def __init__(self, channels, kernel_size=3, dilation=(1, 3)):
+        super(ResBlock2, self).__init__()
+        self.convs = nn.ModuleList([
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[0],
+                               padding=get_padding(kernel_size, dilation[0]))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[1],
+                               padding=get_padding(kernel_size, dilation[1])))
+        ])
+        self.convs.apply(init_weights)
+
+    def forward(self, x, x_mask=None):
+        for c in self.convs:
+            xt = F.leaky_relu(x, LRELU_SLOPE)
+            if x_mask is not None:
+                xt = xt * x_mask
+            xt = c(xt)
+            x = xt + x
+        if x_mask is not None:
+            x = x * x_mask
+        return x
+
+    def remove_weight_norm(self):
+        for l in self.convs:
+            remove_weight_norm(l)
+
+
+class Log(nn.Module):
+  def forward(self, x, x_mask, reverse=False, **kwargs):
+    if not reverse:
+      y = torch.log(torch.clamp_min(x, 1e-5)) * x_mask
+      logdet = torch.sum(-y, [1, 2])
+      return y, logdet
+    else:
+      x = torch.exp(x) * x_mask
+      return x
+    
+
+class Flip(nn.Module):
+  def forward(self, x, *args, reverse=False, **kwargs):
+    x = torch.flip(x, [1])
+    if not reverse:
+      logdet = torch.zeros(x.size(0)).to(dtype=x.dtype, device=x.device)
+      return x, logdet
+    else:
+      return x
+
+
+class ElementwiseAffine(nn.Module):
+  def __init__(self, channels):
+    super().__init__()
+    self.channels = channels
+    self.m = nn.Parameter(torch.zeros(channels,1))
+    self.logs = nn.Parameter(torch.zeros(channels,1))
+
+  def forward(self, x, x_mask, reverse=False, **kwargs):
+    if not reverse:
+      y = self.m + torch.exp(self.logs) * x
+      y = y * x_mask
+      logdet = torch.sum(self.logs * x_mask, [1,2])
+      return y, logdet
+    else:
+      x = (x - self.m) * torch.exp(-self.logs) * x_mask
+      return x
+
+
+class ResidualCouplingLayer(nn.Module):
+  def __init__(self,
+      channels,
+      hidden_channels,
+      kernel_size,
+      dilation_rate,
+      n_layers,
+      p_dropout=0,
+      gin_channels=0,
+      mean_only=False):
+    assert channels % 2 == 0, "channels should be divisible by 2"
+    super().__init__()
+    self.channels = channels
+    self.hidden_channels = hidden_channels
+    self.kernel_size = kernel_size
+    self.dilation_rate = dilation_rate
+    self.n_layers = n_layers
+    self.half_channels = channels // 2
+    self.mean_only = mean_only
+
+    self.pre = nn.Conv1d(self.half_channels, hidden_channels, 1)
+    self.enc = WN(hidden_channels, kernel_size, dilation_rate, n_layers, p_dropout=p_dropout, gin_channels=gin_channels)
+    self.post = nn.Conv1d(hidden_channels, self.half_channels * (2 - mean_only), 1)
+    self.post.weight.data.zero_()
+    self.post.bias.data.zero_()
+
+  def forward(self, x, x_mask, g=None, reverse=False):
+    x0, x1 = torch.split(x, [self.half_channels]*2, 1)
+    h = self.pre(x0) * x_mask
+    h = self.enc(h, x_mask, g=g)
+    stats = self.post(h) * x_mask
+    if not self.mean_only:
+      m, logs = torch.split(stats, [self.half_channels]*2, 1)
+    else:
+      m = stats
+      logs = torch.zeros_like(m)
+
+    if not reverse:
+      x1 = m + x1 * torch.exp(logs) * x_mask
+      x = torch.cat([x0, x1], 1)
+      logdet = torch.sum(logs, [1,2])
+      return x, logdet
+    else:
+      x1 = (x1 - m) * torch.exp(-logs) * x_mask
+      x = torch.cat([x0, x1], 1)
+      return x
diff --git a/AutoCoverTool/ref/so_vits_svc/onnx_export.py b/AutoCoverTool/ref/so_vits_svc/onnx_export.py
new file mode 100644
index 0000000..a762b23
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/onnx_export.py
@@ -0,0 +1,73 @@
+import argparse
+import time
+import numpy as np
+import onnx
+from onnxsim import simplify
+import onnxruntime as ort
+import onnxoptimizer
+import torch
+from model_onnx import SynthesizerTrn
+import utils
+from hubert import hubert_model_onnx
+
+def main(HubertExport,NetExport):
+
+    path = "NyaruTaffy"
+
+    if(HubertExport):
+        device = torch.device("cuda")
+        hubert_soft = hubert_model_onnx.hubert_soft("hubert/model.pt")
+        test_input = torch.rand(1, 1, 16000)
+        input_names = ["source"]
+        output_names = ["embed"]
+        torch.onnx.export(hubert_soft.to(device),
+                        test_input.to(device),
+                        "hubert3.0.onnx",
+                        dynamic_axes={
+                            "source": {
+                                2: "sample_length"
+                            }
+                        },
+                        verbose=False,
+                        opset_version=13,
+                        input_names=input_names,
+                        output_names=output_names)
+    if(NetExport):
+        device = torch.device("cuda")
+        hps = utils.get_hparams_from_file(f"checkpoints/{path}/config.json")
+        SVCVITS = SynthesizerTrn(
+            hps.data.filter_length // 2 + 1,
+            hps.train.segment_size // hps.data.hop_length,
+            **hps.model)
+        _ = utils.load_checkpoint(f"checkpoints/{path}/model.pth", SVCVITS, None)
+        _ = SVCVITS.eval().to(device)
+        for i in SVCVITS.parameters():
+            i.requires_grad = False
+        test_hidden_unit = torch.rand(1, 50, 256)
+        test_lengths = torch.LongTensor([50])
+        test_pitch = torch.rand(1, 50)
+        test_sid = torch.LongTensor([0])
+        input_names = ["hidden_unit", "lengths", "pitch", "sid"]
+        output_names = ["audio", ]
+        SVCVITS.eval()
+        torch.onnx.export(SVCVITS,
+                        (
+                            test_hidden_unit.to(device),
+                            test_lengths.to(device),
+                            test_pitch.to(device),
+                            test_sid.to(device)
+                        ),
+                        f"checkpoints/{path}/model.onnx",
+                        dynamic_axes={
+                            "hidden_unit": [0, 1],
+                            "pitch": [1]
+                        },
+                        do_constant_folding=False,
+                        opset_version=16,
+                        verbose=False,
+                        input_names=input_names,
+                        output_names=output_names)
+
+
+if __name__ == '__main__':
+    main(False,True)
diff --git a/AutoCoverTool/ref/so_vits_svc/onnx_export_48k.py b/AutoCoverTool/ref/so_vits_svc/onnx_export_48k.py
new file mode 100644
index 0000000..9a04635
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/onnx_export_48k.py
@@ -0,0 +1,73 @@
+import argparse
+import time
+import numpy as np
+import onnx
+from onnxsim import simplify
+import onnxruntime as ort
+import onnxoptimizer
+import torch
+from model_onnx_48k import SynthesizerTrn
+import utils
+from hubert import hubert_model_onnx
+
+def main(HubertExport,NetExport):
+
+    path = "NyaruTaffy"
+
+    if(HubertExport):
+        device = torch.device("cuda")
+        hubert_soft = hubert_model_onnx.hubert_soft("hubert/model.pt")
+        test_input = torch.rand(1, 1, 16000)
+        input_names = ["source"]
+        output_names = ["embed"]
+        torch.onnx.export(hubert_soft.to(device),
+                        test_input.to(device),
+                        "hubert3.0.onnx",
+                        dynamic_axes={
+                            "source": {
+                                2: "sample_length"
+                            }
+                        },
+                        verbose=False,
+                        opset_version=13,
+                        input_names=input_names,
+                        output_names=output_names)
+    if(NetExport):
+        device = torch.device("cuda")
+        hps = utils.get_hparams_from_file(f"checkpoints/{path}/config.json")
+        SVCVITS = SynthesizerTrn(
+            hps.data.filter_length // 2 + 1,
+            hps.train.segment_size // hps.data.hop_length,
+            **hps.model)
+        _ = utils.load_checkpoint(f"checkpoints/{path}/model.pth", SVCVITS, None)
+        _ = SVCVITS.eval().to(device)
+        for i in SVCVITS.parameters():
+            i.requires_grad = False
+        test_hidden_unit = torch.rand(1, 50, 256)
+        test_lengths = torch.LongTensor([50])
+        test_pitch = torch.rand(1, 50)
+        test_sid = torch.LongTensor([0])
+        input_names = ["hidden_unit", "lengths", "pitch", "sid"]
+        output_names = ["audio", ]
+        SVCVITS.eval()
+        torch.onnx.export(SVCVITS,
+                        (
+                            test_hidden_unit.to(device),
+                            test_lengths.to(device),
+                            test_pitch.to(device),
+                            test_sid.to(device)
+                        ),
+                        f"checkpoints/{path}/model.onnx",
+                        dynamic_axes={
+                            "hidden_unit": [0, 1],
+                            "pitch": [1]
+                        },
+                        do_constant_folding=False,
+                        opset_version=16,
+                        verbose=False,
+                        input_names=input_names,
+                        output_names=output_names)
+
+
+if __name__ == '__main__':
+    main(False,True)
diff --git a/AutoCoverTool/ref/so_vits_svc/preprocess_flist_config.py b/AutoCoverTool/ref/so_vits_svc/preprocess_flist_config.py
new file mode 100644
index 0000000..5b7e80a
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/preprocess_flist_config.py
@@ -0,0 +1,132 @@
+import os
+import argparse
+import re
+
+from tqdm import tqdm
+from random import shuffle
+import json
+
+config_template = {
+    "train": {
+        "log_interval": 200,
+        "eval_interval": 1000,
+        "seed": 1234,
+        "epochs": 400,  # 由10000->400
+        "learning_rate": 1e-4,
+        "betas": [0.8, 0.99],
+        "eps": 1e-9,
+        "batch_size": 12,
+        "fp16_run": False,
+        "lr_decay": 0.999875,
+        "segment_size": 17920,
+        "init_lr_ratio": 1,
+        "warmup_epochs": 0,
+        "c_mel": 45,
+        "c_kl": 1.0,
+        "use_sr": True,
+        "max_speclen": 384,
+        "port": "8001"
+    },
+    "data": {
+        "training_files": "filelists/train.txt",
+        "validation_files": "filelists/val.txt",
+        "max_wav_value": 32768.0,
+        "sampling_rate": 32000,
+        "filter_length": 1280,
+        "hop_length": 320,
+        "win_length": 1280,
+        "n_mel_channels": 80,
+        "mel_fmin": 0.0,
+        "mel_fmax": None
+    },
+    "model": {
+        "inter_channels": 192,
+        "hidden_channels": 192,
+        "filter_channels": 768,
+        "n_heads": 2,
+        "n_layers": 6,
+        "kernel_size": 3,
+        "p_dropout": 0.1,
+        "resblock": "1",
+        "resblock_kernel_sizes": [3, 7, 11],
+        "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
+        "upsample_rates": [10, 8, 2, 2],
+        "upsample_initial_channel": 512,
+        "upsample_kernel_sizes": [16, 16, 4, 4],
+        "n_layers_q": 3,
+        "use_spectral_norm": False,
+        "gin_channels": 256,
+        "ssl_dim": 256,
+        "n_speakers": 0,
+    },
+    "spk": {
+        "nen": 0,
+        "paimon": 1,
+        "yunhao": 2
+    }
+}
+
+pattern = re.compile(r'^[\.a-zA-Z0-9_\/]+$')
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--train_list", type=str, default="./filelists/train.txt", help="path to train list")
+    parser.add_argument("--val_list", type=str, default="./filelists/val.txt", help="path to val list")
+    parser.add_argument("--test_list", type=str, default="./filelists/test.txt", help="path to test list")
+    parser.add_argument("--source_dir", type=str, default="./dataset/32k", help="path to source dir")
+    parser.add_argument("--config_path", type=str, default="./config/config.json", help="path to source dir")
+    args = parser.parse_args()
+
+    train = []
+    val = []
+    test = []
+    idx = 0
+    spk_dict = {}
+    spk_id = 0
+    for speaker in tqdm(os.listdir(args.source_dir)):
+        spk_dict[speaker] = spk_id
+        spk_id += 1
+        wavs = ["/".join([args.source_dir, speaker, i]) for i in os.listdir(os.path.join(args.source_dir, speaker))]
+        for wavpath in wavs:
+            if not pattern.match(wavpath):
+                print(f"warning：文件名{wavpath}中包含非字母数字下划线，可能会导致错误。（也可能不会）")
+        if len(wavs) < 10:
+            print(f"warning：{speaker}数据集数量小于10条，请补充数据")
+        wavs = [i for i in wavs if i.endswith("wav")]
+        shuffle(wavs)
+        train += wavs[2:-2]
+        val += wavs[:2]
+        test += wavs[-2:]
+    n_speakers = len(spk_dict.keys()) * 2
+    shuffle(train)
+    shuffle(val)
+    shuffle(test)
+
+    print("Writing", args.train_list)
+    with open(args.train_list, "w") as f:
+        for fname in tqdm(train):
+            wavpath = fname
+            f.write(wavpath + "\n")
+
+    print("Writing", args.val_list)
+    with open(args.val_list, "w") as f:
+        for fname in tqdm(val):
+            wavpath = fname
+            f.write(wavpath + "\n")
+
+    print("Writing", args.test_list)
+    with open(args.test_list, "w") as f:
+        for fname in tqdm(test):
+            wavpath = fname
+            f.write(wavpath + "\n")
+
+    config_template["model"]["n_speakers"] = n_speakers
+    config_template["spk"] = spk_dict
+    print("Writing configs/config.json")
+
+    # 修改配置文件
+    config_template["data"]["training_files"] = args.train_list
+    config_template["data"]["validation_files"] = args.val_list
+
+    with open(args.config_path, "w") as f:
+        json.dump(config_template, f, indent=2)
diff --git a/AutoCoverTool/ref/so_vits_svc/preprocess_hubert_f0.py b/AutoCoverTool/ref/so_vits_svc/preprocess_hubert_f0.py
new file mode 100644
index 0000000..4fe7f21
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/preprocess_hubert_f0.py
@@ -0,0 +1,106 @@
+import os
+import argparse
+
+import torch
+import json
+from glob import glob
+
+from pyworld import pyworld
+from tqdm import tqdm
+from scipy.io import wavfile
+
+import utils
+from mel_processing import mel_spectrogram_torch
+#import h5py
+import logging
+logging.getLogger('numba').setLevel(logging.WARNING)
+
+import parselmouth
+import librosa
+import numpy as np
+
+
+def get_f0(path,p_len=None, f0_up_key=0):
+    x, _ = librosa.load(path, 32000)
+    if p_len is None:
+        p_len = x.shape[0]//320
+    else:
+        assert abs(p_len-x.shape[0]//320) < 3, (path, p_len, x.shape)
+    time_step = 320 / 32000 * 1000
+    f0_min = 50
+    f0_max = 1100
+    f0_mel_min = 1127 * np.log(1 + f0_min / 700)
+    f0_mel_max = 1127 * np.log(1 + f0_max / 700)
+
+    f0 = parselmouth.Sound(x, 32000).to_pitch_ac(
+        time_step=time_step / 1000, voicing_threshold=0.6,
+        pitch_floor=f0_min, pitch_ceiling=f0_max).selected_array['frequency']
+
+    pad_size=(p_len - len(f0) + 1) // 2
+    if(pad_size>0 or p_len - len(f0) - pad_size>0):
+        f0 = np.pad(f0,[[pad_size,p_len - len(f0) - pad_size]], mode='constant')
+
+    f0bak = f0.copy()
+    f0 *= pow(2, f0_up_key / 12)
+    f0_mel = 1127 * np.log(1 + f0 / 700)
+    f0_mel[f0_mel > 0] = (f0_mel[f0_mel > 0] - f0_mel_min) * 254 / (f0_mel_max - f0_mel_min) + 1
+    f0_mel[f0_mel <= 1] = 1
+    f0_mel[f0_mel > 255] = 255
+    f0_coarse = np.rint(f0_mel).astype(np.int)
+    return f0_coarse, f0bak
+
+def resize2d(x, target_len):
+    source = np.array(x)
+    source[source<0.001] = np.nan
+    target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
+    res = np.nan_to_num(target)
+    return res
+
+def compute_f0(path, c_len):
+    x, sr = librosa.load(path, sr=32000)
+    f0, t = pyworld.dio(
+        x.astype(np.double),
+        fs=sr,
+        f0_ceil=800,
+        frame_period=1000 * 320 / sr,
+    )
+    f0 = pyworld.stonemask(x.astype(np.double), f0, t, 32000)
+    for index, pitch in enumerate(f0):
+        f0[index] = round(pitch, 1)
+    assert abs(c_len - x.shape[0]//320) < 3, (c_len, f0.shape)
+
+    return None, resize2d(f0, c_len)
+
+
+def process(filename):
+    print(filename)
+    save_name = filename+".soft.pt"
+    if not os.path.exists(save_name):
+        devive = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        wav, _ = librosa.load(filename, sr=16000)
+        wav = torch.from_numpy(wav).unsqueeze(0).to(devive)
+        c = utils.get_hubert_content(hmodel, wav)
+        torch.save(c.cpu(), save_name)
+    else:
+        c = torch.load(save_name)
+    f0path = filename+".f0.npy"
+    if not os.path.exists(f0path):
+        cf0, f0 = compute_f0(filename, c.shape[-1] * 2)
+        np.save(f0path, f0)
+
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--in_dir", type=str, default="dataset/32k", help="path to input dir")
+    args = parser.parse_args()
+
+    print("Loading hubert for content...")
+    hmodel = utils.get_hubert_model(0 if torch.cuda.is_available() else None)
+    print("Loaded hubert.")
+
+    filenames = glob(f'{args.in_dir}/*/*.wav', recursive=True)#[:10]
+    
+    for filename in tqdm(filenames):
+        process(filename)
+    
\ No newline at end of file
diff --git a/AutoCoverTool/ref/so_vits_svc/requirements.txt b/AutoCoverTool/ref/so_vits_svc/requirements.txt
new file mode 100644
index 0000000..2f40497
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/requirements.txt
@@ -0,0 +1,19 @@
+Flask==2.1.2
+Flask_Cors==3.0.10
+gradio==3.4.1
+numpy==1.19.2
+playsound==1.3.0
+PyAudio==0.2.12
+pydub==0.25.1
+pyworld==0.3.0
+requests==2.28.1
+scipy==1.7.3
+sounddevice==0.4.5
+SoundFile==0.10.3.post1
+starlette==0.19.1
+tqdm==4.63.0
+scikit-maad
+praat-parselmouth
+onnx
+onnxsim
+onnxoptimizer
diff --git a/AutoCoverTool/ref/so_vits_svc/resample.py b/AutoCoverTool/ref/so_vits_svc/resample.py
new file mode 100644
index 0000000..b9b6a4f
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/resample.py
@@ -0,0 +1,50 @@
+import os
+import argparse
+import librosa
+import numpy as np
+from multiprocessing import Pool, cpu_count
+from scipy.io import wavfile
+from tqdm import tqdm
+
+
+def process(item):
+    spkdir, wav_name, args = item
+    # speaker 's5', 'p280', 'p315' are excluded,
+    speaker = spkdir.replace("\\", "/").split("/")[-1]
+    wav_path = os.path.join(args.in_dir, speaker, wav_name)
+    print(wav_path)
+    if os.path.exists(wav_path) and '.wav' in wav_path:
+        os.makedirs(os.path.join(args.out_dir2, speaker), exist_ok=True)
+        wav, sr = librosa.load(wav_path, None)
+        wav, _ = librosa.effects.trim(wav, top_db=20)
+        peak = np.abs(wav).max()
+        if peak > 1.0:
+            wav = 0.98 * wav / peak
+        wav2 = librosa.resample(wav, orig_sr=sr, target_sr=args.sr2)
+        wav2 /= max(wav2.max(), -wav2.min())
+        save_name = wav_name
+        save_path2 = os.path.join(args.out_dir2, speaker, save_name)
+        wavfile.write(
+            save_path2,
+            args.sr2,
+            (wav2 * np.iinfo(np.int16).max).astype(np.int16)
+        )
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--sr2", type=int, default=32000, help="sampling rate")
+    parser.add_argument("--in_dir", type=str, default="./dataset_raw", help="path to source dir")
+    parser.add_argument("--out_dir2", type=str, default="./dataset/32k", help="path to target dir")
+    args = parser.parse_args()
+    processs = cpu_count() - 2 if cpu_count() > 4 else 1
+    pool = Pool(processes=processs)
+    speaker = "speaker0"
+    spk_dir = os.path.join(args.in_dir, speaker)
+    # for speaker in os.listdir(args.in_dir):
+    #     spk_dir = os.path.join(args.in_dir, speaker)
+    if os.path.isdir(spk_dir):
+        print(spk_dir)
+        for _ in tqdm(pool.imap_unordered(process,
+                                          [(spk_dir, i, args) for i in os.listdir(spk_dir) if i.endswith("wav")])):
+            pass
diff --git a/AutoCoverTool/ref/so_vits_svc/sovits_gradio.py b/AutoCoverTool/ref/so_vits_svc/sovits_gradio.py
new file mode 100644
index 0000000..9a59e88
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/sovits_gradio.py
@@ -0,0 +1,47 @@
+from inference.infer_tool_grad import VitsSvc
+import gradio as gr
+import os
+
+class VitsGradio:
+    def __init__(self):
+        self.so = VitsSvc()
+        self.lspk = []
+        self.modelPaths = []
+        for root,dirs,files in os.walk("checkpoints"):
+            for dir in dirs:
+                self.modelPaths.append(dir)
+        with gr.Blocks() as self.Vits:
+            with gr.Tab("VoiceConversion"):
+                with gr.Row(visible=False) as self.VoiceConversion:
+                    with gr.Column():
+                        with gr.Row():
+                            with gr.Column():
+                                self.srcaudio = gr.Audio(label = "输入音频")
+                                self.btnVC = gr.Button("说话人转换")
+                            with gr.Column():
+                                self.dsid = gr.Dropdown(label = "目标角色", choices = self.lspk)
+                                self.tran = gr.Slider(label = "升降调", maximum = 60, minimum = -60, step = 1, value = 0)
+                                self.th = gr.Slider(label = "切片阈值", maximum = 32767, minimum = -32768, step = 0.1, value = -40)
+                        with gr.Row():
+                            self.VCOutputs = gr.Audio()
+                self.btnVC.click(self.so.inference, inputs=[self.srcaudio,self.dsid,self.tran,self.th], outputs=[self.VCOutputs])
+            with gr.Tab("SelectModel"):
+                with gr.Column():
+                    modelstrs = gr.Dropdown(label = "模型", choices = self.modelPaths, value = self.modelPaths[0], type = "value")
+                    devicestrs = gr.Dropdown(label = "设备", choices = ["cpu","cuda"], value = "cpu", type = "value")
+                    btnMod = gr.Button("载入模型")
+                    btnMod.click(self.loadModel, inputs=[modelstrs,devicestrs], outputs = [self.dsid,self.VoiceConversion])
+
+    def loadModel(self, path, device):
+        self.lspk = []
+        self.so.set_device(device)
+        self.so.loadCheckpoint(path)
+        for spk, sid in self.so.hps.spk.items():
+            self.lspk.append(spk)
+        VChange = gr.update(visible = True)
+        SDChange = gr.update(choices = self.lspk, value = self.lspk[0])
+        return [SDChange,VChange]
+
+grVits = VitsGradio()
+
+grVits.Vits.launch()
\ No newline at end of file
diff --git a/AutoCoverTool/ref/so_vits_svc/spec_gen.py b/AutoCoverTool/ref/so_vits_svc/spec_gen.py
new file mode 100644
index 0000000..85ad318
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/spec_gen.py
@@ -0,0 +1,22 @@
+from data_utils import TextAudioSpeakerLoader, EvalDataLoader
+import json
+from tqdm import tqdm
+
+from utils import HParams
+
+config_path = 'configs/config.json'
+with open(config_path, "r") as f:
+    data = f.read()
+config = json.loads(data)
+hps = HParams(**config)
+
+train_dataset = TextAudioSpeakerLoader("filelists/train.txt", hps)
+test_dataset = TextAudioSpeakerLoader("filelists/test.txt", hps)
+eval_dataset = TextAudioSpeakerLoader("filelists/val.txt", hps)
+
+for _ in tqdm(train_dataset):
+    pass
+for _ in tqdm(eval_dataset):
+    pass
+for _ in tqdm(test_dataset):
+    pass
\ No newline at end of file
diff --git a/AutoCoverTool/ref/so_vits_svc/train.py b/AutoCoverTool/ref/so_vits_svc/train.py
new file mode 100644
index 0000000..152bb59
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/train.py
@@ -0,0 +1,283 @@
+import logging
+
+logging.getLogger('matplotlib').setLevel(logging.WARNING)
+import os
+import json
+import argparse
+import itertools
+import math
+import torch
+from torch import nn, optim
+from torch.nn import functional as F
+from torch.utils.data import DataLoader
+from torch.utils.tensorboard import SummaryWriter
+import torch.multiprocessing as mp
+import torch.distributed as dist
+from torch.nn.parallel import DistributedDataParallel as DDP
+from torch.cuda.amp import autocast, GradScaler
+
+import commons
+import utils
+from data_utils import TextAudioSpeakerLoader, EvalDataLoader
+from models import (
+    SynthesizerTrn,
+    MultiPeriodDiscriminator,
+)
+from losses import (
+    kl_loss,
+    generator_loss, discriminator_loss, feature_loss
+)
+
+from mel_processing import mel_spectrogram_torch, spec_to_mel_torch
+
+torch.backends.cudnn.benchmark = True
+global_step = 0
+
+
+# os.environ['TORCH_DISTRIBUTED_DEBUG'] = 'INFO'
+
+
+def main():
+    """Assume Single Node Multi GPUs Training Only"""
+    assert torch.cuda.is_available(), "CPU training is not allowed."
+    hps = utils.get_hparams()
+
+    n_gpus = torch.cuda.device_count()
+    os.environ['MASTER_ADDR'] = 'localhost'
+    os.environ['MASTER_PORT'] = hps.train.port
+
+    mp.spawn(run, nprocs=n_gpus, args=(n_gpus, hps,))
+
+
+def run(rank, n_gpus, hps):
+    global global_step
+    if rank == 0:
+        logger = utils.get_logger(hps.model_dir)
+        logger.info(hps)
+        utils.check_git_hash(hps.model_dir)
+        writer = SummaryWriter(log_dir=hps.model_dir)
+        writer_eval = SummaryWriter(log_dir=os.path.join(hps.model_dir, "eval"))
+
+    dist.init_process_group(backend='nccl', init_method='env://', world_size=n_gpus, rank=rank)
+    torch.manual_seed(hps.train.seed)
+    torch.cuda.set_device(rank)
+
+    train_dataset = TextAudioSpeakerLoader(hps.data.training_files, hps)
+    train_loader = DataLoader(train_dataset, num_workers=8, shuffle=False, pin_memory=True,
+                              batch_size=hps.train.batch_size)
+    if rank == 0:
+        eval_dataset = EvalDataLoader(hps.data.validation_files, hps)
+        eval_loader = DataLoader(eval_dataset, num_workers=1, shuffle=False,
+                                 batch_size=1, pin_memory=False,
+                                 drop_last=False)
+
+    net_g = SynthesizerTrn(
+        hps.data.filter_length // 2 + 1,
+        hps.train.segment_size // hps.data.hop_length,
+        **hps.model).cuda(rank)
+    net_d = MultiPeriodDiscriminator(hps.model.use_spectral_norm).cuda(rank)
+    optim_g = torch.optim.AdamW(
+        net_g.parameters(),
+        hps.train.learning_rate,
+        betas=hps.train.betas,
+        eps=hps.train.eps)
+    optim_d = torch.optim.AdamW(
+        net_d.parameters(),
+        hps.train.learning_rate,
+        betas=hps.train.betas,
+        eps=hps.train.eps)
+    net_g = DDP(net_g, device_ids=[rank])  # , find_unused_parameters=True)
+    net_d = DDP(net_d, device_ids=[rank])
+
+    try:
+        _, _, _, epoch_str = utils.load_checkpoint(utils.latest_checkpoint_path(hps.model_dir, "G_*.pth"), net_g,
+                                                   optim_g)
+        _, _, _, epoch_str = utils.load_checkpoint(utils.latest_checkpoint_path(hps.model_dir, "D_*.pth"), net_d,
+                                                   optim_d)
+        global_step = (epoch_str - 1) * len(train_loader)
+        print("load checkpoint ok !")
+    except:
+        epoch_str = 1
+        global_step = 0
+
+    scheduler_g = torch.optim.lr_scheduler.ExponentialLR(optim_g, gamma=hps.train.lr_decay, last_epoch=epoch_str - 2)
+    scheduler_d = torch.optim.lr_scheduler.ExponentialLR(optim_d, gamma=hps.train.lr_decay, last_epoch=epoch_str - 2)
+
+    scaler = GradScaler(enabled=hps.train.fp16_run)
+
+    for epoch in range(epoch_str, hps.train.epochs + 1):
+        if rank == 0:
+            train_and_evaluate(rank, epoch, hps, [net_g, net_d], [optim_g, optim_d], [scheduler_g, scheduler_d], scaler,
+                               [train_loader, eval_loader], logger, [writer, writer_eval])
+        else:
+            train_and_evaluate(rank, epoch, hps, [net_g, net_d], [optim_g, optim_d], [scheduler_g, scheduler_d], scaler,
+                               [train_loader, None], None, None)
+        scheduler_g.step()
+        scheduler_d.step()
+
+
+def train_and_evaluate(rank, epoch, hps, nets, optims, schedulers, scaler, loaders, logger, writers):
+    net_g, net_d = nets
+    optim_g, optim_d = optims
+    scheduler_g, scheduler_d = schedulers
+    train_loader, eval_loader = loaders
+    if writers is not None:
+        writer, writer_eval = writers
+
+    # train_loader.batch_sampler.set_epoch(epoch)
+    global global_step
+
+    net_g.train()
+    net_d.train()
+    for batch_idx, items in enumerate(train_loader):
+        c, f0, spec, y, spk = items
+        g = spk.cuda(rank, non_blocking=True)
+        spec, y = spec.cuda(rank, non_blocking=True), y.cuda(rank, non_blocking=True)
+        c = c.cuda(rank, non_blocking=True)
+        f0 = f0.cuda(rank, non_blocking=True)
+        mel = spec_to_mel_torch(
+            spec,
+            hps.data.filter_length,
+            hps.data.n_mel_channels,
+            hps.data.sampling_rate,
+            hps.data.mel_fmin,
+            hps.data.mel_fmax)
+
+        with autocast(enabled=hps.train.fp16_run):
+            y_hat, ids_slice, z_mask, \
+            (z, z_p, m_p, logs_p, m_q, logs_q) = net_g(c, f0, spec, g=g, mel=mel)
+
+            y_mel = commons.slice_segments(mel, ids_slice, hps.train.segment_size // hps.data.hop_length)
+            y_hat_mel = mel_spectrogram_torch(
+                y_hat.squeeze(1),
+                hps.data.filter_length,
+                hps.data.n_mel_channels,
+                hps.data.sampling_rate,
+                hps.data.hop_length,
+                hps.data.win_length,
+                hps.data.mel_fmin,
+                hps.data.mel_fmax
+            )
+            y = commons.slice_segments(y, ids_slice * hps.data.hop_length, hps.train.segment_size)  # slice
+
+            # Discriminator
+            y_d_hat_r, y_d_hat_g, _, _ = net_d(y, y_hat.detach())
+
+            with autocast(enabled=False):
+                loss_disc, losses_disc_r, losses_disc_g = discriminator_loss(y_d_hat_r, y_d_hat_g)
+                loss_disc_all = loss_disc
+
+        optim_d.zero_grad()
+        scaler.scale(loss_disc_all).backward()
+        scaler.unscale_(optim_d)
+        grad_norm_d = commons.clip_grad_value_(net_d.parameters(), None)
+        scaler.step(optim_d)
+
+        with autocast(enabled=hps.train.fp16_run):
+            # Generator
+            y_d_hat_r, y_d_hat_g, fmap_r, fmap_g = net_d(y, y_hat)
+            with autocast(enabled=False):
+                loss_mel = F.l1_loss(y_mel, y_hat_mel) * hps.train.c_mel
+                loss_kl = kl_loss(z_p, logs_q, m_p, logs_p, z_mask) * hps.train.c_kl
+                loss_fm = feature_loss(fmap_r, fmap_g)
+                loss_gen, losses_gen = generator_loss(y_d_hat_g)
+                loss_gen_all = loss_gen + loss_fm + loss_mel + loss_kl
+        optim_g.zero_grad()
+        scaler.scale(loss_gen_all).backward()
+        scaler.unscale_(optim_g)
+        grad_norm_g = commons.clip_grad_value_(net_g.parameters(), None)
+        scaler.step(optim_g)
+        scaler.update()
+
+        if rank == 0:
+            if global_step % hps.train.log_interval == 0:
+                lr = optim_g.param_groups[0]['lr']
+                losses = [loss_disc, loss_gen, loss_fm, loss_mel, loss_kl]
+                logger.info('Train Epoch: {} [{:.0f}%]'.format(
+                    epoch,
+                    100. * batch_idx / len(train_loader)))
+                logger.info([x.item() for x in losses] + [global_step, lr])
+
+                scalar_dict = {"loss/g/total": loss_gen_all, "loss/d/total": loss_disc_all, "learning_rate": lr,
+                               "grad_norm_d": grad_norm_d, "grad_norm_g": grad_norm_g}
+                scalar_dict.update({"loss/g/fm": loss_fm, "loss/g/mel": loss_mel, "loss/g/kl": loss_kl})
+
+                scalar_dict.update({"loss/g/{}".format(i): v for i, v in enumerate(losses_gen)})
+                scalar_dict.update({"loss/d_r/{}".format(i): v for i, v in enumerate(losses_disc_r)})
+                scalar_dict.update({"loss/d_g/{}".format(i): v for i, v in enumerate(losses_disc_g)})
+                image_dict = {
+                    "slice/mel_org": utils.plot_spectrogram_to_numpy(y_mel[0].data.cpu().numpy()),
+                    "slice/mel_gen": utils.plot_spectrogram_to_numpy(y_hat_mel[0].data.cpu().numpy()),
+                    "all/mel": utils.plot_spectrogram_to_numpy(mel[0].data.cpu().numpy()),
+                }
+
+                utils.summarize(
+                    writer=writer,
+                    global_step=global_step,
+                    images=image_dict,
+                    scalars=scalar_dict
+                )
+
+            if global_step % hps.train.eval_interval == 0:
+                evaluate(hps, net_g, eval_loader, writer_eval)
+                utils.save_checkpoint(net_g, optim_g, hps.train.learning_rate, epoch,
+                                      os.path.join(hps.model_dir, "G_{}.pth".format(global_step)))
+                utils.save_checkpoint(net_d, optim_d, hps.train.learning_rate, epoch,
+                                      os.path.join(hps.model_dir, "D_{}.pth".format(global_step)))
+        global_step += 1
+
+    if rank == 0:
+        logger.info('====> Epoch: {},{}'.format(epoch, global_step))
+
+
+def evaluate(hps, generator, eval_loader, writer_eval):
+    generator.eval()
+    image_dict = {}
+    audio_dict = {}
+    with torch.no_grad():
+        for batch_idx, items in enumerate(eval_loader):
+            c, f0, spec, y, spk = items
+            g = spk[:1].cuda(0)
+            spec, y = spec[:1].cuda(0), y[:1].cuda(0)
+            c = c[:1].cuda(0)
+            f0 = f0[:1].cuda(0)
+            mel = spec_to_mel_torch(
+                spec,
+                hps.data.filter_length,
+                hps.data.n_mel_channels,
+                hps.data.sampling_rate,
+                hps.data.mel_fmin,
+                hps.data.mel_fmax)
+            y_hat = generator.module.infer(c, f0, g=g, mel=mel)
+
+            y_hat_mel = mel_spectrogram_torch(
+                y_hat.squeeze(1).float(),
+                hps.data.filter_length,
+                hps.data.n_mel_channels,
+                hps.data.sampling_rate,
+                hps.data.hop_length,
+                hps.data.win_length,
+                hps.data.mel_fmin,
+                hps.data.mel_fmax
+            )
+
+            audio_dict.update({
+                f"gen/audio_{batch_idx}": y_hat[0],
+                f"gt/audio_{batch_idx}": y[0]
+            })
+        image_dict.update({
+            f"gen/mel": utils.plot_spectrogram_to_numpy(y_hat_mel[0].cpu().numpy()),
+            "gt/mel": utils.plot_spectrogram_to_numpy(mel[0].cpu().numpy())
+        })
+    utils.summarize(
+        writer=writer_eval,
+        global_step=global_step,
+        images=image_dict,
+        audios=audio_dict,
+        audio_sampling_rate=hps.data.sampling_rate
+    )
+    generator.train()
+
+
+if __name__ == "__main__":
+    main()
diff --git a/AutoCoverTool/ref/so_vits_svc/utils.py b/AutoCoverTool/ref/so_vits_svc/utils.py
new file mode 100644
index 0000000..9eb9679
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/utils.py
@@ -0,0 +1,360 @@
+import os
+import glob
+import re
+import sys
+import argparse
+import logging
+import json
+import subprocess
+
+import librosa
+import numpy as np
+import torchaudio
+from scipy.io.wavfile import read
+import torch
+import torchvision
+from torch.nn import functional as F
+from commons import sequence_mask
+from hubert import hubert_model
+
+MATPLOTLIB_FLAG = False
+
+logging.basicConfig(stream=sys.stdout, level=logging.DEBUG)
+logger = logging
+
+f0_bin = 256
+f0_max = 1100.0
+f0_min = 50.0
+f0_mel_min = 1127 * np.log(1 + f0_min / 700)
+f0_mel_max = 1127 * np.log(1 + f0_max / 700)
+
+
+def f0_to_coarse(f0):
+    is_torch = isinstance(f0, torch.Tensor)
+    f0_mel = 1127 * (1 + f0 / 700).log() if is_torch else 1127 * np.log(1 + f0 / 700)
+    f0_mel[f0_mel > 0] = (f0_mel[f0_mel > 0] - f0_mel_min) * (f0_bin - 2) / (f0_mel_max - f0_mel_min) + 1
+
+    f0_mel[f0_mel <= 1] = 1
+    f0_mel[f0_mel > f0_bin - 1] = f0_bin - 1
+    f0_coarse = (f0_mel + 0.5).long() if is_torch else np.rint(f0_mel).astype(np.int)
+    assert f0_coarse.max() <= 255 and f0_coarse.min() >= 1, (f0_coarse.max(), f0_coarse.min())
+    return f0_coarse
+
+
+def get_hubert_model(rank=None):
+    hubert_soft = hubert_model.hubert_soft("data/models/hubert-soft-0d54a1f4.pt")
+    if rank is not None:
+        hubert_soft = hubert_soft.cuda(rank)
+    return hubert_soft
+
+
+def get_hubert_content(hmodel, y=None, path=None):
+    if path is not None:
+        source, sr = torchaudio.load(path)
+        source = torchaudio.functional.resample(source, sr, 16000)
+        if len(source.shape) == 2 and source.shape[1] >= 2:
+            source = torch.mean(source, dim=0).unsqueeze(0)
+    else:
+        source = y
+    source = source.unsqueeze(0)
+    with torch.inference_mode():
+        units = hmodel.units(source)
+        return units.transpose(1, 2)
+
+
+def get_content(cmodel, y):
+    with torch.no_grad():
+        c = cmodel.extract_features(y.squeeze(1))[0]
+    c = c.transpose(1, 2)
+    return c
+
+
+def transform(mel, height):  # 68-92
+    # r = np.random.random()
+    # rate = r * 0.3 + 0.85 # 0.85-1.15
+    # height = int(mel.size(-2) * rate)
+    tgt = torchvision.transforms.functional.resize(mel, (height, mel.size(-1)))
+    if height >= mel.size(-2):
+        return tgt[:, :mel.size(-2), :]
+    else:
+        silence = tgt[:, -1:, :].repeat(1, mel.size(-2) - height, 1)
+        silence += torch.randn_like(silence) / 10
+        return torch.cat((tgt, silence), 1)
+
+
+def stretch(mel, width):  # 0.5-2
+    return torchvision.transforms.functional.resize(mel, (mel.size(-2), width))
+
+
+def load_checkpoint(checkpoint_path, model, optimizer=None):
+    assert os.path.isfile(checkpoint_path)
+    checkpoint_dict = torch.load(checkpoint_path, map_location='cpu')
+    iteration = checkpoint_dict['iteration']
+    learning_rate = checkpoint_dict['learning_rate']
+    if iteration is None:
+        iteration = 1
+    if learning_rate is None:
+        learning_rate = 0.0002
+    if optimizer is not None and checkpoint_dict['optimizer'] is not None:
+        optimizer.load_state_dict(checkpoint_dict['optimizer'])
+    saved_state_dict = checkpoint_dict['model']
+    if hasattr(model, 'module'):
+        state_dict = model.module.state_dict()
+    else:
+        state_dict = model.state_dict()
+    new_state_dict = {}
+    for k, v in state_dict.items():
+        try:
+            new_state_dict[k] = saved_state_dict[k]
+        except:
+            logger.info("%s is not in the checkpoint" % k)
+            new_state_dict[k] = v
+    if hasattr(model, 'module'):
+        model.module.load_state_dict(new_state_dict)
+    else:
+        model.load_state_dict(new_state_dict)
+    logger.info("Loaded checkpoint '{}' (iteration {})".format(
+        checkpoint_path, iteration))
+    return model, optimizer, learning_rate, iteration
+
+
+def save_checkpoint(model, optimizer, learning_rate, iteration, checkpoint_path):
+    logger.info("Saving model and optimizer state at iteration {} to {}".format(
+        iteration, checkpoint_path))
+    if hasattr(model, 'module'):
+        state_dict = model.module.state_dict()
+    else:
+        state_dict = model.state_dict()
+    torch.save({'model': state_dict,
+                'iteration': iteration,
+                'optimizer': optimizer.state_dict(),
+                'learning_rate': learning_rate}, checkpoint_path)
+    clean_ckpt = False
+    if clean_ckpt:
+        clean_checkpoints(path_to_models='logs/32k/', n_ckpts_to_keep=3, sort_by_time=True)
+
+
+def clean_checkpoints(path_to_models='logs/48k/', n_ckpts_to_keep=2, sort_by_time=True):
+    """Freeing up space by deleting saved ckpts
+
+    Arguments:
+    path_to_models    --  Path to the model directory
+    n_ckpts_to_keep   --  Number of ckpts to keep, excluding G_0.pth and D_0.pth
+    sort_by_time      --  True -> chronologically delete ckpts
+                          False -> lexicographically delete ckpts
+    """
+    ckpts_files = [f for f in os.listdir(path_to_models) if os.path.isfile(os.path.join(path_to_models, f))]
+    name_key = (lambda _f: int(re.compile('._(\d+)\.pth').match(_f).group(1)))
+    time_key = (lambda _f: os.path.getmtime(os.path.join(path_to_models, _f)))
+    sort_key = time_key if sort_by_time else name_key
+    x_sorted = lambda _x: sorted([f for f in ckpts_files if f.startswith(_x) and not f.endswith('_0.pth')],
+                                 key=sort_key)
+    to_del = [os.path.join(path_to_models, fn) for fn in
+              (x_sorted('G')[:-n_ckpts_to_keep] + x_sorted('D')[:-n_ckpts_to_keep])]
+    del_info = lambda fn: logger.info(f".. Free up space by deleting ckpt {fn}")
+    del_routine = lambda x: [os.remove(x), del_info(x)]
+    rs = [del_routine(fn) for fn in to_del]
+
+
+def summarize(writer, global_step, scalars={}, histograms={}, images={}, audios={}, audio_sampling_rate=22050):
+    for k, v in scalars.items():
+        writer.add_scalar(k, v, global_step)
+    for k, v in histograms.items():
+        writer.add_histogram(k, v, global_step)
+    for k, v in images.items():
+        writer.add_image(k, v, global_step, dataformats='HWC')
+    for k, v in audios.items():
+        writer.add_audio(k, v, global_step, audio_sampling_rate)
+
+
+def latest_checkpoint_path(dir_path, regex="G_*.pth"):
+    f_list = glob.glob(os.path.join(dir_path, regex))
+    f_list.sort(key=lambda f: int("".join(filter(str.isdigit, f))))
+    x = f_list[-1]
+    print(x)
+    return x
+
+
+def plot_spectrogram_to_numpy(spectrogram):
+    global MATPLOTLIB_FLAG
+    if not MATPLOTLIB_FLAG:
+        import matplotlib
+        matplotlib.use("Agg")
+        MATPLOTLIB_FLAG = True
+        mpl_logger = logging.getLogger('matplotlib')
+        mpl_logger.setLevel(logging.WARNING)
+    import matplotlib.pylab as plt
+    import numpy as np
+
+    fig, ax = plt.subplots(figsize=(10, 2))
+    im = ax.imshow(spectrogram, aspect="auto", origin="lower",
+                   interpolation='none')
+    plt.colorbar(im, ax=ax)
+    plt.xlabel("Frames")
+    plt.ylabel("Channels")
+    plt.tight_layout()
+
+    fig.canvas.draw()
+    data = np.fromstring(fig.canvas.tostring_rgb(), dtype=np.uint8, sep='')
+    data = data.reshape(fig.canvas.get_width_height()[::-1] + (3,))
+    plt.close()
+    return data
+
+
+def plot_alignment_to_numpy(alignment, info=None):
+    global MATPLOTLIB_FLAG
+    if not MATPLOTLIB_FLAG:
+        import matplotlib
+        matplotlib.use("Agg")
+        MATPLOTLIB_FLAG = True
+        mpl_logger = logging.getLogger('matplotlib')
+        mpl_logger.setLevel(logging.WARNING)
+    import matplotlib.pylab as plt
+    import numpy as np
+
+    fig, ax = plt.subplots(figsize=(6, 4))
+    im = ax.imshow(alignment.transpose(), aspect='auto', origin='lower',
+                   interpolation='none')
+    fig.colorbar(im, ax=ax)
+    xlabel = 'Decoder timestep'
+    if info is not None:
+        xlabel += '\n\n' + info
+    plt.xlabel(xlabel)
+    plt.ylabel('Encoder timestep')
+    plt.tight_layout()
+
+    fig.canvas.draw()
+    data = np.fromstring(fig.canvas.tostring_rgb(), dtype=np.uint8, sep='')
+    data = data.reshape(fig.canvas.get_width_height()[::-1] + (3,))
+    plt.close()
+    return data
+
+
+def load_wav_to_torch(full_path):
+    sampling_rate, data = read(full_path)
+    return torch.FloatTensor(data.astype(np.float32)), sampling_rate
+
+
+def load_filepaths_and_text(filename, split="|"):
+    with open(filename, encoding='utf-8') as f:
+        filepaths_and_text = [line.strip().split(split) for line in f]
+    return filepaths_and_text
+
+
+def get_hparams(init=True):
+    parser = argparse.ArgumentParser()
+    parser.add_argument('-c', '--config', type=str, default="./configs/base.json",
+                        help='JSON file for configuration')
+    parser.add_argument('-m', '--model', type=str, required=True,
+                        help='Model name')
+    parser.add_argument('-l', '--logs', type=str, required=True,
+                        help='log Name')
+
+    args = parser.parse_args()
+    model_dir = os.path.join(args.logs, args.model)
+
+    if not os.path.exists(model_dir):
+        os.makedirs(model_dir)
+
+    config_path = args.config
+    config_save_path = os.path.join(model_dir, "config.json")
+    if init:
+        with open(config_path, "r") as f:
+            data = f.read()
+        with open(config_save_path, "w") as f:
+            f.write(data)
+    else:
+        with open(config_save_path, "r") as f:
+            data = f.read()
+    config = json.loads(data)
+
+    hparams = HParams(**config)
+    hparams.model_dir = model_dir
+    return hparams
+
+
+def get_hparams_from_dir(model_dir):
+    config_save_path = os.path.join(model_dir, "config.json")
+    with open(config_save_path, "r") as f:
+        data = f.read()
+    config = json.loads(data)
+
+    hparams = HParams(**config)
+    hparams.model_dir = model_dir
+    return hparams
+
+
+def get_hparams_from_file(config_path):
+    with open(config_path, "r") as f:
+        data = f.read()
+    config = json.loads(data)
+
+    hparams = HParams(**config)
+    return hparams
+
+
+def check_git_hash(model_dir):
+    source_dir = os.path.dirname(os.path.realpath(__file__))
+    if not os.path.exists(os.path.join(source_dir, ".git")):
+        logger.warn("{} is not a git repository, therefore hash value comparison will be ignored.".format(
+            source_dir
+        ))
+        return
+
+    cur_hash = subprocess.getoutput("git rev-parse HEAD")
+
+    path = os.path.join(model_dir, "githash")
+    if os.path.exists(path):
+        saved_hash = open(path).read()
+        if saved_hash != cur_hash:
+            logger.warn("git hash values are different. {}(saved) != {}(current)".format(
+                saved_hash[:8], cur_hash[:8]))
+    else:
+        open(path, "w").write(cur_hash)
+
+
+def get_logger(model_dir, filename="train.log"):
+    global logger
+    logger = logging.getLogger(os.path.basename(model_dir))
+    logger.setLevel(logging.DEBUG)
+
+    formatter = logging.Formatter("%(asctime)s\t%(name)s\t%(levelname)s\t%(message)s")
+    if not os.path.exists(model_dir):
+        os.makedirs(model_dir)
+    h = logging.FileHandler(os.path.join(model_dir, filename))
+    h.setLevel(logging.DEBUG)
+    h.setFormatter(formatter)
+    logger.addHandler(h)
+    return logger
+
+
+class HParams():
+    def __init__(self, **kwargs):
+        for k, v in kwargs.items():
+            if type(v) == dict:
+                v = HParams(**v)
+            self[k] = v
+
+    def keys(self):
+        return self.__dict__.keys()
+
+    def items(self):
+        return self.__dict__.items()
+
+    def values(self):
+        return self.__dict__.values()
+
+    def __len__(self):
+        return len(self.__dict__)
+
+    def __getitem__(self, key):
+        return getattr(self, key)
+
+    def __setitem__(self, key, value):
+        return setattr(self, key, value)
+
+    def __contains__(self, key):
+        return key in self.__dict__
+
+    def __repr__(self):
+        return self.__dict__.__repr__()
diff --git a/AutoCoverTool/ref/so_vits_svc/vdecoder/__init__.py b/AutoCoverTool/ref/so_vits_svc/vdecoder/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/env.py b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/env.py
new file mode 100644
index 0000000..2bdbc95
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/env.py
@@ -0,0 +1,15 @@
+import os
+import shutil
+
+
+class AttrDict(dict):
+    def __init__(self, *args, **kwargs):
+        super(AttrDict, self).__init__(*args, **kwargs)
+        self.__dict__ = self
+
+
+def build_env(config, config_name, path):
+    t_path = os.path.join(path, config_name)
+    if config != t_path:
+        os.makedirs(path, exist_ok=True)
+        shutil.copyfile(config, os.path.join(path, config_name))
diff --git a/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/models.py b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/models.py
new file mode 100644
index 0000000..9747301
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/models.py
@@ -0,0 +1,503 @@
+import os
+import json
+from .env import AttrDict
+import numpy as np
+import torch
+import torch.nn.functional as F
+import torch.nn as nn
+from torch.nn import Conv1d, ConvTranspose1d, AvgPool1d, Conv2d
+from torch.nn.utils import weight_norm, remove_weight_norm, spectral_norm
+from .utils import init_weights, get_padding
+
+LRELU_SLOPE = 0.1
+
+
+def load_model(model_path, device='cuda'):
+    config_file = os.path.join(os.path.split(model_path)[0], 'config.json')
+    with open(config_file) as f:
+        data = f.read()
+
+    global h
+    json_config = json.loads(data)
+    h = AttrDict(json_config)
+
+    generator = Generator(h).to(device)
+
+    cp_dict = torch.load(model_path)
+    generator.load_state_dict(cp_dict['generator'])
+    generator.eval()
+    generator.remove_weight_norm()
+    del cp_dict
+    return generator, h
+
+
+class ResBlock1(torch.nn.Module):
+    def __init__(self, h, channels, kernel_size=3, dilation=(1, 3, 5)):
+        super(ResBlock1, self).__init__()
+        self.h = h
+        self.convs1 = nn.ModuleList([
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[0],
+                               padding=get_padding(kernel_size, dilation[0]))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[1],
+                               padding=get_padding(kernel_size, dilation[1]))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[2],
+                               padding=get_padding(kernel_size, dilation[2])))
+        ])
+        self.convs1.apply(init_weights)
+
+        self.convs2 = nn.ModuleList([
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=1,
+                               padding=get_padding(kernel_size, 1))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=1,
+                               padding=get_padding(kernel_size, 1))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=1,
+                               padding=get_padding(kernel_size, 1)))
+        ])
+        self.convs2.apply(init_weights)
+
+    def forward(self, x):
+        for c1, c2 in zip(self.convs1, self.convs2):
+            xt = F.leaky_relu(x, LRELU_SLOPE)
+            xt = c1(xt)
+            xt = F.leaky_relu(xt, LRELU_SLOPE)
+            xt = c2(xt)
+            x = xt + x
+        return x
+
+    def remove_weight_norm(self):
+        for l in self.convs1:
+            remove_weight_norm(l)
+        for l in self.convs2:
+            remove_weight_norm(l)
+
+
+class ResBlock2(torch.nn.Module):
+    def __init__(self, h, channels, kernel_size=3, dilation=(1, 3)):
+        super(ResBlock2, self).__init__()
+        self.h = h
+        self.convs = nn.ModuleList([
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[0],
+                               padding=get_padding(kernel_size, dilation[0]))),
+            weight_norm(Conv1d(channels, channels, kernel_size, 1, dilation=dilation[1],
+                               padding=get_padding(kernel_size, dilation[1])))
+        ])
+        self.convs.apply(init_weights)
+
+    def forward(self, x):
+        for c in self.convs:
+            xt = F.leaky_relu(x, LRELU_SLOPE)
+            xt = c(xt)
+            x = xt + x
+        return x
+
+    def remove_weight_norm(self):
+        for l in self.convs:
+            remove_weight_norm(l)
+
+
+def padDiff(x):
+    return F.pad(F.pad(x, (0,0,-1,1), 'constant', 0) - x, (0,0,0,-1), 'constant', 0)
+
+class SineGen(torch.nn.Module):
+    """ Definition of sine generator
+    SineGen(samp_rate, harmonic_num = 0,
+            sine_amp = 0.1, noise_std = 0.003,
+            voiced_threshold = 0,
+            flag_for_pulse=False)
+    samp_rate: sampling rate in Hz
+    harmonic_num: number of harmonic overtones (default 0)
+    sine_amp: amplitude of sine-wavefrom (default 0.1)
+    noise_std: std of Gaussian noise (default 0.003)
+    voiced_thoreshold: F0 threshold for U/V classification (default 0)
+    flag_for_pulse: this SinGen is used inside PulseGen (default False)
+    Note: when flag_for_pulse is True, the first time step of a voiced
+        segment is always sin(np.pi) or cos(0)
+    """
+
+    def __init__(self, samp_rate, harmonic_num=0,
+                 sine_amp=0.1, noise_std=0.003,
+                 voiced_threshold=0,
+                 flag_for_pulse=False):
+        super(SineGen, self).__init__()
+        self.sine_amp = sine_amp
+        self.noise_std = noise_std
+        self.harmonic_num = harmonic_num
+        self.dim = self.harmonic_num + 1
+        self.sampling_rate = samp_rate
+        self.voiced_threshold = voiced_threshold
+        self.flag_for_pulse = flag_for_pulse
+
+    def _f02uv(self, f0):
+        # generate uv signal
+        uv = (f0 > self.voiced_threshold).type(torch.float32)
+        return uv
+
+    def _f02sine(self, f0_values):
+        """ f0_values: (batchsize, length, dim)
+            where dim indicates fundamental tone and overtones
+        """
+        # convert to F0 in rad. The interger part n can be ignored
+        # because 2 * np.pi * n doesn't affect phase
+        rad_values = (f0_values / self.sampling_rate) % 1
+
+        # initial phase noise (no noise for fundamental component)
+        rand_ini = torch.rand(f0_values.shape[0], f0_values.shape[2], \
+                              device=f0_values.device)
+        rand_ini[:, 0] = 0
+        rad_values[:, 0, :] = rad_values[:, 0, :] + rand_ini
+
+        # instantanouse phase sine[t] = sin(2*pi \sum_i=1 ^{t} rad)
+        if not self.flag_for_pulse:
+            # for normal case
+
+            # To prevent torch.cumsum numerical overflow,
+            # it is necessary to add -1 whenever \sum_k=1^n rad_value_k > 1.
+            # Buffer tmp_over_one_idx indicates the time step to add -1.
+            # This will not change F0 of sine because (x-1) * 2*pi = x * 2*pi
+            tmp_over_one = torch.cumsum(rad_values, 1) % 1
+            tmp_over_one_idx = (padDiff(tmp_over_one)) < 0
+            cumsum_shift = torch.zeros_like(rad_values)
+            cumsum_shift[:, 1:, :] = tmp_over_one_idx * -1.0
+
+            sines = torch.sin(torch.cumsum(rad_values + cumsum_shift, dim=1)
+                              * 2 * np.pi)
+        else:
+            # If necessary, make sure that the first time step of every
+            # voiced segments is sin(pi) or cos(0)
+            # This is used for pulse-train generation
+
+            # identify the last time step in unvoiced segments
+            uv = self._f02uv(f0_values)
+            uv_1 = torch.roll(uv, shifts=-1, dims=1)
+            uv_1[:, -1, :] = 1
+            u_loc = (uv < 1) * (uv_1 > 0)
+
+            # get the instantanouse phase
+            tmp_cumsum = torch.cumsum(rad_values, dim=1)
+            # different batch needs to be processed differently
+            for idx in range(f0_values.shape[0]):
+                temp_sum = tmp_cumsum[idx, u_loc[idx, :, 0], :]
+                temp_sum[1:, :] = temp_sum[1:, :] - temp_sum[0:-1, :]
+                # stores the accumulation of i.phase within
+                # each voiced segments
+                tmp_cumsum[idx, :, :] = 0
+                tmp_cumsum[idx, u_loc[idx, :, 0], :] = temp_sum
+
+            # rad_values - tmp_cumsum: remove the accumulation of i.phase
+            # within the previous voiced segment.
+            i_phase = torch.cumsum(rad_values - tmp_cumsum, dim=1)
+
+            # get the sines
+            sines = torch.cos(i_phase * 2 * np.pi)
+        return sines
+
+    def forward(self, f0):
+        """ sine_tensor, uv = forward(f0)
+        input F0: tensor(batchsize=1, length, dim=1)
+                  f0 for unvoiced steps should be 0
+        output sine_tensor: tensor(batchsize=1, length, dim)
+        output uv: tensor(batchsize=1, length, 1)
+        """
+        with torch.no_grad():
+            f0_buf = torch.zeros(f0.shape[0], f0.shape[1], self.dim,
+                                 device=f0.device)
+            # fundamental component
+            fn = torch.multiply(f0, torch.FloatTensor([[range(1, self.harmonic_num + 2)]]).to(f0.device))
+
+            # generate sine waveforms
+            sine_waves = self._f02sine(fn) * self.sine_amp
+
+            # generate uv signal
+            # uv = torch.ones(f0.shape)
+            # uv = uv * (f0 > self.voiced_threshold)
+            uv = self._f02uv(f0)
+
+            # noise: for unvoiced should be similar to sine_amp
+            #        std = self.sine_amp/3 -> max value ~ self.sine_amp
+            # .       for voiced regions is self.noise_std
+            noise_amp = uv * self.noise_std + (1 - uv) * self.sine_amp / 3
+            noise = noise_amp * torch.randn_like(sine_waves)
+
+            # first: set the unvoiced part to 0 by uv
+            # then: additive noise
+            sine_waves = sine_waves * uv + noise
+        return sine_waves, uv, noise
+
+
+class SourceModuleHnNSF(torch.nn.Module):
+    """ SourceModule for hn-nsf
+    SourceModule(sampling_rate, harmonic_num=0, sine_amp=0.1,
+                 add_noise_std=0.003, voiced_threshod=0)
+    sampling_rate: sampling_rate in Hz
+    harmonic_num: number of harmonic above F0 (default: 0)
+    sine_amp: amplitude of sine source signal (default: 0.1)
+    add_noise_std: std of additive Gaussian noise (default: 0.003)
+        note that amplitude of noise in unvoiced is decided
+        by sine_amp
+    voiced_threshold: threhold to set U/V given F0 (default: 0)
+    Sine_source, noise_source = SourceModuleHnNSF(F0_sampled)
+    F0_sampled (batchsize, length, 1)
+    Sine_source (batchsize, length, 1)
+    noise_source (batchsize, length 1)
+    uv (batchsize, length, 1)
+    """
+
+    def __init__(self, sampling_rate, harmonic_num=0, sine_amp=0.1,
+                 add_noise_std=0.003, voiced_threshod=0):
+        super(SourceModuleHnNSF, self).__init__()
+
+        self.sine_amp = sine_amp
+        self.noise_std = add_noise_std
+
+        # to produce sine waveforms
+        self.l_sin_gen = SineGen(sampling_rate, harmonic_num,
+                                 sine_amp, add_noise_std, voiced_threshod)
+
+        # to merge source harmonics into a single excitation
+        self.l_linear = torch.nn.Linear(harmonic_num + 1, 1)
+        self.l_tanh = torch.nn.Tanh()
+
+    def forward(self, x):
+        """
+        Sine_source, noise_source = SourceModuleHnNSF(F0_sampled)
+        F0_sampled (batchsize, length, 1)
+        Sine_source (batchsize, length, 1)
+        noise_source (batchsize, length 1)
+        """
+        # source for harmonic branch
+        sine_wavs, uv, _ = self.l_sin_gen(x)
+        sine_merge = self.l_tanh(self.l_linear(sine_wavs))
+
+        # source for noise branch, in the same shape as uv
+        noise = torch.randn_like(uv) * self.sine_amp / 3
+        return sine_merge, noise, uv
+
+
+class Generator(torch.nn.Module):
+    def __init__(self, h):
+        super(Generator, self).__init__()
+        self.h = h
+
+        self.num_kernels = len(h["resblock_kernel_sizes"])
+        self.num_upsamples = len(h["upsample_rates"])
+        self.f0_upsamp = torch.nn.Upsample(scale_factor=np.prod(h["upsample_rates"]))
+        self.m_source = SourceModuleHnNSF(
+            sampling_rate=h["sampling_rate"],
+            harmonic_num=8)
+        self.noise_convs = nn.ModuleList()
+        self.conv_pre = weight_norm(Conv1d(h["inter_channels"], h["upsample_initial_channel"], 7, 1, padding=3))
+        resblock = ResBlock1 if h["resblock"] == '1' else ResBlock2
+        self.ups = nn.ModuleList()
+        for i, (u, k) in enumerate(zip(h["upsample_rates"], h["upsample_kernel_sizes"])):
+            c_cur = h["upsample_initial_channel"] // (2 ** (i + 1))
+            self.ups.append(weight_norm(
+                ConvTranspose1d(h["upsample_initial_channel"] // (2 ** i), h["upsample_initial_channel"] // (2 ** (i + 1)),
+                                k, u, padding=(k - u) // 2)))
+            if i + 1 < len(h["upsample_rates"]):  #
+                stride_f0 = np.prod(h["upsample_rates"][i + 1:])
+                self.noise_convs.append(Conv1d(
+                    1, c_cur, kernel_size=stride_f0 * 2, stride=stride_f0, padding=stride_f0 // 2))
+            else:
+                self.noise_convs.append(Conv1d(1, c_cur, kernel_size=1))
+        self.resblocks = nn.ModuleList()
+        for i in range(len(self.ups)):
+            ch = h["upsample_initial_channel"] // (2 ** (i + 1))
+            for j, (k, d) in enumerate(zip(h["resblock_kernel_sizes"], h["resblock_dilation_sizes"])):
+                self.resblocks.append(resblock(h, ch, k, d))
+
+        self.conv_post = weight_norm(Conv1d(ch, 1, 7, 1, padding=3))
+        self.ups.apply(init_weights)
+        self.conv_post.apply(init_weights)
+        self.cond = nn.Conv1d(h['gin_channels'], h['upsample_initial_channel'], 1)
+
+    def forward(self, x, f0, g=None):
+        # print(1,x.shape,f0.shape,f0[:, None].shape)
+        f0 = self.f0_upsamp(f0[:, None]).transpose(1, 2)  # bs,n,t
+        # print(2,f0.shape)
+        har_source, noi_source, uv = self.m_source(f0)
+        har_source = har_source.transpose(1, 2)
+        x = self.conv_pre(x)
+        x = x + self.cond(g)
+        # print(124,x.shape,har_source.shape)
+        for i in range(self.num_upsamples):
+            x = F.leaky_relu(x, LRELU_SLOPE)
+            # print(3,x.shape)
+            x = self.ups[i](x)
+            x_source = self.noise_convs[i](har_source)
+            # print(4,x_source.shape,har_source.shape,x.shape)
+            x = x + x_source
+            xs = None
+            for j in range(self.num_kernels):
+                if xs is None:
+                    xs = self.resblocks[i * self.num_kernels + j](x)
+                else:
+                    xs += self.resblocks[i * self.num_kernels + j](x)
+            x = xs / self.num_kernels
+        x = F.leaky_relu(x)
+        x = self.conv_post(x)
+        x = torch.tanh(x)
+
+        return x
+
+    def remove_weight_norm(self):
+        print('Removing weight norm...')
+        for l in self.ups:
+            remove_weight_norm(l)
+        for l in self.resblocks:
+            l.remove_weight_norm()
+        remove_weight_norm(self.conv_pre)
+        remove_weight_norm(self.conv_post)
+
+
+class DiscriminatorP(torch.nn.Module):
+    def __init__(self, period, kernel_size=5, stride=3, use_spectral_norm=False):
+        super(DiscriminatorP, self).__init__()
+        self.period = period
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv2d(1, 32, (kernel_size, 1), (stride, 1), padding=(get_padding(5, 1), 0))),
+            norm_f(Conv2d(32, 128, (kernel_size, 1), (stride, 1), padding=(get_padding(5, 1), 0))),
+            norm_f(Conv2d(128, 512, (kernel_size, 1), (stride, 1), padding=(get_padding(5, 1), 0))),
+            norm_f(Conv2d(512, 1024, (kernel_size, 1), (stride, 1), padding=(get_padding(5, 1), 0))),
+            norm_f(Conv2d(1024, 1024, (kernel_size, 1), 1, padding=(2, 0))),
+        ])
+        self.conv_post = norm_f(Conv2d(1024, 1, (3, 1), 1, padding=(1, 0)))
+
+    def forward(self, x):
+        fmap = []
+
+        # 1d to 2d
+        b, c, t = x.shape
+        if t % self.period != 0:  # pad first
+            n_pad = self.period - (t % self.period)
+            x = F.pad(x, (0, n_pad), "reflect")
+            t = t + n_pad
+        x = x.view(b, c, t // self.period, self.period)
+
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class MultiPeriodDiscriminator(torch.nn.Module):
+    def __init__(self, periods=None):
+        super(MultiPeriodDiscriminator, self).__init__()
+        self.periods = periods if periods is not None else [2, 3, 5, 7, 11]
+        self.discriminators = nn.ModuleList()
+        for period in self.periods:
+            self.discriminators.append(DiscriminatorP(period))
+
+    def forward(self, y, y_hat):
+        y_d_rs = []
+        y_d_gs = []
+        fmap_rs = []
+        fmap_gs = []
+        for i, d in enumerate(self.discriminators):
+            y_d_r, fmap_r = d(y)
+            y_d_g, fmap_g = d(y_hat)
+            y_d_rs.append(y_d_r)
+            fmap_rs.append(fmap_r)
+            y_d_gs.append(y_d_g)
+            fmap_gs.append(fmap_g)
+
+        return y_d_rs, y_d_gs, fmap_rs, fmap_gs
+
+
+class DiscriminatorS(torch.nn.Module):
+    def __init__(self, use_spectral_norm=False):
+        super(DiscriminatorS, self).__init__()
+        norm_f = weight_norm if use_spectral_norm == False else spectral_norm
+        self.convs = nn.ModuleList([
+            norm_f(Conv1d(1, 128, 15, 1, padding=7)),
+            norm_f(Conv1d(128, 128, 41, 2, groups=4, padding=20)),
+            norm_f(Conv1d(128, 256, 41, 2, groups=16, padding=20)),
+            norm_f(Conv1d(256, 512, 41, 4, groups=16, padding=20)),
+            norm_f(Conv1d(512, 1024, 41, 4, groups=16, padding=20)),
+            norm_f(Conv1d(1024, 1024, 41, 1, groups=16, padding=20)),
+            norm_f(Conv1d(1024, 1024, 5, 1, padding=2)),
+        ])
+        self.conv_post = norm_f(Conv1d(1024, 1, 3, 1, padding=1))
+
+    def forward(self, x):
+        fmap = []
+        for l in self.convs:
+            x = l(x)
+            x = F.leaky_relu(x, LRELU_SLOPE)
+            fmap.append(x)
+        x = self.conv_post(x)
+        fmap.append(x)
+        x = torch.flatten(x, 1, -1)
+
+        return x, fmap
+
+
+class MultiScaleDiscriminator(torch.nn.Module):
+    def __init__(self):
+        super(MultiScaleDiscriminator, self).__init__()
+        self.discriminators = nn.ModuleList([
+            DiscriminatorS(use_spectral_norm=True),
+            DiscriminatorS(),
+            DiscriminatorS(),
+        ])
+        self.meanpools = nn.ModuleList([
+            AvgPool1d(4, 2, padding=2),
+            AvgPool1d(4, 2, padding=2)
+        ])
+
+    def forward(self, y, y_hat):
+        y_d_rs = []
+        y_d_gs = []
+        fmap_rs = []
+        fmap_gs = []
+        for i, d in enumerate(self.discriminators):
+            if i != 0:
+                y = self.meanpools[i - 1](y)
+                y_hat = self.meanpools[i - 1](y_hat)
+            y_d_r, fmap_r = d(y)
+            y_d_g, fmap_g = d(y_hat)
+            y_d_rs.append(y_d_r)
+            fmap_rs.append(fmap_r)
+            y_d_gs.append(y_d_g)
+            fmap_gs.append(fmap_g)
+
+        return y_d_rs, y_d_gs, fmap_rs, fmap_gs
+
+
+def feature_loss(fmap_r, fmap_g):
+    loss = 0
+    for dr, dg in zip(fmap_r, fmap_g):
+        for rl, gl in zip(dr, dg):
+            loss += torch.mean(torch.abs(rl - gl))
+
+    return loss * 2
+
+
+def discriminator_loss(disc_real_outputs, disc_generated_outputs):
+    loss = 0
+    r_losses = []
+    g_losses = []
+    for dr, dg in zip(disc_real_outputs, disc_generated_outputs):
+        r_loss = torch.mean((1 - dr) ** 2)
+        g_loss = torch.mean(dg ** 2)
+        loss += (r_loss + g_loss)
+        r_losses.append(r_loss.item())
+        g_losses.append(g_loss.item())
+
+    return loss, r_losses, g_losses
+
+
+def generator_loss(disc_outputs):
+    loss = 0
+    gen_losses = []
+    for dg in disc_outputs:
+        l = torch.mean((1 - dg) ** 2)
+        gen_losses.append(l)
+        loss += l
+
+    return loss, gen_losses
diff --git a/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/nvSTFT.py b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/nvSTFT.py
new file mode 100644
index 0000000..88597d6
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/nvSTFT.py
@@ -0,0 +1,111 @@
+import math
+import os
+os.environ["LRU_CACHE_CAPACITY"] = "3"
+import random
+import torch
+import torch.utils.data
+import numpy as np
+import librosa
+from librosa.util import normalize
+from librosa.filters import mel as librosa_mel_fn
+from scipy.io.wavfile import read
+import soundfile as sf
+
+def load_wav_to_torch(full_path, target_sr=None, return_empty_on_exception=False):
+    sampling_rate = None
+    try:
+        data, sampling_rate = sf.read(full_path, always_2d=True)# than soundfile.
+    except Exception as ex:
+        print(f"'{full_path}' failed to load.\nException:")
+        print(ex)
+        if return_empty_on_exception:
+            return [], sampling_rate or target_sr or 32000
+        else:
+            raise Exception(ex)
+    
+    if len(data.shape) > 1:
+        data = data[:, 0]
+        assert len(data) > 2# check duration of audio file is > 2 samples (because otherwise the slice operation was on the wrong dimension)
+    
+    if np.issubdtype(data.dtype, np.integer): # if audio data is type int
+        max_mag = -np.iinfo(data.dtype).min # maximum magnitude = min possible value of intXX
+    else: # if audio data is type fp32
+        max_mag = max(np.amax(data), -np.amin(data))
+        max_mag = (2**31)+1 if max_mag > (2**15) else ((2**15)+1 if max_mag > 1.01 else 1.0) # data should be either 16-bit INT, 32-bit INT or [-1 to 1] float32
+    
+    data = torch.FloatTensor(data.astype(np.float32))/max_mag
+    
+    if (torch.isinf(data) | torch.isnan(data)).any() and return_empty_on_exception:# resample will crash with inf/NaN inputs. return_empty_on_exception will return empty arr instead of except
+        return [], sampling_rate or target_sr or 32000
+    if target_sr is not None and sampling_rate != target_sr:
+        data = torch.from_numpy(librosa.core.resample(data.numpy(), orig_sr=sampling_rate, target_sr=target_sr))
+        sampling_rate = target_sr
+    
+    return data, sampling_rate
+
+def dynamic_range_compression(x, C=1, clip_val=1e-5):
+    return np.log(np.clip(x, a_min=clip_val, a_max=None) * C)
+
+def dynamic_range_decompression(x, C=1):
+    return np.exp(x) / C
+
+def dynamic_range_compression_torch(x, C=1, clip_val=1e-5):
+    return torch.log(torch.clamp(x, min=clip_val) * C)
+
+def dynamic_range_decompression_torch(x, C=1):
+    return torch.exp(x) / C
+
+class STFT():
+    def __init__(self, sr=22050, n_mels=80, n_fft=1024, win_size=1024, hop_length=256, fmin=20, fmax=11025, clip_val=1e-5):
+        self.target_sr = sr
+        
+        self.n_mels     = n_mels
+        self.n_fft      = n_fft
+        self.win_size   = win_size
+        self.hop_length = hop_length
+        self.fmin     = fmin
+        self.fmax     = fmax
+        self.clip_val = clip_val
+        self.mel_basis = {}
+        self.hann_window = {}
+    
+    def get_mel(self, y, center=False):
+        sampling_rate = self.target_sr
+        n_mels     = self.n_mels
+        n_fft      = self.n_fft
+        win_size   = self.win_size
+        hop_length = self.hop_length
+        fmin       = self.fmin
+        fmax       = self.fmax
+        clip_val   = self.clip_val
+        
+        if torch.min(y) < -1.:
+            print('min value is ', torch.min(y))
+        if torch.max(y) > 1.:
+            print('max value is ', torch.max(y))
+        
+        if fmax not in self.mel_basis:
+            mel = librosa_mel_fn(sr=sampling_rate, n_fft=n_fft, n_mels=n_mels, fmin=fmin, fmax=fmax)
+            self.mel_basis[str(fmax)+'_'+str(y.device)] = torch.from_numpy(mel).float().to(y.device)
+            self.hann_window[str(y.device)] = torch.hann_window(self.win_size).to(y.device)
+        
+        y = torch.nn.functional.pad(y.unsqueeze(1), (int((n_fft-hop_length)/2), int((n_fft-hop_length)/2)), mode='reflect')
+        y = y.squeeze(1)
+        
+        spec = torch.stft(y, n_fft, hop_length=hop_length, win_length=win_size, window=self.hann_window[str(y.device)],
+                          center=center, pad_mode='reflect', normalized=False, onesided=True)
+        # print(111,spec)
+        spec = torch.sqrt(spec.pow(2).sum(-1)+(1e-9))
+        # print(222,spec)
+        spec = torch.matmul(self.mel_basis[str(fmax)+'_'+str(y.device)], spec)
+        # print(333,spec)
+        spec = dynamic_range_compression_torch(spec, clip_val=clip_val)
+        # print(444,spec)
+        return spec
+    
+    def __call__(self, audiopath):
+        audio, sr = load_wav_to_torch(audiopath, target_sr=self.target_sr)
+        spect = self.get_mel(audio.unsqueeze(0)).squeeze(0)
+        return spect
+
+stft = STFT()
diff --git a/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/utils.py b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/utils.py
new file mode 100644
index 0000000..84bff02
--- /dev/null
+++ b/AutoCoverTool/ref/so_vits_svc/vdecoder/hifigan/utils.py
@@ -0,0 +1,68 @@
+import glob
+import os
+import matplotlib
+import torch
+from torch.nn.utils import weight_norm
+matplotlib.use("Agg")
+import matplotlib.pylab as plt
+
+
+def plot_spectrogram(spectrogram):
+    fig, ax = plt.subplots(figsize=(10, 2))
+    im = ax.imshow(spectrogram, aspect="auto", origin="lower",
+                   interpolation='none')
+    plt.colorbar(im, ax=ax)
+
+    fig.canvas.draw()
+    plt.close()
+
+    return fig
+
+
+def init_weights(m, mean=0.0, std=0.01):
+    classname = m.__class__.__name__
+    if classname.find("Conv") != -1:
+        m.weight.data.normal_(mean, std)
+
+
+def apply_weight_norm(m):
+    classname = m.__class__.__name__
+    if classname.find("Conv") != -1:
+        weight_norm(m)
+
+
+def get_padding(kernel_size, dilation=1):
+    return int((kernel_size*dilation - dilation)/2)
+
+
+def load_checkpoint(filepath, device):
+    assert os.path.isfile(filepath)
+    print("Loading '{}'".format(filepath))
+    checkpoint_dict = torch.load(filepath, map_location=device)
+    print("Complete.")
+    return checkpoint_dict
+
+
+def save_checkpoint(filepath, obj):
+    print("Saving checkpoint to {}".format(filepath))
+    torch.save(obj, filepath)
+    print("Complete.")
+
+
+def del_old_checkpoints(cp_dir, prefix, n_models=2):
+    pattern = os.path.join(cp_dir, prefix + '????????')
+    cp_list = glob.glob(pattern) # get checkpoint paths
+    cp_list = sorted(cp_list)# sort by iter
+    if len(cp_list) > n_models: # if more than n_models models are found
+        for cp in cp_list[:-n_models]:# delete the oldest models other than lastest n_models
+            open(cp, 'w').close()# empty file contents
+            os.unlink(cp)# delete file (move to trash when using Colab)
+
+
+def scan_checkpoint(cp_dir, prefix):
+    pattern = os.path.join(cp_dir, prefix + '????????')
+    cp_list = glob.glob(pattern)
+    if len(cp_list) == 0:
+        return None
+    return sorted(cp_list)[-1]
+
diff --git a/AutoCoverTool/ref/split_dirty_frame/custom_models/mobilenet_v2_custom.py b/AutoCoverTool/ref/split_dirty_frame/custom_models/mobilenet_v2_custom.py
new file mode 100644
index 0000000..57b1227
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/custom_models/mobilenet_v2_custom.py
@@ -0,0 +1,142 @@
+"""
+直接从代码库中拷贝出的代码
+目的: mobilenet_v2只允许输入图片的通道数为3,不满足要求，因此拷贝出来做修改
+"""
+
+from torch import nn
+
+
+def _make_divisible(v, divisor, min_value=None):
+    """
+    This function is taken from the original tf repo.
+    It ensures that all layers have a channel number that is divisible by 8
+    It can be seen here:
+    https://github.com/tensorflow/models/blob/master/research/slim/nets/mobilenet/mobilenet.py
+    :param v:
+    :param divisor:
+    :param min_value:
+    :return:
+    """
+    if min_value is None:
+        min_value = divisor
+    new_v = max(min_value, int(v + divisor / 2) // divisor * divisor)
+    # Make sure that round down does not go down by more than 10%.
+    if new_v < 0.9 * v:
+        new_v += divisor
+    return new_v
+
+
+class ConvBNReLU(nn.Sequential):
+    def __init__(self, in_planes, out_planes, kernel_size=3, stride=1, groups=1):
+        padding = (kernel_size - 1) // 2
+        super(ConvBNReLU, self).__init__(
+            nn.Conv2d(in_planes, out_planes, kernel_size, stride, padding, groups=groups, bias=False),
+            nn.BatchNorm2d(out_planes),
+            nn.ReLU6(inplace=True)
+        )
+
+
+class InvertedResidual(nn.Module):
+    def __init__(self, inp, oup, stride, expand_ratio):
+        super(InvertedResidual, self).__init__()
+        self.stride = stride
+        assert stride in [1, 2]
+
+        hidden_dim = int(round(inp * expand_ratio))
+        self.use_res_connect = self.stride == 1 and inp == oup
+
+        layers = []
+        if expand_ratio != 1:
+            # pw
+            layers.append(ConvBNReLU(inp, hidden_dim, kernel_size=1))
+        layers.extend([
+            # dw
+            ConvBNReLU(hidden_dim, hidden_dim, stride=stride, groups=hidden_dim),
+            # pw-linear
+            nn.Conv2d(hidden_dim, oup, 1, 1, 0, bias=False),
+            nn.BatchNorm2d(oup),
+        ])
+        self.conv = nn.Sequential(*layers)
+
+    def forward(self, x):
+        if self.use_res_connect:
+            return x + self.conv(x)
+        else:
+            return self.conv(x)
+
+
+class MobileNetV2Custom(nn.Module):
+    def __init__(self, num_classes=2, in_channel=1, width_mult=1.0, inverted_residual_setting=None, round_nearest=8):
+        """
+        MobileNet V2 main class
+
+        Args:
+            num_classes (int): Number of classes
+            width_mult (float): Width multiplier - adjusts number of channels in each layer by this amount
+            inverted_residual_setting: Network structure
+            round_nearest (int): Round the number of channels in each layer to be a multiple of this number
+            Set to 1 to turn off rounding
+        """
+        super(MobileNetV2Custom, self).__init__()
+        block = InvertedResidual
+        input_channel = 32
+        last_channel = 1280
+
+        if inverted_residual_setting is None:
+            inverted_residual_setting = [
+                # t, c, n, s
+                [1, 16, 1, 1],
+                [6, 24, 2, 2],
+                [6, 32, 3, 2],
+                [6, 64, 4, 2],
+                [6, 96, 3, 1],
+                [6, 160, 3, 2],
+                [6, 320, 1, 1],
+            ]
+
+        # only check the first element, assuming user knows t,c,n,s are required
+        if len(inverted_residual_setting) == 0 or len(inverted_residual_setting[0]) != 4:
+            raise ValueError("inverted_residual_setting should be non-empty "
+                             "or a 4-element list, got {}".format(inverted_residual_setting))
+
+        # building first layer
+        input_channel = _make_divisible(input_channel * width_mult, round_nearest)
+        self.last_channel = _make_divisible(last_channel * max(1.0, width_mult), round_nearest)
+        # 修改的地方,原来in_channel=3
+        features = [ConvBNReLU(in_channel, input_channel, stride=2)]
+        # building inverted residual blocks
+        for t, c, n, s in inverted_residual_setting:
+            output_channel = _make_divisible(c * width_mult, round_nearest)
+            for i in range(n):
+                stride = s if i == 0 else 1
+                features.append(block(input_channel, output_channel, stride, expand_ratio=t))
+                input_channel = output_channel
+        # building last several layers
+        features.append(ConvBNReLU(input_channel, self.last_channel, kernel_size=1))
+        # make it nn.Sequential
+        self.features = nn.Sequential(*features)
+
+        # building classifier
+        self.classifier = nn.Sequential(
+            nn.Dropout(0.2),
+            nn.Linear(self.last_channel, num_classes),
+        )
+
+        # weight initialization
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d):
+                nn.init.kaiming_normal_(m.weight, mode='fan_out')
+                if m.bias is not None:
+                    nn.init.zeros_(m.bias)
+            elif isinstance(m, nn.BatchNorm2d):
+                nn.init.ones_(m.weight)
+                nn.init.zeros_(m.bias)
+            elif isinstance(m, nn.Linear):
+                nn.init.normal_(m.weight, 0, 0.01)
+                nn.init.zeros_(m.bias)
+
+    def forward(self, x):
+        x = self.features(x)
+        x = x.mean([2, 3])
+        x = self.classifier(x)
+        return x
diff --git a/AutoCoverTool/ref/split_dirty_frame/custom_models/model.py b/AutoCoverTool/ref/split_dirty_frame/custom_models/model.py
new file mode 100644
index 0000000..e2f21d4
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/custom_models/model.py
@@ -0,0 +1,80 @@
+from custom_models.mobilenet_v2_custom import MobileNetV2Custom
+import torch
+import torch.nn as nn
+from torchstat import stat
+
+MFCC_LEN = 80
+FRAME_LEN = 32
+
+
+class MobileNetV2Dirty(MobileNetV2Custom):
+
+    def forward(self, x):
+        x = x.view([-1, 1, FRAME_LEN, MFCC_LEN])
+        return super(MobileNetV2Dirty, self).forward(x)
+
+
+class ModelV1(nn.Module):
+    def __init__(self):
+        super(ModelV1, self).__init__()
+        # 输入shape, 32 * 80
+        self.model = nn.Sequential(
+            nn.Conv2d(in_channels=1, out_channels=16, kernel_size=3, stride=2, padding=1),
+            nn.BatchNorm2d(16),
+            nn.ReLU(),
+
+            nn.Conv2d(in_channels=16, out_channels=8, kernel_size=3, stride=2, padding=1),
+            nn.BatchNorm2d(8),
+            nn.ReLU(),
+        )
+
+        self.fc = nn.Sequential(
+            nn.Linear(1280, 256),
+            nn.ReLU(),
+            nn.Linear(256, 16),
+            nn.ReLU(),
+            nn.Linear(16, 2)
+        )
+
+    def forward(self, x):
+        x = x.view([-1, 1, FRAME_LEN, MFCC_LEN])
+        x = self.model(x)
+        x = x.view(-1, 1280)
+        return self.fc(x)
+
+
+class ModelV2(nn.Module):
+    def __init__(self):
+        super(ModelV2, self).__init__()
+        # 输入shape, 11 * 80
+        # 在11的维度上进行卷积,将channel认定为80
+        self.model = nn.Sequential(
+            nn.Conv1d(in_channels=80, out_channels=8, kernel_size=3, stride=2, padding=1),
+            nn.BatchNorm1d(8),
+            nn.ReLU(),
+        )
+
+        self.fc = nn.Sequential(
+            nn.Linear(48, 16),
+            nn.ReLU(),
+            nn.Linear(16, 2)
+        )
+
+    def forward(self, x):
+        x = x.view([-1, FRAME_LEN, MFCC_LEN])
+        x = x.permute(0, 2, 1)
+        x = self.model(x)
+        x = x.view(-1, 48)
+        return self.fc(x)
+
+
+def get_cur_model():
+    return ModelV1()
+
+
+if __name__ == '__main__':
+    mv = ModelV1()
+    data = torch.rand(32, 80)
+    stat(mv, (1, 32, 80))
+    out = mv.forward(data)
+    print(out.shape)
diff --git a/AutoCoverTool/ref/split_dirty_frame/dataset/dataset.py b/AutoCoverTool/ref/split_dirty_frame/dataset/dataset.py
new file mode 100644
index 0000000..db9fcfd
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/dataset/dataset.py
@@ -0,0 +1,220 @@
+"""
+数据集
+---dataset
+    ---data
+        xxx.wav
+    ---train.txt
+    ---test.txt
+"""
+
+import os
+import glob
+import librosa
+import numpy as np
+import torch.utils.data as data
+
+gs_frame_num = 32
+
+
+def load_file(filename):
+    target_msg = []
+    other_msg = []
+    other_st = 0
+    with open(filename, "r") as f:
+        while True:
+            line = f.readline()
+            if not line:
+                break
+            line_arr = line.strip().split(",")
+            filename = line_arr[0]
+            tp = int(line_arr[1])
+            st = float(line_arr[2])
+            ed = float(line_arr[3])
+            # 格式: 文件名,类型,开始时间，结束时间
+            target_msg.append([filename, tp, st, ed])
+            if st - other_st > 0.3:
+                other_msg.append([filename, 0, other_st, st])
+            other_st = ed
+    target_frames = get_feature_idx(target_msg)
+    other_frames = get_feature_idx(other_msg)
+    return target_frames, other_frames
+
+
+def load_file_v1(filename, feature_dir, predict=False):
+    """
+    32帧，对应512ms
+    问题帧:
+    1. 问题段长度占音频的总占比超过20%
+    2. 问题段长度占音频的总占比不到20%,但是整个音频段都被包含
+    非问题帧:
+    1. 完全不包含问题帧
+    :return:
+    """
+    target_msg = {}
+    with open(filename, "r") as f:
+        while True:
+            line = f.readline()
+            if not line:
+                break
+            line_arr = line.strip().split(",")
+            filename = line_arr[0]
+            tp = int(line_arr[1])
+            st = float(line_arr[2])
+            ed = float(line_arr[3])
+            # 格式: 文件名,类型,开始时间，结束时间
+            if filename not in target_msg.keys():
+                target_msg[filename] = []
+            target_msg[filename].append([filename, tp, st, ed])
+    # 只用1的数据，2的数据不使用
+    target_frame_idx = []
+    other_frame_idx = []
+    frame_ms = 0.016
+    for filename, arr in target_msg.items():
+        file_msg = target_msg[filename]
+        abs_filename = os.path.join(feature_dir, filename + ".npy")
+        data = np.load(abs_filename)
+        for i in range(0, len(data) - gs_frame_num):
+            st_tm = i * frame_ms
+            ed_tm = st_tm + gs_frame_num * frame_ms
+            flag = False
+            for msg in file_msg:
+                _, tp, st, ed = msg
+                # 标记中的时间小于当前时间，意味着还需要继续向后获取
+                if ed < st_tm:
+                    continue
+                # 标记中的开始时间大于了当前时间的结尾时间，意味着后面都比它大，不需要再向后了
+                if st > ed_tm:
+                    break
+                # 到这里意味着已经有重合的地方了
+                flag = True
+                # 大于等于2的情况下意味着大家不确定，所以不要
+                if int(tp) >= 2:
+                    continue
+                if ed - st <= 0:
+                    print("{}, params err!\n".format(msg[0]))
+                    exit(-1)
+
+                # 目前一定有重合的地方,且重合的长度为min(ed_tm, ed) - max(st_tm, st)
+                # 重合程度大于20%，或者当前帧完全在本段中，都认为是问题段
+                inter = min(ed_tm, ed) - max(st_tm, st)
+                rate = 0.2
+                if predict:
+                    rate = 0.5
+                if (inter / (gs_frame_num * frame_ms)) > rate or (st_tm < st < ed_tm and st_tm < ed < ed_tm):
+                    target_frame_idx.append([filename, tp, int(st_tm / frame_ms), int(ed_tm / frame_ms)])
+            # 只有当本段和每个分段都没有重合时，才认为是正常段
+            if not flag:
+                other_frame_idx.append([filename, 0, int(st_tm / frame_ms), int(ed_tm / frame_ms)])
+    return target_frame_idx, other_frame_idx
+
+
+def file2mfcc(in_file):
+    mfcc, sr = librosa.load(in_file, sr=16000, mono=True)
+    if len(mfcc) < 512:
+        return []
+    # 32ms的长度，16ms一帧
+    mfcc = librosa.feature.mfcc(y=mfcc, sr=sr, n_fft=512, hop_length=256, n_mfcc=80)
+    return mfcc.transpose()
+
+
+def file2stft(in_file):
+    audio, sr = librosa.load(in_file, sr=16000, mono=True)
+    if len(audio) < 512:
+        return []
+    mfcc = np.abs(librosa.stft(audio, n_fft=512, hop_length=256))
+    return mfcc.transpose()
+
+
+def dir2mfcc(wav_dir):
+    files = glob.glob(os.path.join(wav_dir, "*wav"))
+    for file in files:
+        mfcc_file = file.replace(".wav", "")
+        mfcc = file2mfcc(file)
+        # mfcc = file2stft(file)
+        # 大于1.6s才可用
+        if len(mfcc) > 100:
+            np.save(mfcc_file, mfcc)
+
+
+def get_feature_idx(target_msg):
+    feature_idx = []
+    frame_ms = 256 / 16000
+    for idx, msg in enumerate(target_msg):
+        # 格式包含: filename, tp, st, ed
+        # 将st和ed都转为帧号
+        st_frame = int(msg[2] / frame_ms)
+        ed_frame = int(msg[3] / frame_ms)
+        # 2以及以上的都不要
+        if int(msg[1]) >= 2:
+            continue
+        # 带上两端，从而可以保证当占比超过一半的时候也判定为异常
+        for frame_idx in range(st_frame, ed_frame):
+            if frame_idx - 5 < 0:
+                continue
+            feature_idx.append([msg[0], msg[1], frame_idx - 5, frame_idx + 6])  # 包左不包右
+    return feature_idx
+
+
+def construct(msg):
+    frames = []
+    label = []
+    for line in msg:
+        frames.append([line[0], line[2], line[3]])
+        label.append(line[1])
+    return frames, label
+
+
+class CustomDataset(data.Dataset):
+    def __init__(self, root, label_set='train', predict=False):
+        self.work_dir = root
+        self.feature_dir = os.path.join(root, "data")
+        self.predict = predict
+        filename = os.path.join(root, '{}.txt'.format(label_set))
+
+        # target_frames, other_frames = load_file(filename)
+        target_frames, other_frames = load_file_v1(filename, self.feature_dir)
+        print("before, len: {}, {}".format(len(target_frames), len(other_frames)))
+        if len(other_frames) > 3 * len(target_frames) and not self.predict:
+            np.random.shuffle(other_frames)
+            other_frames = other_frames[:3 * len(target_frames)]
+        print("after, len: {}, {}".format(len(target_frames), len(other_frames)))
+        # 构建结果
+        target_frames.extend(other_frames)
+        np.random.shuffle(target_frames)
+        self.frames, self.label = construct(target_frames)
+
+    def __len__(self):
+        return len(self.label)
+
+    def __getitem__(self, idx):
+        msg = self.frames[idx]
+        filename = os.path.join(self.feature_dir, str(msg[0]) + ".npy")
+        mfcc = np.load(filename)
+        st_frame = msg[1]
+        ed_frame = msg[2]
+        if len(mfcc[st_frame:ed_frame]) != 32:
+            # print("err: idx={},{},{},{},{}".format(idx, filename, st_frame, ed_frame, len(mfcc)))
+            idx = np.random.randint(0, self.__len__())
+            return self.__getitem__(idx)
+        item = mfcc[st_frame:ed_frame]
+        label = int(self.label[idx] != 0)
+        if self.predict:
+            return item, label, filename, st_frame, ed_frame
+        return item, label
+
+
+if __name__ == '__main__':
+    file2mfcc("")
+    # out = file2stft("/data/rsync/jiang.yang/dataset/dataset_dev/data_wav/4_5629499489839033.wav")
+    # print(out.shape)
+    # dir2mfcc("/data/rsync/jiang.yang/dataset/dataset_dev/data_wav")
+    # load_file_v1("/data/rsync/jianli.yang/AutoCoverTool/ref/split_dirty_frame/tmp/11.txt",
+    #              "/data/rsync/jianli.yang/AutoCoverTool/data/dataset_dev/data")
+
+    # dir2mfcc(
+    #     "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/dataset_dev/4_wav")
+    # root = "/data/rsync/jianli.yang/AutoCoverTool/data/dataset_dev"
+    # dat = CustomDataset(root)
+    # it, lb = dat.__getitem__(0)
+    # print(it.shape)
+    # print(lb.shape)
diff --git a/AutoCoverTool/ref/split_dirty_frame/readme.txt b/AutoCoverTool/ref/split_dirty_frame/readme.txt
new file mode 100644
index 0000000..c4a56c8
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/readme.txt
@@ -0,0 +1,76 @@
+目前数据集: 46首训练, 10首测试
+base_line:
+v1的情况:
+    t_loss:0.350482	t_acc:84.79	v_loss:0.520381	v_acc:76.58	time:145.974121	epoch:2
+实验一下，对于标注为2的不认为异常:
+    t_loss:0.285704	t_acc:87.83	v_loss:0.662188	v_acc:73.78	time:114.760812	epoch:4
+
+实验3:
+猜想: 模型太复杂了，在实验2的基础上,降低模型复杂度，2维度卷积加两层fc
+t_loss:0.352131	t_acc:84.88	v_loss:0.542022	v_acc:78.05	time:86.826910	epoch:5
+结论: 效果有提升,验证集增加近4.27%
+
+实验4:
+猜想: 模型太复杂了，在实验2的基础上,降低模型复杂度，1维度卷积加两层fc
+t_loss:0.352438	t_acc:84.72	v_loss:0.567134	v_acc:75.52	time:86.549661	epoch:19
+结论: 效果相较于3来说降低了一些，可能是复杂度较低导致的
+
+实验5：在实验3的基础上，训练集新增9个音频
+t_loss:0.410002	t_acc:80.69	v_loss:0.584062	v_acc:74.71	time:164.807675	epoch:5
+
+实验5_1: 在五的基础上，增加模型复杂度
+t_loss:0.396976	t_acc:81.49	v_loss:0.585027	v_acc:74.58	time:164.734624	epoch:2
+结论: 没有价值
+
+实验5_2: 在5的基础上,换数据格式,修改模型结构
+t_loss:0.357168	t_acc:85.44	v_loss:0.723428	v_acc:64.19 epoch:16
+结论: 很差
+--------------------------------------------------->>>>>>
+思路: 先分析错误数据,修复两个数据上的Bug
+实验5_2: 修复bug之后
+t_loss:0.335836	t_acc:85.05	v_loss:0.438867	v_acc:83.24	time:176.928082	epoch:1
+结论: 效果明显提升，继续分析数据
+修复数据集的明显问题:
+1. 数据集中每一行的时间差<=0
+本期修复数据:
+19_10414574138721494.wav
+47_1688849864840588.wav
+54_3634463651.wav
+8_10414574140317353.wav
+实验5_3: 初步修复数据集问题
+t_loss:0.245894	t_acc:89.91	v_loss:0.390855	v_acc:85.28	time:155.996837	epoch:3
+
+实验5_3_1: 微调模型
+1. 切换为1DCNN的模型
+2. 在2DCNN上增加模型复杂度
+
+实验5_3_2: 修复数据88_之后
+88_10414574138721494
+t_loss:0.297692	t_acc:87.22	v_loss:0.400453	v_acc:85.44	time:148.522071	epoch:1
+结论: 效果不明显，继续修复
+21_10414574140317353
+t_loss:0.315018	t_acc:86.42	v_loss:0.364222	v_acc:85.79	time:146.168289	epoch:1
+3_6755399374234747
+15_8162774327817435
+t_loss:0.209222	t_acc:91.69	v_loss:0.376367	v_acc:85.87	time:143.195726	epoch:3
+结论: 轻微效果，符合认知
+在验证集合上，对于整首歌级别，每个段都参与时:
+acc:0.3458628198149156, recall:0.8955528930861936
+
+实验5_3_3: 采用50%认定异常段的方式
+t_loss:0.291052	t_acc:87.80	v_loss:0.360148	v_acc:86.08	time:116.858534	epoch:9
+结论: 轻微提升，效果不明显
+实验5_3_4: 在2的基础上,将正常样本的数量提升到问题样本的3倍
+t_loss:0.257707	t_acc:89.17	v_loss:0.309852	v_acc:87.43	time:282.694043	epoch:5
+在验证集合上，对于整首歌级别，每个段都参与时:
+acc:0.5000699398517275, recall:0.7557074408117249
+
+
+
+
+
+实验5:
+猜想: 目前的总长度太短，重新划分情况
+    1. 如果本段被500ms的时间片全部包含，则认为该段存在问题
+    2. 500ms的时间片中如果包含异常数据的占比超过1/5，也认为异常
+    3. 只有完全不包含异常数据的才认为正常
\ No newline at end of file
diff --git a/AutoCoverTool/ref/split_dirty_frame/script/ana_err_log.py b/AutoCoverTool/ref/split_dirty_frame/script/ana_err_log.py
new file mode 100644
index 0000000..33efef1
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/script/ana_err_log.py
@@ -0,0 +1,85 @@
+"""
+查看一下验证集合错误的情况
+"""
+import os
+import torch
+import numpy as np
+from tqdm import tqdm
+from torch.utils.data import DataLoader
+
+from models.model import get_cur_model
+from dataset.dataset import load_file_v1, construct, CustomDataset
+
+
+def get_frames_and_labels(root):
+    feature_dir = os.path.join(root, "data")
+    filename = os.path.join(root, 'train.txt')
+    target_frames, other_frames = load_file_v1(filename, feature_dir)
+    print("before, len: {}, {}".format(len(target_frames), len(other_frames)))
+    if len(other_frames) > len(target_frames):
+        np.random.shuffle(other_frames)
+        other_frames = other_frames[:len(target_frames)]
+    print("after, len: {}, {}".format(len(target_frames), len(other_frames)))
+    # 构建结果
+    target_frames.extend(other_frames)
+    np.random.shuffle(target_frames)
+    return construct(target_frames)
+
+
+def get_one_frame(filename, st_frame, ed_frame, label):
+    mfcc = np.load(filename)
+    if len(mfcc[st_frame:ed_frame]) != 32:
+        return None, None
+    item = torch.tensor([mfcc[st_frame:ed_frame]]).to('cuda')
+    label = int(label != 0)
+    return item, label
+
+
+def val():
+    device = "cuda"
+    model = get_cur_model()
+    # model_path = "output_v5_2/epoch_1_0.8324131096481914.pth"
+    # model_path = "output_v5_2/epoch_10_0.808451900615842.pth"
+    # model_path = "output_v5_3/epoch_3_0.8527927799886299.pth"
+    model_path = "output_v5_3_4/epoch_5_0.874253837407618.pth"
+    params = torch.load(model_path, map_location=torch.device(device))
+    model.load_state_dict(state_dict=params)
+    model.eval()
+    model.to('cuda')
+    out_dict = {
+        0: {
+            0: 0,  # key是标注，val是predict
+            1: 0
+        },
+        1: {
+            0: 0,
+            1: 0
+        }
+    }
+    predict = CustomDataset("/data/rsync/jianli.yang/AutoCoverTool/data/dataset_dev", "val", True)
+    predict_loader = DataLoader(predict, batch_size=32, shuffle=True, num_workers=8)
+    for images, labels, filename, st_frame, ed_frame in predict_loader:
+        # batch_size = images.size(0)
+        images = images.to(device)
+        labels = labels.to(device)
+        predicts = model(images)
+
+        _, predicts = predicts.max(dim=1)
+        for lb, pe, f, s, e in zip(labels.cpu().numpy(), predicts.cpu().numpy(), filename, st_frame, ed_frame):
+            out_dict[int(lb)][int(pe)] += 1
+            # filename, label, st_frame, ed_frame, true/false 相等是true,不等是false
+            print(
+                "{},{},{},{},{}".format(f, int(lb), round(int(s) * 0.016, 3), round(int(e) * 0.016, 3), int(lb == pe)))
+
+    print("---------------->>")
+    tt = out_dict[1][1]
+    tf = out_dict[1][0]
+    ft = out_dict[0][1]
+    ff = out_dict[0][0]
+    print("{},{}".format(tt, tf))
+    print("{},{}".format(ft, ff))
+    print("acc:{}, recall:{}".format(tt / (tt + ft), tt / (tt + tf)))
+
+
+if __name__ == '__main__':
+    val()
diff --git a/AutoCoverTool/ref/split_dirty_frame/script/get_durations.py b/AutoCoverTool/ref/split_dirty_frame/script/get_durations.py
new file mode 100644
index 0000000..d570fcb
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/script/get_durations.py
@@ -0,0 +1,36 @@
+import os
+import glob
+import time
+import json
+import librosa
+
+
+def exec_cmd(cmd):
+    r = os.popen(cmd)
+    text = r.read()
+    r.close()
+    return text
+
+
+def get_d(audio_path):
+    cmd = "/usr/local/bin/ffprobe -v quiet -print_format json -show_format -show_streams {}".format(audio_path)
+    data = exec_cmd(cmd)
+    data = json.loads(data)
+    return float(data["format"]["duration"])
+
+
+def get_duration():
+    dirs = glob.glob("/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/me_top500/jianli/*")
+    for dir in dirs:
+        st = time.time()
+        wavs = glob.glob(os.path.join(dir, "*wav"))
+        a_duration = get_d(wavs[0])
+        acc_duration = get_d(os.path.join(dir, "acc.mp3"))
+        vocal_duration = get_d(os.path.join(dir, "vocal.mp3"))
+        if a_duration > acc_duration + 5 or a_duration > vocal_duration + 5:
+            print("ERROR: {}".format(dir))
+        print("dir={},sp={}".format(dir, time.time() - st))
+
+
+if __name__ == '__main__':
+    get_duration()
diff --git a/AutoCoverTool/ref/split_dirty_frame/script/label_format.py b/AutoCoverTool/ref/split_dirty_frame/script/label_format.py
new file mode 100644
index 0000000..34ccac8
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/script/label_format.py
@@ -0,0 +1,168 @@
+"""
+格式转换
+"""
+import os
+
+
+def tm2sec(tm):
+    """
+    分:秒.xxx 转为 tm
+    :param tm:
+    :return:
+    """
+    tm_arr = str(tm).split(":")
+    return int(int(tm_arr[0]) * 60) + float(tm_arr[1])
+
+
+def sec2tm(sec):
+    sec = float(sec)
+    m = sec // 60
+    s = sec - m * 60
+    return "{}:{}".format(int(m), round(s, 3))
+
+
+def custom_label2au_format(in_file):
+    """
+    Name	Start	Duration	Time Format	Type	Description
+    1	0:56.429	0:04.824	decimal	Cue
+    :param in_file:
+    :return:
+    """
+
+    lines = []
+    header = False
+    with open(in_file, "r") as f:
+        while True:
+            line = f.readline()
+            if not line:
+                break
+            if header:
+                header = False
+                continue
+            line = line.strip().split(",")
+            tp = line[1]
+            st_tm = tm2sec(line[2])
+            ed_tm = st_tm + tm2sec(line[3])
+            lines.append([tp, sec2tm(st_tm), sec2tm(ed_tm - st_tm)])
+
+    with open(in_file + "_out.csv", "w") as f:
+        f.write("Name\tStart\tDuration\tTime Format\tType\n")
+        for line in lines:
+            strr = "{}\t{}\t{}\t{}\n".format(line[0], line[1], line[2], "decimal\tCue\t")
+            f.write(strr)
+            # f.write("{}\t{}".format("\t".join(line), "decimal\tCue\t\t\n"))
+            # print("{}\t{}".format("\t".join(line), "decimal	Cue\n"))
+
+
+def label2txt(in_file):
+    lines = []
+    header = True
+    filename = os.path.basename(in_file).replace(".csv", "")
+    with open(in_file, "r") as f:
+        while True:
+            line = f.readline()
+            if not line:
+                break
+            if header:
+                header = False
+                continue
+            line = line.split("\t")
+            tp = line[0]
+            st_tm = tm2sec(line[1])
+            ed_tm = st_tm + tm2sec(line[2])
+            lines.append([filename, tp, str(round(st_tm, 3)), str(round(ed_tm, 3))])
+    with open(in_file + "_out.csv", "w") as f:
+        for line in lines:
+            print(line)
+            f.write("{}\n".format(",".join(line)))
+
+
+def label12txt(in_file):
+    lines = []
+    with open(in_file, "r") as f:
+        while True:
+            line = f.readline()
+            if not line:
+                break
+            line = line.split(",")
+            if len(line) < 4:
+                continue
+            tp = line[1]
+            st_tm = tm2sec(line[2])
+            ed_tm = tm2sec(line[3])
+            lines.append([line[0], tp, str(round(st_tm, 3)), str(round(ed_tm, 3))])
+    with open(in_file + "_out.csv", "w") as f:
+        for line in lines:
+            print(line)
+            f.write("{}\n".format(",".join(line)))
+
+
+if __name__ == '__main__':
+    # custom_label2au_format(
+    #     "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/dataset_dev/4/8/8_10414574140317353.txt")
+    label2txt(
+        "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/dataset_dev/data/out1/15_8162774327817435.csv")
+    # label12txt(
+    #     "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/dataset_dev/4/all.csv")
+
+    # arr = [
+    #     "10_5629499489839033.csv",
+    #     "11_10414574140317353.csv",
+    #     "13_1688849864840588.csv",
+    #     "14_8162774327817435.csv",
+    #     "15_8162774327817435.csv",
+    #     "16_8162774327817435.csv",
+    #     "21_10414574140317353.csv",
+    #     "24_6755399374234747.csv",
+    #     "25_8162774327817435.csv",
+    #     "26_6755399374234747.csv",
+    #     "28_8162774327817435.csv",
+    #     "29_3634463651.csv",
+    #     "2_8162774329368194.csv",
+    #     "30_5910973794723621.csv",
+    #     "31_10414574140317353.csv",
+    #     "32_10414574140317353.csv",
+    #     "33_3634463651.csv",
+    #     "35_3634463651.csv",
+    #     "36_5910973794723621.csv",
+    #     "38_8162774329368194.csv",
+    #     "40_6755399374234747.csv",
+    #     "41_5629499489839033.csv",
+    #     "42_10414574138721494.csv",
+    #     "44_3634463651.csv",
+    #     "48_5629499489839033.csv",
+    #     "49_5910973794723621.csv",
+    #     "4_5629499489839033.csv",
+    #     "50_3634463651.csv",
+    #     "51_1688849864840588.csv",
+    #     "52_6755399374234747.csv",
+    #     "53_10414574140317353.csv",
+    #     "55_10414574138721494.csv",
+    #     "56_1688849864840588.csv",
+    #     "57_5629499489839033.csv",
+    #     "59_3634463651.csv",
+    #     "5_10414574138721494.csv",
+    #     "60_5910973794723621.csv",
+    #     "7_10414574140317353.csv",
+    #     "82_8162774329368194.csv",
+    #     "83_10414574138721494.csv",
+    #     "84_8162774329368194.csv",
+    #     "85_1688849864840588.csv",
+    #     "86_8162774329368194.csv",
+    #     "87_6755399374234747.csv",
+    #     "89_10414574138721494.csv",
+    #     "90_8162774327817435.csv",
+    #     "91_8162774327817435.csv",
+    #     "92_10414574138721494.csv",
+    #     "93_1688849864840588.csv",
+    #     "94_3634463651.csv",
+    #     "96_5629499489839033.csv",
+    #     "97_5910973794723621.csv",
+    #     "99_5910973794723621.csv",
+    #     "9_10414574138721494.csv"
+    # ]
+    # # ii = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/dataset_dev/11.txt"
+    # base = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/dataset_dev/data"
+    # for file in arr:
+    #     out_file = os.path.join(base, file)
+    #     label2txt(out_file)
diff --git a/AutoCoverTool/ref/split_dirty_frame/script/preprocess.py b/AutoCoverTool/ref/split_dirty_frame/script/preprocess.py
new file mode 100644
index 0000000..c6fb08c
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/script/preprocess.py
@@ -0,0 +1,418 @@
+"""
+1. 降噪
+2. 拉伸
+"""
+import os
+import time
+
+gs_denoise_exe = "/opt/soft/bin/denoise_exe"
+gs_draw_volume_exe = "/opt/soft/bin/draw_volume"
+
+
+def process():
+    # input_wavs = [
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105027601574/611752105027601574_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105029951597/611752105029951597_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105029951624/611752105029951624_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105029951624/611752105029951624_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105029951624/611752105029951624_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248982/611752105030248982_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248982/611752105030248982_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248982/611752105030248982_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248988/611752105030248988_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248988/611752105030248988_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248988/611752105030248988_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248992/611752105030248992_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248992/611752105030248992_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248992/611752105030248992_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248994/611752105030248994_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248994/611752105030248994_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248994/611752105030248994_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248995/611752105030248995_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248995/611752105030248995_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248995/611752105030248995_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249000/611752105030249000_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249000/611752105030249000_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249000/611752105030249000_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249001/611752105030249001_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249010/611752105030249010_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249010/611752105030249010_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249011/611752105030249011_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249011/611752105030249011_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249011/611752105030249011_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249016/611752105030249016_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249016/611752105030249016_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249019/611752105030249019_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249022/611752105030249022_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249022/611752105030249022_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249022/611752105030249022_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249030/611752105030249030_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249031/611752105030249031_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249031/611752105030249031_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249031/611752105030249031_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249032/611752105030249032_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249032/611752105030249032_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249034/611752105030249034_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249034/611752105030249034_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249034/611752105030249034_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249035/611752105030249035_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249035/611752105030249035_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249036/611752105030249036_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249036/611752105030249036_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249036/611752105030249036_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249037/611752105030249037_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249037/611752105030249037_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249037/611752105030249037_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249038/611752105030249038_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249040/611752105030249040_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249040/611752105030249040_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249041/611752105030249041_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249041/611752105030249041_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249048/611752105030249048_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249049/611752105030249049_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249049/611752105030249049_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249052/611752105030249052_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249052/611752105030249052_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249053/611752105030249053_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249053/611752105030249053_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249053/611752105030249053_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249055/611752105030249055_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249055/611752105030249055_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249055/611752105030249055_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249067/611752105030249067_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249067/611752105030249067_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249067/611752105030249067_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249070/611752105030249070_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249071/611752105030249071_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249073/611752105030249073_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249073/611752105030249073_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249074/611752105030249074_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249074/611752105030249074_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249074/611752105030249074_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249091/611752105030249091_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249091/611752105030249091_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249091/611752105030249091_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249104/611752105030249104_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249104/611752105030249104_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249105/611752105030249105_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249112/611752105030249112_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249112/611752105030249112_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249112/611752105030249112_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249113/611752105030249113_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249113/611752105030249113_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249118/611752105030249118_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249118/611752105030249118_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249127/611752105030249127_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249127/611752105030249127_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249128/611752105030249128_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249134/611752105030249134_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249134/611752105030249134_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249134/611752105030249134_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249136/611752105030249136_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249136/611752105030249136_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249136/611752105030249136_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249160/611752105030249160_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249173/611752105030249173_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249173/611752105030249173_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249173/611752105030249173_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249174/611752105030249174_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249174/611752105030249174_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249174/611752105030249174_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249175/611752105030249175_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249175/611752105030249175_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249176/611752105030249176_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249176/611752105030249176_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249176/611752105030249176_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249177/611752105030249177_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249177/611752105030249177_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249177/611752105030249177_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249195/611752105030249195_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249195/611752105030249195_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249206/611752105030249206_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249206/611752105030249206_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249206/611752105030249206_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249213/611752105030249213_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249213/611752105030249213_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249216/611752105030249216_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249216/611752105030249216_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249216/611752105030249216_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249227/611752105030249227_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249227/611752105030249227_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249233/611752105030249233_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249233/611752105030249233_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249233/611752105030249233_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249240/611752105030249240_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249240/611752105030249240_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249243/611752105030249243_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249243/611752105030249243_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249250/611752105030249250_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249250/611752105030249250_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249250/611752105030249250_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249258/611752105030249258_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249264/611752105030249264_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249267/611752105030249267_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249273/611752105030249273_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249273/611752105030249273_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249273/611752105030249273_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249275/611752105030249275_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249275/611752105030249275_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249278/611752105030249278_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249278/611752105030249278_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249278/611752105030249278_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249280/611752105030249280_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249280/611752105030249280_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249280/611752105030249280_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249281/611752105030249281_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249281/611752105030249281_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249281/611752105030249281_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249282/611752105030249282_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249282/611752105030249282_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249283/611752105030249283_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249284/611752105030249284_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249284/611752105030249284_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249287/611752105030249287_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249287/611752105030249287_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249289/611752105030249289_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249289/611752105030249289_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249289/611752105030249289_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249292/611752105030249292_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249292/611752105030249292_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249292/611752105030249292_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249293/611752105030249293_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249293/611752105030249293_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249293/611752105030249293_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249295/611752105030249295_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249295/611752105030249295_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249295/611752105030249295_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249296/611752105030249296_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249302/611752105030249302_5910973794723621.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249302/611752105030249302_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249302/611752105030249302_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250690/611752105030250690_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250690/611752105030250690_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250690/611752105030250690_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250691/611752105030250691_10414574140317353.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250691/611752105030250691_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250691/611752105030250691_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250695/611752105030250695_3634463651.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250695/611752105030250695_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250695/611752105030250695_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250699/611752105030250699_5629499489839033.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250699/611752105030250699_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250699/611752105030250699_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250702/611752105030250702_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250702/611752105030250702_6755399374234747.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250704/611752105030250704_1688849864840588.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250704/611752105030250704_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250704/611752105030250704_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250711/611752105030250711_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250711/611752105030250711_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250715/611752105030250715_10414574138721494.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250715/611752105030250715_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250715/611752105030250715_8162774329368194.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250717/611752105030250717_8162774327817435.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250717/611752105030250717_8162774329368194.wav"
+    # ]
+
+    input_wavs = [
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105028480653/611752105028480653_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105028480653/611752105028480653_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105028480653/611752105028480653_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248965/611752105030248965_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248972/611752105030248972_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248973/611752105030248973_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248973/611752105030248973_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030248974/611752105030248974_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249319/611752105030249319_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249322/611752105030249322_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249322/611752105030249322_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249324/611752105030249324_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249324/611752105030249324_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249324/611752105030249324_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249330/611752105030249330_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249333/611752105030249333_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249333/611752105030249333_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249334/611752105030249334_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249336/611752105030249336_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249337/611752105030249337_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249338/611752105030249338_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249338/611752105030249338_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249338/611752105030249338_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249340/611752105030249340_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249340/611752105030249340_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249342/611752105030249342_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249342/611752105030249342_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249342/611752105030249342_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249347/611752105030249347_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249347/611752105030249347_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249347/611752105030249347_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249348/611752105030249348_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249352/611752105030249352_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249353/611752105030249353_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249353/611752105030249353_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249353/611752105030249353_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249354/611752105030249354_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249354/611752105030249354_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249355/611752105030249355_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249355/611752105030249355_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249355/611752105030249355_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249356/611752105030249356_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249359/611752105030249359_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249361/611752105030249361_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249361/611752105030249361_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249364/611752105030249364_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249364/611752105030249364_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249364/611752105030249364_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249365/611752105030249365_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249365/611752105030249365_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249365/611752105030249365_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249366/611752105030249366_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249366/611752105030249366_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249366/611752105030249366_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249368/611752105030249368_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249368/611752105030249368_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249370/611752105030249370_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249370/611752105030249370_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249371/611752105030249371_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249371/611752105030249371_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249371/611752105030249371_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249372/611752105030249372_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249372/611752105030249372_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249374/611752105030249374_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249374/611752105030249374_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249375/611752105030249375_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249375/611752105030249375_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249377/611752105030249377_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249377/611752105030249377_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249383/611752105030249383_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249383/611752105030249383_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249383/611752105030249383_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249384/611752105030249384_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249385/611752105030249385_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249385/611752105030249385_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249386/611752105030249386_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249387/611752105030249387_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249387/611752105030249387_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249388/611752105030249388_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249388/611752105030249388_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249388/611752105030249388_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249391/611752105030249391_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249391/611752105030249391_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249393/611752105030249393_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249393/611752105030249393_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249394/611752105030249394_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249394/611752105030249394_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249395/611752105030249395_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249395/611752105030249395_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249397/611752105030249397_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249397/611752105030249397_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249398/611752105030249398_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249398/611752105030249398_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249401/611752105030249401_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249401/611752105030249401_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249401/611752105030249401_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249402/611752105030249402_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249402/611752105030249402_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249403/611752105030249403_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249403/611752105030249403_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249405/611752105030249405_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249406/611752105030249406_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249406/611752105030249406_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249409/611752105030249409_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249409/611752105030249409_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249410/611752105030249410_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249414/611752105030249414_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249414/611752105030249414_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249414/611752105030249414_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249417/611752105030249417_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249417/611752105030249417_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249417/611752105030249417_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249431/611752105030249431_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249431/611752105030249431_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249431/611752105030249431_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250728/611752105030250728_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250728/611752105030250728_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250730/611752105030250730_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250730/611752105030250730_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250733/611752105030250733_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250733/611752105030250733_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250735/611752105030250735_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250735/611752105030250735_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250735/611752105030250735_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250739/611752105030250739_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250741/611752105030250741_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250743/611752105030250743_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030250743/611752105030250743_5910973794723621.wav"
+    ]
+    dst_base_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/user_out_data/me_top500/step2"
+    for i in range(len(input_wavs)):
+        # input_wavs[i] = os.path.join("/data/rsync/jianli.yang/AutoCoverTool", input_wavs[i])
+        in_f = input_wavs[i]
+        in_v_f = input_wavs[i]
+        v_f = "/".join(input_wavs[i].replace("out_data", "inf_users").split("/")[:-1]) + "/vocal.wav"
+
+        st = time.time()
+        # 降噪
+        denoise_path = in_f.replace(".wav", "_d.wav")
+        cmd = "{} {} {}".format(gs_denoise_exe, in_f, denoise_path)
+        os.system(cmd)
+        if not os.path.exists(denoise_path):
+            print("{} sp={} err 1".format(in_f, time.time() - st))
+            continue
+        # 拉伸
+        out_path = in_f.replace(".wav", "_dv.wav")
+        cmd = "{} {} {} {}".format(gs_draw_volume_exe, denoise_path, v_f, out_path)
+        os.system(cmd)
+        if not os.path.exists(out_path):
+            print("{} sp={} err 2".format(in_f, time.time() - st))
+            continue
+
+        # 重采样到44k单声道
+        out441_path = in_f.replace(".wav", "_dv441.wav")
+        cmd = "ffmpeg -i {} -ar 44100 -ac 1 {}".format(out_path, out441_path)
+        os.system(cmd)
+        if not os.path.exists(out441_path):
+            print("{} sp={} err 7".format(in_f, time.time() - st))
+            os.unlink(out_path)
+            continue
+
+        # 拷贝数据到目标位置
+        song_id = in_f.split("/")[-2]
+        dst_dir = os.path.join(dst_base_dir, song_id)
+        if not os.path.exists(dst_dir):
+            os.makedirs(dst_dir)
+        # 拷贝人声和伴奏
+        dst_vocal_path = os.path.join(dst_dir, "vocal.mp3")
+        dst_acc_path = os.path.join(dst_dir, "acc.mp3")
+        dst_mp3_path = os.path.join(dst_dir, "src.mp3")
+        if not os.path.exists(dst_vocal_path):
+            cmd = "ffmpeg -i {} -ab 320k {}".format(v_f, dst_vocal_path)
+            os.system(cmd)
+            if not os.path.exists(dst_vocal_path):
+                print("{} sp={} err 3".format(in_f, time.time() - st))
+                continue
+
+        if not os.path.exists(dst_acc_path):
+            cmd = "ffmpeg -i {} -ab 320k {}".format(v_f.replace("vocal.wav", "acc.wav"), dst_acc_path)
+            os.system(cmd)
+            if not os.path.exists(dst_acc_path):
+                print("{} sp={} err 4".format(in_f, time.time() - st))
+                continue
+        if not os.path.exists(dst_mp3_path):
+            cmd = "cp {} {}".format(v_f.replace("vocal.wav", "src.mp3"), dst_mp3_path)
+            os.system(cmd)
+            if not os.path.exists(dst_mp3_path):
+                print("{} sp={} err 5".format(in_f, time.time() - st))
+                continue
+        name = out_path.split("/")[-1]
+        dst_path = os.path.join(dst_dir, name)
+        cmd = "cp {} {}".format(out_path, dst_path)
+        os.system(cmd)
+        if not os.path.exists(dst_path):
+            print("{} sp={} err 6".format(in_f, time.time() - st))
+            continue
+        print("{} sp={} finish".format(in_f, time.time() - st))
+
+
+if __name__ == '__main__':
+    process()
diff --git a/AutoCoverTool/ref/split_dirty_frame/script/process_one.py b/AutoCoverTool/ref/split_dirty_frame/script/process_one.py
new file mode 100644
index 0000000..5754df4
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/script/process_one.py
@@ -0,0 +1,1842 @@
+"""
+处理单个音频文件的操作
+1. 查找到异常的位置
+2. 统计异常的位置 并确定出要替换的位置
+3. 使用原唱进行替换
+"""
+import os
+import time
+import glob
+import torch
+import madmom
+import librosa
+import soundfile
+import numpy as np
+
+from custom_models.model import get_cur_model
+from dataset.dataset import file2mfcc, gs_frame_num
+
+gs_err_code_success = 0
+gs_err_code_no_file = 1
+gs_err_code_file_too_short = 2
+
+
+def construct_power_fragment(points):
+    fragments = []
+    st_frame = -1
+    tot_rate = []
+    for idx, cur_tp_rate in enumerate(points):
+        """
+        1. 当前tp==1:
+            前面也是1，意味着继续
+            前面不是1，意味着从当前开始
+        2. 当前tp==0:
+            前面是0，继续
+            前面不是0，意味着可以截断
+        """
+        tp = int(cur_tp_rate < 0.01)
+        if int(tp) == 1:
+            tot_rate.append(cur_tp_rate)
+
+        # 从此处开始
+        if st_frame == -1 and int(tp) == 1:
+            st_frame = idx
+            continue
+        # 到此处截断
+        if st_frame != -1 and int(tp) == 0:
+            fragments.append([st_frame, idx - st_frame, sum(tot_rate) / len(tot_rate)])
+            st_frame = -1
+            tot_rate = []
+
+    # 做一次合并,如果某个分段前后的时间长度小于等于100ms,并且能量均值小于15,则合并段
+    idx = 1
+    while idx < len(fragments):
+        last_fragment = fragments[idx - 1]
+        cur_fragment = fragments[idx]
+        cur_duration = cur_fragment[0] - (last_fragment[0] + last_fragment[1])
+        if 10 > cur_duration > 0 and \
+                np.mean(points[last_fragment[0] + last_fragment[1]:last_fragment[0] + last_fragment[
+                    1] + cur_duration]) < 0.015:
+            fragments[idx - 1][1] = cur_fragment[0] + cur_fragment[1] - fragments[idx - 1][0]
+            del fragments[idx]
+            idx -= 1
+        idx += 1
+    return fragments
+
+
+# 能量切分段
+def split_vocal2fragment(in_file):
+    """
+    先归一化,按照能量选取出适合分割的点
+    :param in_file:
+    :return:
+    """
+    audio, sr = librosa.load(in_file, sr=16000, mono=True)
+    audio = librosa.util.normalize(audio)
+    # 帧长100ms,帧移10ms,计算能量
+    power_arr = []
+    for i in range(0, len(audio) - 1600, 160):
+        power_arr.append(np.sum(np.abs(audio[i:i + 160])) / 160)
+
+    # 将能量小于等于10的部分做成段
+    power_arr = construct_power_fragment(power_arr)
+    fragments = []
+    out_file = in_file + "_power.csv"
+    with open(out_file, "w") as f:
+        f.write("Name\tStart\tDuration\tTime Format\tType\n")
+        for idx, line in enumerate(power_arr):
+            start = round(float(line[0]) * 0.01, 3)
+            duration = round(float(line[1]) * 0.01, 3)
+            fragments.append([start, duration])
+            strr = "{}\t{}\t{}\t{}\n".format(str(round(line[2] * 1000, 2)), start, duration, "decimal\tCue\t")
+            f.write(strr)
+    return fragments
+
+
+def get_onsets(in_file):
+    """
+    获取onset点
+    :param in_file:
+    :return:
+    """
+    proc = madmom.features.OnsetPeakPickingProcessor(fps=100)
+    act = madmom.features.RNNOnsetProcessor()(in_file)
+    times = proc(act)
+    return times
+
+
+def get_downbeats(in_file):
+    """
+    获取节奏点
+    :param in_file:
+    :return:
+    """
+    proc = madmom.features.DBNDownBeatTrackingProcessor(beats_per_bar=[3, 4], fps=100)
+    act = madmom.features.RNNDownBeatProcessor()(in_file)
+    res = proc(act)
+    # times = np.array(res[:, 0])
+    # 只要=1的那个时间点
+    downbeats = []
+    for i in range(0, len(res)):
+        if res[i][1] == 1:
+            downbeats.append(res[i][0])
+    downbeats = np.array(downbeats)
+    bpm = 60 / (np.mean(np.diff(downbeats)) / 4)
+    return downbeats, bpm
+
+
+def split_vocal2fragment_v1(in_file):
+    onsets_times_s = get_onsets(in_file)
+    print("len={}".format(len(onsets_times_s)))
+    with open(in_file + "_onsets.csv", "w") as f:
+        f.write("Name\tStart\tDuration\tTime Format\tType\n")
+        for idx, line in enumerate(onsets_times_s):
+            start = round(float(onsets_times_s[idx]), 3)
+            duration = 0.01
+            strr = "{}\t{}\t{}\t{}\n".format("bb", start, duration, "decimal\tCue\t")
+            f.write(strr)
+
+
+class ReplaceVocalFrame:
+    def __init__(self, model_path):
+        st = time.time()
+        model = get_cur_model()
+        device = 'cuda' if torch.cuda.is_available() else 'cpu'
+        params = torch.load(model_path, map_location=torch.device(device))
+        model.load_state_dict(state_dict=params)
+        model.eval()
+        model.to('cuda')
+        self.model = model
+        self.device = device
+        print("load model sp={}".format(time.time() - st))
+
+    def get_batch_frames(self, mfcc):
+        # 切片成32帧一组
+        predict_mfcc = []
+        for i in range(0, len(mfcc) - gs_frame_num):
+            predict_mfcc.append(mfcc[i:i + gs_frame_num])
+        # 批量推理
+        batch_num = 32
+        real_predict_mfcc = []
+        i = 0
+        while i < len(predict_mfcc):
+            real_predict_mfcc.append(predict_mfcc[i:i + batch_num])
+            i += batch_num
+        return real_predict_mfcc
+
+    def construct_fragment(self, vocal_result, slience_fragment):
+        """
+        构造出连续的段
+        :param vocal_result:
+        :return:
+        """
+        # 静音段不会是异常段
+        vocal_result = np.array(vocal_result)
+        for fragment in slience_fragment:
+            st_s = int(fragment[0] / 0.016)
+            ed_s = int((fragment[0] + fragment[1]) / 0.016)
+            vocal_result[st_s:ed_s] = 0
+
+        fragments = []
+        st_frame = -1
+        tot_rate = []
+        for idx, cur_tp_rate in enumerate(vocal_result):
+            """
+            1. 当前tp==1:
+                前面也是1，意味着继续
+                前面不是1，意味着从当前开始
+            2. 当前tp==0:
+                前面是0，继续
+                前面不是0，意味着可以截断
+            """
+            tp = int(cur_tp_rate > 0.5)
+            if int(tp) == 1:
+                tot_rate.append(cur_tp_rate)
+
+            # 从此处开始
+            if st_frame == -1 and int(tp) == 1:
+                st_frame = idx
+                continue
+            # 到此处截断
+            if st_frame != -1 and int(tp) == 0:
+                fragments.append(
+                    [float(st_frame) * 0.016, float(idx - st_frame) * 0.016, sum(tot_rate) / len(tot_rate)])
+                st_frame = -1
+                tot_rate = []
+
+        return fragments
+
+    def fragment_filter(self, fragments):
+        """
+        1. 过滤掉不符合常理的段
+        2. 合并相近的段
+        如果当前段小于64ms，并且，前后相近的64ms内均没有段，则不用该段
+        :return:
+        """
+        idx = 0
+        while idx < len(fragments):
+            fragment = fragments[idx]
+            st_idx = fragment[0]
+            duration = fragment[1]
+            ed_idx = fragment[0] + fragment[1]
+            if duration < 0.064:
+                # 前面有，则向前面探查
+                # 后面有，则向后面探查
+                # 两者都有，选择距离最近的
+                before_idx = 10000
+                after_idx = 10000
+                if idx > 0:
+                    before_idx = st_idx - (fragments[idx - 1][0] + fragments[idx - 1][1])
+                if idx + 1 < len(fragments):
+                    after_idx = fragments[idx + 1][0] - ed_idx
+
+                # 如果前面比后面小，并且前面相距小于64ms
+                if before_idx < after_idx and before_idx < 0.064:
+                    fragments[idx - 1][1] = ed_idx - fragments[idx - 1][0]
+
+                # 归属到后面
+                if before_idx > after_idx and after_idx < 0.064:
+                    fragments[idx + 1][0] = st_idx
+                    fragments[idx + 1][1] += after_idx + duration
+                del fragments[idx]
+                idx -= 1
+            idx += 1
+        return fragments
+
+    def fragment_filter_by_power(self, fragments, in_file):
+        """
+        使用能量卡一下分段，从而保证不会带有平滑段
+        :param fragments:
+        :return:
+        """
+        audio, sr = librosa.load(in_file, sr=16000, mono=True)
+        hop_len = 160
+        win_len = 160 * 5
+        threshold = 0.015
+        i = 0
+        while i < len(fragments):
+            st_s = fragments[i][0]
+            ed_s = fragments[i][0] + fragments[i][1]
+            st_pos = int(st_s * sr + 0.5)
+            ed_pos = int(ed_s * sr + 0.5)
+            # 对于每个分段从两段向中间卡,10ms帧移，50ms帧长，均值小于15就卡掉
+            # 如果本段不够50ms,则评估能量，均值小于15就直接干掉
+            # 如果整体能量太低，也会被卡掉
+
+            if ed_pos - st_pos < win_len:
+                if np.mean(np.abs(audio[st_pos:ed_pos])) < threshold:
+                    print("Remove:{},{}".format(st_s, ed_s, ))
+                    del fragments[i]
+                    i -= 1
+            else:
+                # 从左边向右边卡
+                left_pos = st_pos
+                for idx in range(st_pos, ed_pos - win_len, hop_len):
+                    cur_win_len = win_len
+                    if idx + win_len > ed_pos:
+                        cur_win_len = ed_pos - idx
+                    if np.mean(np.abs(audio[idx:idx + cur_win_len])) < threshold:
+                        left_pos = idx
+                        continue
+                    break
+
+                right_pos = ed_pos
+                for idx in range(ed_pos - win_len, st_pos - 1, -hop_len):
+                    cur_win_len = win_len
+                    if idx + win_len > ed_pos:
+                        cur_win_len = ed_pos - idx
+                    if np.mean(np.abs(audio[idx:idx + cur_win_len])) < threshold:
+                        right_pos = idx
+                        continue
+                    break
+                # 左右的探寻方式不同，如果两者交叉，说明本段能量较小，得干掉
+                if right_pos < left_pos:
+                    print("RemoveM:{},{}".format(st_s, ed_s))
+                    del fragments[i]
+                    i -= 1
+                else:
+                    fragments[i][0] = left_pos / sr
+                    fragments[i][1] = (right_pos - left_pos) / sr
+            i += 1
+
+        # 检查一遍，是否有重合项
+        for i in range(1, len(fragments)):
+            if fragments[i][1] < 0:
+                print("ERROR, {} < 0!".format(fragments[i][1]))
+                exit(-1)
+            if fragments[i][0] < (fragments[i - 1][0] + fragments[i - 1][1]):
+                print("ERROR!, {} < {}!".format(fragments[i][0], fragments[i - 1][0] + fragments[i - 1][1]))
+                exit(-1)
+        return fragments
+
+    def write_fragments2file(self, fragments, out_file):
+        with open(out_file + "_out.csv", "w") as f:
+            f.write("Name\tStart\tDuration\tTime Format\tType\n")
+            for line in fragments:
+                start = str(round(float(line[0]), 3))
+                duration = str(round(float(line[1]), 3))
+                strr = "{}\t{}\t{}\t{}\n".format(str(round(line[2], 2)), start, duration, "decimal\tCue\t")
+                f.write(strr)
+
+    def get_vocal_frames(self, in_file, slience_fragment):
+        if not os.path.exists(in_file):
+            return gs_err_code_no_file, []
+        st = time.time()
+        mfcc = file2mfcc(in_file)
+        print("{} file2mfcc sp={}".format(in_file, time.time() - st))
+        if len(mfcc) < gs_frame_num:
+            return gs_err_code_file_too_short, []
+
+        st = time.time()
+        real_predict_mfcc = self.get_batch_frames(mfcc)
+        print("{} get_batch_frames sp={}".format(in_file, time.time() - st))
+
+        # 推理
+        st = time.time()
+        vocal_result = []
+        with torch.no_grad():
+            for batch in real_predict_mfcc:
+                result = self.model(torch.tensor(batch).to(self.device))
+                result = result.softmax(dim=1)[:, 1]  # 只看1的概率
+
+                # _, result = result.max(dim=1)  # 0代表正常，1代表异常
+                vocal_result.extend(list(result.cpu().numpy()))
+        print("{} model sp={}".format(in_file, time.time() - st))
+        # 构造出连续的段
+        st = time.time()
+        fragments = self.construct_fragment(vocal_result, slience_fragment)
+        fragments = self.fragment_filter_by_power(fragments, in_file)
+        fragments = self.fragment_filter(fragments)
+        self.write_fragments2file(fragments, in_file + "_label.csv")
+        print("{} write_fragments2file sp={}".format(in_file, time.time() - st))
+        return gs_err_code_success, fragments
+
+    def replace_logic_rate(self, in_file, frames, fragments):
+        replace_fragment = []
+        for idx, frame in enumerate(frames):
+            start_s = frame[0]
+            duration_s = frame[1]
+            ed_s = start_s + duration_s
+            rate = frame[2]
+            if rate < 0.85:
+                continue
+            # 找到能将该时间片容纳住的分段
+            # 分段的意思是,从该时间段开始，向两边扩，扩展到有静音分段位置
+            left_start_s = -1
+            left_start_idx = -1
+            for ii, fragment in enumerate(fragments):
+                f_start_s = fragment[0]
+                if f_start_s > start_s:
+                    left_start_s = fragments[ii - 1][0]
+                    left_start_idx = ii - 1
+                    break
+
+            right_ed_s = -1
+            right_ed_idx = -1
+            for ii in range(len(fragments) - 1, -1, -1):
+                f_ed_s = fragments[ii][0] + fragments[ii][1]
+                if f_ed_s < ed_s and ii + 1 < len(fragments):
+                    right_ed_s = fragments[ii + 1][0] + fragments[ii + 1][1]
+                    right_ed_idx = ii + 1
+                    break
+            max_sec = 3
+            if left_start_s != -1 and right_ed_s != -1:
+                # 修补逻辑, 从当前分段向前奏各自探寻3s,寻找到最大的分割段
+                # 向左探寻
+                left_max_sed_idx = left_start_idx
+                for ii in range(left_start_idx, -1, -1):
+                    if fragments[ii][1] > fragments[left_max_sed_idx][1]:
+                        left_max_sed_idx = ii
+                    if fragments[left_start_idx][0] - fragments[ii][0] >= max_sec:
+                        break
+                # 向右探寻
+                right_max_sed_idx = right_ed_idx
+                for ii in range(right_ed_idx, len(fragments), 1):
+                    if fragments[ii][1] > fragments[right_max_sed_idx][1]:
+                        right_max_sed_idx = ii
+                    if fragments[ii][0] - fragments[right_ed_idx][0] >= max_sec:
+                        break
+                left_start_s = fragments[left_max_sed_idx][0]
+                right_ed_s = fragments[right_max_sed_idx][0] + fragments[right_max_sed_idx][1]
+                # 存放开始时间、持续时间，左端静音段长度，右边静音段长度
+                replace_fragment.append([left_start_s, right_ed_s - left_start_s, rate,
+                                         fragments[left_max_sed_idx][1],
+                                         fragments[right_max_sed_idx][1]])
+
+        # 分段合并
+        # 会出现相邻的两个分段之间重合，此时直接合并,因为都是用的分段信息，所以不会出现两个分段之间相距比较近的情况
+        idx = 1
+        while idx < len(replace_fragment):
+            last_fragment = replace_fragment[idx - 1]
+            if last_fragment[0] + last_fragment[1] > replace_fragment[idx][0]:
+                replace_fragment[idx - 1][1] = replace_fragment[idx][0] + replace_fragment[idx][1] - \
+                                               replace_fragment[idx - 1][0]
+                del replace_fragment[idx]
+                idx -= 1
+            idx += 1
+
+        # 分段太短，则剔除掉| 小于1s
+        audio, sr = librosa.load(in_file, sr=44100, mono=True)
+        replace_tot_sec = 0
+        for idx, fragment in enumerate(replace_fragment):
+            if fragment[1] - (fragment[3] + fragment[4]) < 1:
+                print("TooShort: {},{}".format(fragment[0], fragment[1]))
+                del replace_fragment[idx]
+                continue
+            replace_tot_sec += fragment[1] - (fragment[3] + fragment[4])
+        print("{}, final: len= {}, tot_sec={}, replace={}, rate={}".
+              format(in_file, len(replace_fragment), len(audio) / sr, replace_tot_sec,
+                     replace_tot_sec / (len(audio) / sr)))
+        rate = replace_tot_sec / (len(audio) / sr)
+        return replace_fragment, rate
+
+    def replace_logic(self, in_file, vocal_file, frames, fragments):
+        """
+        异常段进行替换
+        :param in_file:
+        :param vocal_file:
+        :param frames:
+        :param fragments:
+        :return:
+        """
+        audio, sr = librosa.load(in_file, sr=44100, mono=True)
+        replace_fragment, rate = self.replace_logic_rate(in_file, frames, fragments)
+        # 写入文件
+        with open(in_file + "_replace.csv", "w") as f:
+            f.write("Name\tStart\tDuration\tTime Format\tType\n")
+            for idx, line in enumerate(replace_fragment):
+                start = str(round(line[0], 3))
+                duration = str(round(line[1], 3))
+                strr = "{}\t{}\t{}\t{}\n".format(str(round(line[2], 3)), start, duration, "decimal\tCue\t")
+                f.write(strr)
+            for idx, line in enumerate(frames):
+                start = str(round(line[0], 3))
+                duration = str(round(line[1], 3))
+                if line[2] < 0.85:
+                    continue
+                strr = "ll_{}\t{}\t{}\t{}\n".format(str(round(line[2], 3)), start, duration, "decimal\tCue\t")
+                f.write(strr)
+
+        # 从vocal中替换出合适的句子出来
+        vocal, sr = librosa.load(vocal_file, sr=44100, mono=True)
+        fade_len = int(sr * 0.05)
+        for idx, fragment in enumerate(replace_fragment):
+            st_pos = int(fragment[0] * sr + 0.5)
+            ed_pos = st_pos + int(fragment[1] * sr + 0.5)
+            # 替换的方式: fade_in, fade_out
+            for kk in range(0, fade_len):
+                audio[st_pos + kk] = vocal[st_pos + kk] * (kk / fade_len) + audio[st_pos + kk] * (1 - kk / fade_len)
+                audio[ed_pos - kk] = vocal[ed_pos - kk] * (kk / fade_len) + audio[ed_pos - kk] * (1 - kk / fade_len)
+
+            audio[st_pos + fade_len:ed_pos - fade_len] = vocal[st_pos + fade_len:ed_pos - fade_len]
+        soundfile.write(in_file + "_replace.wav", audio, 44100, format="wav")
+
+    def process(self, in_file, in_volume_file, vocal_file):
+
+        # 获取分割段,单位是秒
+        # [[start, duration], ...., [start, duration]]
+        fragments = split_vocal2fragment(in_file)
+
+        # [[start, duration, rate]]
+        # 单位是秒
+        err, frames = self.get_vocal_frames(in_file, fragments)
+        if err != gs_err_code_success:
+            return err
+
+        # 替换逻辑
+        self.replace_logic(in_volume_file, vocal_file, frames, fragments)
+        print("replace ....")
+
+    def get_rate(self, in_file):
+        # 获取分割段,单位是秒
+        # [[start, duration], ...., [start, duration]]
+        fragments = split_vocal2fragment(in_file)
+        # [[start, duration, rate]]
+        # 单位是秒
+        err, frames = self.get_vocal_frames(in_file, fragments)
+        if err != gs_err_code_success:
+            return err
+        replace_fragments, rate = self.replace_logic_rate(in_file, frames, fragments)
+        return rate
+
+
+def process_v0():
+    """
+    直接采用替换的方式,不加混响和音量调整
+    :return:
+    """
+    input_wavs = [
+        "611752105030249010",
+        "611752105030249011",
+        "611752105030249016",
+        "611752105030249019",
+        "611752105030249022",
+        "611752105030249030",
+        "611752105030249031",
+        "611752105030249032",
+        "611752105030249034",
+        "611752105030249035"
+    ]
+    m_path = "output_v5_3/epoch_3_0.8527927799886299.pth"
+    simple_mixer_path = "/opt/soft/bin/simple_mixer"
+    input_wavs_base = "/data/rsync/jianli.yang/AutoCoverTool/data/user_out_data/me_top500/out_test/v0"
+    # for input_wav in input_wavs:
+    #     input_wav = os.path.join(input_wavs_base, input_wav)
+    #     print("cp -r {} ./ \n".format(input_wav))
+    # exit(-1)
+
+    re = ReplaceVocalFrame(m_path)
+    for i in range(0, len(input_wavs)):
+        wavs = glob.glob(os.path.join(os.path.join(input_wavs_base, input_wavs[i]), "*dv.wav"))
+        for wav in wavs:
+            i_v = wav
+            e_v = wav
+            v_v = os.path.join(
+                os.path.join(os.path.join("/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500",
+                                          input_wavs[i])), "vocal.wav")
+            st = time.time()
+            re.process(i_v, e_v, v_v)
+
+            dst_path = e_v + "_replace.wav"
+            if not os.path.exists(dst_path):
+                print("ERROR:={}, replace sp={}".format(i_v, time.time() - st))
+                continue
+
+            # 先转码
+            dst_path_442 = dst_path.replace("_replace.wav", "_replace442.wav")
+            if not os.path.exists(dst_path_442):
+                cmd = "ffmpeg -i {} -ar 44100 -ac 2 {}".format(dst_path, dst_path_442)
+                os.system(cmd)
+                if not os.path.exists(dst_path_442):
+                    print("ERROR:={}, resample sp={}".format(i_v, time.time() - st))
+                    continue
+            mix_path = dst_path_442.replace("_replace442.wav", "_replace442_mix.wav")
+            cmd = "{} {} {} {}".format(simple_mixer_path, dst_path_442, v_v.replace("vocal.wav", "acc.wav"), mix_path)
+            print("{}".format(cmd))
+            os.system(cmd)
+            if not os.path.exists(mix_path):
+                print("ERROR:={}, mix sp={}".format(i_v, time.time() - st))
+                continue
+            print("sp={}".format(time.time() - st))
+
+
+def real_process():
+    input_wavs_base = "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500"
+    input_wavs = [
+        "611752105030249022/611752105030249022_3634463651.wav",
+        "611752105030249038/611752105030249038_6755399374234747.wav",
+        "611752105030249067/611752105030249067_5910973794723621.wav",
+        "611752105030249112/611752105030249112_5910973794723621.wav",
+        "611752105030249173/611752105030249173_3634463651.wav",
+        "611752105030249216/611752105030249216_1688849864840588.wav",
+        "611752105030249267/611752105030249267_10414574138721494.wav",
+        "611752105030249284/611752105030249284_1688849864840588.wav",
+        "611752105030250690/611752105030250690_5629499489839033.wav"
+    ]
+
+    effect_wavs_base = "/data/rsync/jianli.yang/AutoCoverTool/data/user_effect_out_data/step1/cyl"
+    effect_wavs = [
+        "611752105030249022_3634463651_human.wav",
+        "611752105030249038_6755399374234747_human.wav",
+        "611752105030249067_5910973794723621_human.wav",
+        "611752105030249112_5910973794723621_human.wav",
+        "611752105030249173_3634463651_human.wav",
+        "611752105030249216_1688849864840588_human.wav",
+        "611752105030249267_10414574138721494_human.wav",
+        "611752105030249284_1688849864840588_human.wav",
+        "611752105030250690_5629499489839033_human.wav"
+    ]
+
+    vocal_base_path = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500"
+    vocal_wavs = [
+        "611752105030249022/vocal.wav",
+        "611752105030249038/vocal.wav",
+        "611752105030249067/vocal.wav",
+        "611752105030249112/vocal.wav",
+        "611752105030249173/vocal.wav",
+        "611752105030249216/vocal.wav",
+        "611752105030249267/vocal.wav",
+        "611752105030249284/vocal.wav",
+        "611752105030250690/vocal.wav"
+    ]
+
+    m_path = "output_v5_3/epoch_3_0.8527927799886299.pth"
+    simple_mixer_path = "/opt/soft/bin/simple_mixer"
+    re = ReplaceVocalFrame(m_path)
+    for i_v, e_v, v_v in zip(input_wavs, effect_wavs, vocal_wavs):
+        i_v = os.path.join(input_wavs_base, i_v)
+        e_v = os.path.join(effect_wavs_base, e_v)
+        v_v = os.path.join(vocal_base_path, v_v)
+        st = time.time()
+        re.process(i_v, e_v, v_v)
+
+        dst_path = e_v + "_replace.wav"
+        if not os.path.exists(dst_path):
+            print("ERROR:={}, replace sp={}".format(i_v, time.time() - st))
+            continue
+
+        # 先转码
+        dst_path_442 = dst_path.replace("_replace.wav", "_replace442.wav")
+        if not os.path.exists(dst_path_442):
+            cmd = "ffmpeg -i {} -ar 44100 -ac 2 {}".format(dst_path, dst_path_442)
+            os.system(cmd)
+            if not os.path.exists(dst_path_442):
+                print("ERROR:={}, resample sp={}".format(i_v, time.time() - st))
+                continue
+        mix_path = dst_path_442.replace("_replace442.wav", "_replace442_mix.wav")
+        cmd = "{} {} {} {}".format(simple_mixer_path, dst_path_442, v_v.replace("vocal.wav", "acc.wav"), mix_path)
+        os.system(cmd)
+        if not os.path.exists(mix_path):
+            print("ERROR:={}, mix sp={}".format(i_v, time.time() - st))
+            continue
+        print("sp={}".format(time.time() - st))
+
+
+if __name__ == '__main__':
+    real_process()
+    # process_v0()
+    # test()
+    # split_vocal2fragment_v1("/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/9/9_10414574138721494.wav")
+    # exit(-1)
+    # m_path = "output_v5_3/epoch_3_0.8527927799886299.pth"
+    # re = ReplaceVocalFrame(m_path)
+    #
+    # old_input_wavs = [
+    #     "data/out_data/me_top500/611752105027601574/611752105027601574_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105027601574/611752105027601574_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105027601574/611752105027601574_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105028392007/611752105028392007_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105028392007/611752105028392007_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105028392007/611752105028392007_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105028480056/611752105028480056_3634463651.wav",
+    #     "data/out_data/me_top500/611752105028480056/611752105028480056_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105028480056/611752105028480056_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105029951597/611752105029951597_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105029951597/611752105029951597_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105029951597/611752105029951597_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105029951624/611752105029951624_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105029951624/611752105029951624_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105029951624/611752105029951624_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248977/611752105030248977_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248977/611752105030248977_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030248977/611752105030248977_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030248981/611752105030248981_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248981/611752105030248981_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030248981/611752105030248981_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030248982/611752105030248982_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248982/611752105030248982_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030248982/611752105030248982_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248988/611752105030248988_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248988/611752105030248988_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248988/611752105030248988_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030248992/611752105030248992_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248992/611752105030248992_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030248992/611752105030248992_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248994/611752105030248994_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248994/611752105030248994_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030248994/611752105030248994_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248995/611752105030248995_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248995/611752105030248995_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030248995/611752105030248995_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249000/611752105030249000_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249000/611752105030249000_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249000/611752105030249000_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249001/611752105030249001_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249001/611752105030249001_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249001/611752105030249001_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249007/611752105030249007_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249007/611752105030249007_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249007/611752105030249007_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249009/611752105030249009_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249009/611752105030249009_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249009/611752105030249009_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249010/611752105030249010_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249010/611752105030249010_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249010/611752105030249010_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249011/611752105030249011_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249011/611752105030249011_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249011/611752105030249011_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249016/611752105030249016_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249016/611752105030249016_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249016/611752105030249016_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249018/611752105030249018_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249018/611752105030249018_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249018/611752105030249018_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249019/611752105030249019_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249019/611752105030249019_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249019/611752105030249019_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249020/611752105030249020_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249020/611752105030249020_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249020/611752105030249020_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249022/611752105030249022_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249022/611752105030249022_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249022/611752105030249022_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249025/611752105030249025_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249025/611752105030249025_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249025/611752105030249025_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249030/611752105030249030_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249030/611752105030249030_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249030/611752105030249030_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249031/611752105030249031_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249031/611752105030249031_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249031/611752105030249031_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249032/611752105030249032_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249032/611752105030249032_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249032/611752105030249032_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249034/611752105030249034_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249034/611752105030249034_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249034/611752105030249034_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249035/611752105030249035_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249035/611752105030249035_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249035/611752105030249035_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249036/611752105030249036_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249036/611752105030249036_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249036/611752105030249036_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249037/611752105030249037_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249037/611752105030249037_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249037/611752105030249037_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249038/611752105030249038_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249038/611752105030249038_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249038/611752105030249038_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249040/611752105030249040_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249040/611752105030249040_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249040/611752105030249040_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249041/611752105030249041_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249041/611752105030249041_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249041/611752105030249041_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249048/611752105030249048_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249048/611752105030249048_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249048/611752105030249048_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249049/611752105030249049_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249049/611752105030249049_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249049/611752105030249049_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249052/611752105030249052_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249052/611752105030249052_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249052/611752105030249052_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249053/611752105030249053_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249053/611752105030249053_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249053/611752105030249053_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249055/611752105030249055_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249055/611752105030249055_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249055/611752105030249055_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249057/611752105030249057_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249057/611752105030249057_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249057/611752105030249057_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249058/611752105030249058_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249058/611752105030249058_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249058/611752105030249058_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249065/611752105030249065_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249065/611752105030249065_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249065/611752105030249065_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249067/611752105030249067_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249067/611752105030249067_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249067/611752105030249067_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249070/611752105030249070_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249070/611752105030249070_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249070/611752105030249070_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249071/611752105030249071_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249071/611752105030249071_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249071/611752105030249071_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249073/611752105030249073_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249073/611752105030249073_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249073/611752105030249073_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249074/611752105030249074_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249074/611752105030249074_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249074/611752105030249074_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249077/611752105030249077_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249077/611752105030249077_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249077/611752105030249077_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249079/611752105030249079_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249079/611752105030249079_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249079/611752105030249079_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249082/611752105030249082_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249082/611752105030249082_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249082/611752105030249082_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249091/611752105030249091_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249091/611752105030249091_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249091/611752105030249091_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249094/611752105030249094_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249094/611752105030249094_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249094/611752105030249094_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249099/611752105030249099_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249099/611752105030249099_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249099/611752105030249099_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249104/611752105030249104_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249104/611752105030249104_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249104/611752105030249104_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249105/611752105030249105_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249105/611752105030249105_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249105/611752105030249105_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249111/611752105030249111_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249111/611752105030249111_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249111/611752105030249111_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249112/611752105030249112_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249112/611752105030249112_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249112/611752105030249112_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249113/611752105030249113_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249113/611752105030249113_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249113/611752105030249113_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249118/611752105030249118_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249118/611752105030249118_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249118/611752105030249118_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249121/611752105030249121_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249121/611752105030249121_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249121/611752105030249121_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249127/611752105030249127_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249127/611752105030249127_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249127/611752105030249127_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249128/611752105030249128_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249128/611752105030249128_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249128/611752105030249128_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249133/611752105030249133_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249133/611752105030249133_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249133/611752105030249133_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249134/611752105030249134_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249134/611752105030249134_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249134/611752105030249134_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249136/611752105030249136_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249136/611752105030249136_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249136/611752105030249136_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249143/611752105030249143_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249143/611752105030249143_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249143/611752105030249143_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249148/611752105030249148_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249148/611752105030249148_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249148/611752105030249148_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249153/611752105030249153_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249153/611752105030249153_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249153/611752105030249153_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249157/611752105030249157_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249157/611752105030249157_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249157/611752105030249157_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249160/611752105030249160_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249160/611752105030249160_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249160/611752105030249160_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249161/611752105030249161_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249161/611752105030249161_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249161/611752105030249161_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249162/611752105030249162_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249162/611752105030249162_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249162/611752105030249162_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249163/611752105030249163_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249163/611752105030249163_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249163/611752105030249163_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249171/611752105030249171_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249171/611752105030249171_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249171/611752105030249171_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249173/611752105030249173_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249173/611752105030249173_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249173/611752105030249173_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249174/611752105030249174_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249174/611752105030249174_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249174/611752105030249174_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249175/611752105030249175_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249175/611752105030249175_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249175/611752105030249175_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249176/611752105030249176_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249176/611752105030249176_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249176/611752105030249176_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249177/611752105030249177_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249177/611752105030249177_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249177/611752105030249177_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249178/611752105030249178_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249178/611752105030249178_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249178/611752105030249178_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249181/611752105030249181_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249181/611752105030249181_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249181/611752105030249181_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249191/611752105030249191_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249191/611752105030249191_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249191/611752105030249191_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249195/611752105030249195_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249195/611752105030249195_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249195/611752105030249195_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249200/611752105030249200_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249200/611752105030249200_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249200/611752105030249200_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249201/611752105030249201_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249201/611752105030249201_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249201/611752105030249201_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249206/611752105030249206_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249206/611752105030249206_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249206/611752105030249206_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249209/611752105030249209_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249209/611752105030249209_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249209/611752105030249209_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249211/611752105030249211_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249211/611752105030249211_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249211/611752105030249211_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249213/611752105030249213_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249213/611752105030249213_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249213/611752105030249213_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249216/611752105030249216_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249216/611752105030249216_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249216/611752105030249216_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249218/611752105030249218_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249218/611752105030249218_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249218/611752105030249218_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249224/611752105030249224_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249224/611752105030249224_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249224/611752105030249224_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249227/611752105030249227_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249227/611752105030249227_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249227/611752105030249227_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249233/611752105030249233_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249233/611752105030249233_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249233/611752105030249233_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249237/611752105030249237_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249237/611752105030249237_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249237/611752105030249237_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249240/611752105030249240_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249240/611752105030249240_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249240/611752105030249240_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249243/611752105030249243_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249243/611752105030249243_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249243/611752105030249243_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249244/611752105030249244_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249244/611752105030249244_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249244/611752105030249244_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249245/611752105030249245_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249245/611752105030249245_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249245/611752105030249245_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249250/611752105030249250_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249250/611752105030249250_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249250/611752105030249250_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249255/611752105030249255_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249255/611752105030249255_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249255/611752105030249255_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249258/611752105030249258_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249258/611752105030249258_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249258/611752105030249258_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249264/611752105030249264_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249264/611752105030249264_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249264/611752105030249264_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249267/611752105030249267_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249267/611752105030249267_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249267/611752105030249267_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249273/611752105030249273_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249273/611752105030249273_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249273/611752105030249273_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249275/611752105030249275_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249275/611752105030249275_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249275/611752105030249275_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249278/611752105030249278_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249278/611752105030249278_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249278/611752105030249278_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249280/611752105030249280_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249280/611752105030249280_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249280/611752105030249280_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249281/611752105030249281_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249281/611752105030249281_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249281/611752105030249281_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249282/611752105030249282_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249282/611752105030249282_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249282/611752105030249282_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249283/611752105030249283_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249283/611752105030249283_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249283/611752105030249283_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249284/611752105030249284_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249284/611752105030249284_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249284/611752105030249284_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249287/611752105030249287_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249287/611752105030249287_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249287/611752105030249287_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249288/611752105030249288_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249288/611752105030249288_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249288/611752105030249288_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249289/611752105030249289_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249289/611752105030249289_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249289/611752105030249289_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249292/611752105030249292_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249292/611752105030249292_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249292/611752105030249292_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249293/611752105030249293_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249293/611752105030249293_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249293/611752105030249293_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249295/611752105030249295_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249295/611752105030249295_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249295/611752105030249295_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249296/611752105030249296_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249296/611752105030249296_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249296/611752105030249296_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249299/611752105030249299_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249299/611752105030249299_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249299/611752105030249299_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249302/611752105030249302_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249302/611752105030249302_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249302/611752105030249302_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249307/611752105030249307_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249307/611752105030249307_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249307/611752105030249307_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249309/611752105030249309_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249309/611752105030249309_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249309/611752105030249309_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250690/611752105030250690_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250690/611752105030250690_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250690/611752105030250690_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250691/611752105030250691_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250691/611752105030250691_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250691/611752105030250691_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250695/611752105030250695_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250695/611752105030250695_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250695/611752105030250695_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250698/611752105030250698_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250698/611752105030250698_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250698/611752105030250698_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030250699/611752105030250699_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250699/611752105030250699_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250699/611752105030250699_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250701/611752105030250701_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250701/611752105030250701_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250701/611752105030250701_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250702/611752105030250702_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250702/611752105030250702_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250702/611752105030250702_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250704/611752105030250704_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250704/611752105030250704_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250704/611752105030250704_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250711/611752105030250711_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250711/611752105030250711_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250711/611752105030250711_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250715/611752105030250715_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250715/611752105030250715_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250715/611752105030250715_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250716/611752105030250716_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250716/611752105030250716_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250716/611752105030250716_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250717/611752105030250717_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250717/611752105030250717_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250717/611752105030250717_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250718/611752105030250718_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250718/611752105030250718_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250718/611752105030250718_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250720/611752105030250720_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250720/611752105030250720_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250720/611752105030250720_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250721/611752105030250721_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250721/611752105030250721_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250721/611752105030250721_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250725/611752105030250725_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030250725/611752105030250725_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250725/611752105030250725_8162774327817435.wav"
+    # ]
+    #
+    # input_wavs = [
+    #     "data/out_data/me_top500/611752105027601574/611752105027601574_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105027601574/611752105027601574_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105027601574/611752105027601574_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105028392007/611752105028392007_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105028392007/611752105028392007_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105028392007/611752105028392007_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105028480056/611752105028480056_3634463651.wav",
+    #     "data/out_data/me_top500/611752105028480056/611752105028480056_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105028480056/611752105028480056_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105028480653/611752105028480653_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105028480653/611752105028480653_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105028480653/611752105028480653_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105029951597/611752105029951597_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105029951597/611752105029951597_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105029951597/611752105029951597_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105029951624/611752105029951624_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105029951624/611752105029951624_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105029951624/611752105029951624_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248965/611752105030248965_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030248965/611752105030248965_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248965/611752105030248965_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030248971/611752105030248971_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248971/611752105030248971_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248971/611752105030248971_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248972/611752105030248972_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248972/611752105030248972_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030248972/611752105030248972_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248973/611752105030248973_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248973/611752105030248973_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030248973/611752105030248973_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030248974/611752105030248974_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248974/611752105030248974_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030248974/611752105030248974_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248977/611752105030248977_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248977/611752105030248977_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030248977/611752105030248977_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030248981/611752105030248981_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248981/611752105030248981_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030248981/611752105030248981_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030248982/611752105030248982_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248982/611752105030248982_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030248982/611752105030248982_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248988/611752105030248988_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030248988/611752105030248988_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248988/611752105030248988_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030248992/611752105030248992_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248992/611752105030248992_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030248992/611752105030248992_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248994/611752105030248994_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248994/611752105030248994_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030248994/611752105030248994_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030248995/611752105030248995_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030248995/611752105030248995_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030248995/611752105030248995_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249000/611752105030249000_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249000/611752105030249000_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249000/611752105030249000_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249001/611752105030249001_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249001/611752105030249001_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249001/611752105030249001_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249007/611752105030249007_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249007/611752105030249007_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249007/611752105030249007_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249009/611752105030249009_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249009/611752105030249009_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249009/611752105030249009_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249010/611752105030249010_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249010/611752105030249010_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249010/611752105030249010_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249011/611752105030249011_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249011/611752105030249011_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249011/611752105030249011_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249016/611752105030249016_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249016/611752105030249016_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249016/611752105030249016_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249018/611752105030249018_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249018/611752105030249018_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249018/611752105030249018_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249019/611752105030249019_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249019/611752105030249019_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249019/611752105030249019_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249020/611752105030249020_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249020/611752105030249020_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249020/611752105030249020_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249022/611752105030249022_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249022/611752105030249022_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249022/611752105030249022_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249025/611752105030249025_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249025/611752105030249025_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249025/611752105030249025_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249030/611752105030249030_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249030/611752105030249030_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249030/611752105030249030_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249031/611752105030249031_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249031/611752105030249031_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249031/611752105030249031_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249032/611752105030249032_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249032/611752105030249032_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249032/611752105030249032_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249034/611752105030249034_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249034/611752105030249034_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249034/611752105030249034_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249035/611752105030249035_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249035/611752105030249035_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249035/611752105030249035_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249036/611752105030249036_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249036/611752105030249036_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249036/611752105030249036_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249037/611752105030249037_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249037/611752105030249037_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249037/611752105030249037_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249038/611752105030249038_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249038/611752105030249038_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249038/611752105030249038_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249040/611752105030249040_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249040/611752105030249040_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249040/611752105030249040_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249041/611752105030249041_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249041/611752105030249041_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249041/611752105030249041_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249048/611752105030249048_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249048/611752105030249048_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249048/611752105030249048_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249049/611752105030249049_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249049/611752105030249049_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249049/611752105030249049_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249052/611752105030249052_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249052/611752105030249052_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249052/611752105030249052_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249053/611752105030249053_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249053/611752105030249053_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249053/611752105030249053_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249055/611752105030249055_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249055/611752105030249055_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249055/611752105030249055_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249057/611752105030249057_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249057/611752105030249057_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249057/611752105030249057_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249058/611752105030249058_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249058/611752105030249058_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249058/611752105030249058_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249065/611752105030249065_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249065/611752105030249065_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249065/611752105030249065_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249067/611752105030249067_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249067/611752105030249067_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249067/611752105030249067_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249070/611752105030249070_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249070/611752105030249070_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249070/611752105030249070_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249071/611752105030249071_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249071/611752105030249071_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249071/611752105030249071_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249073/611752105030249073_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249073/611752105030249073_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249073/611752105030249073_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249074/611752105030249074_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249074/611752105030249074_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249074/611752105030249074_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249077/611752105030249077_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249077/611752105030249077_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249077/611752105030249077_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249079/611752105030249079_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249079/611752105030249079_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249079/611752105030249079_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249082/611752105030249082_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249082/611752105030249082_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249082/611752105030249082_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249091/611752105030249091_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249091/611752105030249091_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249091/611752105030249091_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249094/611752105030249094_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249094/611752105030249094_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249094/611752105030249094_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249099/611752105030249099_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249099/611752105030249099_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249099/611752105030249099_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249104/611752105030249104_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249104/611752105030249104_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249104/611752105030249104_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249105/611752105030249105_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249105/611752105030249105_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249105/611752105030249105_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249111/611752105030249111_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249111/611752105030249111_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249111/611752105030249111_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249112/611752105030249112_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249112/611752105030249112_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249112/611752105030249112_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249113/611752105030249113_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249113/611752105030249113_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249113/611752105030249113_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249118/611752105030249118_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249118/611752105030249118_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249118/611752105030249118_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249121/611752105030249121_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249121/611752105030249121_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249121/611752105030249121_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249127/611752105030249127_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249127/611752105030249127_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249127/611752105030249127_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249128/611752105030249128_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249128/611752105030249128_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249128/611752105030249128_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249133/611752105030249133_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249133/611752105030249133_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249133/611752105030249133_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249134/611752105030249134_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249134/611752105030249134_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249134/611752105030249134_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249136/611752105030249136_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249136/611752105030249136_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249136/611752105030249136_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249143/611752105030249143_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249143/611752105030249143_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249143/611752105030249143_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249148/611752105030249148_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249148/611752105030249148_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249148/611752105030249148_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249153/611752105030249153_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249153/611752105030249153_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249153/611752105030249153_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249157/611752105030249157_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249157/611752105030249157_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249157/611752105030249157_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249160/611752105030249160_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249160/611752105030249160_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249160/611752105030249160_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249161/611752105030249161_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249161/611752105030249161_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249161/611752105030249161_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249162/611752105030249162_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249162/611752105030249162_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249162/611752105030249162_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249163/611752105030249163_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249163/611752105030249163_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249163/611752105030249163_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249171/611752105030249171_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249171/611752105030249171_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249171/611752105030249171_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249173/611752105030249173_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249173/611752105030249173_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249173/611752105030249173_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249174/611752105030249174_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249174/611752105030249174_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249174/611752105030249174_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249175/611752105030249175_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249175/611752105030249175_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249175/611752105030249175_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249176/611752105030249176_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249176/611752105030249176_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249176/611752105030249176_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249177/611752105030249177_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249177/611752105030249177_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249177/611752105030249177_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249178/611752105030249178_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249178/611752105030249178_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249178/611752105030249178_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249181/611752105030249181_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249181/611752105030249181_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249181/611752105030249181_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249191/611752105030249191_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249191/611752105030249191_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249191/611752105030249191_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249195/611752105030249195_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249195/611752105030249195_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249195/611752105030249195_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249200/611752105030249200_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249200/611752105030249200_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249200/611752105030249200_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249201/611752105030249201_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249201/611752105030249201_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249201/611752105030249201_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249206/611752105030249206_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249206/611752105030249206_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249206/611752105030249206_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249209/611752105030249209_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249209/611752105030249209_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249209/611752105030249209_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249211/611752105030249211_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249211/611752105030249211_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249211/611752105030249211_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249213/611752105030249213_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249213/611752105030249213_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249213/611752105030249213_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249216/611752105030249216_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249216/611752105030249216_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249216/611752105030249216_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249218/611752105030249218_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249218/611752105030249218_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249218/611752105030249218_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249224/611752105030249224_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249224/611752105030249224_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249224/611752105030249224_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249227/611752105030249227_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249227/611752105030249227_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249227/611752105030249227_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249233/611752105030249233_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249233/611752105030249233_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249233/611752105030249233_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249237/611752105030249237_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249237/611752105030249237_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249237/611752105030249237_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249240/611752105030249240_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249240/611752105030249240_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249240/611752105030249240_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249243/611752105030249243_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249243/611752105030249243_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249243/611752105030249243_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249244/611752105030249244_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249244/611752105030249244_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249244/611752105030249244_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249245/611752105030249245_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249245/611752105030249245_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249245/611752105030249245_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249250/611752105030249250_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249250/611752105030249250_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249250/611752105030249250_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249255/611752105030249255_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249255/611752105030249255_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249255/611752105030249255_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249258/611752105030249258_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249258/611752105030249258_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249258/611752105030249258_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249264/611752105030249264_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249264/611752105030249264_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249264/611752105030249264_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249267/611752105030249267_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249267/611752105030249267_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249267/611752105030249267_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249273/611752105030249273_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249273/611752105030249273_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249273/611752105030249273_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249275/611752105030249275_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249275/611752105030249275_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249275/611752105030249275_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249278/611752105030249278_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249278/611752105030249278_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249278/611752105030249278_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249280/611752105030249280_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249280/611752105030249280_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249280/611752105030249280_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249281/611752105030249281_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249281/611752105030249281_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249281/611752105030249281_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249282/611752105030249282_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249282/611752105030249282_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249282/611752105030249282_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249283/611752105030249283_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249283/611752105030249283_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249283/611752105030249283_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249284/611752105030249284_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249284/611752105030249284_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249284/611752105030249284_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249287/611752105030249287_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249287/611752105030249287_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249287/611752105030249287_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249288/611752105030249288_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249288/611752105030249288_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249288/611752105030249288_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249289/611752105030249289_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249289/611752105030249289_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249289/611752105030249289_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249292/611752105030249292_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249292/611752105030249292_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249292/611752105030249292_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249293/611752105030249293_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249293/611752105030249293_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249293/611752105030249293_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249295/611752105030249295_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249295/611752105030249295_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249295/611752105030249295_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249296/611752105030249296_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249296/611752105030249296_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249296/611752105030249296_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249299/611752105030249299_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249299/611752105030249299_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249299/611752105030249299_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249302/611752105030249302_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249302/611752105030249302_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249302/611752105030249302_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249307/611752105030249307_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249307/611752105030249307_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249307/611752105030249307_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249309/611752105030249309_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249309/611752105030249309_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249309/611752105030249309_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249318/611752105030249318_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249318/611752105030249318_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249318/611752105030249318_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249319/611752105030249319_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249319/611752105030249319_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249319/611752105030249319_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249320/611752105030249320_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249320/611752105030249320_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249320/611752105030249320_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249321/611752105030249321_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249321/611752105030249321_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249321/611752105030249321_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249322/611752105030249322_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249322/611752105030249322_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249322/611752105030249322_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249323/611752105030249323_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249323/611752105030249323_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249323/611752105030249323_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249324/611752105030249324_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249324/611752105030249324_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249324/611752105030249324_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249325/611752105030249325_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249325/611752105030249325_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249325/611752105030249325_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249327/611752105030249327_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249327/611752105030249327_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249327/611752105030249327_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249329/611752105030249329_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249329/611752105030249329_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249329/611752105030249329_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249330/611752105030249330_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249330/611752105030249330_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249330/611752105030249330_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249332/611752105030249332_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249332/611752105030249332_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249332/611752105030249332_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249333/611752105030249333_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249333/611752105030249333_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249333/611752105030249333_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249334/611752105030249334_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249334/611752105030249334_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249334/611752105030249334_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249336/611752105030249336_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249336/611752105030249336_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249336/611752105030249336_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249337/611752105030249337_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249337/611752105030249337_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249337/611752105030249337_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249338/611752105030249338_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249338/611752105030249338_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249338/611752105030249338_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249339/611752105030249339_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249339/611752105030249339_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249339/611752105030249339_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249340/611752105030249340_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249340/611752105030249340_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249340/611752105030249340_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249341/611752105030249341_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249341/611752105030249341_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249341/611752105030249341_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249342/611752105030249342_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249342/611752105030249342_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249342/611752105030249342_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249343/611752105030249343_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249343/611752105030249343_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249343/611752105030249343_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249345/611752105030249345_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249345/611752105030249345_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249345/611752105030249345_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249346/611752105030249346_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249346/611752105030249346_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249346/611752105030249346_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249347/611752105030249347_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249347/611752105030249347_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249347/611752105030249347_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249348/611752105030249348_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249348/611752105030249348_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249348/611752105030249348_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249349/611752105030249349_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249349/611752105030249349_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249349/611752105030249349_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249350/611752105030249350_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249350/611752105030249350_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249350/611752105030249350_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249352/611752105030249352_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249352/611752105030249352_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249352/611752105030249352_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249353/611752105030249353_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249353/611752105030249353_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249353/611752105030249353_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249354/611752105030249354_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249354/611752105030249354_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249354/611752105030249354_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249355/611752105030249355_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249355/611752105030249355_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249355/611752105030249355_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249356/611752105030249356_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249356/611752105030249356_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249356/611752105030249356_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249357/611752105030249357_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249357/611752105030249357_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249357/611752105030249357_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249358/611752105030249358_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249358/611752105030249358_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249358/611752105030249358_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249359/611752105030249359_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249359/611752105030249359_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249359/611752105030249359_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249361/611752105030249361_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249361/611752105030249361_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249361/611752105030249361_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249362/611752105030249362_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249362/611752105030249362_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249362/611752105030249362_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249363/611752105030249363_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249363/611752105030249363_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249363/611752105030249363_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249364/611752105030249364_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249364/611752105030249364_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249364/611752105030249364_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249365/611752105030249365_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249365/611752105030249365_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249365/611752105030249365_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249366/611752105030249366_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249366/611752105030249366_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249366/611752105030249366_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249367/611752105030249367_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249367/611752105030249367_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249367/611752105030249367_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249368/611752105030249368_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249368/611752105030249368_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249368/611752105030249368_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249369/611752105030249369_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249369/611752105030249369_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249369/611752105030249369_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249370/611752105030249370_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249370/611752105030249370_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249370/611752105030249370_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249371/611752105030249371_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249371/611752105030249371_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249371/611752105030249371_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249372/611752105030249372_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249372/611752105030249372_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249372/611752105030249372_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249373/611752105030249373_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249373/611752105030249373_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249373/611752105030249373_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249374/611752105030249374_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249374/611752105030249374_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249374/611752105030249374_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249375/611752105030249375_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249375/611752105030249375_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249375/611752105030249375_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249377/611752105030249377_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249377/611752105030249377_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249377/611752105030249377_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249378/611752105030249378_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249378/611752105030249378_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249378/611752105030249378_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249379/611752105030249379_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249379/611752105030249379_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249379/611752105030249379_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249381/611752105030249381_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249381/611752105030249381_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249381/611752105030249381_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249383/611752105030249383_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249383/611752105030249383_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249383/611752105030249383_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249384/611752105030249384_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249384/611752105030249384_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249384/611752105030249384_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249385/611752105030249385_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249385/611752105030249385_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249385/611752105030249385_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249386/611752105030249386_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249386/611752105030249386_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249386/611752105030249386_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249387/611752105030249387_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249387/611752105030249387_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249387/611752105030249387_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249388/611752105030249388_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249388/611752105030249388_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249388/611752105030249388_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249390/611752105030249390_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249390/611752105030249390_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249390/611752105030249390_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249391/611752105030249391_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249391/611752105030249391_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249391/611752105030249391_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249392/611752105030249392_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249392/611752105030249392_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249392/611752105030249392_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249393/611752105030249393_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249393/611752105030249393_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249393/611752105030249393_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249394/611752105030249394_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249394/611752105030249394_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249394/611752105030249394_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249395/611752105030249395_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249395/611752105030249395_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249395/611752105030249395_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249396/611752105030249396_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249396/611752105030249396_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249396/611752105030249396_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249397/611752105030249397_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249397/611752105030249397_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249397/611752105030249397_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249398/611752105030249398_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249398/611752105030249398_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249398/611752105030249398_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249399/611752105030249399_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249399/611752105030249399_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249399/611752105030249399_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249401/611752105030249401_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249401/611752105030249401_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249401/611752105030249401_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249402/611752105030249402_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249402/611752105030249402_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249402/611752105030249402_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249403/611752105030249403_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249403/611752105030249403_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249403/611752105030249403_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249404/611752105030249404_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249404/611752105030249404_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249404/611752105030249404_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249405/611752105030249405_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249405/611752105030249405_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249405/611752105030249405_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249406/611752105030249406_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249406/611752105030249406_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249406/611752105030249406_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249407/611752105030249407_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249407/611752105030249407_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249407/611752105030249407_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249408/611752105030249408_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249408/611752105030249408_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249408/611752105030249408_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249409/611752105030249409_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249409/611752105030249409_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249409/611752105030249409_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030249410/611752105030249410_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249410/611752105030249410_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249410/611752105030249410_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249412/611752105030249412_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249412/611752105030249412_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249412/611752105030249412_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249413/611752105030249413_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249413/611752105030249413_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249413/611752105030249413_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249414/611752105030249414_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249414/611752105030249414_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249414/611752105030249414_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249415/611752105030249415_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249415/611752105030249415_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030249415/611752105030249415_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249416/611752105030249416_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249416/611752105030249416_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249416/611752105030249416_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249417/611752105030249417_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249417/611752105030249417_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249417/611752105030249417_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249418/611752105030249418_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249418/611752105030249418_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249418/611752105030249418_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030249419/611752105030249419_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249419/611752105030249419_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030249419/611752105030249419_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030249420/611752105030249420_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030249420/611752105030249420_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249420/611752105030249420_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030249431/611752105030249431_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030249431/611752105030249431_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030249431/611752105030249431_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250690/611752105030250690_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250690/611752105030250690_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250690/611752105030250690_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250691/611752105030250691_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250691/611752105030250691_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250691/611752105030250691_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250695/611752105030250695_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250695/611752105030250695_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250695/611752105030250695_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250698/611752105030250698_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250698/611752105030250698_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250698/611752105030250698_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030250699/611752105030250699_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250699/611752105030250699_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250699/611752105030250699_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250701/611752105030250701_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250701/611752105030250701_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250701/611752105030250701_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250702/611752105030250702_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250702/611752105030250702_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250702/611752105030250702_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250704/611752105030250704_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250704/611752105030250704_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250704/611752105030250704_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250711/611752105030250711_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250711/611752105030250711_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250711/611752105030250711_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250715/611752105030250715_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250715/611752105030250715_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250715/611752105030250715_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250716/611752105030250716_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250716/611752105030250716_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250716/611752105030250716_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250717/611752105030250717_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250717/611752105030250717_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250717/611752105030250717_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250718/611752105030250718_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250718/611752105030250718_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250718/611752105030250718_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250720/611752105030250720_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250720/611752105030250720_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250720/611752105030250720_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250721/611752105030250721_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250721/611752105030250721_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250721/611752105030250721_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250725/611752105030250725_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030250725/611752105030250725_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250725/611752105030250725_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250726/611752105030250726_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250726/611752105030250726_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250726/611752105030250726_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250728/611752105030250728_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250728/611752105030250728_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250728/611752105030250728_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250729/611752105030250729_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250729/611752105030250729_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250729/611752105030250729_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250730/611752105030250730_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250730/611752105030250730_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030250730/611752105030250730_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250732/611752105030250732_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250732/611752105030250732_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250732/611752105030250732_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250733/611752105030250733_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250733/611752105030250733_8162774327817435.wav",
+    #     "data/out_data/me_top500/611752105030250733/611752105030250733_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250735/611752105030250735_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250735/611752105030250735_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250735/611752105030250735_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250736/611752105030250736_10414574140317353.wav",
+    #     "data/out_data/me_top500/611752105030250736/611752105030250736_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250736/611752105030250736_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250739/611752105030250739_10414574138721494.wav",
+    #     "data/out_data/me_top500/611752105030250739/611752105030250739_1688849864840588.wav",
+    #     "data/out_data/me_top500/611752105030250739/611752105030250739_5910973794723621.wav",
+    #     "data/out_data/me_top500/611752105030250741/611752105030250741_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250741/611752105030250741_6755399374234747.wav",
+    #     "data/out_data/me_top500/611752105030250741/611752105030250741_8162774329368194.wav",
+    #     "data/out_data/me_top500/611752105030250743/611752105030250743_3634463651.wav",
+    #     "data/out_data/me_top500/611752105030250743/611752105030250743_5629499489839033.wav",
+    #     "data/out_data/me_top500/611752105030250743/611752105030250743_5910973794723621.wav"
+    # ]
+    # input_wavs_volume = [
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/90/90_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/91/91_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/92/92_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/93/93_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/94/94_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/96/96_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/97/97_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/99/99_dev.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/9/9_dev.wav",
+    # ]
+    #
+    # vocals = [
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/90/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/91/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/92/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/93/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/94/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/96/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/97/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/99/vocal.wav",
+    #     "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/youtube_me_100/9/vocal.wav"
+    # ]
+
+    # for in_f, in_v_f, v_f in zip(input_wavs, input_wavs_volume, vocals):
+    # for i in range(len(input_wavs)):
+    #     if input_wavs[i] in old_input_wavs:
+    #         continue
+    #     input_wavs[i] = os.path.join("/data/rsync/jianli.yang/AutoCoverTool", input_wavs[i])
+    #     in_f = input_wavs[i]
+    #     in_v_f = input_wavs[i]
+    #     v_f = "/".join(input_wavs[i].replace("out_data", "inf_users").split("/")[:-1]) + "/vocal.wav"
+    #     st = time.time()
+    #     re.process(in_f, in_v_f, v_f)
+    #     print("sp={}".format(time.time() - st))
+    # split_vocal2fragment("/data/rsync/jianli.yang/AutoCoverTool/data/out_data/youtube_me_100/94/94_3634463651.wav")
diff --git a/AutoCoverTool/ref/split_dirty_frame/split_dirty_frame.py b/AutoCoverTool/ref/split_dirty_frame/split_dirty_frame.py
new file mode 100644
index 0000000..4ab89f4
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/split_dirty_frame.py
@@ -0,0 +1,87 @@
+"""
+切割出有问题的段
+1. 载入音频
+2. 分帧,采样率44100,帧长2048,帧移1024, 23ms一帧
+3. 每11帧做一个统计，当做中间那一帧的结果,打印出对应帧的均值和方差
+"""
+import librosa
+import numpy as np
+import matplotlib.pyplot as plt
+
+
+def tm2sec(tm):
+    """
+    分:秒.xxx 转为 tm
+    :param tm:
+    :return:
+    """
+    tm_arr = str(tm).split(":")
+    return int(int(tm_arr[0]) * 60) + float(tm_arr[1])
+
+
+def load_data():
+    label_txt = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/test1/test6/top_100/example/example.txt"
+    # filename => [[st, end, label]]
+    msg_dict = {}
+    with open(label_txt) as f:
+        lines = f.readlines()
+        for line in lines:
+            line = line.strip().split(",")
+            if len(line) != 4:
+                continue
+            filename = line[0]
+            tp = line[1]
+            st = tm2sec(line[2])
+            ed = tm2sec(line[3])
+            if filename not in msg_dict.keys():
+                msg_dict[filename] = []
+            msg_dict[filename].append([st, ed, tp])
+    return msg_dict
+
+
+def get_feature(path):
+    data, sr = librosa.load(path, sr=44100, mono=True)
+    stft_data = np.abs(librosa.stft(data, win_length=2048, hop_length=1024))
+    return stft_data.transpose()
+
+
+def process(path):
+    msg_dict = load_data()
+    msg = msg_dict["611752105020942848_10414574140317353"]
+    data = get_feature(path)
+    frame_ms = 1024 / 44100
+    st_ms = frame_ms * 5
+
+    normal_data = []
+    color_data = []
+    for i in range(5, len(data) - 6):
+        cur_data = data[i - 5:i + 6]
+        tm = round(st_ms, 2)
+        mean = round(np.mean(np.mean(cur_data, axis=1)), 4)
+        std = round(np.mean(np.std(cur_data, axis=1)), 4)
+        power = np.sum(cur_data)
+        st_ms += frame_ms
+        color = 'black'
+        for idx in range(len(msg)):
+            st = msg[idx][0]
+            ed = msg[idx][1]
+            # 在时间段中
+            if st <= st_ms <= ed:
+                color = "red"
+                break
+            # 查询时该时间段已经大于当前时间了，向后查没有必要
+            if st > st_ms:
+                break
+
+        normal_data.append([float(tm), float(mean), float(std), float(power)])
+        color_data.append(color)
+    normal_data = np.array(normal_data)
+    color_data = np.array(color_data)
+    print(normal_data.shape)
+    plt.scatter(normal_data[::2, 0], normal_data[::2, 3], c=color_data[::2])
+    plt.show()
+
+
+if __name__ == '__main__':
+    pp = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/resource/test1/test6/top_100/example/611752105020942848/611752105020942848_10414574140317353.wav"
+    process(pp)
diff --git a/AutoCoverTool/ref/split_dirty_frame/train.py b/AutoCoverTool/ref/split_dirty_frame/train.py
new file mode 100644
index 0000000..582ae81
--- /dev/null
+++ b/AutoCoverTool/ref/split_dirty_frame/train.py
@@ -0,0 +1,142 @@
+from dataset.dataset import *
+from models.model import *
+
+import torch.nn as nn
+import torch
+import torch.nn.functional as functional
+from tqdm import tqdm
+import os
+import sys
+from torch.optim.lr_scheduler import MultiStepLR
+import time
+from torch.utils.data import DataLoader
+import torch.utils.data as data
+
+# 通用配置
+BatchSize = 32
+ThreadNum = 8
+# 训练配置参数
+MaxEpoch = 200
+LR = 1e-3
+Momentum = 0
+WeightDecay = 0
+
+Milestones = [20, 30, 50, 100]
+Gamma = 0.1
+
+
+def get_dataloader(root):
+    train_set = CustomDataset(root, "train")
+    train_loader = DataLoader(train_set, batch_size=BatchSize, shuffle=True, num_workers=ThreadNum)
+
+    val_set = CustomDataset(root, "val")
+    val_loader = DataLoader(val_set, batch_size=BatchSize, shuffle=False, num_workers=ThreadNum)
+
+    return train_loader, val_loader
+
+
+def train_one_epoch(model, device, loader, optimizer, criterion):
+    model.train()
+
+    total_num = 0
+    total_loss = 0
+    correct = 0
+
+    for images, labels in tqdm(loader):
+        batch_size = images.size(0)
+        images = images.to(device)
+        labels = labels.to(device)
+
+        predicts = model(images)
+
+        optimizer.zero_grad()
+        loss = criterion(predicts, labels)
+        loss.backward()
+        optimizer.step()
+
+        total_num += batch_size
+        total_loss += loss.item() * batch_size
+
+        _, predicts = predicts.max(dim=1)
+        correct += predicts.eq(labels).sum().item()
+
+    if total_num != 0:
+        total_loss = total_loss / total_num
+        correct = correct / total_num
+
+    return total_loss, correct
+
+
+def val_one_epoch(model, device, loader, criterion):
+    model.eval()
+
+    total_num = 0
+    total_loss = 0
+    correct = 0
+
+    with torch.no_grad():
+        for images, labels in loader:
+            batch_size = images.size(0)
+            images = images.to(device)
+            labels = labels.to(device)
+            predicts = model(images)
+
+            loss = criterion(predicts, labels)
+
+            total_num += batch_size
+            total_loss += loss.item() * batch_size
+
+            _, predicts = predicts.max(dim=1)
+            correct += predicts.eq(labels).sum().item()
+
+    if total_num != 0:
+        total_loss = total_loss / total_num
+        correct = correct / total_num
+
+    return total_loss, correct
+
+
+def train():
+    set_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/dataset_dev"
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+    model = get_cur_model()
+    model.to(device)
+
+    # 模型保存路径
+    save_directory = "output_v5_3_4"
+    if not os.path.exists(save_directory):
+        os.makedirs(save_directory)
+
+    optimizer = torch.optim.SGD(model.parameters(), lr=LR, momentum=Momentum, weight_decay=WeightDecay)
+    # optimizer = torch.optim.Adam(model.parameters(), lr=LR)
+    criterion = nn.CrossEntropyLoss()
+    scheduler = MultiStepLR(optimizer, Milestones, Gamma)
+
+    # 文件地址
+    train_loader, val_loader = get_dataloader(set_dir)
+
+    max_acc = 0
+    for i in range(MaxEpoch):
+        start = time.time()
+        t_loss, t_acc = train_one_epoch(model, device, train_loader, optimizer, criterion)
+        v_loss, v_acc = val_one_epoch(model, device, val_loader, criterion)
+        end = time.time()
+
+        scheduler.step(i)
+
+        msg = 't_loss:%f\tt_acc:%.2f' % (t_loss, t_acc * 100)
+        msg += '\tv_loss:%f\tv_acc:%.2f' % (v_loss, v_acc * 100)
+        msg += '\ttime:%f\tepoch:%d' % (end - start, i)
+        print(msg)
+
+        params = model.state_dict()
+        save_path = os.path.join(save_directory, 'epoch_' + str(i) + '_' + str(v_acc) + '.pth')
+        torch.save(params, save_path)
+
+        max_acc = max(max_acc, v_acc)
+
+    print('最大acc为：', max_acc)
+
+
+if __name__ == '__main__':
+    train()
diff --git a/AutoCoverTool/ref/tools/mixer/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/CMakeLists.txt
new file mode 100644
index 0000000..1be8553
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/CMakeLists.txt
@@ -0,0 +1,116 @@
+cmake_minimum_required(VERSION 2.8)
+project(mixer)
+
+set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib) #����lib���ɵ�Ŀ¼
+set(CMAKE_CXX_STANDARD 11)
+
+include_directories(alimter/inc)
+include_directories(waves/inc)
+include_directories(ebur128/inc)
+include_directories(audio_mixer/inc)
+include_directories(audio_effects_lib/inc audio_effects_lib/example)
+include_directories(denoise/webrtc/include)
+add_subdirectory(denoise)
+
+# 引入audio_effects_lib
+include_directories(audio_effects_lib)
+include_directories(audio_effects_lib/src)
+include_directories(audio_effects_lib/inc)
+include_directories(audio_effects_lib/common)
+include_directories(audio_effects_lib/ref)
+include_directories(audio_effects_lib/ref/al_reverb/inc)
+include_directories(audio_effects_lib/ref/al_reverb/src)
+include_directories(audio_effects_lib/ref/autotune/inc)
+include_directories(audio_effects_lib/ref/autotune/src)
+include_directories(audio_effects_lib/ref/iir_eq/inc)
+include_directories(audio_effects_lib/ref/iir_eq/src)
+include_directories(audio_effects_lib/ref/phonograph/inc)
+include_directories(audio_effects_lib/ref/phonograph/src)
+include_directories(audio_effects_lib/ref/reverb/inc)
+include_directories(audio_effects_lib/ref/reverb/src)
+include_directories(audio_effects_lib/ref/saudio_effects/inc)
+include_directories(audio_effects_lib/ref/saudio_effects/src)
+include_directories(audio_effects_lib/ref/slow_flanging/inc)
+include_directories(audio_effects_lib/ref/slow_flanging/src)
+include_directories(audio_effects_lib/ref/tone_shift/inc)
+include_directories(audio_effects_lib/ref/tone_shift/src)
+include_directories(audio_effects_lib/ref/common)
+
+include_directories(audio_effects_lib/ref/al_reverb/src/biquad_filters)
+include_directories(audio_effects_lib/ref/al_reverb/src/fast_delay)
+include_directories(audio_effects_lib/ref/al_reverb/src/filter)
+include_directories(audio_effects_lib/ref/al_reverb/src/AlReverbApi.cpp)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_biquad)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_common)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_echo)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb)
+include_directories(audio_effects_lib/ref/al_reverb/src/al_reverb_modulation)
+include_directories(audio_effects_lib/ref/iir_eq/src/audacious_arma)
+include_directories(audio_effects_lib/ref/iir_eq/src/audacious_eq)
+include_directories(audio_effects_lib/ref/saudio_effects/src/all_plat audio_effects_lib/ref/saudio_effects/src/audio_effect audio_effects_lib/ref/saudio_effects/src/biquad
+        audio_effects_lib/ref/saudio_effects/src/buffer audio_effects_lib/ref/saudio_effects/src/damper audio_effects_lib/ref/saudio_effects/src/delay audio_effects_lib/ref/saudio_effects/src/delayi audio_effects_lib/ref/saudio_effects/src/envelope_follower
+        audio_effects_lib/ref/saudio_effects/src/equalizer audio_effects_lib/ref/saudio_effects/src/reverb audio_effects_lib/ref/saudio_effects/src/simple_delay_effect audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect)
+include_directories(audio_effects_lib/ref/tone_shift/src/aa_filter)
+include_directories(audio_effects_lib/ref/tone_shift/src/bpm_detect)
+include_directories(audio_effects_lib/ref/tone_shift/src/cpu_detect)
+include_directories(audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer)
+include_directories(audio_effects_lib/ref/tone_shift/src/fir_filter)
+include_directories(audio_effects_lib/ref/tone_shift/src/peak_finder)
+include_directories(audio_effects_lib/ref/tone_shift/src/rate_transposer)
+include_directories(audio_effects_lib/ref/tone_shift/src/sound_touch)
+include_directories(audio_effects_lib/ref/tone_shift/src/td_stretch)
+include_directories(audio_effects_lib/ref/supersound/inc)
+include_directories(audio_effects_lib/ref/supersound/src)
+include_directories(audio_effects_lib/ref/supersound/src/common)
+include_directories(audio_effects_lib/ref/supersound/src/impulse)
+include_directories(audio_effects_lib/ref/supersound/ref)
+include_directories(audio_effects_lib/ref/supersound/ref/kiss_fft)
+
+AUX_SOURCE_DIRECTORY(audio_effects_lib/common AE_SRC_COMMON_DIR)
+file(GLOB_RECURSE AE_CPP_SRC_DIR audio_effects_lib/src/*cpp)
+file(GLOB_RECURSE AE_CPP_REF_DIR audio_effects_lib/ref/*cpp)
+file(GLOB_RECURSE AE_C_REF_DIR audio_effects_lib/ref/*c)
+
+include_directories(audio_effects_lib/ref/waves/inc)
+list(REMOVE_ITEM AE_CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/audio_effects_lib/ref/audio_resample/src/FfmpegResampler.cpp")
+
+
+AUX_SOURCE_DIRECTORY(alimter/src DIR_ALIMTER_SRCS)
+AUX_SOURCE_DIRECTORY(waves/src DIR_WAVES_SRCS)
+AUX_SOURCE_DIRECTORY(ebur128/src DIR_EBUR128_SRCS)
+AUX_SOURCE_DIRECTORY(audio_mixer/src DIR_AUDIO_MIXER_SRCS)
+
+#add_executable(mixer main.cpp ${DIR_ALIMTER_SRCS} ${DIR_WAVES_SRCS} ${DIR_EBUR128_SRCS} ${DIR_AUDIO_MIXER_SRCS}
+#        ${AE_CPP_SRC_DIR} ${AE_CPP_REF_DIR} ${AE_C_REF_DIR} ${AE_SRC_COMMON_DIR}
+#        audio_effects_lib/example/ae_server/CAeServer.cpp)
+#target_link_libraries(mixer ${LIBRARY_OUTPUT_PATH}/libwebrtc.a -lpthread)
+
+
+# 音量拉伸
+add_executable(draw_volume draw_volume.cpp ${DIR_ALIMTER_SRCS} ${DIR_WAVES_SRCS} ${DIR_EBUR128_SRCS} ${DIR_AUDIO_MIXER_SRCS}
+        ${AE_CPP_SRC_DIR} ${AE_CPP_REF_DIR} ${AE_C_REF_DIR} ${AE_SRC_COMMON_DIR}
+        audio_effects_lib/example/ae_server/CAeServer.cpp)
+target_link_libraries(draw_volume ${LIBRARY_OUTPUT_PATH}/libwebrtc.a -lpthread)
+
+# 降噪
+add_executable(denoise_exe denoise.cpp ${DIR_ALIMTER_SRCS} ${DIR_WAVES_SRCS} ${DIR_EBUR128_SRCS} ${DIR_AUDIO_MIXER_SRCS}
+        ${AE_CPP_SRC_DIR} ${AE_CPP_REF_DIR} ${AE_C_REF_DIR} ${AE_SRC_COMMON_DIR}
+        audio_effects_lib/example/ae_server/CAeServer.cpp)
+target_link_libraries(denoise_exe ${LIBRARY_OUTPUT_PATH}/libwebrtc.a -lpthread)
+
+
+# 简单的混合
+add_executable(simple_mixer simple_mixer.cpp ${DIR_ALIMTER_SRCS} ${DIR_WAVES_SRCS} ${DIR_EBUR128_SRCS} ${DIR_AUDIO_MIXER_SRCS}
+        ${AE_CPP_SRC_DIR} ${AE_CPP_REF_DIR} ${AE_C_REF_DIR} ${AE_SRC_COMMON_DIR}
+        audio_effects_lib/example/ae_server/CAeServer.cpp)
+target_link_libraries(simple_mixer ${LIBRARY_OUTPUT_PATH}/libwebrtc.a -lpthread)
+
+# 音效
+add_executable(im_effect_exe im_effect.cpp ${DIR_ALIMTER_SRCS} ${DIR_WAVES_SRCS} ${DIR_EBUR128_SRCS} ${DIR_AUDIO_MIXER_SRCS}
+        ${AE_CPP_SRC_DIR} ${AE_CPP_REF_DIR} ${AE_C_REF_DIR} ${AE_SRC_COMMON_DIR}
+        audio_effects_lib/example/ae_server/CAeServer.cpp)
+target_link_libraries(im_effect_exe ${LIBRARY_OUTPUT_PATH}/libwebrtc.a -lpthread)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/alimter/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/alimter/CMakeLists.txt
new file mode 100644
index 0000000..9748c4d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/alimter/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_ALIMTER_SRCS)
+add_library(alimiter ${DIR_ALIMTER_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/alimter/inc/alimiter.h b/AutoCoverTool/ref/tools/mixer/alimter/inc/alimiter.h
new file mode 100755
index 0000000..8022d39
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/alimter/inc/alimiter.h
@@ -0,0 +1,99 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现 FFMPEG 中的限制器，这个压限器对频谱友好，但是压得比较厉害
+
+#ifndef __ALIMITER_H__
+#define __ALIMITER_H__
+
+#include <stdint.h>
+#define ERROR_SUPERSOUND_SUCCESS 0
+#define ERROR_SUPERSOUND_PARAM -1
+#define ERROR_SUPERSOUND_MEMORY -2
+typedef struct AudioLimiterContext
+{
+	float limit;
+	float attack;
+	float release;
+	float att;
+	float level_in;
+	float level_out;
+	int32_t auto_release;
+	int32_t auto_level;
+	float asc;
+	int32_t asc_c;
+	int32_t asc_pos;
+	float asc_coeff;
+
+	float *buffer;
+	int32_t buffer_size;
+	int32_t buffer_max_size;
+	int32_t pos;
+	int32_t *nextpos;
+	float *nextdelta;
+
+	float delta;
+	int32_t nextiter;
+	int32_t nextlen;
+	int32_t asc_changed;
+}AudioLimiterContext;
+
+namespace SUPERSOUND
+{
+
+
+class Alimiter
+{
+public:
+	Alimiter();
+	~Alimiter();
+
+public:
+	void Flush();
+	int32_t GetLatecy();
+	int32_t SetParam(int32_t fs, int32_t channels);
+	void Filter(float * input, float * output, int32_t num);
+
+private:
+	void Uninit();
+	int32_t config_input();
+	float get_rdelta(AudioLimiterContext *s, float release, int sample_rate, float peak, float limit, float patt, int asc);
+
+private:
+	AudioLimiterContext m_alimiterCtx;
+	int m_nChannels;
+	int m_nFs;
+};
+
+
+}
+
+#endif /* __ALIMITER_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/alimter/src/alimiter.cpp b/AutoCoverTool/ref/tools/mixer/alimter/src/alimiter.cpp
new file mode 100755
index 0000000..abbd622
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/alimter/src/alimiter.cpp
@@ -0,0 +1,306 @@
+
+#include "alimiter.h"
+#include <string.h>
+#include <math.h>
+#include <stdio.h>
+#include <new>
+
+#define MAX(a,b) (((a) > (b)) ? (a) : (b))
+#define MIN(a,b) (((a) < (b)) ? (a) : (b))
+#define MIDDLE(x, y, z) ((x)<(y)?((y)<(z)?(y):(x)<(z)?(z):(x)):((y)>(z)?(y):(x)>(z)?(z):(x)))
+#define SAFE_DELETE_PTR(ptr)    \
+{                                                               \
+        if(ptr)                                         \
+        {                                                       \
+                delete [] ptr;                  \
+                ptr = NULL;                             \
+        }                                                       \
+}
+
+namespace SUPERSOUND
+{
+
+
+Alimiter::Alimiter()
+{
+	memset(&m_alimiterCtx, 0, sizeof(m_alimiterCtx));
+
+	m_nChannels = 0;
+	m_nFs = 0;
+
+	Flush();
+}
+
+Alimiter::~Alimiter()
+{
+	Uninit();
+}
+
+void Alimiter::Flush()
+{
+	float * buffer = m_alimiterCtx.buffer;
+	float * nextdelta = m_alimiterCtx.nextdelta;
+	int32_t * nextpos = m_alimiterCtx.nextpos;
+	int32_t buffer_max_size = m_alimiterCtx.buffer_max_size;
+	int32_t buffer_size = m_alimiterCtx.buffer_size;
+
+	if(buffer)
+		memset(buffer, 0, sizeof(float) * buffer_max_size);
+	if(nextdelta)
+		memset(nextdelta, 0, sizeof(float) * buffer_max_size);
+	if(nextpos)
+		memset(nextpos, -1, sizeof(float) * buffer_max_size);
+
+	memset(&m_alimiterCtx, 0, sizeof(m_alimiterCtx));
+
+	m_alimiterCtx.level_in = 1;
+	m_alimiterCtx.level_out = 32000 / 32768.0;
+	m_alimiterCtx.limit = 1;
+	m_alimiterCtx.attack = 5;
+	m_alimiterCtx.release = 50;
+	m_alimiterCtx.auto_release = 0;
+	m_alimiterCtx.asc_coeff = 0.5;
+	m_alimiterCtx.auto_level = 1;
+
+	m_alimiterCtx.attack /= 1000;
+	m_alimiterCtx.release /= 1000;
+	m_alimiterCtx.att = 1;
+	m_alimiterCtx.asc_pos = -1;
+	m_alimiterCtx.asc_coeff = pow(0.5f, m_alimiterCtx.asc_coeff - 0.5f) * 2 * -1;
+
+	m_alimiterCtx.buffer = buffer;
+	m_alimiterCtx.nextdelta = nextdelta;
+	m_alimiterCtx.nextpos = nextpos;
+	m_alimiterCtx.buffer_max_size = buffer_max_size;
+	m_alimiterCtx.buffer_size = buffer_size;
+}
+
+int32_t Alimiter::GetLatecy()
+{
+	return m_alimiterCtx.buffer_size / m_nChannels;
+}
+
+int32_t Alimiter::SetParam( int32_t fs, int32_t channels )
+{
+	if((fs == m_nFs) && (channels == m_nChannels))
+		return ERROR_SUPERSOUND_SUCCESS;
+
+	m_nChannels = channels;
+	m_nFs = fs;
+
+	return config_input();
+}
+
+void Alimiter::Filter( float * input, float * output, int32_t num )
+{
+	num = num / m_nChannels;
+	int channels = m_nChannels;
+	int buffer_size = m_alimiterCtx.buffer_size;
+	float * buffer = m_alimiterCtx.buffer;
+	float release = m_alimiterCtx.release;
+	float limit = m_alimiterCtx.limit;
+	float * nextdelta = m_alimiterCtx.nextdelta;
+	float level = m_alimiterCtx.auto_level ? 1 / limit : 1;
+	float level_out = m_alimiterCtx.level_out;
+	float level_in = m_alimiterCtx.level_in;
+	int *nextpos = m_alimiterCtx.nextpos;
+
+	float * buf;
+	float * dst;
+	float * src;
+	int n, c, i;
+	AudioLimiterContext * s = &m_alimiterCtx;
+
+	dst = output;
+	src = input;
+
+	for (n = 0; n < num; n++) {
+		float peak = 0;
+
+		for (c = 0; c < channels; c++) {
+			float sample = src[c] * level_in;
+
+			buffer[s->pos + c] = sample;
+			peak = MAX(peak, fabs(sample));
+		}
+
+		if (s->auto_release && peak > limit) {
+			s->asc += peak;
+			s->asc_c++;
+		}
+
+		if (peak > limit) {
+			float patt = MIN(limit / peak, 1);
+			float rdelta = get_rdelta(s, release, m_nFs,
+				peak, limit, patt, 0);
+			float delta = (limit / peak - s->att) / buffer_size * channels;
+			int found = 0;
+
+			if (delta < s->delta) {
+				s->delta = delta;
+				nextpos[0] = s->pos;
+				nextpos[1] = -1;
+				nextdelta[0] = rdelta;
+				s->nextlen = 1;
+				s->nextiter= 0;
+			} else {
+				for (i = s->nextiter; i < s->nextiter + s->nextlen; i++) {
+					int j = i % buffer_size;
+					float ppeak, pdelta;
+
+					ppeak = fabs(buffer[nextpos[j]]) > fabs(buffer[nextpos[j] + 1]) ?
+						fabs(buffer[nextpos[j]]) : fabs(buffer[nextpos[j] + 1]);
+					pdelta = (limit / peak - limit / ppeak) / (((buffer_size - nextpos[j] + s->pos) % buffer_size) / channels);
+					if (pdelta < nextdelta[j]) {
+						nextdelta[j] = pdelta;
+						found = 1;
+						break;
+					}
+				}
+				if (found) {
+					s->nextlen = i - s->nextiter + 1;
+					nextpos[(s->nextiter + s->nextlen) % buffer_size] = s->pos;
+					nextdelta[(s->nextiter + s->nextlen) % buffer_size] = rdelta;
+					nextpos[(s->nextiter + s->nextlen + 1) % buffer_size] = -1;
+					s->nextlen++;
+				}
+			}
+		}
+
+		buf = &s->buffer[(s->pos + channels) % buffer_size];
+		peak = 0;
+		for (c = 0; c < channels; c++) {
+			float sample = buf[c];
+
+			peak = MAX(peak, fabs(sample));
+		}
+
+		if (s->pos == s->asc_pos && !s->asc_changed)
+			s->asc_pos = -1;
+
+		if (s->auto_release && s->asc_pos == -1 && peak > limit) {
+			s->asc -= peak;
+			s->asc_c--;
+		}
+
+		s->att += s->delta;
+
+		for (c = 0; c < channels; c++)
+			dst[c] = buf[c] * s->att;
+
+		if ((s->pos + channels) % buffer_size == nextpos[s->nextiter]) {
+			if (s->auto_release) {
+				s->delta = get_rdelta(s, release, m_nFs,
+					peak, limit, s->att, 1);
+				if (s->nextlen > 1) {
+					int pnextpos = nextpos[(s->nextiter + 1) % buffer_size];
+					float ppeak = fabs(buffer[pnextpos]) > fabs(buffer[pnextpos + 1]) ?
+						fabs(buffer[pnextpos]) :
+					fabs(buffer[pnextpos + 1]);
+					float pdelta = (limit / ppeak - s->att) /
+						(((buffer_size + pnextpos -
+						((s->pos + channels) % buffer_size)) %
+						buffer_size) / channels);
+					if (pdelta < s->delta)
+						s->delta = pdelta;
+				}
+			} else {
+				s->delta = nextdelta[s->nextiter];
+				s->att = limit / peak;
+			}
+
+			s->nextlen -= 1;
+			nextpos[s->nextiter] = -1;
+			s->nextiter = (s->nextiter + 1) % buffer_size;
+		}
+
+		if (s->att > 1.) {
+			s->att = 1.;
+			s->delta = 0.;
+			s->nextiter = 0;
+			s->nextlen = 0;
+			nextpos[0] = -1;
+		}
+
+		if (s->att <= 0.) {
+			s->att = 0.000001f;
+			s->delta = (1 - s->att) / (m_nFs * release);
+		}
+
+		if (s->att != 1 && (1 - s->att) < 0.000001f)
+			s->att = 1;
+
+		if (s->delta != 0 && fabs(s->delta) < 0.000001f)
+			s->delta = 0;
+
+		for (c = 0; c < channels; c++)
+			dst[c] = MIDDLE(dst[c], -limit, limit) * level * level_out;
+
+		s->pos = (s->pos + channels) % buffer_size;
+		src += channels;
+		dst += channels;
+	}
+}
+
+void Alimiter::Uninit()
+{
+	SAFE_DELETE_PTR(m_alimiterCtx.buffer);
+	SAFE_DELETE_PTR(m_alimiterCtx.nextdelta);
+	SAFE_DELETE_PTR(m_alimiterCtx.nextpos);
+}
+
+int32_t Alimiter::config_input()
+{
+	int obuffer_size = int(m_nFs * m_nChannels * 100 / 1000. + m_nChannels);
+	if(obuffer_size < m_nChannels)
+		return ERROR_SUPERSOUND_PARAM;
+
+	if(obuffer_size > m_alimiterCtx.buffer_max_size)
+	{
+		SAFE_DELETE_PTR(m_alimiterCtx.buffer);
+		m_alimiterCtx.buffer = new(std::nothrow) float[obuffer_size];
+		if(m_alimiterCtx.buffer == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_alimiterCtx.buffer, 0, sizeof(float) * obuffer_size);
+
+		SAFE_DELETE_PTR(m_alimiterCtx.nextdelta);
+		m_alimiterCtx.nextdelta = new(std::nothrow) float[obuffer_size];
+		if(m_alimiterCtx.nextdelta == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_alimiterCtx.nextdelta, 0, sizeof(float) * obuffer_size);
+
+		SAFE_DELETE_PTR(m_alimiterCtx.nextpos);
+		m_alimiterCtx.nextpos = new(std::nothrow) int32_t[obuffer_size];
+		if(m_alimiterCtx.nextpos == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_alimiterCtx.nextpos, -1, obuffer_size*sizeof(int32_t));
+
+		m_alimiterCtx.buffer_max_size = obuffer_size;
+	}
+
+	m_alimiterCtx.buffer_size = int(m_nFs * m_alimiterCtx.attack * m_nChannels);
+	m_alimiterCtx.buffer_size -= m_alimiterCtx.buffer_size % m_nChannels;
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+float Alimiter::get_rdelta( AudioLimiterContext *s, float release, int sample_rate, float peak, float limit, float patt, int asc )
+{
+	float rdelta = (1 - patt) / (sample_rate * release);
+
+	if (asc && s->auto_release && s->asc_c > 0) {
+		float a_att = limit / (s->asc_coeff * s->asc) * (float)s->asc_c;
+
+		if (a_att > patt) {
+			float delta = MAX((a_att - patt) / (sample_rate * release), rdelta / 10);
+
+			if (delta < rdelta)
+				rdelta = delta;
+		}
+	}
+
+	return rdelta;
+}
+
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/CMakeLists.txt
new file mode 100644
index 0000000..6724db8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/CMakeLists.txt
@@ -0,0 +1,183 @@
+cmake_minimum_required(VERSION 3.4)
+project(audio_effects_lib)
+#set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+set(CMAKE_CXX_STANDARD 11)
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++11")
+
+option(AELIB_BUILD_WHOLE_LIBS "Audio Effect Lib build as a whole lib" ON)
+option(WITH_FFT "Audio Effect Lib build with fft" ON)
+
+#add_definitions(-DAE_CONFUSE_CODE)
+include_directories(./)
+include_directories(inc common src)
+include_directories(ref)
+
+# 指定本机的ffmpeg地址，如果为arm编译，则不需要给，因为代码库中自带了
+#include_directories(/Users/yangjianli/starMaker/ffmpeg_lib/ffmpeg-4.3.1/mac/include)
+#set(FFMPEG_LIB /Users/yangjianli/starMaker/ffmpeg_lib/ffmpeg-4.3.1/mac/lib)
+
+IF(NOT AELIB_BUILD_WHOLE_LIBS)
+    # 子项目
+    add_subdirectory(ref)
+
+    AUX_SOURCE_DIRECTORY(common SRC_COMMON_DIR)
+    file(GLOB_RECURSE CPP_SRC_DIR src/*cpp)
+    add_library(audio_effects_lib ${CPP_SRC_DIR} ${SRC_COMMON_DIR})
+ELSE()
+    include_directories(ref/al_reverb/inc)
+    include_directories(ref/al_reverb/src)
+    include_directories(ref/autotune/inc)
+    include_directories(ref/autotune/src)
+    include_directories(ref/iir_eq/inc)
+    include_directories(ref/iir_eq/src)
+    include_directories(ref/phonograph/inc)
+    include_directories(ref/phonograph/src)
+    include_directories(ref/reverb/inc)
+    include_directories(ref/reverb/src)
+    include_directories(ref/saudio_effects/inc)
+    include_directories(ref/saudio_effects/src)
+    include_directories(ref/slow_flanging/inc)
+    include_directories(ref/slow_flanging/src)
+    include_directories(ref/tone_shift/inc)
+    include_directories(ref/tone_shift/src)
+    #include_directories(ref/waves/inc)
+    #include_directories(ref/waves/src)
+
+    include_directories(ref/common)
+
+    include_directories(ref/al_reverb/src/biquad_filters)
+    include_directories(ref/al_reverb/src/fast_delay)
+    include_directories(ref/al_reverb/src/filter)
+    include_directories(ref/al_reverb/src/AlReverbApi.cpp)
+    include_directories(ref/al_reverb/src/al_reverb)
+    include_directories(ref/al_reverb/src/al_reverb_biquad)
+    include_directories(ref/al_reverb/src/al_reverb_common)
+    include_directories(ref/al_reverb/src/al_reverb_early_reflection)
+    include_directories(ref/al_reverb/src/al_reverb_echo)
+    include_directories(ref/al_reverb/src/al_reverb_late_allpass)
+    include_directories(ref/al_reverb/src/al_reverb_late_lowpass)
+    include_directories(ref/al_reverb/src/al_reverb_late_reverb)
+    include_directories(ref/al_reverb/src/al_reverb_modulation)
+
+    include_directories(ref/iir_eq/src/audacious_arma)
+    include_directories(ref/iir_eq/src/audacious_eq)
+
+    include_directories(ref/saudio_effects/src/all_plat ref/saudio_effects/src/audio_effect ref/saudio_effects/src/biquad
+            ref/saudio_effects/src/buffer ref/saudio_effects/src/damper ref/saudio_effects/src/delay ref/saudio_effects/src/delayi ref/saudio_effects/src/envelope_follower
+            ref/saudio_effects/src/equalizer ref/saudio_effects/src/reverb ref/saudio_effects/src/simple_delay_effect ref/saudio_effects/src/simple_reverb_effect)
+
+    include_directories(ref/tone_shift/src/aa_filter)
+    include_directories(ref/tone_shift/src/bpm_detect)
+    include_directories(ref/tone_shift/src/cpu_detect)
+    include_directories(ref/tone_shift/src/fifo_sample_buffer)
+    include_directories(ref/tone_shift/src/fir_filter)
+    include_directories(ref/tone_shift/src/peak_finder)
+    include_directories(ref/tone_shift/src/rate_transposer)
+    include_directories(ref/tone_shift/src/sound_touch)
+    include_directories(ref/tone_shift/src/td_stretch)
+
+    include_directories(ref/supersound/inc)
+    include_directories(ref/supersound/src)
+    include_directories(ref/supersound/src/common)
+    include_directories(ref/supersound/src/impulse)
+    include_directories(ref/supersound/ref)
+    include_directories(ref/supersound/ref/kiss_fft)
+
+#    include_directories(ref/audio_resample/inc)
+
+    AUX_SOURCE_DIRECTORY(common SRC_COMMON_DIR)
+    file(GLOB_RECURSE CPP_SRC_DIR src/*cpp)
+    file(GLOB_RECURSE CPP_REF_DIR ref/*cpp)
+    file(GLOB_RECURSE C_REF_DIR ref/*c)
+
+    include_directories(ref/waves/inc)
+#    include_directories(ref/audio_codec/inc)
+#    list(REMOVE_ITEM CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/ref/waves/src/STWaveFile.cpp")
+#    list(REMOVE_ITEM CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/ref/autotune/src/common/util/util.cpp")
+    list(REMOVE_ITEM CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/ref/audio_resample/src/FfmpegResampler.cpp")
+
+
+#    IF(NOT WITH_FFT)
+#        list(REMOVE_ITEM CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/ref/supersound/ref/kiss_fft/kiss_fft.cpp")
+#        list(REMOVE_ITEM CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/ref/supersound/ref/kiss_fft/kiss_fftr.cpp")
+#        list(REMOVE_ITEM CPP_REF_DIR "${CMAKE_CURRENT_SOURCE_DIR}/ref/supersound/ref/kiss_fft/kiss_fftnd.c")
+#    endif()
+
+    add_library(audio_effects_lib ${CPP_SRC_DIR} ${CPP_REF_DIR} ${C_REF_DIR} ${SRC_COMMON_DIR})
+
+#    set_target_properties(audio_effects_lib PROPERTIES CXX_VISIBILITY_PRESET hidden)
+ENDIF()
+
+
+#set_target_properties(audio_effects_lib PROPERTIES CXX_VISIBILITY_PRESET hidden)
+#add_executable(main example/main.cpp example/ae_server/CAeServer.cpp)
+
+
+# 强制链接.a中的所有变量，否则每个类无法自动注册到map中，外部无法调用
+# 静态链接库链接的时候，会将没有任何调用的变量抛弃
+#if(APPLE)
+#    target_link_libraries(main
+#             -Wl,-all_load ${LIBRARY_OUTPUT_PATH}/libaudio_codec.a -Wl,-noall_load
+#            )
+#    target_link_libraries(main
+#            -Wl,-all_load ${LIBRARY_OUTPUT_PATH}/libaudio_effects_lib.a -Wl,-noall_load
+#            )
+#else()
+#    target_link_libraries(main
+#            -Wl,--whole-archive ${LIBRARY_OUTPUT_PATH}/libaudio_codec.a -Wl,--no-whole-archive
+#            )
+#    target_link_libraries(main
+#            -Wl,-all_load ${LIBRARY_OUTPUT_PATH}/libaudio_effects_lib.a -Wl,-noall_load
+#            )
+#endif()
+
+
+#add_executable(effect_im_tool example/effect_im_tool.cpp example/ae_server/CAeServer.cpp ${CPP_SRC_DIR} ${CPP_REF_DIR} ${C_REF_DIR} ${SRC_COMMON_DIR})
+#if(APPLE)
+#    target_link_libraries(effect_im_tool
+#            -Wl,-all_load ${LIBRARY_OUTPUT_PATH}/libaudio_effects_lib.a -Wl,-noall_load
+#            )
+#else()
+#    target_link_libraries(effect_im_tool
+#            -Wl,--whole-archive ${LIBRARY_OUTPUT_PATH}/libaudio_effects_lib.a -Wl,--whole-archive
+#            )
+#endif()
+#target_link_libraries(effect_im_tool
+#        -lpthread -lz -lbz2 -ldl
+#        )
+
+#target_link_libraries(main
+#        ${LIBRARY_OUTPUT_PATH}/libaudio_effects_lib.a
+#        ${LIBRARY_OUTPUT_PATH}/libwaves.a
+#        ${LIBRARY_OUTPUT_PATH}/libiir_eq.a
+#        ${LIBRARY_OUTPUT_PATH}/libsaudio_effects.a
+#        ${LIBRARY_OUTPUT_PATH}/libautotune.a
+#        ${LIBRARY_OUTPUT_PATH}/libreverb.a
+#        ${LIBRARY_OUTPUT_PATH}/libal_reverb.a
+#        ${LIBRARY_OUTPUT_PATH}/libphonograph.a
+#        ${LIBRARY_OUTPUT_PATH}/libslow_flanging.a
+#        ${LIBRARY_OUTPUT_PATH}/libref_common.a
+#        ${LIBRARY_OUTPUT_PATH}/libtone_shift.a
+#        )
+#
+#target_link_libraries(main
+#                ${FFMPEG_LIB}/libavfilter.a
+#                ${FFMPEG_LIB}/libavformat.a
+#                ${FFMPEG_LIB}/libavcodec.a
+#                ${FFMPEG_LIB}/libswresample.a
+#                ${FFMPEG_LIB}/libswscale.a
+#                ${FFMPEG_LIB}/libavutil.a
+#                -lz -lbz2 -liconv -llzma
+#                "-framework VideoToolbox"
+#                "-framework Security"
+#                "-framework CoreFoundation"
+#                "-framework CoreMedia"
+#                "-framework CoreVideo"
+#                "-framework VideoDecodeAcceleration"
+#                "-framework AVFoundation"
+#                "-framework CoreGraphics"
+#                "-framework Foundation"
+#                "-framework CoreServices"
+#
+##                ${LIBRARY_OUTPUT_PATH}/libwaves.a
+#            )
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/README.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/README.txt
new file mode 100644
index 0000000..b5e2234
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/README.txt
@@ -0,0 +1,24 @@
+项目简介:
+    音效lib库，主要包括各类音效以及均衡器效果。
+
+代码结构介绍:
+    --inc           头文件目录
+    --src           源代码目录
+       --audio_eq   为每个ref中的音效进行一层封装，以供统一使用
+       --manager    音效注册以及获取注册后的音效
+       --common     各个模块之间可以公用的部分
+    --ref           子项目目录 --[具体每个音效都是每一个子项目]
+        --common    子项目中可以公用的部分
+    --example       项目测试文件夹
+        --main.cpp  项目测试入口程序
+        --ae_server 基于当前业务给出的使用程序的样本
+
+使用方法:
+    以android为例子:
+        执行build_android.sh,在./build/libs/android/中可以
+    看到各个平台的.a文件，将其拷贝到android平台。
+        头文件使用inc中的文件即可
+
+新音效增加方式:
+    在ref中增加一个新的子目录[新音效]
+    在inc和src分别增加对该音效的封装，封装方法，参考当前的音效
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/build_android.sh b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/build_android.sh
new file mode 100755
index 0000000..6b81de3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/build_android.sh
@@ -0,0 +1,64 @@
+#!/bin/sh
+
+# @Time    : 2019-06-18 17:50
+# @Author  : AlanWang
+# @FileName: build_android.sh
+
+# MY_NDK 和 MY_CMAKE 需要改成自己对应的 ndk 中的目录
+#MY_NDK="/Users/yangjianli/Library/Android/sdk/ndk-bundle"
+MY_CMAKE="/Users/yangjianli/Library/Android/sdk/cmake/3.6.4111459/bin/cmake"
+MY_NDK="/Users/yangjianli/android-ndk/android-ndk-r16b"
+#MY_CMAKE="/Users/wangjianjun/AndroidDev/sdk/cmake/3.10.2.4988404/bin/cmake"
+
+if [ -z "$MY_NDK" ]; then
+  echo "Please set MY_NDK to the Android NDK folder"
+  exit 1
+fi
+
+if [ -z "$MY_CMAKE" ]; then
+  echo "Please set MY_CMAKE to the Android CMake folder"
+  exit 1
+fi
+
+OUTPUT_LIBS="./build/libs/android"
+# arme_abis=(armeabi armeabi-v7a arm64-v8a x86 x86_64 mips mips64)
+
+function build_with_armeabi() {
+	ARME_ABI=$1
+	echo ${ARME_ABI}
+	ANDROID_NATIVE_API_LEVEL="android-$2"
+	echo ${ANDROID_NATIVE_API_LEVEL}
+
+	BUILD_DIR="./build/android/${ARME_ABI}"
+	BUILD_REF_DIR="./build/android/${ARME_ABI}/ref"
+	OUTPUT_SO_DIR="${BUILD_DIR}/build/android/libs/${ARME_ABI}"
+
+	PRE_EXE_DIR=$(pwd)
+	echo ${PRE_EXE_DIR}
+
+	${MY_CMAKE} \
+	-H"./" \
+	-B"${BUILD_DIR}" \
+	-DANDROID_ABI="${ARME_ABI}" \
+	-DANDROID_NDK="${MY_NDK}" \
+	-DCMAKE_LIBRARY_OUTPUT_DIRECTORY="./build/android/libs/${ARME_ABI}" \
+	-DCMAKE_BUILD_TYPE="Release" \
+	-DCMAKE_TOOLCHAIN_FILE="${MY_NDK}/build/cmake/android.toolchain.cmake" \
+	-DANDROID_NATIVE_API_LEVEL=${ANDROID_NATIVE_API_LEVEL} \
+	-DANDROID_TOOLCHAIN="clang" \
+	-DCMAKE_C_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DCMAKE_CXX_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DANDROID_STL="c++_static" \
+
+
+	cd ${BUILD_DIR}
+	make
+
+	cd ${PRE_EXE_DIR}
+	mkdir -p ${OUTPUT_LIBS}/${ARME_ABI}/
+	mv ${PRE_EXE_DIR}/lib/* ${OUTPUT_LIBS}/${ARME_ABI}/
+	rm -r ./build/android
+}
+
+build_with_armeabi armeabi-v7a 16
+build_with_armeabi arm64-v8a 21
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/build_ios.sh b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/build_ios.sh
new file mode 100755
index 0000000..f228a1f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/build_ios.sh
@@ -0,0 +1,39 @@
+#!/bin/sh
+
+OUTPUT_LIBS="./build/libs/ios"
+
+function build_with_platform_and_armeabi() {
+	PLATFORM=$1
+	ARME_ABI=$2
+	echo ${PLATFORM}
+	echo ${ARME_ABI}
+
+	BUILD_DIR="./build/ios/${ARME_ABI}"
+	PRE_EXE_DIR=$(pwd)
+	echo ${PRE_EXE_DIR}
+
+	cmake \
+	-H"./" \
+	-B"${BUILD_DIR}" \
+	-DCMAKE_BUILD_TYPE="Release" \
+	-DCMAKE_TOOLCHAIN_FILE="./toolchain/ios.toolchain.cmake" \
+	-DIOS_PLATFORM=${PLATFORM} \
+#	-DIOS_ARCH=${ARME_ABI}
+
+	# 生成目标文件
+	cd ${BUILD_DIR}
+	make
+
+	# 将目标文件移至指定目录
+	cd ${PRE_EXE_DIR}
+	mkdir -p ${OUTPUT_LIBS}/${ARME_ABI}/
+	mv ${PRE_EXE_DIR}/lib/* ${OUTPUT_LIBS}/${ARME_ABI}/
+	rm -r ./build/ios
+}
+
+build_with_platform_and_armeabi "OS" "all"
+#build_with_platform_and_armeabi "OS" "armv7s"
+#build_with_platform_and_armeabi "OS" "arm64"
+
+#build_with_platform_and_armeabi "SIMULATOR64" "x86_64"
+#build_with_platform_and_armeabi "SIMULATOR" "i386"
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/ae_server/CAeServer.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/ae_server/CAeServer.cpp
new file mode 100644
index 0000000..1406fad
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/ae_server/CAeServer.cpp
@@ -0,0 +1,480 @@
+//
+// Created by yangjianli on 2020-01-16.
+//
+
+#include "CAeServer.h"
+#include "cstring"
+#include "WaveFile.h"
+
+#ifdef FFMEPG
+#include "DecoderWrapper.h"
+#endif
+
+//////////////////////////////////////////内部函数//////////////////////////////////////////////////////////////
+
+int32_t CAeServer::get_im_params_by_ffmpeg(void* params, Impulse_Param* new_param)
+{
+    AE_PARAMS_IM_EFFECT* cur_params = (AE_PARAMS_IM_EFFECT*) params;
+
+    // 空字符串则直接返回一个结构出去
+    if (cur_params->effect_path.empty())
+    {
+        return AE_ERR_PARAMS_ERR;
+    }
+
+    std::string audio_path(cur_params->effect_path);
+    if (m_im_path2params.find(audio_path) == m_im_path2params.end())
+    {
+#ifdef FFMPEG
+        // 载入数据
+        CDecoderWrapper* m_decode_inst = new(std::nothrow) CDecoderWrapper();
+        if (NULL == m_decode_inst)
+        {
+            return AE_ERR_NO_BUFFER;
+        }
+        MediaParam param;
+        param.duration = 0;
+        param.prelude_time = 0;
+        param.start_time = 0;
+        param.end_time = 0;
+        param.need_decrypt = false;
+        param.path = cur_params->effect_path.c_str();
+
+        MediaInfo info;
+        int errcode = m_decode_inst->init(&param, m_sample_rate, m_channel, CONTEXT_FFMPEG, DECODER_FFMPEG, PROTOCOL_TYPE_FILE);
+        if(0 != errcode)
+        {
+            m_decode_inst->uninit();
+            delete m_decode_inst;
+            return errcode;
+        }
+        m_decode_inst->get_media_info(&info);
+
+        // 解码音频
+        int frame_len = 512 * m_channel;
+        int cap_len = int(info.duration * m_sample_rate / 1000.0 * m_channel) + 10;
+        cap_len = (cap_len / frame_len + 1) * frame_len;
+        int out_len = 0;
+        float* out_buf = new float[cap_len];
+
+        AudioFrameBuffer<float> m_tmp_buffer;
+        m_tmp_buffer.init(512 * m_channel);
+        errcode = m_decode_inst->decode(&m_tmp_buffer);
+        while(E_NATIVE_DECODER_SUCCESS == errcode)
+        {
+            // 这种情况基本不会出现
+            if (cap_len < out_len + m_tmp_buffer.get_size())
+            {
+                cap_len = out_len + m_tmp_buffer.get_size();
+                float* tmp_out = new float[cap_len];
+                memcpy(tmp_out, out_buf, sizeof(float) * out_len);
+                delete[] out_buf;
+                out_buf = tmp_out;
+            }
+            memcpy(out_buf+out_len, m_tmp_buffer.get_buffer(), sizeof(float) * m_tmp_buffer.get_size());
+            out_len += m_tmp_buffer.get_size();
+            memset(m_tmp_buffer.get_buffer(), 0, sizeof(float) * m_tmp_buffer.get_size());
+            errcode = m_decode_inst->decode(&m_tmp_buffer);
+        }
+
+        delete m_decode_inst;
+        if (errcode != E_NATIVE_DECODER_END)
+        {
+            delete [] out_buf;
+            return errcode;
+        }
+#else
+        CWaveFile wave_im = CWaveFile(cur_params->effect_path.c_str(), false);
+        if(!wave_im.GetStatus())
+        {
+            return AE_ERR_NO_BUFFER;
+        }
+
+        int channel = wave_im.GetChannels();
+        int sample_rate = wave_im.GetSampleRate();
+        if (sample_rate != m_sample_rate || channel != m_channel)
+        {
+            printf("impluse params err!\n");
+            return AE_ERR_NO_BUFFER;
+        }
+        int out_len = wave_im.GetTotalFrames() * channel;
+        float* out_buf = new float[out_len];
+        wave_im.ReadFrameAsfloat(out_buf, out_len / channel);
+#endif
+        Impulse_Param* im_params = new Impulse_Param();
+        im_params->in_channels = m_channel;
+        im_params->out_channels = m_channel;
+        im_params->fs = m_sample_rate;
+        im_params->im_response = out_buf;
+        im_params->response_len = out_len / m_channel;
+        im_params->response_channels = m_channel;
+        // 一般最小是192的buffer_size，fft搞小一点，更合适
+        im_params->window_bits = 9;
+        im_params->process_buffer_len = m_buffer_size;
+        im_params->high_performance = true;
+        im_params->effect_path = cur_params->effect_path;
+        m_im_path2params[audio_path] = im_params;
+
+//        STCWaveFile wave_out = STCWaveFile("/Users/yangjianli/starmaker-work/research/tmp_code/音效相关/test1/t1.wav", true);
+//        wave_out.SetChannels(m_channel);
+//        wave_out.SetSampleRate(m_sample_rate);
+//        wave_out.SetSampleFormat(SF_IEEE_FLOAT);
+//        wave_out.SetupDone();
+//        wave_out.WriteFrame(out_buf, out_len / m_channel);
+    }
+    copy_impluse_params(new_param, m_im_path2params[audio_path]);
+    return AE_ERR_SUCCESS;
+}
+
+//////////////////////////////////////////////////////////////////////////////////////////////////////////////
+CAeServer::CAeServer()
+{
+    m_chain = nullptr;
+    m_ae2group_id.clear();
+    m_ae2inst_map.clear();
+    m_ae_group.clear();
+}
+
+CAeServer::~CAeServer()
+{
+    uninit();
+}
+
+int32_t CAeServer::init(int sample_rate, int channel, int buffer_size)
+{
+    m_chain = ae_create_object();
+    ae_init(m_chain, sample_rate, channel);
+    AE_TYPE ae_types[] = {AE_TYPE_NONE, AE_TYPE_KTV, AE_TYPE_AUTOTUNE,AE_TYPE_DISTANT,
+                          AE_TYPE_WARM,AE_TYPE_PHONOGRAPH,AE_TYPE_MAGNETIC,AE_TYPE_ETHEREAL,
+                          AE_TYPE_DIZZY,AE_TYPE_NEW_DISTANT,AE_TYPE_TONE_SHIFT,AE_TYPE_CUSTOM,
+                          AE_TYPE_KARAOKE,SAE_POP,SAE_STUDIO, AE_TYPE_IM_EFFECT};
+
+    combine_group(ae_types, 16);
+    AE_TYPE ae_types1[] = {EQ_TYPE_BEGIN, EQ_TYPE_END};
+    combine_group(ae_types1, 2);
+    m_sample_rate = sample_rate;
+    m_channel = channel;
+    m_buffer_size = buffer_size;
+    return AE_ERR_SUCCESS;
+}
+
+int32_t CAeServer::uninit()
+{
+    if(nullptr != m_chain)
+    {
+        ae_destory_object(m_chain);
+        m_chain = nullptr;
+    }
+    m_ae_group.clear();
+    m_ae2inst_map.clear();
+    m_ae2group_id.clear();
+
+    // 删除im效果器中所有参数映射过的结果
+    std::map<std::string, Impulse_Param *>::iterator itt;
+    for(itt = m_im_path2params.begin(); itt != m_im_path2params.end(); itt++)
+    {
+       if (itt->second != NULL)
+       {
+           if (itt->second->im_response != NULL)
+           {
+               delete[] itt->second->im_response;
+               itt->second->im_response = NULL;
+           }
+           delete itt->second;
+           itt->second = NULL;
+       }
+    }
+    m_im_path2params.clear();
+    return AE_ERR_SUCCESS;
+}
+
+int CAeServer::get_latency_ms()
+{
+    return ae_get_latency_ms(m_chain);
+}
+
+int32_t CAeServer::reset()
+{
+    return ae_reset(m_chain);
+}
+
+int32_t CAeServer::get_ae_effect_params(AE_TYPE ae_type, void *ae_params, AE_EFFECT_TYPE &ae_effect_type, void*& ret)
+{
+    pAECustomParam tp_custom;
+    AE_PARAMS_REVERB* tp_reverb;
+    int err_code = AE_ERR_SUCCESS;
+    switch(ae_type){
+        case AE_TYPE_KTV:
+            ae_effect_type = AE_EFFECT_TYPE_REVERB;
+            ret = new AE_PARAMS_REVERB();
+            memcpy(ret, &gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_ID_11 - AE_PARAMS_TYPE_RERVERB],
+                    sizeof(AE_PARAMS_REVERB));
+            break;
+        case AE_TYPE_AUTOTUNE:
+            ae_effect_type = AE_EFFECT_TYPE_AUTOTUNE;
+            break;
+        case AE_TYPE_DISTANT:
+            ae_effect_type = AE_EFFECT_TYPE_REVERB;
+            ret = new AE_PARAMS_REVERB();
+            memcpy(ret, &gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_ID_15 - AE_PARAMS_TYPE_RERVERB],
+                   sizeof(AE_PARAMS_REVERB));
+            break;
+        case AE_TYPE_WARM:
+            ae_effect_type = AE_EFFECT_TYPE_AL_REVERB;
+            ret = new AE_PARAMS_AL_REVERB();
+            memcpy(ret, &gs_ae_params_al_reverbs[AE_PARAMS_TYPE_AL_REVERB_CITY_STREETS - AE_PARAMS_TYPE_AL_REVERB],
+                   sizeof(AE_PARAMS_AL_REVERB));
+            break;
+        case AE_TYPE_PHONOGRAPH:
+            ae_effect_type = AE_EFFECT_TYPE_PHONOGRAPH;
+            break;
+        case AE_TYPE_MAGNETIC:
+            ae_effect_type = AE_EFFECT_TYPE_AL_REVERB;
+            ret = new AE_PARAMS_AL_REVERB();
+            memcpy(ret, &gs_ae_params_al_reverbs[AE_PARAMS_TYPE_AL_REVERB_GENERIC_1 - AE_PARAMS_TYPE_AL_REVERB],
+                   sizeof(AE_PARAMS_AL_REVERB));
+            break;
+        case AE_TYPE_ETHEREAL:
+            ae_effect_type = AE_EFFECT_TYPE_AL_REVERB;
+            ret = new AE_PARAMS_AL_REVERB();
+            memcpy(ret, &gs_ae_params_al_reverbs[AE_PARAMS_TYPE_AL_REVERB_CASTLE_COURTYARD - AE_PARAMS_TYPE_AL_REVERB],
+                   sizeof(AE_PARAMS_AL_REVERB));
+            break;
+        case AE_TYPE_DIZZY:
+            ae_effect_type = AE_EFFECT_TYPE_SLOWFLANGING;
+            break;
+        case AE_TYPE_NEW_DISTANT:
+            ae_effect_type = AE_EFFECT_TYPE_REVERB;
+            ret = new AE_PARAMS_REVERB();
+            memcpy(ret, &gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_NEW_CONCERT - AE_PARAMS_TYPE_RERVERB],
+                   sizeof(AE_PARAMS_REVERB));
+            break;
+        case AE_TYPE_TONE_SHIFT:
+            ae_effect_type = AE_EFFECT_TYPE_TONE_SHIFT;
+            ret = new AE_PARAMS_TONE_SHIFT();
+            ((AE_PARAMS_TONE_SHIFT*) ret)->shift_value = ((AEToneShiftParam*) ae_params)->tone_shift;
+            break;
+        case AE_TYPE_CUSTOM:
+            ae_effect_type = AE_EFFECT_TYPE_REVERB;
+            ret = new AE_PARAMS_REVERB();
+            memcpy(ret, &gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_ID_18 - AE_PARAMS_TYPE_RERVERB],
+                   sizeof(AE_PARAMS_REVERB));
+            tp_custom = (pAECustomParam) ae_params;
+            tp_reverb = (AE_PARAMS_REVERB*) ret;
+            tp_reverb->wet = tp_custom->reverb_wet / 3.0; // 兼容android当前的使用方式
+            tp_reverb->room_size = tp_custom->room_size;
+            break;
+        case AE_TYPE_KARAOKE:
+            ae_effect_type = AE_EFFECT_TYPE_REVERB;
+            ret = new AE_PARAMS_REVERB();
+            memcpy(ret, &gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_ID_18 - AE_PARAMS_TYPE_RERVERB],
+                   sizeof(AE_PARAMS_REVERB));
+            break;
+        case SAE_POP:
+            ae_effect_type = AE_EFFECT_TYPE_SAE;
+            ret = new AE_PARAMS_SAE();
+            ((AE_PARAMS_SAE*)ret)->params_list.assign(
+                    gs_sae_params[AE_PARAMS_TYPE_SAE_POP - AE_PARAMS_TYPE_SAE].params_list.begin(),
+                    gs_sae_params[AE_PARAMS_TYPE_SAE_POP - AE_PARAMS_TYPE_SAE].params_list.end()
+                    );
+            break;
+        case SAE_STUDIO:
+            ae_effect_type = AE_EFFECT_TYPE_SAE;
+            ret = new AE_PARAMS_SAE();
+            ((AE_PARAMS_SAE*)ret)->params_list.assign(
+                    gs_sae_params[AE_PARAMS_TYPE_SAE_STUDIO - AE_PARAMS_TYPE_SAE].params_list.begin(),
+                    gs_sae_params[AE_PARAMS_TYPE_SAE_STUDIO - AE_PARAMS_TYPE_SAE].params_list.end()
+            );
+            break;
+        case EQ_TYPE_END:
+            ae_effect_type = AE_EFFECT_TYPE_EQ;
+            ret = new AE_PARAMS_EQ();
+            memcpy(ret, ae_params, sizeof(AE_PARAMS_EQ));
+            break;
+        case AE_TYPE_IM_EFFECT:
+            ae_effect_type = AE_EFFECT_TYPE_IM_EFFECT;
+            ret = new Impulse_Param (); // 内部的对象地址是复制的，不会被释放，将由外部做释放
+            err_code = get_im_params_by_ffmpeg(ae_params, (Impulse_Param*)ret);
+            break;
+        default:
+            ae_effect_type = AE_EFFECT_TYPE_NONE;
+    }
+    return err_code;
+}
+
+int32_t CAeServer::combine_group(AE_TYPE *ae_types, int size)
+{
+    int group_id = m_ae_group.size();
+    for(int i=0;i<size;i++)
+    {
+        m_ae2group_id.insert(std::make_pair(ae_types[i], group_id));
+    }
+    m_ae_group.push_back(nullptr); // 占据一个位置
+    return AE_ERR_SUCCESS;
+}
+
+int32_t CAeServer::set_params(AE_TYPE ae_type, void *params)
+{
+    AE_EFFECT_TYPE effect_type = AE_EFFECT_TYPE_NONE;
+    void* cur_params = nullptr;
+    int err_code = get_ae_effect_params(ae_type, params, effect_type, cur_params);
+    if (err_code != AE_ERR_SUCCESS)
+    {
+        if (nullptr != cur_params)
+        {
+            AE_PARAMS* ae_params = (AE_PARAMS*)cur_params;
+            delete ae_params;
+        }
+        return (AE_ERR)err_code;
+    }
+    AE_PARAMS* ae_params = (AE_PARAMS*)cur_params;
+    // 判断是否是要关闭本分组效果
+    if(AE_EFFECT_TYPE_NONE == effect_type)
+    {
+        // 删除该效果所在分组的其他效果
+        std::map<AE_TYPE, int>::iterator iter = m_ae2group_id.find(ae_type);
+        if(iter != m_ae2group_id.end())
+        {
+            int group_id = iter->second;
+            if(group_id >= 0 && group_id < m_ae_group.size())
+            {
+                // 删除ae2inst中效果
+                std::map<AE_TYPE, void*>::iterator itt;
+                for(itt = m_ae2inst_map.begin(); itt != m_ae2inst_map.end(); itt++)
+                {
+                    if(m_ae_group[group_id] == itt->second)
+                    {
+                        m_ae2inst_map.erase(itt);
+                        break;
+                    }
+                }
+                // 删除效果,去掉type2ins映射
+                ae_delete_effect(m_chain, m_ae_group[group_id]);
+                m_ae_group[group_id] = nullptr; // 这块搞空
+            }
+        }
+        return AE_ERR_SUCCESS;
+    }
+
+    // 判断是否在效果链上
+    std::map<AE_TYPE, void*>::iterator it = m_ae2inst_map.find(ae_type);
+    if(it != m_ae2inst_map.end())
+    {
+        // 在效果链上
+        ae_set_params(m_chain, it->second, ae_params);
+    }else
+    {
+        // 没在链上，添加效果
+        void* new_effect_ptr = ae_add_effect(m_chain, effect_type);
+        if(nullptr == new_effect_ptr)
+        {
+            // 没有该效果
+            if(nullptr != ae_params)
+            {
+                delete ae_params;
+            }
+            return AE_ERR_NO_EFFECTS;
+        }
+        ae_set_params(m_chain, new_effect_ptr, ae_params);
+        m_ae2inst_map.insert(std::make_pair(ae_type, new_effect_ptr));
+
+        // 删除该效果所在分组的其他效果
+        std::map<AE_TYPE, int>::iterator iter = m_ae2group_id.find(ae_type);
+        if(iter != m_ae2group_id.end())
+        {
+            int group_id = iter->second;
+            if(group_id >= 0 && group_id < m_ae_group.size())
+            {
+                // 删除分组音效,存放上自己的音效
+                if(nullptr != m_ae_group[group_id])
+                {
+                    // 删除ae2inst中效果
+                    std::map<AE_TYPE, void*>::iterator itt;
+                    for(itt = m_ae2inst_map.begin(); itt != m_ae2inst_map.end(); itt++)
+                    {
+                        if(m_ae_group[group_id] == itt->second)
+                        {
+                            m_ae2inst_map.erase(itt);
+                            break;
+                        }
+                    }
+
+                    // 删除效果,去掉type2ins映射
+                    ae_delete_effect(m_chain, m_ae_group[group_id]);
+                    m_ae_group[group_id] = nullptr; // 这块搞空
+                }
+
+                m_ae_group[group_id] = new_effect_ptr;
+            }
+        }
+    }
+
+    // 在上面return 不需要处理的原因是，当出现上述条件时,ae_params
+    // 没有被创建
+    if(nullptr != ae_params)
+    {
+        delete ae_params;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int32_t CAeServer::get_params(AE_TYPE ae_type, void *params)
+{
+    std::map<AE_TYPE, void*>::iterator it = m_ae2inst_map.find(ae_type);
+    if(it != m_ae2inst_map.end())
+    {
+        // 在效果链上才有结果
+        // 根据对应的类型选择参数结构
+        AE_EFFECT_TYPE effect_type;
+        void* cur_params = nullptr;
+        int err_code = get_ae_effect_params(ae_type, params, effect_type, cur_params);
+        if (cur_params == nullptr)
+        {
+            return err_code;
+        }
+        AE_PARAMS* ae_params = (AE_PARAMS*)cur_params;
+        ae_get_params(m_chain, it->second, (AE_PARAMS*) ae_params);
+
+        switch (ae_type)
+        {
+            case AE_TYPE_TONE_SHIFT:
+            {
+                pAEToneShiftParam tp_server = (pAEToneShiftParam) params;
+                AE_PARAMS_TONE_SHIFT* tp_system = (AE_PARAMS_TONE_SHIFT*) ae_params;
+                tp_server->tone_shift = int(tp_system->shift_value);
+                tp_server->max_shift = int(tp_system->max_value);
+                tp_server->min_shift = int(tp_system->min_value);
+                break;
+            }
+            case AE_TYPE_CUSTOM:
+            {
+                pAECustomParam tp_server = (pAECustomParam) params;
+                AE_PARAMS_REVERB* tp_system = (AE_PARAMS_REVERB*) ae_params;
+                tp_server->reverb_wet = tp_system->wet;
+                tp_server->room_size = tp_system->room_size;
+                break;
+            }
+            case AE_TYPE_IM_EFFECT:
+            {
+                AE_PARAMS_IM_EFFECT* tp_server = (AE_PARAMS_IM_EFFECT*) params;
+                Impulse_Param * tp_system = (Impulse_Param*) ae_params;
+                tp_server->effect_path = tp_system->effect_path;
+                break;
+            }
+            case EQ_TYPE_END:
+            {
+                pAECustomEqParam tp_server = (pAECustomEqParam) params;
+                AE_PARAMS_EQ* tp_system = (AE_PARAMS_EQ*) ae_params;
+                memcpy(tp_server->params, tp_system->params, sizeof(float) * 10);
+            }
+        }
+        delete ae_params;
+        return AE_ERR_SUCCESS;
+    }
+    return AE_ERR_EFFECT_NOT_IN_CHAIN;
+}
+
+int32_t CAeServer::process(float *in_buf, float *out_buf, int length)
+{
+    return ae_process(m_chain, in_buf, out_buf, length);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/ae_server/CAeServer.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/ae_server/CAeServer.h
new file mode 100644
index 0000000..844c525
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/ae_server/CAeServer.h
@@ -0,0 +1,191 @@
+//
+// Created by yangjianli on 2020-01-16.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAESERVER_H
+#define AUDIO_EFFECTS_LIB_CAESERVER_H
+
+/**
+ * 音效系统业务类　
+ * 这部分是参考当前业务场景给出的工作类
+ * 可能会经常修改，跟业务代码一起编译
+ *
+ * 当前的业务逻辑是:
+ * 每个AE_TYPE对应一个效果器,其中部分效果器互斥，内部互相不可以叠加，
+ * 与其他可叠加
+ */
+
+#include "CAudioEffectsChainApi.h"
+#include "map"
+#include "vector"
+
+enum AE_TYPE
+{
+    AE_TYPE_BEGIN,
+    AE_TYPE_NONE = AE_TYPE_BEGIN,
+    AE_TYPE_KTV,
+    AE_TYPE_AUTOTUNE,
+    AE_TYPE_DISTANT,
+    AE_TYPE_WARM,
+    AE_TYPE_PHONOGRAPH,
+    AE_TYPE_MAGNETIC,
+    AE_TYPE_ETHEREAL,
+    AE_TYPE_DIZZY,
+    AE_TYPE_NEW_DISTANT,
+    AE_TYPE_TONE_SHIFT,
+    AE_TYPE_CUSTOM,
+    AE_TYPE_SPEED_SHIFT,
+    AE_TYPE_KARAOKE,
+    SAE_POP,
+    SAE_STUDIO,
+    AE_TYPE_END,
+    AE_TYPE_IM_EFFECT,
+    EQ_TYPE_BEGIN = 10000,
+    EQ_TYPE_END = 20000,
+};
+
+// ToneShift 音效参数
+typedef struct _AEToneShiftParam
+{
+    //tone shift
+    int tone_shift;
+    int min_shift;
+    int max_shift;
+}AEToneShiftParam, *pAEToneShiftParam;
+
+// custom 音效参数
+typedef struct _AECustomParam
+{
+    float reverb_wet;
+    float room_size;
+}AECustomParam, *pAECustomParam;
+
+// 均衡器参数
+typedef struct _AECustomEqParam
+{
+    float params[10];
+}AECustomEqParam, *pAECustomEqParam;
+
+
+class CAeServer
+{
+public:
+    CAeServer();
+    ~CAeServer();
+
+public:
+
+    /**
+     * 初始化函数
+     * 作用: 初始化内部成员
+     * 注意: 创建新类之后，必须进行init才可以进行其他操作
+     * @param sample_rate  采样率
+     * @param channel 通道数
+     * @param buffer_size 单次处理的音频的buffer的长度[单声道*通道数]
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t init(int sample_rate, int channel, int buffer_size);
+
+    /**
+     * 逆初始化函数
+     * 作用: 销毁内部成员，释放空间
+     * 注意:在结束类处理之前，必须进行uninit释放空间，否则可能会有内存泄漏的风险
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t uninit();
+
+    /**
+     * 重置函数
+     * 作用: 清空内部缓存
+     * 注意: 一般是在输入数据发生变化(比如播放音乐的seek操作)之后，使用该函数
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t reset();
+
+    /**
+     * 获取本系统的延迟时间(ms)
+     * 作用: 获取延迟时间
+     * 注意: 在内部音效切换或者叠加时有可能引发音效延迟改变
+     * @return 返回延迟时间(ms)
+     */
+    int get_latency_ms();
+
+    /**
+     * 音效的添加修改或者删除
+     * 作用: 系统中音效状态控制[增删改]
+     * 注意: 选择需要的音效添加即可[具体删除和修改参见combine_group]
+     * @param ae_type AE_TYPE
+     * @param params 根据AE_TYPE 选择具体结构体
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t set_params(AE_TYPE ae_type, void* params);
+
+    /**
+     * 音效参数的获取
+     * 作用: 获取目前已经在效果链上的给定音效的参数
+     * 注意: 如果给定的音效不在效果链上，那么返回值不可信
+     * @param ae_type AE_TYPE
+     * @param params 根据AE_TYPE 选择具体结构体
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t get_params(AE_TYPE ae_type, void* params);
+
+    /**
+     * 处理函数
+     * 作用: 音效系统主处理函数
+     * 注意: in_buf和out_buf可以是同一块buf[建议不是同一块，防止之后添加新效果，新效果有此要求]
+     * in_buf 和 out_buf 必须一致，且长度为length
+     * 输入和输出是一致的
+     * @param in_buf
+     * @param out_buf
+     * @param length buf长度
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t process(float* in_buf, float* out_buf, int length);
+
+    /**
+     * 绑定音效组[每次输入需要绑定的一组音效]
+     * 作用: 将不同的音效绑定成为一组,同一组内的音效不能共存，不同组的音效可以叠加,同一个音效无法在多个组
+     * 注意: 在init函数中已经根据Android App进行了一次预先绑定,需要的时候可以直接在init函数中修改
+     * Tips: 通过在每一组中增加了一个None音效保证可以删除本组音效
+     * @param ae_types
+     * @param size
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    int32_t combine_group(AE_TYPE* ae_types, int size);
+
+private:
+
+    /**
+     * 获取外部音效类型与内部音效类型结构的转换函数[不对外暴露]
+     * 作用: 转化外部与内部结构
+     * 注意: 新增音效时需要增加对应关系
+     * @param ae_type
+     * @param ae_params
+     * @param ae_effect_type
+     * @param ret_params 内部创建空间(因为外部不知道具体类型)
+     * @return 0 表示正常
+     */
+    int32_t get_ae_effect_params(AE_TYPE ae_type,void* ae_params, AE_EFFECT_TYPE & ae_effect_type, void*& ret);
+
+
+    /**
+     * 根据外部输入的音频地址读取数据并进行处理
+     * 1. 进行重采样
+     * 2. 通道数处理
+     * @param params AE_PARAMS_IM_EFFECT*, Impulse_Param* (out)
+     * @return 0 表示正常
+     */
+    int32_t get_im_params_by_ffmpeg(void* params, Impulse_Param* new_param);
+private:
+    void* m_chain; // 效果链实例
+    std::map<AE_TYPE, void*> m_ae2inst_map; // 音效type和音效实例之间的关系
+    std::map<AE_TYPE, int> m_ae2group_id; // 音效type所属组id
+    std::vector<void*> m_ae_group; // 每个group中最多只有一个可用，所以只保存一个即可
+    int32_t m_sample_rate; // 采样率
+    int32_t m_channel; // 通道数
+    int32_t m_buffer_size; // 每次处理的音频数据的单声道的长度
+    std::map<std::string, Impulse_Param*> m_im_path2params; // im效果器本地数据和参数对应关系
+};
+
+#endif //AUDIO_EFFECTS_LIB_CAESERVER_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/effect_im_tool.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/effect_im_tool.cpp
new file mode 100644
index 0000000..578e8e5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/effect_im_tool.cpp
@@ -0,0 +1,72 @@
+//
+// Created by yangjianli on 2023/2/16.
+//
+
+#include "waves/inc/STWaveFile.h"
+#include "CAudioEffectsChainApi.h"
+#include "string"
+#include "ae_server/CAeServer.h"
+#include <cstdio>
+#include <chrono>
+#include <iostream>
+#include <cstdlib>
+#include <sys/time.h>
+void cae_server_float_im(std::string in_file, std::string effect_file, std::string out_file)
+{
+    STCWaveFile oWaveFile = STCWaveFile(in_file.c_str(), false);
+    int length = oWaveFile.GetTotalFrames() * oWaveFile.GetChannels();
+    int sample_rate = oWaveFile.GetSampleRate();
+    int channel = oWaveFile.GetChannels();
+    float* in_buf = new float[length];
+    oWaveFile.ReadFrameAsfloat(in_buf, oWaveFile.GetTotalFrames());
+
+    // 处理逻辑
+    int32_t process_buffer_len = 2048;
+    CAeServer cAeServer;
+    cAeServer.init(sample_rate, channel, process_buffer_len);
+
+    AE_PARAMS_IM_EFFECT im_params = {
+            .effect_path = effect_file,
+    };
+    int ret = cAeServer.set_params(AE_TYPE_IM_EFFECT, (void*) &im_params);
+    printf("set params: %d\n", ret);
+    int step = process_buffer_len * channel;
+
+    struct timeval start;
+    struct timeval end;
+    gettimeofday(&start, NULL);
+    for(int i=0,frame=0;i<length;i+=step,frame++)
+    {
+        if(i+step > length) step = length - i;
+        cAeServer.process(in_buf + i, in_buf + i, step);
+    }
+
+    cAeServer.get_params(AE_TYPE_IM_EFFECT, (void*)&im_params);
+    gettimeofday(&end, NULL);
+    printf("Out====>%s, %f latency=%d\n", im_params.effect_path.c_str(), (end.tv_sec - start.tv_sec) * 1000.0 + (end.tv_usec - start.tv_usec) / 1000.0, cAeServer.get_latency_ms());
+    cAeServer.uninit();
+
+    // 保存起来
+    STCWaveFile out_file_inst = STCWaveFile(out_file.c_str(), true);
+    out_file_inst.SetSampleRate(sample_rate);
+    out_file_inst.SetSampleFormat(SF_IEEE_FLOAT);
+    out_file_inst.SetChannels(channel);
+    out_file_inst.SetupDone();
+    out_file_inst.WriteFrame(in_buf, length / 2);
+}
+
+int main(int argc, char* argv[])
+{
+
+    if(argc != 4)
+    {
+        printf("input err! ./main s_audio_path s_audio_im_path s_audio_out\n");
+        return -1;
+    }
+
+    std::string sAudio = argv[1];
+    std::string sAudioIm = argv[2];
+    std::string sAudioOut = argv[3];
+    cae_server_float_im(sAudio, sAudioIm, sAudioOut);
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/main.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/main.cpp
new file mode 100644
index 0000000..728664b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/example/main.cpp
@@ -0,0 +1,674 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#include "CAudioEffectsChainApi.h"
+#include "iir_eq/inc/CAudaciousEqApi.h"
+#include "waves/inc/STWaveFile.h"
+#include "string"
+#include "saudio_effects/inc/SAudioEffectsApi.h"
+#include "autotune/inc/ATndkWrapper.h"
+#include "reverb/inc/CReverb.h"
+#include "al_reverb/inc/AlReverbApi.h"
+#include "phonograph/inc/CPhonograph.h"
+#include "slow_flanging/inc/CSlowFlanging.h"
+#include "tone_shift/inc/CToneShift.h"
+#include "tone_shift/inc/CSpeedShift.h"
+#include "ae_server/CAeServer.h"
+#include <cstdio>
+#include <chrono>
+#include <iostream>
+#include <cstdlib>
+#include <sys/time.h>
+#define STYLES_LEN 25
+static const float STYLES[STYLES_LEN][10] = {
+        {4,2,0,-3,-6,-6,-3,0,1,3}, // pop 0
+        {7,6,3,0,0,-4,-6,-6,0,0}, // dance 1
+        {3,6,8,3,-2,0,4,7,9,10}, // blues 2
+        {0,0,0,0,0,0,-6,-6,-6,-8}, // classic 3
+        {0,0,1,4,4,4,0,1,3,3}, // jazz 4
+        {5,4,2,0,-2,0,3,6,7,8}, // slow 5
+        {6,5,0,-5,-4,0,6,8,8,7}, // electronica 6
+        {7,4,-4,7,-2,1,5,7,9,9}, // rock 7
+        {5,6,2,-5,1,1,-5,3,8,5}, // country 8
+        {-2,-1,-1,0,3,4,3,0,0,1},// voice 9
+        {5.8,5.8,3,0,-1.5,-1.5,0,0,0,0},//低音 10
+        {13.8,12.6,6.3,0,-1.5,-1.5,0,0,0,0},//超重低音 11
+        {5.8,5.8,3,0,-1.5,-1.5,0,1.5,5.8,5.8},//低音&高音 12
+        {-3,-3,-3,-3,-1.5,-1.5,0,6.3,9.6,12.3},//高音 13
+        {0,0,0,0,0,0,-3,-3,-3,-4.5},//经典 14
+        {5.8,3.2,2.1,0,0,-2.7,-2,-2.2,-0.6,-0.1},//舞曲 15
+        {5.8,3.2,1.3,-3,-2.3,2.2,3.6,5.8,5.8,5.8},//摇滚 16
+        {5.8,5.8,0,-2.9,-2.1,0,3.6,7.4,7.7,7.5},//电子 17
+        {-2.9,-2.9,2.5,3.6,4.8,4.7,6,6,3,3},//扬声器(响亮) 18
+        {-4.5,-3.8,2.2,2.2,2.2,2.2,2.1,1.5,1.5,1.5},//现场 19
+        {-4.5,-4.5,-1.5,-1.5,4.5,4.5,1.5,0,-4.5,-6},//中音 20
+        {1.5,4.5,5.8,3,1.5,0,0,0,1.5,3},//流行 21
+        {5.5,2.5,0.9,-2.6,-5,-10.6,-12.4,-13.3,-10.6,-6.7},//柔和 22
+        {3,3,3,0,-3,-3,0,0,0,0},//柔和低音 23
+        {0,0,-4.5,-4.5,-4.5,-4.5,-3,0,4.5,4.5},//柔和高音 24
+};
+#define MAX_IM_NUMS 9
+Impulse_Param impulseParam[MAX_IM_NUMS];
+std::string paths[MAX_IM_NUMS] = {
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/2f82_l.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/36af_l.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/43e7.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/4d11_l.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/8da7_l.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/b7c9.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/c2e6.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/responses/impulse/d8d3_l.wav",
+        "/Users/yangjianli/starmaker-work/research/qh_code/av_tools/audio_effects/ImpluseEffecLibs/supersound/resource/impluse_test_2.wav",
+};
+
+void get_params()
+{
+    for(int i=0;i<MAX_IM_NUMS;i++)
+    {
+        STCWaveFile* cWaveFile = new STCWaveFile(paths[i].c_str(), false);
+        int nLength = cWaveFile->GetTotalFrames() * cWaveFile->GetChannels();
+        float* response = new float[nLength];
+        cWaveFile->ReadFrameAsfloat(response, nLength);
+
+        impulseParam[i] = Impulse_Param();
+        impulseParam[i].in_channels = 2;
+        impulseParam[i].out_channels = 2;
+        impulseParam[i].fs = 44100;
+        impulseParam[i].im_response = response;
+        impulseParam[i].response_len = nLength / cWaveFile->GetChannels();
+        impulseParam[i].response_channels = cWaveFile->GetChannels();
+        impulseParam[i].window_bits = 10; // 代表了单声道的BufferSize
+
+        delete cWaveFile;
+    }
+}
+
+void eq(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+
+    CAudaciousEqApi eqApi;
+    eqApi.init(nSampleRate, nChannel);
+    eqApi.set_param(0);
+
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        if(nCnt % 100 == 0)
+        {
+            eqApi.reset();
+            eqApi.set_param(nCnt % 26);
+        }
+        eqApi.process(buf + i, buf + i, nStep);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    delete[] buf;
+}
+
+void autotune(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+
+    CATndkWrapper* autotune = new CATndkWrapper();
+    autotune->init(nSampleRate, nChannel);
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        autotune->process(buf+i, buf+i, nStep, 0);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    autotune->uninit();
+    delete autotune;
+    delete[] buf;
+}
+
+void reverb(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    CReverb* cReverb = new CReverb();
+    cReverb->init(nSampleRate, nChannel);
+//    cReverb->set_type_id(KALA_VB_ID_11);
+    AE_PARAMS_REVERB rb = gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_ID_18 - AE_PARAMS_TYPE_RERVERB];
+    rb.room_size = 0.8;
+    rb.wet = 0.8 / 3;
+    cReverb->set_params(&rb);
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+//        printf("%d\n", nStep);
+        cReverb->process(buf + i, nStep, buf + i, nStep);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    cReverb->uninit();
+    delete cReverb;
+}
+
+void phonograph(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    CPhonograph* cReverb = new CPhonograph();
+    cReverb->init(nSampleRate, nChannel);
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        printf("%d\n", nStep);
+        cReverb->process(buf + i, nStep);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    cReverb->uninit();
+    delete cReverb;
+}
+
+void slow_flanging(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    CSlowFlanging* cReverb = new CSlowFlanging();
+    cReverb->init(nChannel, nSampleRate);
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        printf("%d\n", nStep);
+        cReverb->process(buf + i, buf + i, nStep);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    cReverb->uninit();
+    delete cReverb;
+}
+
+void sound_touch(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    float* buf = new float[nLength];
+    float* buf_out = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    CToneShift* cReverb = new CToneShift();
+    cReverb->init(nSampleRate, nChannel);
+    cReverb->set_shift_value(2);
+    cReverb->reset();
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        int ret = cReverb->process(buf + i, nStep, buf + i, nStep);
+        printf("%d %d\n", nStep, ret);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    cReverb->uninit();
+    delete cReverb;
+    delete[] buf;
+    delete[] buf_out;
+}
+
+void al_reverb(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    SUPERSOUND::ALREVERB::AlReverbApi* cReverb = new SUPERSOUND::ALREVERB::AlReverbApi();
+    cReverb->init(nSampleRate,nChannel, 0);
+    AE_PARAMS_AL_REVERB aeParamsAlReverb =
+            gs_ae_params_al_reverbs[AE_PARAMS_TYPE_AL_REVERB_DIZZY_NEW - AE_PARAMS_TYPE_AL_REVERB];
+//    cReverb->set_type_id(KALA_VB_ID_11);
+    cReverb->set_param(&aeParamsAlReverb);
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        printf("%d\n", nStep);
+        cReverb->process(buf+i, nStep);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    cReverb->uninit();
+    delete cReverb;
+}
+
+//void sm_audio_effects_single(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+//{
+//    AE_EFFECT_TYPE type = AE_EFFECT_TYPE_TONE_SHIFT;
+//
+//    void* p = ae_create_object();
+//    AE_EFFECT_TYPE tps[] = {type};
+//    AE_PARAMS_TONE_SHIFT rb = {
+//            .shift_value = 2
+//    };
+//
+//    ae_init(p,tps,1, nSampleRate, nChannel);
+//    ae_set_params(p, type, (AE_PARAMS*) (&rb));
+//    float* buf = new float[nLength];
+//    float* buf_out = new float[nLength];
+//    for(int i=0;i<nLength;i++)
+//    {
+//        buf[i] = pInBuf[i] * 1.0 / 32768;
+//        buf_out[i] = buf[i];
+//    }
+//    int nStep = 512 * nChannel;
+//    bool b_on = false;
+//    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+//    {
+//        if(i+nStep > nLength) nStep = nLength - i;
+//        if(nCnt % 500 == 0)
+//        {
+//            if(b_on)
+//            {
+//                b_on = false;
+////                delete_effect(p, type);
+//                ae_set_params(p, type, nullptr);
+//            }else
+//            {
+//                b_on = true;
+//                int t = nLength / nStep * 12;
+//                rb.shift_value = t;
+//                ae_set_params(p, type, (AE_PARAMS*)&rb);
+//            }
+//        }
+//        ae_process(p, buf+i, buf_out+i, nStep);
+//        for(int j=0;j<nStep;j++)
+//        {
+//            pInBuf[i + j] = short(buf_out[i+j] * 32768);
+//        }
+//    }
+//    ae_uninit(p);
+//    ae_destory_object(p);
+//    delete[] buf;
+//}
+
+void sm_audio_effects(short* pInBuf, int nLength, int nSampleRate, int nChannel)
+{
+    int type = AE_PARAMS_TYPE_SAE_POP;
+
+    SAudioEffectsApi* sAudioEffectsApi = new SAudioEffectsApi();
+    sAudioEffectsApi->init(nSampleRate, nChannel);
+
+    float* buf = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        buf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    int nStep = 512 * nChannel;
+    for(int i=0, nCnt = 0;i<nLength;i+=nStep, nCnt++)
+    {
+        if(i+nStep > nLength) nStep = nLength - i;
+        if(nCnt % 100 == 0)
+        {
+            if(type == AE_PARAMS_TYPE_SAE_POP)
+            {
+                type = AE_PARAMS_TYPE_SAE_STUDIO;
+            }else if(type == AE_PARAMS_TYPE_SAE_STUDIO)
+            {
+                type = AE_PARAMS_TYPE_SAE_POP;
+            }
+            const AE_PARAMS_SAE* saudio_effect_params =
+                    &gs_sae_params[type - AE_PARAMS_TYPE_SAE];
+            sAudioEffectsApi->set_audio_effect((AE_PARAMS*) saudio_effect_params);
+        }
+        sAudioEffectsApi->process(buf + i, buf + i, nStep);
+        for(int j=0;j<nStep;j++)
+        {
+            pInBuf[i + j] = short(buf[i+j] * 32768);
+        }
+    }
+    sAudioEffectsApi->uninit();
+    delete sAudioEffectsApi;
+    delete[] buf;
+}
+
+void chain(short* in_buf, int length, int sample_rate, int channel)
+{
+    // 转换short->float
+    float* buf = new float[length];
+    for(int i=0;i<length;i++)
+    {
+        buf[i] = in_buf[i] * 1.0 / 32768;
+    }
+
+    // 处理逻辑
+    void* chain = ae_create_object();
+    ae_init(chain, sample_rate, channel);
+
+    // 添加留声机效果
+    void* effects[10];
+    int elen = 0;
+    effects[elen++] = ae_add_effect(chain, AE_EFFECT_TYPE_PHONOGRAPH);
+    ae_set_params(chain, effects[elen - 1], nullptr);
+    // 分段处理
+    int step = 512 * channel;
+    for(int i=0,frame=0;i<length;i+=step,frame++)
+    {
+        if(i+step > length) step = length - i;
+        if(frame == 400)
+        {
+            effects[elen++] = ae_add_effect(chain, AE_EFFECT_TYPE_AUTOTUNE);
+            ae_set_params(chain, effects[elen - 1], nullptr);
+        }else if(frame == 800)
+        {
+            effects[elen++] = ae_add_effect(chain, AE_EFFECT_TYPE_EQ);
+            ae_set_params(chain, effects[elen - 1], nullptr);
+            ae_delete_effect(chain, effects[0]);
+        } else if(frame == 1200)
+        {
+            AE_PARAMS_EQ params_eq;
+            memcpy(params_eq.params, STYLES[11], sizeof(float)*10);
+            ae_set_params(chain, effects[elen - 1], (AE_PARAMS *) &params_eq);
+        } else if(frame == 1400)
+        {
+            effects[elen++] = ae_add_effect(chain, AE_EFFECT_TYPE_EQ);
+            AE_PARAMS_EQ params_eq;
+            memcpy(params_eq.params, STYLES[13], sizeof(float)*10);
+            ae_set_params(chain, effects[elen - 1], (AE_PARAMS *) &params_eq);
+        }
+        ae_process(chain, buf + i, buf + i, step);
+    }
+    ae_destory_object(chain);
+
+    // 转换float->short
+    for(int i=0;i<length;i++)
+    {
+        in_buf[i] = short(buf[i] * 32768);
+    }
+    delete [] buf;
+
+//    AE_PARAMS_EQ audioEffectsEqParams;
+//    void* p = ae_create_object();
+//    ae_init(p, sample_rate, channel);
+//    float* buf = new float[length];
+//    for(int i=0;i<length;i++)
+//    {
+//        buf[i] = in_buf[i] * 1.0 / 32768;
+//    }
+//    int nStep = 512 * channel;
+//    int nCC = 0;
+//    int nums = 5;
+//    for(int i=0, nCnt = 0;i<length;i+=nStep, nCnt++)
+//    {
+//        if(i+nStep > length) nStep = length - i;
+//        if(nCnt % 400 == 0)
+//        {
+//            if(nCC % nums == nums - 1)
+//            {
+//                AE_PARAMS* tp = NULL;
+////                set_params(p, AE_TYPE_EQ,tp);
+//                ae_set_params(p, AE_EFFECT_TYPE_AL_REVERB, tp);
+////                delete_effect(p, AE_TYPE_SAE);
+//
+//            }else
+//            {
+////                memcpy(audioEffectsEqParams.params, STYLES[nCnt % 26],
+////                       sizeof(float) * 10);
+////                set_params(p, AE_TYPE_EQ,
+////                           (AE_PARAMS*)&audioEffectsEqParams);
+//                const AE_PARAMS_AL_REVERB* saudio_effect_params =
+//                        &gs_ae_params_al_reverbs[(AE_EFFECT_TYPE_AL_REVERB + nCC % nums) - AE_EFFECT_TYPE_AL_REVERB];
+//                ae_set_params(p, AE_EFFECT_TYPE_AL_REVERB, (AE_PARAMS*)saudio_effect_params);
+//            }
+//            nCC++;
+//        }
+//        ae_process(p, buf + i, buf + i, nStep);
+//        for(int j=0;j<nStep;j++)
+//        {
+//            in_buf[i + j] = short(buf[i+j] * 32768);
+//        }
+//    }
+//    delete[] buf;
+//    ae_destory_object(p);
+}
+
+void ef_chain(short* in_buf, int length, int sample_rate, int channel)
+{
+//    float* buf = new float[length];
+//    for(int i=0;i<length;i++)
+//    {
+//        buf[i] = in_buf[i] * 1.0 / 32768;
+//    }
+//
+//    AE_EFFECT_TYPE numbers[] = {AE_EFFECT_TYPE_EQ, AE_EFFECT_TYPE_PHONOGRAPH, AE_EFFECT_TYPE_AUTOTUNE};
+//    void* p = ae_create_object();
+//    ae_init(p, numbers, 3, sample_rate, channel);
+////    combine_group(p, numbers+1, 2);
+//    int nStep = 512 * channel;
+//    int nCC = 0;
+//    int nums = 3;
+//    for(int i=0, nCnt = 0;i<length;i+=nStep, nCnt++)
+//    {
+//        if(i+nStep > length) nStep = length - i;
+//        if(nCnt % 400 == 0)
+//        {
+//            if(nCC % nums == nums - 1)
+//            {
+//                AE_PARAMS* tp = NULL;
+//                ae_set_params(p, AE_EFFECT_TYPE_AL_REVERB, tp);
+//
+//            }else
+//            {
+//                const AE_PARAMS_AL_REVERB* saudio_effect_params =
+//                        &gs_ae_params_al_reverbs[(AE_EFFECT_TYPE_AL_REVERB + nCC % nums) - AE_EFFECT_TYPE_AL_REVERB];
+//                ae_set_params(p, AE_EFFECT_TYPE_AL_REVERB, (AE_PARAMS*)saudio_effect_params);
+//            }
+//
+//
+//            if(nCC % nums == 0)
+//            {
+//                // EQ
+//                AE_PARAMS_EQ eq;
+//                memcpy(eq.params, STYLES[2], sizeof(float) * 10);
+//                ae_set_params(p, AE_EFFECT_TYPE_EQ, (AE_PARAMS*) &eq);
+//            }else
+//                if(nCC % nums == 1)
+//            {
+//                ae_set_params(p, AE_EFFECT_TYPE_PHONOGRAPH, nullptr);
+//            }else if(nCC % nums == 2)
+//            {
+//                ae_set_params(p, AE_EFFECT_TYPE_AUTOTUNE, nullptr);
+//            }
+//            nCC++;
+//        }
+//        ae_process(p, buf + i, buf + i, nStep);
+//        for(int j=0;j<nStep;j++)
+//        {
+//            in_buf[i + j] = short(buf[i+j] * 32768);
+//        }
+//    }
+}
+
+
+void cae_server(short* in_buf, int length, int sample_rate, int channel)
+{
+    // 转换short->float
+    float* buf = new float[length];
+    for(int i=0;i<length;i++)
+    {
+        buf[i] = in_buf[i] * 1.0 / 32767;
+    }
+
+    FILE* file = fopen("/Users/yangjianli/starmaker/starmaker-audio-effect/audio/audio_effects_lib/resource/t3.pcm", "w");
+    // 处理逻辑
+    CAeServer cAeServer;
+    cAeServer.init(sample_rate, channel, 0);
+    cAeServer.set_params(AE_TYPE_IM_EFFECT, (void*)&impulseParam[MAX_IM_NUMS-1]);
+    int step = 512 * channel;
+    for(int i=0,frame=0;i<length;i+=step,frame++)
+    {
+        if(i+step > length) step = length - i;
+        cAeServer.process(buf + i, buf + i, step);
+        fwrite(buf+i, sizeof(float) * step, 1, file);
+    }
+
+    cAeServer.uninit();
+    // 转换float->short
+    for(int i=0;i<length;i++)
+    {
+        in_buf[i] = short(buf[i] * 32767);
+    }
+    delete [] buf;
+}
+
+void cae_server_float(const char* in_file, const char* out_file)
+{
+    STCWaveFile oWaveFile = STCWaveFile(in_file, false);
+    int length = oWaveFile.GetTotalFrames() * oWaveFile.GetChannels();
+    int sample_rate = oWaveFile.GetSampleRate();
+    int channel = oWaveFile.GetChannels();
+    float* in_buf = new float[length];
+    oWaveFile.ReadFrameAsfloat(in_buf, oWaveFile.GetTotalFrames());
+
+    // 处理逻辑
+    int32_t process_buffer_len = 4097;
+    CAeServer cAeServer;
+    cAeServer.init(sample_rate, channel, process_buffer_len);
+
+//    std::string cd_string = "/Users/yangjianli/starmaker-work/research/tmp_code/音效相关/test1/qm_effect_5/CD/effect.wav";
+    std::string studio_string = "/Users/yangjianli/starmaker-work/research/tmp_code/音效相关/test1/qm_effect_5/录音棚/effect.wav";
+    std::string cd_string = "/Users/yangjianli/starmaker-work/research/tmp_code/音效相关/test1/qm_effect_5/唱将/effect_v2.wav";
+
+    AE_PARAMS_IM_EFFECT im_params = {
+//            .effect_path = "/Users/yangjianli/starmaker-work/research/tmp_code/音效相关/test/response_z/response-v3.wav",
+            .effect_path = studio_string,
+    };
+    int ret = cAeServer.set_params(AE_TYPE_IM_EFFECT, (void*) &im_params);
+    printf("set params: %d\n", ret);
+//    cAeServer.set_params(AE_TYPE_DIZZY, NULL);
+    int step = process_buffer_len * channel;
+
+    struct timeval start;
+    struct timeval end;
+    gettimeofday(&start, NULL);
+    for(int i=0,frame=0;i<length;i+=step,frame++)
+    {
+        if(i+step > length) step = length - i;
+//        if (800 * 5 == frame)
+//        {
+//            im_params.effect_path = cd_string;
+//            cAeServer.set_params(AE_TYPE_IM_EFFECT, (void*) &im_params);
+//        }
+//
+//        if (frame == 400 * 5)
+//        {
+//            im_params.effect_path = studio_string;
+//            cAeServer.set_params(AE_TYPE_IM_EFFECT, (void*) &im_params);
+//        }
+        cAeServer.process(in_buf + i, in_buf + i, step);
+    }
+
+    im_params.effect_path = "dsdsd";
+    cAeServer.get_params(AE_TYPE_IM_EFFECT, (void*)&im_params);
+    gettimeofday(&end, NULL);
+    printf("Out====>%s, %f latency=%d\n", im_params.effect_path.c_str(), (end.tv_sec - start.tv_sec) * 1000.0 + (end.tv_usec - start.tv_usec) / 1000.0, cAeServer.get_latency_ms());
+    cAeServer.uninit();
+
+    // 保存起来
+    STCWaveFile out_file_inst = STCWaveFile(out_file, true);
+    out_file_inst.SetSampleRate(sample_rate);
+    out_file_inst.SetSampleFormat(SF_IEEE_FLOAT);
+    out_file_inst.SetChannels(channel);
+    out_file_inst.SetupDone();
+    out_file_inst.WriteFrame(in_buf, length / 2);
+}
+
+void cae_server_float_im(std::string in_file, std::string effect_file, std::string out_file)
+{
+    STCWaveFile oWaveFile = STCWaveFile(in_file.c_str(), false);
+    int length = oWaveFile.GetTotalFrames() * oWaveFile.GetChannels();
+    int sample_rate = oWaveFile.GetSampleRate();
+    int channel = oWaveFile.GetChannels();
+    float* in_buf = new float[length];
+    oWaveFile.ReadFrameAsfloat(in_buf, oWaveFile.GetTotalFrames());
+
+    // 处理逻辑
+    int32_t process_buffer_len = 2048;
+    CAeServer cAeServer;
+    cAeServer.init(sample_rate, channel, process_buffer_len);
+
+    AE_PARAMS_IM_EFFECT im_params = {
+            .effect_path = effect_file,
+    };
+    int ret = cAeServer.set_params(AE_TYPE_IM_EFFECT, (void*) &im_params);
+    printf("set params: %d\n", ret);
+    int step = process_buffer_len * channel;
+
+    struct timeval start;
+    struct timeval end;
+    gettimeofday(&start, NULL);
+    for(int i=0,frame=0;i<length;i+=step,frame++)
+    {
+        if(i+step > length) step = length - i;
+        cAeServer.process(in_buf + i, in_buf + i, step);
+    }
+
+    cAeServer.get_params(AE_TYPE_IM_EFFECT, (void*)&im_params);
+    gettimeofday(&end, NULL);
+    printf("Out====>%s, %f latency=%d\n", im_params.effect_path.c_str(), (end.tv_sec - start.tv_sec) * 1000.0 + (end.tv_usec - start.tv_usec) / 1000.0, cAeServer.get_latency_ms());
+    cAeServer.uninit();
+
+    // 保存起来
+    STCWaveFile out_file_inst = STCWaveFile(out_file.c_str(), true);
+    out_file_inst.SetSampleRate(sample_rate);
+    out_file_inst.SetSampleFormat(SF_IEEE_FLOAT);
+    out_file_inst.SetChannels(channel);
+    out_file_inst.SetupDone();
+    out_file_inst.WriteFrame(in_buf, length / 2);
+}
+int main(int argc, char* argv[])
+{
+
+    if(argc != 2)
+    {
+        printf("input err! ./main s_audio_path\n");
+        return -1;
+    }
+
+    std::string sAudio = argv[1];
+    std::string sAudioIm = argv[2];
+    std::string sAudioOut = argv[3];
+    cae_server_float_im(sAudio, sAudioIm, sAudioOut);
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/AudioEffectsConf.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/AudioEffectsConf.h
new file mode 100644
index 0000000..2668156
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/AudioEffectsConf.h
@@ -0,0 +1,112 @@
+//
+// Created by yangjianli on 2020/10/27.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_AUDIOEFFECTSCONF_H
+#define AUDIO_EFFECTS_LIB_AUDIOEFFECTSCONF_H
+#include <cstring>
+#include <string.h>
+//#define AE_CONFUSE_CODE
+#ifdef AE_CONFUSE_CODE
+    #define AE_NEW_NAME(NAME)               AE_ ## NAME
+
+    // AlReverb
+    #define AlReverb                        AE_NEW_NAME(C_ALR_30001)
+    #define AlReverbApi                     AE_NEW_NAME(C_ALRA_30002)
+    #define AlReverbBiquad                  AE_NEW_NAME(C_ALRB_30003)
+    #define AlReverbBiquad                  AE_NEW_NAME(C_ALRB_30003)
+    #define AlReverbEarlyReflection         AE_NEW_NAME(C_ALRER_30004)
+    #define AlReverbEcho                    AE_NEW_NAME(C_ALRE_30005)
+    #define AlReverbLateAllpass             AE_NEW_NAME(C_ALRLA_30006)
+    #define AlReverbLateLowpass             AE_NEW_NAME(C_ALRLL_30007)
+    #define AlReverbLateReverb              AE_NEW_NAME(C_ALRLR_30008)
+    #define AlReverbModulation              AE_NEW_NAME(C_ALRM_30009)
+    #define SuperSoundFastDelay             AE_NEW_NAME(C_SSFD_30010)
+    #define CFilters                        AE_NEW_NAME(C_CF_30011)
+
+    // autotune
+    #define CATndkWrapper                   AE_NEW_NAME(C_ATW_40001)
+    #define CAutoTuneWrapper                AE_NEW_NAME(C_ATW_40002)
+    #define CAutoTune                       AE_NEW_NAME(C_AT_40003)
+
+    // common
+    #define APFilter                        AE_NEW_NAME(C_APF_50001)
+    #define CBaseFilter                     AE_NEW_NAME(C_F_50002)
+    #define LPFilter                        AE_NEW_NAME(C_LPF_50003)
+    #define HPFilter                        AE_NEW_NAME(C_LPF_50004)
+    #define BPFilter                        AE_NEW_NAME(C_LPF_50005)
+    #define NTFilter                        AE_NEW_NAME(C_NTF_50006)
+    #define LSFilter                        AE_NEW_NAME(C_LSF_50007)
+    #define HSFilter                        AE_NEW_NAME(C_HSF_50008)
+    #define PKFilter                        AE_NEW_NAME(C_PKF_50009)
+    #define APFilter                        AE_NEW_NAME(C_APF_50010)
+
+    // iir_eq
+    #define CAudaciousEq                    AE_NEW_NAME(C_AEQ_60000)
+    #define CAudaciousEqApi                 AE_NEW_NAME(C_AEQA_60001)
+    #define CAudaciousArma                  AE_NEW_NAME(C_AEQA_60002)
+
+    // phonograph
+    #define CPhonograph                     AE_NEW_NAME(C_CPG_70000)
+    #define CPhonographFilters              AE_NEW_NAME(C_CPGF_70001)
+
+    // CReverb
+    #define CReverb                         AE_NEW_NAME(C_CRB_80001)
+    #define allpass                         AE_NEW_NAME(C_AP_80002)
+    #define comb                            AE_NEW_NAME(C_CB_80003)
+    #define revmodel                        AE_NEW_NAME(C_RM_80004)
+
+    // Equalizer
+    #define Equalizer                       AE_NEW_NAME(C_EQ_90001)
+    #define SimpleDelayEffect               AE_NEW_NAME(C_SDE_90002)
+    #define SimpleReverbEffect              AE_NEW_NAME(C_SRE_90003)
+    #define SAudioEffectsApi                AE_NEW_NAME(C_SEA_90004)
+    #define Allplat                         AE_NEW_NAME(C_AP_90005)
+    #define Parameter                       AE_NEW_NAME(C_PM_90006)
+    #define MidiContext                     AE_NEW_NAME(C_MC_90007)
+    #define FXConfigInfo                    AE_NEW_NAME(C_FCI_90008)
+    #define AudioEffect                     AE_NEW_NAME(C_AE_90009)
+    #define Biquad                          AE_NEW_NAME(C_BQ_90010)
+    #define Buffer                          AE_NEW_NAME(C_BF_90011)
+    #define Damper                          AE_NEW_NAME(C_DP_90012)
+    #define Delay                           AE_NEW_NAME(C_DL_90013)
+    #define DelayI                          AE_NEW_NAME(C_DLI_90014)
+    #define EnvelopeFollower                AE_NEW_NAME(C_EF_90015)
+    #define Reverb                          AE_NEW_NAME(C_RB_90016)
+
+    // CSlowFlanging
+    #define CSlowFlanging                   AE_NEW_NAME(C_CSF_100000)
+
+    // ToneShift
+    #define CToneShift                      AE_NEW_NAME(C_CTS_110000)
+    #define ToneShiftInterface              AE_NEW_NAME(C_TSI_110001)
+    #define CSpeedShift                     AE_NEW_NAME(C_CSS_110002)
+    #define SpeedShiftInterface             AE_NEW_NAME(C_SSI_110003)
+
+    // src
+    #define IAudioEffects                   AE_NEW_NAME(C_IAE_120000)
+    #define CAudioAlReverb                  AE_NEW_NAME(C_CAALR_120001)
+    #define CAudioAlReverbCreator           AE_NEW_NAME(C_CAALRC_120002)
+    #define CAudioAutoTune                  AE_NEW_NAME(C_IAE_120003)
+    #define CAudioAutoTuneCreator           AE_NEW_NAME(C_IAEC_120004)
+    #define CAudioEffectsChain              AE_NEW_NAME(C_IAEC_120005)
+    #define CAudioEqApi                     AE_NEW_NAME(C_CAEQA_120006)
+    #define CEqApiCreator                   AE_NEW_NAME(C_CAEQAC_120007)
+    #define CAudioPhonograph                AE_NEW_NAME(C_CAPG_120008)
+    #define CAudioPhonographCreator         AE_NEW_NAME(C_CAPGC_120009)
+    #define CAudioReverbApi                 AE_NEW_NAME(C_CARA_120010)
+    #define CAudioReverbApiCreator          AE_NEW_NAME(C_CARAC_120011)
+    #define CAudioSAudioEffectsApi          AE_NEW_NAME(C_CASAEA_120012)
+    #define CAudioSAudioEffectsCreator      AE_NEW_NAME(C_CASAEAC_120013)
+    #define CAudioSlowFlanging              AE_NEW_NAME(C_CASF_120014)
+    #define CAudioSlowFlangingCreator       AE_NEW_NAME(C_CASFC_120015)
+    #define CAudioSmoothWrapper             AE_NEW_NAME(C_CASW_120016)
+    #define CAudioToneShift                 AE_NEW_NAME(C_CATS_120017)
+    #define CKeepVolumeSteady               AE_NEW_NAME(C_CKVS_120018)
+    #define ICreator                        AE_NEW_NAME(C_IC_120019)
+
+    // ae_server
+    #define CAeServer                        AE_NEW_NAME(C_CAS_130000)
+
+#endif
+#endif //AUDIO_EFFECTS_LIB_AUDIOEFFECTSCONF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/AudioEffectsDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/AudioEffectsDef.h
new file mode 100644
index 0000000..c8ade5f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/AudioEffectsDef.h
@@ -0,0 +1,97 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_AUDIOEFFECTSDEF_H
+#define AUDIO_EFFECTS_LIB_AUDIOEFFECTSDEF_H
+
+#include "AudioEffectsConf.h"
+#include "SAudioEffectsParams.h"
+#include "CReverbParams.h"
+#include "CAlReverbParams.h"
+#include "CImEffectParams.h"
+#include "ae_defs.h"
+
+// 效果器类型
+enum AE_EFFECT_TYPE
+{
+    AE_EFFECT_TYPE_NONE          = 0, // 无效果
+    AE_EFFECT_TYPE_EQ            = 1,
+    AE_EFFECT_TYPE_SAE           = 10000, // 使用自定义参数
+    AE_EFFECT_TYPE_AUTOTUNE      = 20000,
+    AE_EFFECT_TYPE_REVERB,
+    AE_EFFECT_TYPE_AL_REVERB     = 30000,
+    AE_EFFECT_TYPE_PHONOGRAPH    = 40000,
+    AE_EFFECT_TYPE_SLOWFLANGING,            // AE_TYPE_DIZZY
+    AE_EFFECT_TYPE_TONE_SHIFT,
+    AE_EFFECT_TYPE_IM_EFFECT,
+};
+
+// 参数预定义类型
+enum AE_PARAMS_TYPE
+{
+    // SAE
+    AE_PARAMS_TYPE_SAE = AE_EFFECT_TYPE::AE_EFFECT_TYPE_SAE + 1,
+    AE_PARAMS_TYPE_SAE_POP = AE_PARAMS_TYPE_SAE,
+    AE_PARAMS_TYPE_SAE_STUDIO,
+
+    AE_PARAMS_TYPE_RERVERB = AE_EFFECT_TYPE::AE_EFFECT_TYPE_REVERB + 1, // 使用自定义参数
+    AE_PARAMS_TYPE_REVERB_RECORD_STUDIO = AE_PARAMS_TYPE_RERVERB,
+    AE_PARAMS_TYPE_REVERB_KTV,
+    AE_PARAMS_TYPE_REVERB_CONCERT,
+    AE_PARAMS_TYPE_REVERB_THEATER,
+    AE_PARAMS_TYPE_REVERB_NEW_KTV,
+    AE_PARAMS_TYPE_REVERB_NEW_CONCERT,  // AE_TYPE_NEW_DISTANT
+    AE_PARAMS_TYPE_REVERB_NEW_THEATER,
+    AE_PARAMS_TYPE_REVERB_ID_7,
+    AE_PARAMS_TYPE_REVERB_ID_8,
+    AE_PARAMS_TYPE_REVERB_ID_9,
+    AE_PARAMS_TYPE_REVERB_ID_10,
+    AE_PARAMS_TYPE_REVERB_ID_11,    // AE_TYPE_KTV
+    AE_PARAMS_TYPE_REVERB_ID_12,
+    AE_PARAMS_TYPE_REVERB_ID_13,
+    AE_PARAMS_TYPE_REVERB_ID_14,
+    AE_PARAMS_TYPE_REVERB_ID_15,    // AE_TYPE_DISTANT
+    AE_PARAMS_TYPE_REVERB_ID_16,
+    AE_PARAMS_TYPE_REVERB_ID_17,
+    AE_PARAMS_TYPE_REVERB_ID_18,    // AE_TYPE_KARAOKE/ [AE_TYPE_CUSTOM, 更新其wet和dry]
+
+    AE_PARAMS_TYPE_AL_REVERB = AE_EFFECT_TYPE::AE_EFFECT_TYPE_AL_REVERB + 1,
+    AE_PARAMS_TYPE_AL_REVERB_GENERIC = AE_PARAMS_TYPE_AL_REVERB,
+    AE_PARAMS_TYPE_AL_REVERB_GENERIC_1,                 // AE_TYPE_MAGNETIC
+    AE_PARAMS_TYPE_AL_REVERB_CITY_STREETS,              // AE_TYPE_WRAM
+    AE_PARAMS_TYPE_AL_REVERB_CASTLE_COURTYARD,          // AE_TYPE_ETHEREAL
+    AE_PARAMS_TYPE_AL_REVERB_CASTLE_HALL,
+    AE_PARAMS_TYPE_AL_REVERB_DIZZY_NEW,
+    AE_PARAMS_TYPE_AL_REVERB_CASTLE_HALL_NEW,
+};
+
+// 错误码
+enum AE_ERR
+{
+    AE_ERR_SUCCESS              =  0,
+    AE_ERR_NO_BUFFER            = -1,
+    AE_ERR_NO_EFFECTS           = -2, // 没有该音效[两个原因:1有可能没有进行静态链接库使用全符号链接，2:某音效没有做全局变量]
+    AE_ERR_NO_INIT              = -3, // 没有做初始化
+    AE_ERR_EFFECT_NOT_IN_CHAIN  = -4, // 该效果器不在链上
+    AE_ERR_PARAMS_ERR           = -5, // 参数设置错误
+};
+
+ST_AE_LIB_API struct AE_PARAMS
+{
+
+};
+
+// EQ 参数结构
+ST_AE_LIB_API struct AE_PARAMS_EQ
+{
+    float params[10];
+};
+
+ST_AE_LIB_API struct AE_PARAMS_TONE_SHIFT
+{
+    float shift_value; // [-12,12]
+    float max_value;
+    float min_value;
+};
+#endif //AUDIO_EFFECTS_LIB_AUDIOEFFECTSDEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CAlReverbParams.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CAlReverbParams.h
new file mode 100644
index 0000000..a1b648c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CAlReverbParams.h
@@ -0,0 +1,256 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CALREVERBPARAMS_H
+#define AUDIO_EFFECTS_LIB_CALREVERBPARAMS_H
+
+#include "ae_defs.h"
+
+//需要传入的参数
+ST_AE_LIB_API typedef struct AE_PARAMS_AL_REVERB
+{
+    //采样率，单位 hz
+    int32_t fs;
+    //输入声道数
+    int32_t in_channels;
+    //输出声道数，需和输入通道相同
+    int32_t out_channels;
+    //密度
+    float density;
+    //衍射
+    float diffusion;
+    //混响增益
+    float reverbGain;
+    //高低切增益
+    float lowpass_gain;
+    float highpass_gain;
+    //衰减时间
+    float decay_time;
+    //高切截止比例
+    float highpass_ratio;
+    float lowpass_ratio;
+    //前期反射和后期混响增益
+    float early_gain;
+    float late_gain;
+    //高低切频率
+    float lowpass_reference;
+    float highpass_reference;
+    //回声时间和回声深度
+    float echo_time;
+    float echo_depth;
+    //调制时间和调制深度
+    float modulation_time;
+    float modulation_depth;
+    //前期反射和后期混响时间
+    float early_delay;
+    float late_delay;
+    //低通空气衰减增益
+    float lowpass_air_absorption_gain;
+    //是否启用低切衰减限制
+    int32_t b_decay_lowpass_limit;
+    // 是否进行滤波
+    bool b_need_filter;
+};
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_generic =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=1.000000,
+        .diffusion=1.000000,
+        .reverbGain=0.010000,
+        .lowpass_gain=1.000000,
+        .highpass_gain=0.891300,
+        .decay_time=1.490000,
+        .highpass_ratio=0.830000,
+        .lowpass_ratio=1.000000,
+        .early_gain=0.050000,
+        .late_gain=1.258900,
+        .lowpass_reference=250.000000,
+        .highpass_reference=5000.000000,
+        .echo_time=0.250000,
+        .echo_depth=0.000000,
+        .modulation_time=0.250000,
+        .modulation_depth=0.000000,
+        .early_delay=0.007000,
+        .late_delay=0.011000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=1,
+        .b_need_filter = false
+};
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_generic_1 =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=1.000000,
+        .diffusion=1.000000,
+        .reverbGain=0.10000,
+        .lowpass_gain=1.000000,
+        .highpass_gain=0.891300,
+        .decay_time=1.490000,
+        .highpass_ratio=0.830000,
+        .lowpass_ratio=1.000000,
+        .early_gain=0.050000,
+        .late_gain=1.258900,
+        .lowpass_reference=250.000000,
+        .highpass_reference=5000.000000,
+        .echo_time=0.250000,
+        .echo_depth=0.000000,
+        .modulation_time=0.250000,
+        .modulation_depth=0.000000,
+        .early_delay=0.007000,
+        .late_delay=0.011000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=1,
+        .b_need_filter = false
+};
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_city_streets =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=1.000000,
+        .diffusion=0.780000,
+        .reverbGain=0.100000,
+        .lowpass_gain=0.891300,
+        .highpass_gain=0.707900,
+        .decay_time=1.790000,
+        .highpass_ratio=1.120000,
+        .lowpass_ratio=0.910000,
+        .early_gain=0.281800,
+        .late_gain=0.199500,
+        .lowpass_reference=250.000000,
+        .highpass_reference=5000.000000,
+        .echo_time=0.250000,
+        .echo_depth=0.200000,
+        .modulation_time=0.250000,
+        .modulation_depth=0.000000,
+        .early_delay=0.046000,
+        .late_delay=0.028000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=1,
+        .b_need_filter = true
+};
+
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_castle_countryard =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=1.000000,
+        .diffusion=0.420000,
+        .reverbGain=0.116200,
+        .lowpass_gain=0.199500,
+        .highpass_gain=0.446700,
+        .decay_time=2.130000,
+        .highpass_ratio=0.610000,
+        .lowpass_ratio=0.230000,
+        .early_gain=0.223900,
+        .late_gain=0.707900,
+        .lowpass_reference=250.000000,
+        .highpass_reference=5000.000000,
+        .echo_time=0.250000,
+        .echo_depth=0.370000,
+        .modulation_time=0.250000,
+        .modulation_depth=0.000000,
+        .early_delay=0.160000,
+        .late_delay=0.036000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=0,
+        .b_need_filter = false
+};
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_hall =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=1.000000,
+        .diffusion=0.810000,
+        .reverbGain=0.116200,
+        .lowpass_gain=0.177800,
+        .highpass_gain=0.281800,
+        .decay_time=7.540000,
+        .highpass_ratio=0.790000,
+        .lowpass_ratio=0.620000,
+        .early_gain=0.177800,
+        .late_gain=1.122000,
+        .lowpass_reference=139.500000,
+        .highpass_reference=5168.600098,
+        .echo_time=0.250000,
+        .echo_depth=0.500000,
+        .modulation_time=0.250000,
+        .modulation_depth=0.000000,
+        .early_delay=0.056000,
+        .late_delay=0.024000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=1,
+        .b_need_filter = false
+};
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_new =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=0.364500,
+        .diffusion=0.600000,
+        .reverbGain=0.100000,
+        .lowpass_gain=1.000000,
+        .highpass_gain=0.631000,
+        .decay_time=6.230000,
+        .highpass_ratio=0.560000,
+        .lowpass_ratio=1.000000,
+        .early_gain=0.139200,
+        .late_gain=0.493700,
+        .lowpass_reference=250.000000,
+        .highpass_reference=5000.000000,
+        .echo_time=0.850000,
+        .echo_depth=0.600000,
+        .modulation_time=0.810000,
+        .modulation_depth=0.310000,
+        .early_delay=0.020000,
+        .late_delay=0.030000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=0,
+        .b_need_filter = false
+};
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverb_hall_new =
+{
+        .fs = 0,
+        .in_channels = 0,
+        .out_channels = 0,
+        .density=1.000000,
+        .diffusion=0.810000,
+        .reverbGain=0.116200,
+        .lowpass_gain=0.177800,
+        .highpass_gain=0.281800,
+        .decay_time=10.400000,
+        .highpass_ratio=0.790000,
+        .lowpass_ratio=0.620000,
+        .early_gain=0.177800,
+        .late_gain=1.122000,
+        .lowpass_reference=139.500000,
+        .highpass_reference=5168.600098,
+        .echo_time=0.250000,
+        .echo_depth=0.950000,
+        .modulation_time=0.250000,
+        .modulation_depth=0.000000,
+        .early_delay=0.056000,
+        .late_delay=0.024000,
+        .lowpass_air_absorption_gain=0.994300,
+        .b_decay_lowpass_limit=1,
+        .b_need_filter = false
+};
+
+ST_AE_LIB_API const AE_PARAMS_AL_REVERB gs_ae_params_al_reverbs[] =
+{
+    gs_ae_params_al_reverb_generic,
+    gs_ae_params_al_reverb_generic_1,
+    gs_ae_params_al_reverb_city_streets,
+    gs_ae_params_al_reverb_castle_countryard,
+    gs_ae_params_al_reverb_hall,
+    gs_ae_params_al_reverb_new,
+    gs_ae_params_al_reverb_hall_new
+};
+#endif //AUDIO_EFFECTS_LIB_CALREVERBPARAMS_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CAudioEffectsChainApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CAudioEffectsChainApi.h
new file mode 100644
index 0000000..02242a4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CAudioEffectsChainApi.h
@@ -0,0 +1,131 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOEFFECTSCHAINAPI_H
+#define AUDIO_EFFECTS_LIB_CAUDIOEFFECTSCHAINAPI_H
+/**
+ * 音效效果链使用方式
+ * ae_create_object -> ae_init() ->  各项操作   ->ae_uninit()->ae_destory_object
+ */
+#include "AudioEffectsDef.h"
+#include "ae_defs.h"
+
+#ifdef __cplusplus
+extern "C"
+{
+#endif
+
+    /**
+     * 创建类实例
+     * @return 获取类实例
+     */
+    ST_AE_LIB_API void* ae_create_object();
+
+    /**
+     * 销毁类释放空间
+     * @param p ae_create_object中创建出的类
+     */
+    ST_AE_LIB_API void ae_destory_object(void *p);
+
+
+    /**
+     * 初始化类
+     * 作用: 初始化内部成员
+     * 注意: 创建新类之后，必须进行init才可以进行其他操作
+     * @param p ae_create_object中创建出的类
+     * @param sample_rate 采样率
+     * @param channel 通道数
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_init(void *p, int sample_rate, int channel);
+
+    /**
+     * 逆初始化类
+     * 作用: 销毁类内部成员，释放空间
+     * 注意: destory_object之前必须进行uninit释放空间
+     * @param p ae_create_object中创建出的类
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_uninit(void *p);
+
+    /**
+     * 重置函数
+     * 作用: 清空类内部缓存buffer
+     * 注意: 一般是在输入数据发生变化(比如播放音乐的seek操作)之后，使用该函数
+     * @param p ae_create_object中创建出的类
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_reset(void *p);
+
+    /**
+     * 获取本系统的延迟时间(ms)
+     * 作用: 获取延迟时间
+     * 注意: 在内部音效切换或者叠加时有可能引发音效延迟改变
+     * @param p ae_create_object中创建出的类
+     * @return 返回延迟时间(ms)
+     */
+    ST_AE_LIB_API int ae_get_latency_ms(void *p);
+
+    /**
+     * 对效果链上的音效参数进行设置
+     * 作用: 修改音效参数，设置音效参数
+     * @param p 效果链实例
+     * @param casw 音效实例
+     * @param params 需要设置的参数结构体
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_set_params(void *p, void *casw, AE_PARAMS *params);
+
+    /**
+     * 获取效果链上的效果器参数
+     * 作用: 获取效果器参数
+     * 注意: 外部需要创建好空间
+     * @param p 效果链实例
+     * @param casw 音效实例
+     * @param params 获取出的效果器参数
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_get_params(void *p, void *casw, AE_PARAMS *params);
+
+    /**
+     * 处理函数
+     * 作用: 音效系统主处理函数
+     * 注意: inbuf和out_buf可以是同一块buf[建议不是同一块，防止之后添加新效果，新效果有此要求]
+     * in_buf 和 out_buf 必须一致，且长度为length
+     * @param p 效果链实例
+     * @param in_buf 输入buf
+     * @param out_buf 输出buf
+     * @param length buf长度
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_process(void *p, float *in_buf, float *out_buf, int length);
+
+    /**
+     * 添加音效
+     * 作用: 创建一个效果器并添加到效果链上
+     * 注意: 如果创建成功会添加到效果链并返回效果器地址，如果没有，则返回一个空指针
+     * @param p 效果链实例
+     * @param effects_number 效果器类型
+     * @return 效果器的地址/nullptr
+     */
+    ST_AE_LIB_API void* ae_add_effect(void *p, AE_EFFECT_TYPE effects_number);
+
+    /**
+     * 删除音效
+     * 作用: 关闭效果链上的效果器
+     * 注意: 本函数只是关闭了效果器，并没有真正将其从效果链上删除，会在process的过程中自动删除
+     * @param p 效果链实例
+     * @param casw 效果器实例
+     * @return 返回值是AE_ERR AE_ERR_SUCCESS是正常返回
+     */
+    ST_AE_LIB_API AE_ERR ae_delete_effect(void *p, void *casw);
+
+#ifdef __cplusplus
+}
+#endif
+
+
+
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOEFFECTSCHAINAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CImEffectParams.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CImEffectParams.h
new file mode 100644
index 0000000..96f1358
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CImEffectParams.h
@@ -0,0 +1,62 @@
+//
+// Created by yangjianli on 2022/9/8.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CIMEFFECTPARAMS_H
+#define AUDIO_EFFECTS_LIB_CIMEFFECTPARAMS_H
+#include "ae_defs.h"
+#include <cstring>
+#include <cstdio>
+#include <string>
+
+ST_AE_LIB_API typedef struct _Impulse_Param
+{
+    //采样率，单位 hz
+    // 外围保证处理时的音频的采样率和卷积的采样率一致
+    int32_t fs;
+    //输入声道数
+    // 处理音频的输入通道数和初始化的时候一致即可[内部会自动赋值]
+    int32_t in_channels;
+    // 处理音频的输出通道数和初始化的时候一致即可[内部会自动赋值]
+    //输出声道数，需和输入通道相同
+    int32_t out_channels;
+    // 直接给10,后续在内部会根据输入长度做调整
+    //FIR 窗 bit 长度，最小为 10
+    int32_t window_bits;
+    //im 响应，外围需要保证其采样率和输入的采样率一致
+    float * im_response;
+    //响应的长度
+    int32_t response_len;
+    //响应的通道数，该通道数必须与输入通道数相同或为1，为1时表示输入的所有通道使用相同的响应
+    int32_t response_channels;
+    // 每次处理时输入的音频的长度(单声道的长度)，用于计算延迟
+    int32_t process_buffer_len;
+    // true则高性能计算，存在算法延迟
+    bool high_performance;
+    // 音频文件地址
+    std::string effect_path;
+} Impulse_Param;
+
+inline void copy_impluse_params(Impulse_Param* dst, Impulse_Param* src)
+{
+    dst->fs = src->fs;
+    dst->in_channels = src->in_channels;
+    dst->out_channels = src->out_channels;
+    dst->window_bits = src->window_bits;
+    // 只拷贝首地址,减少拷贝时的内存消耗
+    dst->im_response = src->im_response;
+    dst->response_len = src->response_len;
+    dst->high_performance = src->high_performance;
+    dst->response_channels = src->response_channels;
+    dst->process_buffer_len = src->process_buffer_len;
+    dst->effect_path = src->effect_path;
+}
+ST_AE_LIB_API typedef struct AE_PARAMS_IM_EFFECT
+{
+    // 音效的地址
+    std::string effect_path;
+    // true则高性能计算，存在算法延迟
+    bool high_performance;
+};
+
+#endif //AUDIO_EFFECTS_LIB_CIMEFFECTPARAMS_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CReverbParams.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CReverbParams.h
new file mode 100644
index 0000000..f9748cd
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/CReverbParams.h
@@ -0,0 +1,214 @@
+//
+// Created by yangjianli on 2020-01-13.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CREVERBPARAMS_H
+#define AUDIO_EFFECTS_LIB_CREVERBPARAMS_H
+
+#include "ae_defs.h"
+
+ST_AE_LIB_API struct AE_PARAMS_REVERB
+{
+    float mode;
+    float room_size;
+    float damp;
+    float wet;
+    float dry;
+    float width;
+};
+
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_record_studio =
+{
+        .mode=0.2f,
+        .room_size=0,
+        .damp=0,
+        .wet=0,
+        .dry=0.8f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_ktv =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_concert =
+{
+        .mode=0.3f,
+        .room_size=0.50f,
+        .damp=0.6f,
+        .wet=0.3f,
+        .dry=0.6f,
+        .width=0.56f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_theater =
+{
+        .mode=0.0,
+        .room_size=0.6f,
+        .damp=0.2f,
+        .wet=0.4f,
+        .dry=0.5f,
+        .width=0.20f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_new_ktv =
+ {
+        .mode=0.2f,
+        .room_size=0.7f,
+        .damp=0.9f,
+        .wet=0.11f,
+        .dry=0.44f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_new_concert =
+{
+        .mode=0.3f,
+        .room_size=0.60f,
+        .damp=0.6f,
+        .wet=0.18f,
+        .dry=0.37f,
+        .width=0.56f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_new_theater =
+{
+        .mode=0.0,
+        .room_size=0.8f,
+        .damp=0.8f,
+        .wet=0.248f,
+        .dry=0.182f,
+        .width=0.50f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_7 =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_8 =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_9 =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_10 =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_11 =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_12 =
+{
+        .mode=0.2f,
+        .room_size=0.4f,
+        .damp=0.69f,
+        .wet=0.14f,
+        .dry=0.22f,
+        .width=0.82f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_13 =
+        {
+        .mode=0.2f,
+        .room_size=0.41f,
+        .damp=0.18f,
+        .wet=0.16f,
+        .dry=0.24f,
+        .width=0.68f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_14 =
+{
+        .mode=0.2f,
+        .room_size=0.79f,
+        .damp=0.63f,
+        .wet=0.14f,
+        .dry=0.26f,
+        .width=0.92f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_15 =
+{
+        .mode=0.2f,
+        .room_size=0.84f,
+        .damp=0.25f,
+        .wet=0.12f,
+        .dry=0.22f,
+        .width=0.76f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_16 =
+{
+        .mode=0.2f,
+        .room_size=0.88f,
+        .damp=0.42f,
+        .wet=0.12f,
+        .dry=0.17f,
+        .width=0.84f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_17 =
+{
+        .mode=0.2f,
+        .room_size=0.35f,
+        .damp=0.5f,
+        .wet=0.20f,
+        .dry=0.5f,
+        .width=0.5f,
+};
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_reverb_id_18 =
+{
+        .mode=0.2f,
+        .room_size=0.65f,
+        .damp=0.25f,
+        .wet=0.25f,
+        .dry=0.6f,
+        .width=0.95f,
+};
+
+ST_AE_LIB_API const AE_PARAMS_REVERB gs_ae_params_reverb_params[] = {
+        gs_reverb_record_studio,
+        gs_reverb_ktv,
+        gs_reverb_concert,
+        gs_reverb_theater,
+        gs_reverb_new_ktv,
+        gs_reverb_new_concert,
+        gs_reverb_new_theater,
+        gs_reverb_id_7,
+        gs_reverb_id_8,
+        gs_reverb_id_9,
+        gs_reverb_id_10,
+        gs_reverb_id_11,
+        gs_reverb_id_12,
+        gs_reverb_id_13,
+        gs_reverb_id_14,
+        gs_reverb_id_15,
+        gs_reverb_id_16,
+        gs_reverb_id_17,
+        gs_reverb_id_18,
+};
+
+#endif //AUDIO_EFFECTS_LIB_CREVERBPARAMS_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/SAudioEffectsParams.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/SAudioEffectsParams.h
new file mode 100644
index 0000000..1fcbe75
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/SAudioEffectsParams.h
@@ -0,0 +1,322 @@
+//
+// Created by yangjianli on 2020-01-10.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_SAUDIOEFFECTSPARAMS_H
+#define AUDIO_EFFECTS_LIB_SAUDIOEFFECTSPARAMS_H
+
+/**
+ * 定义关于SAudioEffects的相关参数以及预定义的参数
+ */
+#include "vector"
+#include "string"
+#include "ae_defs.h"
+
+// 定义参数需要的类名称,函数名称
+#define SAE_CLASS_EQ "Eq"
+#define SAE_CLASS_DELAY "Delay"
+#define SAE_CLASS_REVERB "Reverb"
+
+// 函数常量
+#define SAE_FUNC_CENTER_FREQ "Center Freq."
+#define SAE_FUNC_GAIN "Gain"
+#define SAE_FUNC_Q "Q"
+#define SAE_FUNC_DELAY "Delay"
+#define SAE_FUNC_FEEDBACK "Feedback"
+#define SAE_FUNC_FEEDBACK_DAMPING "Feedback Damping"
+#define SAE_FUNC_MIX "Mix"
+#define SAE_FUNC_DECAY "Decay"
+#define SAE_FUNC_DRY "Dry"
+#define SAE_FUNC_INPUT_DAMPING "Input Damping"
+#define SAE_FUNC_WET "Wet"
+#define SAE_FUNC_IN_CH "In Ch."
+#define SAE_FUNC_OUT_CH "Out Ch."
+
+// 根据方法名，选择对应类型的参数
+ST_AE_LIB_API struct AE_PARAMS_SAE_CONTENT
+{
+    std::string class_name;
+    std::string function_name;
+    int idx;
+    float f_value;
+    bool b_value;
+};
+
+// saudio_effects 参数
+ST_AE_LIB_API struct AE_PARAMS_SAE
+{
+    std::vector<AE_PARAMS_SAE_CONTENT> params_list;
+};
+
+ST_AE_LIB_API const AE_PARAMS_SAE_CONTENT gs_sae_pop[] =
+{
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_CENTER_FREQ,
+                .idx=0,
+                .f_value=25.0,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_CENTER_FREQ,
+                .idx=1,
+                .f_value=1204.0,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_CENTER_FREQ,
+                .idx=2,
+                .f_value=10000.000000,
+                .b_value= false,
+
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_GAIN,
+                .idx=0,
+                .f_value=-20.000000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_GAIN,
+                .idx=1,
+                .f_value=-3.500000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_GAIN,
+                .idx=2,
+                .f_value=2.200000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_Q,
+                .idx=0,
+                .f_value=1.000000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_Q,
+                .idx=1,
+                .f_value=3.100000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_EQ,
+                .function_name= SAE_FUNC_Q,
+                .idx=2,
+                .f_value=1.000000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_DELAY,
+                .function_name= SAE_FUNC_DELAY,
+                .idx=0,
+                .f_value=160.000000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_DELAY,
+                .function_name= SAE_FUNC_FEEDBACK,
+                .idx=0,
+                .f_value=6.000000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_DELAY,
+                .function_name= SAE_FUNC_MIX,
+                .idx=0,
+                .f_value=5.500000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_DECAY,
+                .idx=0,
+                .f_value=0.700000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_DRY,
+                .idx=0,
+                .f_value=0.900000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_FEEDBACK_DAMPING,
+                .idx=0,
+                .f_value=0.000500,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_INPUT_DAMPING,
+                .idx=0,
+                .f_value=0.000500,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_WET,
+                .idx=0,
+                .f_value=0.100000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_IN_CH,
+                .idx=0,
+                .f_value=0.000000,
+                .b_value= false,
+        },
+        {
+                .class_name = SAE_CLASS_REVERB,
+                .function_name= SAE_FUNC_OUT_CH,
+                .idx=0,
+                .f_value=0.000000,
+                .b_value= true,
+        }
+};
+
+ST_AE_LIB_API const AE_PARAMS_SAE_CONTENT gs_sae_studio[] =
+{
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_CENTER_FREQ,
+            .idx = 0,
+            .f_value = 25.0,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_CENTER_FREQ,
+            .idx = 1,
+            .f_value = 2229.0,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_CENTER_FREQ,
+            .idx = 2,
+            .f_value = 8105.0,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_GAIN,
+            .idx = 0,
+            .f_value = -20.0,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_GAIN,
+            .idx = 1,
+            .f_value = 3.0,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_GAIN,
+            .idx = 2,
+            .f_value = 1.8,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_Q,
+            .idx = 0,
+            .f_value = 0.999000,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_Q,
+            .idx = 1,
+            .f_value = 0.6,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_EQ,
+            .function_name = SAE_FUNC_Q,
+            .idx = 2,
+            .f_value = 0.1,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_DECAY,
+            .idx = 0,
+            .f_value = 0.7,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_DRY,
+            .idx = 0,
+            .f_value = 0.7,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_FEEDBACK_DAMPING,
+            .idx = 0,
+            .f_value = 0.000500f,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_INPUT_DAMPING,
+            .idx = 0,
+            .f_value = 0.000500f,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_WET,
+            .idx = 0,
+            .f_value = 0.2,
+            .b_value= false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_IN_CH,
+            .idx = 0,
+            .f_value = 0.0,
+            .b_value = false,
+        },
+        {
+            .class_name = SAE_CLASS_REVERB,
+            .function_name = SAE_FUNC_OUT_CH,
+            .idx = 0,
+            .f_value = 0.0,
+            .b_value = true,
+        },
+};
+ST_AE_LIB_API const AE_PARAMS_SAE gs_sae_params_pop =
+{
+        .params_list = std::vector<AE_PARAMS_SAE_CONTENT>(gs_sae_pop,
+                                                                                gs_sae_pop+19),
+};
+
+ST_AE_LIB_API const AE_PARAMS_SAE gs_sae_params_studio =
+{
+        .params_list = std::vector<AE_PARAMS_SAE_CONTENT>(gs_sae_studio,
+                                                                                gs_sae_studio+16),
+};
+
+
+ST_AE_LIB_API const AE_PARAMS_SAE gs_sae_params[] =
+{
+    gs_sae_params_pop,gs_sae_params_studio
+};
+
+#endif //AUDIO_EFFECTS_LIB_SAUDIOEFFECTSPARAMS_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/ae_defs.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/ae_defs.h
new file mode 100644
index 0000000..8c9aff1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/inc/ae_defs.h
@@ -0,0 +1,12 @@
+/**
+ * Author: AlanWang4523.
+ * Date: 2021/12/29 11:38.
+ * Mail: alanwang4523@gmail.com
+ */
+
+#ifndef AVAUDIO_EFFECT_LIBS_DEFINES_H
+#define AVAUDIO_EFFECT_LIBS_DEFINES_H
+
+#define ST_AE_LIB_API __attribute__ ((visibility("default")))
+
+#endif //AVAUDIO_EFFECT_LIBS_DEFINES_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/py/1.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/py/1.txt
new file mode 100644
index 0000000..f9865ec
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/py/1.txt
@@ -0,0 +1,261 @@
+
+        /***************** v1.0, id 0~3, add here ************************************/
+    case KALA_VB_RECORD_STUDIO:
+    {
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0);
+        pmd->setdamp(0);
+        pmd->setwet(0);
+        pmd->setdry(0.8f);
+        pmd->setwidth(0.5f);
+        break;
+    }
+    case KALA_VB_KTV:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+
+    case KALA_VB_CONCERT:
+    {
+        // for concert ok
+        pmd->setmode(0.3f);
+        pmd->setroomsize(0.50f);
+        pmd->setdamp(0.6f);
+        pmd->setwet(0.3f);
+        pmd->setdry(0.6f);
+        pmd->setwidth(0.56f);
+        break;
+    }
+
+    case KALA_VB_THEATER:
+    {
+        // for theater
+        pmd->setmode(0.0);
+        pmd->setroomsize(0.6f);
+        pmd->setdamp(0.2f);
+        pmd->setwet(0.4f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.20f);
+        break;
+    }
+    /***************** kala v2.6, id 0\4\5\6, add here ************************************/
+    case KALA_VB_NEW_KTV:
+    {
+
+        // v2.2
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.7f);
+        pmd->setdamp(0.9f);
+        pmd->setwet(0.11f);
+        pmd->setdry(0.44f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_NEW_CONCERT:
+    {
+        // v2.2
+        pmd->setmode(0.3f);
+        pmd->setroomsize(0.60f);
+        pmd->setdamp(0.6f);
+        pmd->setwet(0.18f);
+        pmd->setdry(0.37f);
+        pmd->setwidth(0.56f);
+
+        break;
+    }
+    case KALA_VB_NEW_THEATER:
+    {
+
+        //old version
+        //pmd->setmode(0.0);
+        //pmd->setroomsize(0.6f);
+        //pmd->setdamp(0.2f);
+        //pmd->setwet(0.4f);
+        //pmd->setdry(0.5f);
+        //pmd->setwidth(0.20f);
+
+        // new 1.0
+        //pmd->setmode(0.0);
+        //pmd->setroomsize(0.8f);
+        //pmd->setdamp(0.8f);
+        //pmd->setwet(0.3f);
+        //pmd->setdry(0.4f);
+        //pmd->setwidth(0.50f);
+
+        // v2.0
+        //pmd->setmode(0.0);
+        //pmd->setroomsize(0.8f);
+        //pmd->setdamp(0.8f);
+        //pmd->setwet(0.22f);
+        //pmd->setdry(0.14f);
+        //pmd->setwidth(0.50f);
+
+        //v2.2
+        pmd->setmode(0.0);
+        pmd->setroomsize(0.8f);
+        pmd->setdamp(0.8f);
+        pmd->setwet(0.248f);
+        pmd->setdry(0.182f);
+        pmd->setwidth(0.50f);
+
+        break;
+    }
+    /***************** kala v2.6, id 0\4\5\6, add here ************************************/
+    case KALA_VB_ID_7:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_ID_8:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_ID_9:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_ID_10:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_ID_11:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_ID_12:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.4f);
+        pmd->setdamp(0.69f);
+        pmd->setwet(0.14f);
+        pmd->setdry(0.22f);
+        pmd->setwidth(0.82f);
+
+        break;
+    }
+    case KALA_VB_ID_13:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.41f);
+        pmd->setdamp(0.18f);
+        pmd->setwet(0.16f);
+        pmd->setdry(0.24f);
+        pmd->setwidth(0.68f);
+
+        break;
+    }
+    case KALA_VB_ID_14:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.79f);
+        pmd->setdamp(0.63f);
+        pmd->setwet(0.14f);
+        pmd->setdry(0.26f);
+        pmd->setwidth(0.92f);
+
+        break;
+    }
+    case KALA_VB_ID_15:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.84f);
+        pmd->setdamp(0.25f);
+        pmd->setwet(0.12f);
+        pmd->setdry(0.22f);
+        pmd->setwidth(0.76f);
+
+        break;
+    }
+    case KALA_VB_ID_16:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.88f);
+        pmd->setdamp(0.42f);
+        pmd->setwet(0.12f);
+        pmd->setdry(0.17f);
+        pmd->setwidth(0.84f);
+
+        break;
+    }
+    case KALA_VB_ID_17:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.35f);
+        pmd->setdamp(0.5f);
+        pmd->setwet(0.20f);
+        pmd->setdry(0.5f);
+        pmd->setwidth(0.5f);
+
+        break;
+    }
+    case KALA_VB_ID_18:
+    {
+        // for ktv
+        pmd->setmode(0.2f);
+        pmd->setroomsize(0.65f);
+        pmd->setdamp(0.25f);
+        pmd->setwet(0.25f);
+        pmd->setdry(0.6f);
+        pmd->setwidth(0.95f);
+
+        break;
+    }
+    default:
+    {
+        pmd->setmode(1);
+        break;
+    }
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/py/trans.py b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/py/trans.py
new file mode 100644
index 0000000..fc65690
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/py/trans.py
@@ -0,0 +1,49 @@
+import os
+
+
+def read_file(file_path):
+    res = {}
+    current_key = ""
+    with open(file_path, "r") as f:
+        while True:
+            line = f.readline()
+            if not line:
+                return res
+            line = line.strip().split()
+            if not line:
+                continue
+            if line[0][0] not in ["p", "c"]:
+                continue
+            if line[0] == "case":
+                current_key = line[1].split(':')[0]
+                continue
+
+            line = line[0].split('->')[1].replace('set', "").split(':')[0]
+            func, para = line.split('(')
+            para = str(para).replace(');', "")
+            if current_key not in res:
+                res[current_key] = {}
+            if func == "roomsize":
+                func = "room_size"
+            res[current_key][func] = para
+    return res
+
+
+if __name__ == "__main__":
+    res = read_file("1.txt")
+    for k, v in res.items():
+        print("const AE_PARAMS_REVERB gs_{}".format(k.lower().replace("kala_vb", "reverb")))
+        print("{")
+        for kk, vv in v.items():
+            print("\t.{}={},".format(kk, vv))
+        print("};")
+
+    print("AE_PARAMS_REVERB gs_reverb_params[] = {")
+    for k, v in res.items():
+        print("gs_{},".format(k.lower().replace("kala_vb","reverb")))
+    print("};")
+
+    for k, v in res.items():
+        print("AE_PARAMS_TYPE_{},".format(k.replace("KALA_VB", "REVERB")))
+
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/CMakeLists.txt
new file mode 100644
index 0000000..4e84812
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/CMakeLists.txt
@@ -0,0 +1,12 @@
+include_directories(common)
+add_subdirectory(common)
+add_subdirectory(tone_shift)
+add_subdirectory(slow_flanging)
+add_subdirectory(phonograph)
+add_subdirectory(al_reverb)
+add_subdirectory(saudio_effects)
+add_subdirectory(autotune)
+add_subdirectory(waves)
+add_subdirectory(iir_eq)
+add_subdirectory(reverb)
+add_executable(supersound)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/CMakeLists.txt
new file mode 100644
index 0000000..7196bb9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/CMakeLists.txt
@@ -0,0 +1,23 @@
+include_directories(./)
+include_directories(inc)
+
+include_directories(src)
+include_directories(src/biquad_filters)
+include_directories(src/fast_delay)
+include_directories(src/filter)
+include_directories(src/AlReverbApi.cpp)
+include_directories(src/al_reverb)
+include_directories(src/al_reverb_biquad)
+include_directories(src/al_reverb_common)
+include_directories(src/al_reverb_early_reflection)
+include_directories(src/al_reverb_echo)
+include_directories(src/al_reverb_late_allpass)
+include_directories(src/al_reverb_late_lowpass)
+include_directories(src/al_reverb_late_reverb)
+include_directories(src/al_reverb_modulation)
+
+
+file(GLOB_RECURSE SRC_ALREVERB_DIR src/*cpp)
+
+add_library(al_reverb ${SRC_ALREVERB_DIR})
+#set_target_properties(al_reverb PROPERTIES CXX_VISIBILITY_PRESET hidden)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/inc/AlReverbApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/inc/AlReverbApi.h
new file mode 100644
index 0000000..87ae900
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/inc/AlReverbApi.h
@@ -0,0 +1,47 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_ALREVERBAPI_H
+#define AUDIO_EFFECTS_LIB_ALREVERBAPI_H
+
+#include "AlReverbDefs.h"
+#include "vector"
+
+class CFilters;
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+class AlReverb;
+class AlReverbApi
+{
+public:
+    AlReverbApi();
+    ~AlReverbApi();
+
+public:
+    void flush();
+    int32_t get_latency();
+    int32_t set_param(AE_PARAMS_AL_REVERB *param);
+
+    // 线上接口
+    int32_t init(int32_t sample_rate, int32_t channel, int32_t n_type_id);
+    void reset();
+    int32_t process(float *data, int len);
+    int32_t uninit();
+private:
+    AlReverb * m_reverb;
+    CFilters * m_filter;
+
+    int m_sample_rate;
+    int m_channel;
+
+    bool m_need_filter; // 是否需要滤波
+    bool m_need_process; // 是否需要处理
+};
+}
+}
+
+
+#endif //AUDIO_EFFECTS_LIB_ALREVERBAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/inc/AlReverbDefs.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/inc/AlReverbDefs.h
new file mode 100755
index 0000000..df0a4c1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/inc/AlReverbDefs.h
@@ -0,0 +1,138 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//在 alreverb 工程中使用到的常量和结构
+
+#ifndef __AL_REVERB_TYPES_H__
+#define __AL_REVERB_TYPES_H__
+
+#include <stdint.h>
+#include "CAlReverbParams.h"
+#include "AudioEffectsConf.h"
+class Arp_param
+{
+public:
+    float fl_density;
+    float fl_diffusion;
+    float fl_gain;
+    float fl_gain_hf;
+    float fl_gain_lf;
+    float fl_decay_time;
+    float fl_decayhf_ratio;
+    float fl_decay_lf_ratio;
+    float fl_reflections_gain;
+    float fl_reflections_delay;
+    float fl_reflections_pan[3];
+    float fl_late_reverb_gain;
+    float fl_late_reverb_delay;
+    float fl_late_reverb_pan[3];
+    float fl_echo_time;
+    float fl_echo_depth;
+    float fl_modulation_time;
+    float fl_modulation_depth;
+    float fl_air_absorption_gain_hf;
+    float fl_hf_reference;
+    float fl_lf_reference;
+    float fl_room_rolloff_factor;
+    int   i_decay_hf_limit;
+};
+
+namespace SUPERSOUND
+{
+
+
+//安全删除指针
+#ifndef SAFE_DELETE_PTR
+#define SAFE_DELETE_PTR(a)	\
+{							\
+	if(a)					\
+	{						\
+		delete [] a;		\
+		a = NULL;			\
+	}						\
+}
+#endif /* SAFE_DELETE_PTR */
+
+#ifndef SAFE_DELETE_OBJ
+#define SAFE_DELETE_OBJ(a)	\
+{							\
+	if(a)					\
+	{						\
+		delete a;		\
+		a = NULL;			\
+	}						\
+}
+#endif /* SAFE_DELETE_OBJ */
+
+#ifndef MIN
+#define MIN(a,b) (((a) < (b)) ? (a) : (b))
+#endif /* MIN */
+
+#ifndef MAX
+#define MAX(a,b) (((a) > (b)) ? (a) : (b))
+#endif /* MAX */
+
+//将 a 规范到 [b, c] 之间
+#ifndef MIDDLE
+#define MIDDLE(a, b, c) (MIN(c, MAX(a, b)))
+#endif /* MIDDLE */
+
+#ifndef M_PI
+#define M_PI 3.14159265358979323846
+#endif /* M_PI */
+
+#ifndef FLOAT_EQUAL
+#define FLOAT_EQUAL(a, b)	(fabs((a) - (b)) <= 1E-5)
+#endif /* FLOAT_EQUAL */
+
+//必须是 2 的幂次，这样方便计算一些
+#define SUPERSOUND_WAV_BUF_STEP_LEN		1024
+#define SUPERSOUND_DEFAULT_FFT_LEN		SUPERSOUND_WAV_BUF_STEP_LEN
+#define SUPERSOUND_CHANNEL_PROC_LEN		SUPERSOUND_DEFAULT_FFT_LEN
+
+}
+
+//成功
+#define ERROR_SUPERSOUND_SUCCESS		0
+
+//输入参数有误
+#define ERROR_SUPERSOUND_PARAM			2000
+//内存不够
+#define ERROR_SUPERSOUND_MEMORY			2001
+
+enum ALRB_ERR {
+    ALRB_ERR_SUCCESS            = 0,
+    ALRB_ERR_PARAM              = -1,
+    ALRB_ERR_BASE_H_MALLOC_NULL = -2,
+};
+
+
+#endif /* __AL_REVERB_TYPES_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/AlReverbApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/AlReverbApi.cpp
new file mode 100644
index 0000000..78e253a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/AlReverbApi.cpp
@@ -0,0 +1,103 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#include "AlReverbApi.h"
+#include "AlReverb.h"
+#include "filter/CFilters.h"
+namespace SUPERSOUND
+{
+    namespace ALREVERB
+    {
+        AlReverbApi::AlReverbApi()
+        {
+            m_reverb = nullptr;
+            m_filter = nullptr;
+        }
+
+        AlReverbApi::~AlReverbApi()
+        {
+            uninit();
+        }
+
+        int32_t AlReverbApi::init(int32_t sample_rate, int32_t channel, int32_t n_type_id)
+        {
+            m_sample_rate = sample_rate;
+            m_channel = channel;
+
+            m_reverb = new AlReverb();
+            m_reverb->init(channel, sample_rate, n_type_id);
+
+            m_filter = new CFilters();
+            m_filter->Init(sample_rate, channel);
+            m_filter->setFilterType(LOW_PASS_FILTER);
+            m_need_filter = false;
+            m_need_process = false;
+            return ALRB_ERR_SUCCESS;
+        }
+
+        int32_t AlReverbApi::uninit()
+        {
+            if(nullptr != m_reverb)
+            {
+                m_reverb->uninit();
+                delete m_reverb;
+                m_reverb = nullptr;
+            }
+
+            if(nullptr != m_filter)
+            {
+                m_filter->Uninit();
+                delete m_filter;
+                m_filter = nullptr;
+            }
+            return ALRB_ERR_SUCCESS;
+        }
+
+        void AlReverbApi::reset()
+        {
+            m_filter->Reset();
+            m_reverb->reset();
+        }
+
+        int32_t AlReverbApi::set_param(AE_PARAMS_AL_REVERB *param)
+        {
+            if(nullptr == param)
+            {
+                m_need_process = false;
+                return ALRB_ERR_SUCCESS;
+            }
+            m_need_process = true;
+            m_need_filter = param->b_need_filter;
+            param->fs = m_sample_rate;
+            param->in_channels = m_channel;
+            param->out_channels = m_channel;
+            return m_reverb->set_param(param);
+        }
+
+        void AlReverbApi::flush()
+        {
+            m_filter->Reset();
+            m_reverb->flush();
+        }
+
+        int32_t AlReverbApi::get_latency()
+        {
+            return m_reverb->get_latecy();
+        }
+
+        int32_t AlReverbApi::process(float *data, int len)
+        {
+            if(!m_need_process)
+            {
+                return ALRB_ERR_SUCCESS;
+            }
+
+            if(m_need_filter)
+            {
+                m_filter->Process(data, len);
+            }
+            return m_reverb->process(data, len);
+        }
+    }
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb/AlReverb.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb/AlReverb.cpp
new file mode 100755
index 0000000..fce36e3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb/AlReverb.cpp
@@ -0,0 +1,415 @@
+
+#include "AlReverb.h"
+#include "AlReverbDefs.h"
+#include "AlReverbCommon.h"
+#include <math.h>
+#include <string.h>
+#include <stdio.h>
+#include <stdlib.h>
+
+#define ARP_EFFECT_ID_MAX 8
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+static Arp_param aEaxPreset[ARP_EFFECT_ID_MAX] =
+        {
+                // EFX_REVERB_PRESET_GENERIC				0
+                { 1.0000f, 1.0000f, 0.01f, 0.8913f, 1.0000f, 1.4900f, 0.8300f, 1.0000f, 0.0500f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 1.2589f, 0.0110f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+//    { 1.0000f, 1.0000f, 0.3162f, 0.8913f, 1.0000f, 1.4900f, 0.8300f, 1.0000f, 0.0500f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 1.2589f, 0.0110f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+                //{ 1.0000f, 1.0000f, 0.1f, 0.8913f, 1.0000f, 1.4900f, 0.8300f, 1.0000f, 0.0500f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 1.2589f, 0.0110f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+                //EFX_REVERB_PRESET_GENERIC
+                { 1.0000f, 1.0000f, 0.1f, 0.8913f, 1.0000f, 1.4900f, 0.8300f, 1.0000f, 0.0500f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 1.2589f, 0.0110f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                //EFX_REVERB_PRESET_CITY_STREETS
+                { 1.0000f, 0.7800f, 0.1f, 0.7079f, 0.8913f, 1.7900f, 1.1200f, 0.9100f, 0.2818f, 0.0460f, { 0.0000f, 0.0000f, 0.0000f }, 0.1995f, 0.0280f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.2000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                //EFX_REVERB_PRESET_GENERIC
+                { 1.0000f, 1.0000f, 0.1f, 0.8913f, 1.0000f, 1.4900f, 0.8300f, 1.0000f, 0.0500f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 1.2589f, 0.0110f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                //EFX_REVERB_PRESET_CASTLE_COURTYARD
+                { 1.0000f, 0.4200f, 0.1162f, 0.4467f, 0.1995f, 2.1300f, 0.6100f, 0.2300f, 0.2239f, 0.1600f, { 0.0000f, 0.0000f, 0.0000f }, 0.7079f, 0.0360f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.3700f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x0 },
+
+                //EFX_REVERB_PRESET_CASTLE_HALL
+                { 1.0000f, 0.8100f, 0.1162f, 0.2818f, 0.1778f, 7.5400f, 0.7900f, 0.6200f, 0.1778f, 0.0560f, { 0.0000f, 0.0000f, 0.0000f }, 1.1220f, 0.0240f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.5000f, 0.2500f, 0.0000f, 0.9943f, 5168.6001f, 139.5000f, 0.0000f, 0x1 },
+
+
+                //EFX_REVERB_PRESET_DIZZY_NEW
+                { 0.3645f, 0.6000f, 0.1f, 0.6310f, 1.0000f, 6.2300f, 0.5600f, 1.0000f, 0.1392f, 0.0200f, { 0.0000f, 0.0000f, 0.0000f }, 0.4937f, 0.0300f, { 0.0000f, 0.0000f, 0.0000f }, 0.8500f, 0.6000f, 0.8100f, 0.3100f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x0 },
+
+                //EFX_REVERB_PRESET_CASTLE_HALL_NEW
+                { 1.0000f, 0.8100f, 0.1162f, 0.2818f, 0.1778f, 10.400f, 0.7900f, 0.6200f, 0.1778f, 0.0560f, { 0.0000f, 0.0000f, 0.0000f }, 1.1220f, 0.0240f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.9500f, 0.2500f, 0.0000f, 0.9943f, 5168.6001f, 139.5000f, 0.0000f, 0x1 },
+
+
+                // EFX_REVERB_PRESET_ROOM					2
+                //{ 0.4287f, 1.0000f, 0.3162f, 0.5929f, 1.0000f, 0.4000f, 0.8300f, 1.0000f, 0.1503f, 0.0020f, { 0.0000f, 0.0000f, 0.0000f }, 1.0629f, 0.0030f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_CONCERTHALL			7
+                //{ 1.0000f, 1.0000f, 0.3162f, 0.5623f, 1.0000f, 3.9200f, 0.7000f, 1.0000f, 0.2427f, 0.0200f, { 0.0000f, 0.0000f, 0.0000f }, 0.9977f, 0.0290f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_ARENA					9
+                //{ 1.0000f, 1.0000f, 0.3162f, 0.4477f, 1.0000f, 7.2400f, 0.3300f, 1.0000f, 0.2612f, 0.0200f, { 0.0000f, 0.0000f, 0.0000f }, 1.0186f, 0.0300f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_ICEPALACE_HALL			49
+                //{ 1.0000f, 0.7600f, 0.3162f, 0.4467f, 0.5623f, 5.4900f, 1.5300f, 0.3800f, 0.1122f, 0.0540f, { 0.0000f, 0.0000f, 0.0000f }, 0.6310f, 0.0520f, { 0.0000f, 0.0000f, 0.0000f }, 0.2260f, 0.1100f, 0.2500f, 0.0000f, 0.9943f, 12428.5000f, 99.6000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_SPACESTATION_CUPBOARD	59
+                //{ 0.1715f, 0.5600f, 0.3162f, 0.7079f, 0.8913f, 0.7900f, 0.8100f, 0.5500f, 1.4125f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 1.7783f, 0.0180f, { 0.0000f, 0.0000f, 0.0000f }, 0.1810f, 0.3100f, 0.2500f, 0.0000f, 0.9943f, 3316.1001f, 458.2000f, 0.0000f, 0x1 },
+
+
+                // EFX_REVERB_PRESET_STONEROOM						5
+                //{ 1.0000f, 1.0000f, 0.3162f, 0.7079f, 1.0000f, 2.3100f, 0.6400f, 1.0000f, 0.4411f, 0.0120f, { 0.0000f, 0.0000f, 0.0000f }, 1.1003f, 0.0170f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_AUDITORIUM						6
+                //{ 1.0000f, 1.0000f, 0.3162f, 0.5781f, 1.0000f, 4.3200f, 0.5900f, 1.0000f, 0.4032f, 0.0200f, { 0.0000f, 0.0000f, 0.0000f }, 0.7170f, 0.0300f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_CAVE							8
+                //{ 1.0000f, 1.0000f, 0.3162f, 1.0000f, 1.0000f, 2.9100f, 1.3000f, 1.0000f, 0.5000f, 0.0150f, { 0.0000f, 0.0000f, 0.0000f }, 0.7063f, 0.0220f, { 0.0000f, 0.0000f, 0.0000f }, 0.2500f, 0.0000f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x0 },
+
+                // EFX_REVERB_PRESET_ALLEY							14
+                //{ 1.0000f, 0.3000f, 0.3162f, 0.7328f, 1.0000f, 1.4900f, 0.8600f, 1.0000f, 0.2500f, 0.0070f, { 0.0000f, 0.0000f, 0.0000f }, 0.9954f, 0.0110f, { 0.0000f, 0.0000f, 0.0000f }, 0.1250f, 0.9500f, 0.2500f, 0.0000f, 0.9943f, 5000.0000f, 250.0000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_FACTORY_LARGEROOM				38, // 工厂，大房间  将此效果作为停车场的代替
+                //{ 0.4287f, 0.7500f, 0.2512f, 0.7079f, 0.6310f, 4.2400f, 0.5100f, 1.3100f, 0.1778f, 0.0390f, { 0.0000f, 0.0000f, 0.0000f }, 1.1220f, 0.0230f, { 0.0000f, 0.0000f, 0.0000f }, 0.2310f, 0.0700f, 0.2500f, 0.0000f, 0.9943f, 3762.6001f, 362.5000f, 0.0000f, 0x1 },
+
+                // EFX_REVERB_PRESET_CITY_LIBRARY					107, // 城市，图书馆
+                //{ 1.0000f, 0.8200f, 0.3162f, 0.2818f, 0.0891f, 2.7600f, 0.8900f, 0.4100f, 0.3548f, 0.0290f, { 0.0000f, 0.0000f, -0.0000f }, 0.8913f, 0.0200f, { 0.0000f, 0.0000f, 0.0000f }, 0.1300f, 0.1700f, 0.2500f, 0.0000f, 0.9943f, 2854.3999f, 107.5000f, 0.0000f, 0x0 },
+
+        };
+
+AlReverb::AlReverb()
+{
+	m_late_desity_gain = 1;
+	m_b_update = true;
+	m_current_id = 0;
+	memset(&m_current_param, 0, sizeof(m_current_param));
+	//默认配置
+	m_new_param.fs = 44100;
+	m_new_param.in_channels = 2;
+	m_new_param.out_channels = 2;
+	m_new_param.density = 1;
+	m_new_param.diffusion = 1;
+	m_new_param.reverbGain = 0.3162f;
+	m_new_param.lowpass_gain = 0.5623f;
+	m_new_param.highpass_gain = 1;
+	m_new_param.decay_time = 3.92f;
+	m_new_param.lowpass_ratio = 0.7f;
+	m_new_param.early_gain = 0.2427f;
+	m_new_param.late_gain = 0.9977f;
+	m_new_param.lowpass_reference = 5000;
+	m_new_param.highpass_reference = 250;
+	m_new_param.echo_time = 0.25f;
+	m_new_param.echo_depth = 0;
+	m_new_param.modulation_time = 0.25f;
+	m_new_param.modulation_depth = 0;
+	m_new_param.early_delay = 0.02f;
+	m_new_param.late_delay = 0.029f;
+	m_new_param.lowpass_air_absorption_gain = 0.9943f;
+	m_new_param.b_decay_lowpass_limit = 1;
+}
+
+AlReverb::~AlReverb()
+{
+
+}
+
+void AlReverb::flush()
+{
+    m_lowpass.flush();
+    m_highpass.flush();
+    m_modulation.flush();
+    m_early_delay.flush();
+    m_late_delay.flush();
+    m_early_reflection.flush();
+    m_late_reverb.flush();
+    m_echo.flush();
+
+	for(int32_t i = 0; i < 3; i++)
+	{
+        m_decorrelator[i].flush();
+	}
+}
+
+int32_t AlReverb::get_latecy()
+{
+	//因为本身作为干声输出所以没有延迟量了
+	return 0;
+}
+
+void AlReverb::control_update()
+{
+	m_b_update = true;
+}
+
+int32_t AlReverb::set_param(AE_PARAMS_AL_REVERB *param)
+{
+	m_new_param = *param;
+    control_update();
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t AlReverb::process(std::vector<float *> &buf_vector, int32_t in_num)
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	float early[4], late[4];
+	float taps[4];
+	float in;
+	float * left = buf_vector[0];
+	float * right = NULL;
+
+	//看是否需要更新参数
+	if(m_b_update)
+	{
+		nRet = update();
+		m_b_update = false;
+		if(nRet != ERROR_SUPERSOUND_SUCCESS)
+			return nRet;
+	}
+
+	//给右声道赋值
+	if(m_current_param.in_channels == 2)
+		right = buf_vector[1];
+
+	//因为本来这个proc的长度是为双声道准备的，这里预处理之后变成了单声道的数据
+	for(int32_t i = 0; i < in_num; i++)
+	{
+		if(right == NULL)
+			in = left[i] / 4;
+		else
+			in = (left[i] + right[i]) / 8;
+
+		in = m_lowpass.filtef(in);
+		in = m_highpass.filtef(in);
+
+		in = m_modulation.filter(in);
+		//前期反射处理
+		in = m_early_delay.filter(in);
+        m_early_reflection.filter(in, early);
+		//后期混响处理
+		in = m_late_delay.filter(in);
+		taps[0] = in * m_late_desity_gain;
+		taps[1] = m_decorrelator[0].filter(taps[0]);
+		taps[2] = m_decorrelator[1].filter(taps[0]);
+		taps[3] = m_decorrelator[2].filter(taps[0]);
+
+        m_late_reverb.filter(taps, late);
+		m_echo.Filter(in, late);
+		if(right == NULL)
+		{
+			left[i] = left[i] + (early[2] + late[2]) * 4;
+		}
+		else
+		{
+			left[i] = left[i] + (early[0] + late[0]) * 8;
+			right[i] = right[i] + (early[1] + late[1]) * 8;
+		}
+	}
+	return nRet;
+}
+
+int32_t AlReverb::update()
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+    // 低通
+    nRet = m_lowpass.set_high_shelf_param(m_new_param.fs,
+                                          m_new_param.highpass_reference,
+                                          m_new_param.highpass_gain,
+                                          0.75f);
+
+    if(nRet != ERROR_SUPERSOUND_SUCCESS)
+        return nRet;
+
+    // 高通
+    nRet = m_highpass.set_low_shelf_param(m_new_param.fs,
+                                          m_new_param.lowpass_reference,
+                                          m_new_param.lowpass_gain,
+                                          0.75f);
+    if(nRet != ERROR_SUPERSOUND_SUCCESS)
+        return nRet;
+
+    // 一个点的延迟
+	nRet = m_modulation.set_param(m_new_param.fs,
+                                  m_new_param.modulation_time,
+                                  m_new_param.modulation_depth);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	// 前向延迟
+	nRet = m_early_delay.set_delay_len(int32_t(float(m_new_param.fs * m_new_param.early_delay)));
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	// 后向延迟
+	nRet = m_late_delay.set_delay_len(int32_t(m_new_param.fs * m_new_param.late_delay));
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	// 前向反射
+	nRet = m_early_reflection.set_param(m_new_param.fs,
+                                        m_new_param.reverbGain,
+                                        m_new_param.early_gain,
+                                        m_new_param.late_delay);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	// 计算hfRatio
+	float hfRatio = m_new_param.highpass_ratio;
+	if(m_new_param.b_decay_lowpass_limit && (m_new_param.lowpass_air_absorption_gain < 1))
+	{
+		hfRatio = calc_limited_hf_ratio(hfRatio, m_new_param.lowpass_air_absorption_gain, m_new_param.decay_time);
+	}
+
+    // 后向反射
+    nRet = m_late_reverb.set_param(m_new_param.fs,
+                                   m_new_param.reverbGain,
+                                   m_new_param.late_gain,
+                                   m_new_param.density,
+                                   m_new_param.decay_time,
+                                   m_new_param.diffusion,
+                                   hfRatio,
+                                   m_new_param.highpass_reference);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	// 回响
+	nRet = m_echo.set_param(m_new_param.fs,
+                            m_new_param.reverbGain,
+                            m_new_param.late_gain,
+                            m_new_param.echo_time,
+                            m_new_param.decay_time,
+                            m_new_param.diffusion,
+                            m_new_param.echo_depth,
+                            hfRatio,
+                            m_new_param.lowpass_reference);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	// 解相关
+	for(int32_t i = 0; i < 3; i++)
+	{
+		float length = (0.15f * pow(2, (float)i)) * (1 + m_new_param.density * 4) * 0.0211f;
+		nRet = m_decorrelator[i].set_delay_len(int32_t(length * m_new_param.fs));
+		if(nRet != ERROR_SUPERSOUND_SUCCESS)
+			return nRet;
+	}
+
+	m_late_desity_gain = m_late_reverb.get_density_gain();
+
+	m_current_param = m_new_param;
+
+	return nRet;
+}
+
+/**
+ * 更新音效id&参数
+ * @param n_type_id
+ * @return
+ */
+int32_t AlReverb::reset_effect_id(int n_type_id, bool is_init)
+{
+    // 输出参数错误
+    if(n_type_id >= ARP_EFFECT_ID_MAX || n_type_id < 0)
+    {
+        return ERROR_SUPERSOUND_PARAM;
+    }
+
+    if(m_current_id != n_type_id || is_init)
+    {
+        // 参数更改
+        m_new_param.density = aEaxPreset[n_type_id].fl_density;
+        m_new_param.diffusion = aEaxPreset[n_type_id].fl_diffusion;
+        m_new_param.reverbGain = aEaxPreset[n_type_id].fl_gain;
+        m_new_param.highpass_gain = aEaxPreset[n_type_id].fl_gain_hf;
+        m_new_param.lowpass_gain = aEaxPreset[n_type_id].fl_gain_lf;
+        m_new_param.decay_time = aEaxPreset[n_type_id].fl_decay_time;
+        m_new_param.highpass_ratio = aEaxPreset[n_type_id].fl_decayhf_ratio;
+        m_new_param.lowpass_ratio = aEaxPreset[n_type_id].fl_decay_lf_ratio;
+        m_new_param.early_gain = aEaxPreset[n_type_id].fl_reflections_gain;
+        m_new_param.early_delay = aEaxPreset[n_type_id].fl_reflections_delay;
+        m_new_param.late_gain = aEaxPreset[n_type_id].fl_late_reverb_gain;
+        m_new_param.late_delay = aEaxPreset[n_type_id].fl_late_reverb_delay;
+        m_new_param.echo_time = aEaxPreset[n_type_id].fl_echo_time;
+        m_new_param.echo_depth = aEaxPreset[n_type_id].fl_echo_depth;
+        m_new_param.modulation_time = aEaxPreset[n_type_id].fl_modulation_time;
+        m_new_param.modulation_depth = aEaxPreset[n_type_id].fl_modulation_depth;
+        m_new_param.lowpass_air_absorption_gain = aEaxPreset[n_type_id].fl_air_absorption_gain_hf;
+        m_new_param.highpass_reference = aEaxPreset[n_type_id].fl_hf_reference;
+        m_new_param.lowpass_reference = aEaxPreset[n_type_id].fl_lf_reference;
+        m_new_param.b_decay_lowpass_limit = aEaxPreset[n_type_id].i_decay_hf_limit;
+        m_new_param.in_channels = m_channels;
+        m_new_param.out_channels = m_channels;
+        m_new_param.fs = m_freq;
+        m_current_id = n_type_id;
+        control_update();
+    }
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t AlReverb::init(int32_t channels, int32_t freq, int32_t n_type_id)
+{
+    m_channels = channels;
+    m_freq = freq;
+    reset_effect_id(n_type_id, true);
+    m_current_param = m_new_param; // 保证代码一致
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t AlReverb::uninit()
+{
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t AlReverb::process(float *data, int len)
+{
+    std::vector<float*> buf_vector;
+    int nStep = SUPERSOUND_CHANNEL_PROC_LEN;
+    int nRet = ERROR_SUPERSOUND_SUCCESS;
+    for(int i=0;i<len;i+=nStep) {
+        if (len - i < nStep) {
+            nStep = len - i;
+        }
+
+        int tpLen = nStep;
+        // 输入数据整理
+        buf_vector.clear();
+        if (m_current_param.in_channels == 2) {
+            memset(m_left, 0, sizeof(float) * ALR_MAX_PROCESS_BLOCK);
+            memset(m_right, 0, sizeof(float) * ALR_MAX_PROCESS_BLOCK);
+
+            for (unsigned int index = 0; index < nStep; index += 2) {
+                int tpIndex = index / 2;
+                m_left[tpIndex] = data[i + index];
+                m_right[tpIndex] = data[i + index + 1];
+            }
+            buf_vector.push_back(m_left);
+            buf_vector.push_back(m_right);
+            tpLen /= 2;
+        } else {
+            buf_vector.push_back(data + i);
+        }
+        //处理
+        nRet = process(buf_vector, tpLen);
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        {
+            return nRet;
+        }
+        // 输出数据整理
+        if (m_current_param.in_channels == 2) {
+            for (int index = 0; index < tpLen; index++) {
+                data[index * 2 + i] = buf_vector[0][index];
+                data[index * 2 + i + 1] = buf_vector[1][index];
+            }
+        }
+    }
+    return nRet;
+}
+
+void AlReverb::reset()
+{
+    flush();
+}
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb/AlReverb.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb/AlReverb.h
new file mode 100755
index 0000000..d75aa47
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb/AlReverb.h
@@ -0,0 +1,112 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现 openal 中的 reverb 效果
+//这里的早起反射和后期延迟和正常的想法有点出入，主要是这里将声道进行了合并，导致了需要多声道输出
+//但是实际应该每个通道，单独处理的
+
+#ifndef __AL_REVERB_H__
+#define __AL_REVERB_H__
+
+#include "AlReverbBiquad.h"
+#include "AlReverbDefs.h"
+#include "AlReverbEarlyReflection.h"
+#include "AlReverbLateReverb.h"
+#include "AlReverbEcho.h"
+#include "AlReverbModulation.h"
+#include <vector>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+#define ALR_MAX_PROCESS_BLOCK 4096
+class AlReverb
+{
+public:
+	AlReverb();
+	~AlReverb();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	void control_update();
+	int32_t set_param(AE_PARAMS_AL_REVERB *param);
+	int32_t process(std::vector<float *> &buf_vector, int32_t in_num);
+
+	// 线上接口
+	int32_t init(int32_t channels, int32_t freq, int32_t n_type_id);
+	void reset();
+    int32_t reset_effect_id(int n_type_id, bool is_init = false);
+    int32_t process(float *data, int len);
+	int32_t uninit();
+
+private:
+	int32_t update();
+private:
+    AE_PARAMS_AL_REVERB m_current_param;
+    AE_PARAMS_AL_REVERB m_new_param;
+
+	//高低切
+	AlReverbBiquad m_lowpass;
+	AlReverbBiquad m_highpass;
+	//调制过程
+	AlReverbModulation m_modulation;
+	//前期反射和后期混响延迟
+	SuperSoundFastDelay m_early_delay;
+	SuperSoundFastDelay m_late_delay;
+	//前期反射和后期混响
+	AlReverbEarlyReflection m_early_reflection;
+	AlReverbLateReverb m_late_reverb;
+	//回声效果
+	AlReverbEcho m_echo;
+	//解相关
+	SuperSoundFastDelay m_decorrelator[3];
+
+	float m_late_desity_gain;
+	bool m_b_update;
+
+	//左右声道
+    float m_left[ALR_MAX_PROCESS_BLOCK];
+    float m_right[ALR_MAX_PROCESS_BLOCK];
+
+	// 基础参数
+	int32_t m_channels;
+	int32_t m_freq;
+	int32_t m_current_id;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_biquad/AlReverbBiquad.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_biquad/AlReverbBiquad.cpp
new file mode 100755
index 0000000..5901c8f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_biquad/AlReverbBiquad.cpp
@@ -0,0 +1,89 @@
+
+#include "AlReverbBiquad.h"
+#include "AlReverbDefs.h"
+#include <math.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+AlReverbBiquad::AlReverbBiquad()
+{
+	m_a1 = 0;
+	m_a2 = 0;
+	//输入什么输出什么
+	m_b0 = 1;
+	m_b1 = 0;
+	m_b2 = 0;
+
+    flush();
+}
+
+AlReverbBiquad::~AlReverbBiquad()
+{
+
+}
+
+void AlReverbBiquad::flush()
+{
+	m_x1 = 0;
+	m_x2 = 0;
+	m_y1 = 0;
+	m_y2 = 0;
+}
+
+int32_t AlReverbBiquad::get_latecy()
+{
+	return 0;
+}
+
+int32_t AlReverbBiquad::set_high_shelf_param(int32_t fs, float f0, float A, float S)
+{
+	float w0 = float(2 * M_PI * f0 / fs);
+	A = MAX(A, 0.00001f);
+	float alpha = sin(w0) / 2 * sqrt((A + 1 / A)*(1 / S - 1) + 2);
+	float a0 = (A + 1) - (A - 1) * cos(w0) + 2 * sqrt(A) * alpha;
+
+	m_b0 = (A * ((A + 1) + (A - 1) * cos(w0) + 2 * sqrt(A) * alpha)) / a0;
+	m_b1 = (-2 * A * ((A - 1) + (A + 1) * cos(w0))) / a0;
+	m_b2 = (A * ((A + 1) + (A - 1) * cos(w0) - 2 * sqrt(A) * alpha)) / a0;
+	m_a1 = (2 * ((A - 1) - (A + 1) * cos(w0))) / a0;
+	m_a2 = ((A + 1) - (A - 1) * cos(w0) - 2 * sqrt(A) * alpha) / a0;
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t AlReverbBiquad::set_low_shelf_param(int32_t fs, float f0, float A, float S)
+{
+	float w0 = float(2 * M_PI * f0 / fs);
+	A = MAX(A, 0.00001f);
+	float  alpha = sin(w0) / 2 * sqrt((A + 1 / A) * (1 / S - 1) + 2);
+	float a0 = (A + 1) + (A - 1) * cos(w0) + 2 * sqrt(A) * alpha;
+
+	m_b0 = (A * ((A + 1) - (A - 1) * cos(w0) + 2 * sqrt(A) * alpha)) / a0;
+	m_b1 = (2 * A * ((A - 1) - (A + 1) * cos(w0))) / a0;
+	m_b2 = (A * ((A + 1) - (A - 1) * cos(w0) - 2 * sqrt(A) * alpha)) / a0;
+	m_a1 = (-2 * ((A - 1) + (A + 1) * cos(w0))) / a0;
+	m_a2 = ((A + 1) + (A - 1) * cos(w0) - 2 * sqrt(A) * alpha) / a0;
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+float AlReverbBiquad::filtef(float in)
+{
+	float out = m_b0 * in + m_b1 * m_x1 + m_b2 * m_x2 -
+		m_a1 * m_y1 - m_a2 * m_y2;
+
+	m_x2 = m_x1;
+	m_x1 = in;
+	m_y2 = m_y1;
+	m_y1 = out;
+
+	return out;
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_biquad/AlReverbBiquad.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_biquad/AlReverbBiquad.h
new file mode 100755
index 0000000..6890ac6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_biquad/AlReverbBiquad.h
@@ -0,0 +1,75 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//这里和 AuidoEQCookBook 相同，主要使用了 Shelf 滤波器
+
+#ifndef __AL_REVERB_BIQUAD_H__
+#define __AL_REVERB_BIQUAD_H__
+
+#include <stdint.h>
+#include "AudioEffectsConf.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+class AlReverbBiquad
+{
+public:
+	AlReverbBiquad();
+	~AlReverbBiquad();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_high_shelf_param(int32_t fs, float f0, float A, float S);
+	int32_t set_low_shelf_param(int32_t fs, float f0, float A, float S);
+	float filtef(float in);
+
+private:
+	float m_x1;
+	float m_x2;
+	float m_y1;
+	float m_y2;
+	float m_a1;
+	float m_a2;
+	float m_b0;
+	float m_b1;
+	float m_b2;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_BIQUAD_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_common/AlReverbCommon.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_common/AlReverbCommon.cpp
new file mode 100755
index 0000000..3239e82
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_common/AlReverbCommon.cpp
@@ -0,0 +1,112 @@
+
+#include "AlReverbCommon.h"
+#include "AlReverbDefs.h"
+#include <math.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+float calc_decay_coeff(float length, float decay_time)
+{
+	// -60dB 就是 0.001
+	return pow(0.001f, length / decay_time);
+}
+
+// Calculate a decay length from a coefficient and the time until the decay
+// reaches -60 dB.
+float calc_decay_length(float coeff, float decay_time)
+{
+	return log(coeff) * decay_time / log(0.001f)/*-60 dB*/;
+}
+
+float calc_damping_coeff(int32_t fs, float hf_ratio, float length, float decay_time, float f0)
+{
+	float coeff = 0;
+	float gain;
+	float cw;
+
+	//如果大于 1 的话那么就会变成增强
+	if(hf_ratio < 1)
+	{
+		gain = calc_decay_coeff(length, decay_time * hf_ratio) / calc_decay_coeff(length, decay_time);
+		cw = (float)cos(2 * M_PI * f0 / fs);
+
+		//因为是单极点滤波器，因此增益需要取平方 
+		gain *= gain;
+
+		//近似和 1（这里利用 1 - epsilon） 进行判断
+		if(gain < 0.9999f)
+		{
+			//如果增益小于 -60dB 的话，将会导致系数趋近于 1，最后将是一个平坦的信号
+			gain = MAX(gain, 0.001f);
+			coeff = (1 - gain * cw - sqrt(2 * gain * (1 - cw) - gain * gain * (1 - cw * cw))) / (1 - gain);
+		}
+
+		//非常小的衰减时间将会导致非常小的输出，因此这里取个下限
+		coeff = MIN(coeff, 0.98f);
+	}
+
+	return coeff;
+}
+
+float lerp( float val1, float val2, float mu )
+{
+	return val1 + (val2 - val1) * mu;
+}
+
+float calc_density_gain(float a)
+{
+	/* The energy of a signal can be obtained by finding the area under the
+     * squared signal.  This takes the form of Sum(x_n^2), where x is the
+     * amplitude for the sample n.
+     *
+     * Decaying feedback matches exponential decay of the form Sum(a^n),
+     * where a is the attenuation coefficient, and n is the sample.  The area
+     * under this decay curve can be calculated as:  1 / (1 - a).
+     *
+     * Modifying the above equation to find the squared area under the curve
+     * (for energy) yields:  1 / (1 - a^2).  Input attenuation can then be
+     * calculated by inverting the square root of this approximation,
+     * yielding:  1 / sqrt(1 / (1 - a^2)), simplified to: sqrt(1 - a^2).
+     */
+    return sqrt(1 - (a * a));
+}
+
+// Calculate the mixing matrix coefficients given a diffusion factor.
+void calc_matrix_coeffs(float diffusion, float *x, float *y)
+{
+	float n, t;
+
+	// The matrix is of order 4, so n is sqrt (4 - 1).
+	n = sqrt(3.0f);
+	t = diffusion * atan(n);
+
+	// Calculate the first mixing matrix coefficient.
+	*x = cos(t);
+	// Calculate the second mixing matrix coefficient.
+	*y = sin(t) / n;
+}
+
+// Calculate the limited HF ratio for use with the late reverb low-pass
+// filters.
+float calc_limited_hf_ratio(float hf_ratio, float air_absorption_gain_hf, float decay_time)
+{
+    float limitRatio;
+
+    /* Find the attenuation due to air absorption in dB (converting delay
+     * time to meters using the speed of sound).  Then reversing the decay
+     * equation, solve for HF ratio.  The delay length is cancelled out of
+     * the equation, so it can be calculated once for all lines.
+     */
+    limitRatio = 1.0f / (calc_decay_length(air_absorption_gain_hf, decay_time) *
+                         343.3f/*SPEEDOFSOUNDMETRESPERSEC*/);
+    /* Using the limit calculated above, apply the upper bound to the HF
+     * ratio. Also need to limit the result to a minimum of 0.1, just like the
+     * HF ratio parameter. */
+	return MIDDLE(limitRatio, 0.1f, hf_ratio);
+}
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_common/AlReverbCommon.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_common/AlReverbCommon.h
new file mode 100755
index 0000000..27af5f9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_common/AlReverbCommon.h
@@ -0,0 +1,68 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//包含 openal reverb 库中需要处理的一些基础函数
+
+#ifndef __AL_REVERB_COMMON_H__
+#define __AL_REVERB_COMMON_H__
+
+
+
+#include <stdint.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+//第一个参数是延迟长度，也就是多久算一次，第二个是 T60 衰减时间
+float calc_decay_coeff(float length, float decay_time);
+
+float calc_decay_length(float coeff, float decay_time);
+
+//计算高通（甚至低通）的衰减系数
+float calc_damping_coeff(int32_t fs, float hf_ratio, float length, float decay_time, float f0);
+
+//线性插值的 lerp 函数
+float lerp(float val1, float val2, float mu);
+
+//计算密度衰减增益
+float calc_density_gain(float a);
+
+//计算混合矩阵系数
+void calc_matrix_coeffs(float diffusion, float *x, float *y);
+
+float calc_limited_hf_ratio(float hf_ratio, float air_absorption_gain_hf, float decay_time);
+}
+}
+
+#endif /* __AL_REVERB_COMMON_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection/AlReverbEarlyReflection.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection/AlReverbEarlyReflection.cpp
new file mode 100755
index 0000000..fcfcb18
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection/AlReverbEarlyReflection.cpp
@@ -0,0 +1,90 @@
+
+#include "AlReverbEarlyReflection.h"
+#include "AlReverbCommon.h"
+
+#include "AlReverbDefs.h"
+#include <string.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+// 4 个早期反射的延迟量
+const static float gs_early_delay[4] = {
+	0.0015f, 0.0045f, 0.0135f, 0.0405f
+};
+
+AlReverbEarlyReflection::AlReverbEarlyReflection()
+{
+	memset(m_decay, 0, sizeof(m_decay));
+	m_gain = 1;
+}
+
+AlReverbEarlyReflection::~AlReverbEarlyReflection()
+{
+
+}
+
+void AlReverbEarlyReflection::flush()
+{
+	for(int32_t i = 0; i < 4; i++)
+	{
+        m_delay[i].flush();
+	}
+}
+
+int32_t AlReverbEarlyReflection::get_latency()
+{
+	int32_t latecy = m_delay[0].get_latecy();
+
+	for(int32_t i = 0; i < 4; i++)
+	{
+		latecy = MIN(latecy, m_delay[i].get_latecy());
+	}
+
+	return latecy;
+}
+
+int32_t AlReverbEarlyReflection::set_param(int32_t fs, float reverb_gain, float early_gain, float late_delay)
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	m_gain = 0.5f * reverb_gain * early_gain;
+
+	for(int32_t i = 0; i < 4; i++)
+	{
+		nRet = m_delay[i].set_delay_len(int32_t(fs * gs_early_delay[i]));
+		if(nRet != ERROR_SUPERSOUND_SUCCESS)
+			return nRet;
+
+		m_decay[i] = calc_decay_coeff(gs_early_delay[i], late_delay);
+	}
+
+	return nRet;
+}
+
+void AlReverbEarlyReflection::filter(float in, float (&out)[4])
+{
+	float sum = 0;
+
+	for(int32_t i = 0; i < 4; i++)
+	{
+		out[i] = m_delay[i].get_now() * m_decay[i];
+		sum += out[i];
+	}
+
+	sum = sum * 0.5f + in;
+
+	for(int32_t i = 0; i < 4; i++)
+	{
+		out[i] = sum - out[i];
+        m_delay[i].put_now(out[i]);
+		out[i] *= m_gain;
+	}
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection/AlReverbEarlyReflection.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection/AlReverbEarlyReflection.h
new file mode 100755
index 0000000..756e826
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_early_reflection/AlReverbEarlyReflection.h
@@ -0,0 +1,72 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现早期反射模型的类，本来应该是单纯的梳状滤波器组的，但是这里将梳状滤波叠加延迟，增加了混响强度
+
+#ifndef __AL_REVERB_EARLY_REFLECTION_H__
+#define __AL_REVERB_EARLY_REFLECTION_H__
+
+#include "fast_delay/SupersoundFastDelay.h"
+
+namespace SUPERSOUND
+{
+
+namespace ALREVERB
+{
+
+
+class AlReverbEarlyReflection
+{
+public:
+	AlReverbEarlyReflection();
+	~AlReverbEarlyReflection();
+
+public:
+	void flush();
+	int32_t get_latency();
+	int32_t set_param(int32_t fs, float reverb_gain, float early_gain, float late_delay);
+	//这个有点蛋碎，和正常的滤波器不是那么一致
+	void filter(float in, float (&out)[4]);
+
+private:
+	//利用无损衍射的waveguide理论创建最大的漫反射效果，也就是延迟反馈网络
+	SuperSoundFastDelay m_delay[4];
+	//每个延迟的衰减系数，也就是计算到衰减-60dB，每次衰减需要衰减多少
+	float m_decay[4];
+	//最后的输出增益
+	float m_gain;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_EARLY_REFLECTION_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_echo/AlReverbEcho.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_echo/AlReverbEcho.cpp
new file mode 100755
index 0000000..983f2f0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_echo/AlReverbEcho.cpp
@@ -0,0 +1,94 @@
+
+#include "AlReverbEcho.h"
+#include "AlReverbDefs.h"
+#include "AlReverbCommon.h"
+#include <string.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+// When diffusion is above 0, an all-pass filter is used to take the edge off
+// the echo effect.  It uses the following line length (in seconds).
+#define ECHO_ALLPASS_LENGTH		0.0133f
+
+AlReverbEcho::AlReverbEcho()
+{
+	m_coeff = 0;
+	m_densityGain = 0;
+	memset(m_mixCoeff, 0, sizeof(m_mixCoeff));
+}
+
+AlReverbEcho::~AlReverbEcho()
+{
+
+}
+
+void AlReverbEcho::flush()
+{
+    m_delay.flush();
+    m_lowpass.flush();
+    m_allpass.flush();
+}
+
+int32_t AlReverbEcho::get_latecy()
+{
+	return m_delay.get_latecy() + m_lowpass.get_latecy() + m_allpass.get_latecy();
+}
+
+int32_t AlReverbEcho::set_param(int32_t fs, float reverb_gain, float late_gain, float echo_time,
+                                float decay_time, float diffusion, float echo_depth, float hf_ratio, float f0)
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	m_coeff = calc_decay_coeff(echo_time, decay_time);
+
+	m_densityGain = calc_density_gain(m_coeff);
+
+	nRet = m_delay.set_delay_len(int32_t(fs * echo_time));
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	nRet = m_allpass.set_param(fs, diffusion, ECHO_ALLPASS_LENGTH, decay_time);
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	nRet = m_lowpass.set_param(fs, hf_ratio, echo_time, decay_time, f0);
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	/* Calculate the echo mixing coefficients.  The first is applied to the
+     * echo itself.  The second is used to attenuate the late reverb when
+     * echo depth is high and diffusion is low, so the echo is slightly
+     * stronger than the decorrelated echos in the reverb tail.
+     */
+    m_mixCoeff[0] = reverb_gain * late_gain * echo_depth;
+    m_mixCoeff[1] = 1 - (echo_depth * 0.5f * (1 - diffusion));
+
+	return nRet;
+}
+
+void AlReverbEcho::Filter( float in, float (&in_out)[4] )
+{
+	float feed = m_delay.get_now() * m_coeff;
+	float out = m_mixCoeff[0] * feed;
+
+	for(int32_t i = 0; i < 4; i++)
+	{
+		in_out[i] = m_mixCoeff[1] * in_out[i] + out;
+	}
+
+	feed += m_densityGain * in;
+
+	feed = m_lowpass.filter(feed);
+
+	feed = m_allpass.filter(feed);
+
+    m_delay.put_now(feed);
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_echo/AlReverbEcho.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_echo/AlReverbEcho.h
new file mode 100755
index 0000000..136bf34
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_echo/AlReverbEcho.h
@@ -0,0 +1,73 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现一个回声效果
+
+#ifndef __AL_REVERB_ECHO_H__
+#define __AL_REVERB_ECHO_H__
+
+#include "fast_delay/SupersoundFastDelay.h"
+#include "AlReverbLateAllpass.h"
+#include "AlReverbLateLowpass.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+class AlReverbEcho
+{
+public:
+	AlReverbEcho();
+	~AlReverbEcho();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_param(int32_t fs, float reverb_gain, float late_gain, float echo_time,
+                      float decay_time, float diffusion, float echo_depth, float hf_ratio, float f0);
+	void Filter(float in, float (&in_out)[4]);
+
+private:
+	SuperSoundFastDelay m_delay;
+	AlReverbLateLowpass m_lowpass;
+	AlReverbLateAllpass m_allpass;
+	float m_coeff;
+	float m_densityGain;
+	float m_mixCoeff[2];
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_ECHO_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass/AlReverbLateAllpass.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass/AlReverbLateAllpass.cpp
new file mode 100755
index 0000000..56afbcb
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass/AlReverbLateAllpass.cpp
@@ -0,0 +1,54 @@
+
+#include "AlReverbLateAllpass.h"
+#include "AlReverbCommon.h"
+#include <math.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+AlReverbLateAllpass::AlReverbLateAllpass()
+{
+	m_coeff = 0;
+	m_feedCoeff = 0;
+}
+
+AlReverbLateAllpass::~AlReverbLateAllpass()
+{
+
+}
+
+void AlReverbLateAllpass::flush()
+{
+    m_delay.flush();
+}
+
+int32_t AlReverbLateAllpass::get_latecy()
+{
+	return m_delay.get_latecy();
+}
+
+int32_t AlReverbLateAllpass::set_param(int32_t fs, float diffusion, float length, float decay_time)
+{
+	m_feedCoeff = 0.5f * pow(diffusion, 2);
+
+	m_coeff = calc_decay_coeff(length, decay_time);
+
+	return m_delay.set_delay_len(int32_t(float(fs * length)));
+}
+
+float AlReverbLateAllpass::filter(float in)
+{
+	float out = m_delay.get_now();
+	float feed = m_feedCoeff * in;
+
+    m_delay.put_now(m_feedCoeff * (out - feed) + in);
+
+	return m_coeff * out - feed;
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass/AlReverbLateAllpass.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass/AlReverbLateAllpass.h
new file mode 100755
index 0000000..a9ebee6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_allpass/AlReverbLateAllpass.h
@@ -0,0 +1,67 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现后延迟中的全通滤波器，特么和延迟器混叠在一起的，醉了
+
+#ifndef __AL_REVERB_LATE_ALLPASS_H__
+#define __AL_REVERB_LATE_ALLPASS_H__
+
+#include "fast_delay/SupersoundFastDelay.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+class AlReverbLateAllpass
+{
+public:
+	AlReverbLateAllpass();
+	~AlReverbLateAllpass();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_param(int32_t fs, float diffusion, float length, float decay_time);
+	float filter(float in);
+
+private:
+	SuperSoundFastDelay m_delay;
+	float m_coeff;
+	float m_feedCoeff;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_LATE_ALLPASS_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass/AlReverbLateLowpass.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass/AlReverbLateLowpass.cpp
new file mode 100755
index 0000000..8e7f458
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass/AlReverbLateLowpass.cpp
@@ -0,0 +1,52 @@
+
+#include "AlReverbLateLowpass.h"
+#include "AlReverbCommon.h"
+#include "AlReverbDefs.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+AlReverbLateLowpass::AlReverbLateLowpass()
+{
+	m_coeff = 1;
+
+    flush();
+}
+
+AlReverbLateLowpass::~AlReverbLateLowpass()
+{
+
+}
+
+void AlReverbLateLowpass::flush()
+{
+	m_y1 = 0;
+}
+
+int32_t AlReverbLateLowpass::get_latecy()
+{
+	return 0;
+}
+
+int32_t AlReverbLateLowpass::set_param(int32_t fs, float hf_ratio, float length, float decay_time, float f0)
+{
+	m_coeff = calc_damping_coeff(fs, hf_ratio, length, decay_time, f0);
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+float AlReverbLateLowpass::filter(float in)
+{
+	float out = lerp(in, m_y1, m_coeff);
+	
+	m_y1 = out;
+
+	return out;
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass/AlReverbLateLowpass.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass/AlReverbLateLowpass.h
new file mode 100755
index 0000000..4e38a85
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_lowpass/AlReverbLateLowpass.h
@@ -0,0 +1,66 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现后延迟中的低通，其实也正常的一阶低通一样的公式
+
+#ifndef __AL_REVERB_LATE_LOWPASS_H__
+#define __AL_REVERB_LATE_LOWPASS_H__
+
+#include <stdint.h>
+#include "AudioEffectsConf.h"
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+class AlReverbLateLowpass
+{
+public:
+	AlReverbLateLowpass();
+	~AlReverbLateLowpass();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_param(int32_t fs, float hf_ratio, float length, float decay_time, float f0);
+	float filter(float in);
+
+private:
+	float m_coeff;
+	float m_y1;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_LATE_LOWPASS_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb/AlReverbLateReverb.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb/AlReverbLateReverb.cpp
new file mode 100755
index 0000000..7428593
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb/AlReverbLateReverb.cpp
@@ -0,0 +1,143 @@
+
+#include "AlReverbLateReverb.h"
+#include "AlReverbDefs.h"
+#include "AlReverbCommon.h"
+#include <string.h>
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+// 4 个后期反射延迟量
+const static float gs_late_delay[4] = {
+	0.0211f, 0.0311f, 0.0461f, 0.0680f
+};
+
+const static float gs_allpass_length[4] = {
+	0.0151f, 0.0167f, 0.0183f, 0.0200f,
+};
+
+#define LATE_LINE_MULTIPLIER	4
+
+AlReverbLateReverb::AlReverbLateReverb()
+{
+	m_mixCoeff = 1;
+
+	memset(m_coeff, 0, sizeof(m_coeff));
+
+	m_gain = 1;
+
+	m_density_gain = 1;
+}
+
+AlReverbLateReverb::~AlReverbLateReverb()
+{
+
+}
+
+void AlReverbLateReverb::flush()
+{
+	for(int32_t i = 0; i < 4; i++)
+	{
+        m_delay[i].flush();
+        m_lowpass[i].flush();
+        m_allpass[i].flush();
+	}
+}
+
+int32_t AlReverbLateReverb::get_latecy()
+{
+	int32_t latecy = m_delay[0].get_latecy() +
+            m_lowpass[0].get_latecy() +
+            m_allpass[0].get_latecy();
+
+	for(int32_t i = 1; i < 4; i++)
+	{
+		int32_t len = 0;
+		len += latecy, m_delay[i].get_latecy();
+		len += latecy, m_lowpass[i].get_latecy();
+		len += latecy, m_allpass[i].get_latecy();
+		latecy = MIN(latecy, len);
+	}
+
+	return latecy;
+}
+
+int32_t AlReverbLateReverb::set_param(int32_t fs, float reverb_gain, float late_gain,
+                                      float density, float decay_time, float diffusion, float hf_ratio, float hfcutoff)
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+	float length;
+	float x, y;
+
+    calc_matrix_coeffs(diffusion, &x, &y);
+	m_mixCoeff = y / x;
+
+	m_gain = reverb_gain * late_gain * x;
+
+	length = (gs_late_delay[0] + gs_late_delay[1] + gs_late_delay[2] + gs_late_delay[3]) / 4;
+	length *= 1 + (density * LATE_LINE_MULTIPLIER);
+	m_density_gain = calc_density_gain(calc_decay_coeff(length, decay_time));
+	
+	for(int32_t i = 0; i < 4; i++)
+	{
+		length = gs_late_delay[i] * (1 + density * LATE_LINE_MULTIPLIER);
+
+		nRet = m_delay[i].set_delay_len(int32_t(length * fs));
+		if(ERROR_SUPERSOUND_SUCCESS != nRet)
+			return nRet;
+
+		nRet = m_lowpass[i].set_param(fs, hf_ratio, length, decay_time, hfcutoff);
+		if(ERROR_SUPERSOUND_SUCCESS != nRet)
+			return nRet;
+
+		nRet = m_allpass[i].set_param(fs, diffusion, gs_allpass_length[i], decay_time);
+		if(ERROR_SUPERSOUND_SUCCESS != nRet)
+			return nRet;
+
+		m_coeff[i] = calc_decay_coeff(length, decay_time) * x;
+	}
+
+	return nRet;
+}
+
+void AlReverbLateReverb::filter(float (&in)[4], float (&out)[4])
+{
+	float d[4];
+
+	d[0] = m_lowpass[2].filter(in[2] + m_delay[2].get_now() * m_coeff[2]);
+	d[1] = m_lowpass[0].filter(in[0] + m_delay[0].get_now() * m_coeff[0]);
+	d[2] = m_lowpass[3].filter(in[3] + m_delay[3].get_now() * m_coeff[3]);
+	d[3] = m_lowpass[1].filter(in[1] + m_delay[1].get_now() * m_coeff[1]);
+
+	d[0] = m_allpass[0].filter(d[0]);
+	d[1] = m_allpass[1].filter(d[1]);
+	d[2] = m_allpass[2].filter(d[2]);
+	d[3] = m_allpass[3].filter(d[3]);
+
+	out[0] = d[0] + (m_mixCoeff * (         d[1] + -d[2] + d[3]));
+	out[1] = d[1] + (m_mixCoeff * (-d[0]         +  d[2] + d[3]));
+	out[2] = d[2] + (m_mixCoeff * ( d[0] + -d[1]         + d[3]));
+	out[3] = d[3] + (m_mixCoeff * (-d[0] + -d[1] + -d[2]       ));
+
+    m_delay[0].put_now(out[0]);
+    m_delay[1].put_now(out[1]);
+    m_delay[2].put_now(out[2]);
+    m_delay[3].put_now(out[3]);
+
+	out[0] = m_gain * out[0];
+	out[1] = m_gain * out[1];
+	out[2] = m_gain * out[2];
+	out[3] = m_gain * out[3];
+}
+
+float AlReverbLateReverb::get_density_gain()
+{
+	return m_density_gain;
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb/AlReverbLateReverb.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb/AlReverbLateReverb.h
new file mode 100755
index 0000000..abc381d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_late_reverb/AlReverbLateReverb.h
@@ -0,0 +1,103 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现后期反射
+/* Late reverb is done with a modified feed-back delay network (FDN)
+* topology.  Four input lines are each fed through their own all-pass
+* filter and then into the mixing matrix.  The four outputs of the
+* mixing matrix are then cycled back to the inputs.  Each output feeds
+* a different input to form a circlular feed cycle.
+*
+* The mixing matrix used is a 4D skew-symmetric rotation matrix derived
+* using a single unitary rotational parameter:
+*
+*  [  d,  a,  b,  c ]          1 = a^2 + b^2 + c^2 + d^2
+*  [ -a,  d,  c, -b ]
+*  [ -b, -c,  d,  a ]
+*  [ -c,  b, -a,  d ]
+*
+* The rotation is constructed from the effect's diffusion parameter,
+* yielding:  1 = x^2 + 3 y^2; where a, b, and c are the coefficient y
+* with differing signs, and d is the coefficient x.  The matrix is thus:
+*
+*  [  x,  y, -y,  y ]          n = sqrt(matrix_order - 1)
+*  [ -y,  x,  y,  y ]          t = diffusion_parameter * atan(n)
+*  [  y, -y,  x,  y ]          x = cos(t)
+*  [ -y, -y, -y,  x ]          y = sin(t) / n
+*
+* To reduce the number of multiplies, the x coefficient is applied with
+* the cyclical delay line coefficients.  Thus only the y coefficient is
+* applied when mixing, and is modified to be:  y / x.
+*/
+
+#ifndef __AL_REVERB_LATE_REVERB_H__
+#define __AL_REVERB_LATE_REVERB_H__
+
+#include "fast_delay/SupersoundFastDelay.h"
+#include "AlReverbLateAllpass.h"
+#include "AlReverbLateLowpass.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+class AlReverbLateReverb
+{
+public:
+	AlReverbLateReverb();
+	~AlReverbLateReverb();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_param(int32_t fs, float reverb_gain, float late_gain,
+                      float density, float decay_time, float diffusion, float hf_ratio, float hfcutoff);
+	void filter(float (&in)[4], float (&out)[4]);
+	float get_density_gain();
+
+private:
+	SuperSoundFastDelay m_delay[4];
+	AlReverbLateLowpass m_lowpass[4];
+	AlReverbLateAllpass m_allpass[4];
+
+	float m_mixCoeff;
+	float m_coeff[4];
+	float m_gain;
+	float m_density_gain;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_LATE_REVERB_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_modulation/AlReverbModulation.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_modulation/AlReverbModulation.cpp
new file mode 100755
index 0000000..7cffac1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_modulation/AlReverbModulation.cpp
@@ -0,0 +1,44 @@
+
+#include "AlReverbModulation.h"
+#include "AlReverbDefs.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+AlReverbModulation::AlReverbModulation()
+{
+
+}
+
+AlReverbModulation::~AlReverbModulation()
+{
+
+}
+
+void AlReverbModulation::flush()
+{
+    m_delay.flush();
+}
+
+int32_t AlReverbModulation::get_latecy()
+{
+	return m_delay.get_latecy();
+}
+
+int32_t AlReverbModulation::set_param(int32_t fs, float time, float depth)
+{
+    m_delay.set_delay_len(1);
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+float AlReverbModulation::filter(float in)
+{
+	return m_delay.filter(in);
+}
+
+
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_modulation/AlReverbModulation.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_modulation/AlReverbModulation.h
new file mode 100755
index 0000000..2bf57dc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/al_reverb_modulation/AlReverbModulation.h
@@ -0,0 +1,66 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//主要是实现一个调制器，本来调制器应该实现一个类似于重采样的功能，解决
+//因为因为采样率等变化带来的瞬态颤音问题，这里直接都略过了
+
+#ifndef __AL_REVERB_MODULATION_H__
+#define __AL_REVERB_MODULATION_H__
+
+#include "fast_delay/SupersoundFastDelay.h"
+
+namespace SUPERSOUND
+{
+namespace ALREVERB
+{
+
+
+class AlReverbModulation
+{
+public:
+	AlReverbModulation();
+	~AlReverbModulation();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_param(int32_t fs, float time, float depth);
+	float filter(float in);
+
+private:
+	SuperSoundFastDelay m_delay;
+};
+
+
+}
+}
+
+#endif /* __AL_REVERB_MODULATION_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/fast_delay/SupersoundFastDelay.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/fast_delay/SupersoundFastDelay.cpp
new file mode 100755
index 0000000..fb59aa2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/fast_delay/SupersoundFastDelay.cpp
@@ -0,0 +1,155 @@
+
+#include "SupersoundFastDelay.h"
+#include "AlReverbDefs.h"
+#include "AlReverbCommon.h"
+#include <stdio.h>
+#include <string.h>
+#include <new>
+
+namespace SUPERSOUND
+{
+
+
+SuperSoundFastDelay::SuperSoundFastDelay()
+{
+	m_len = -1;
+	m_idx = 0;
+
+	m_cache = NULL;
+	m_mask = -1;
+}
+
+SuperSoundFastDelay::~SuperSoundFastDelay()
+{
+	SAFE_DELETE_PTR(m_cache);
+	m_mask = -1;
+}
+
+void SuperSoundFastDelay::flush()
+{
+	for(int32_t i = 0; i < m_len; i++)
+	{
+        put_now(0);
+	}
+}
+
+int32_t SuperSoundFastDelay::get_latecy()
+{
+	return m_len;
+}
+
+int32_t SuperSoundFastDelay::set_delay_len(int32_t len)
+{
+	//相等就直接返回
+	if(len == m_len)
+		return ERROR_SUPERSOUND_SUCCESS;
+
+	//重新申请一段新的内存空间
+	int32_t delay = len;
+	len = supersound_next_power_2(delay + 1);
+	float * cache = new(std::nothrow) float[len];
+	if(NULL == cache)
+	{
+		return ERROR_SUPERSOUND_MEMORY;
+	}
+	memset(cache, 0, sizeof(float) * len);
+
+	//如果原始有数据的话，采用线性插值的方式来减少破音
+	if(m_cache != NULL)
+	{
+        resample(cache, delay);
+	}
+
+	//重新更新各个参量
+	m_cache = cache;
+	m_len = delay;
+	m_mask = len - 1;
+	m_idx = 0;
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundFastDelay::set_param(int32_t fs, float ms)
+{
+	return set_delay_len(int32_t(fs * ms / 1000));
+}
+
+float SuperSoundFastDelay::filter(float in)
+{
+	int32_t idx = (m_idx + m_len) & m_mask;
+
+    float out = m_cache[m_idx];
+	m_cache[idx] = in;
+
+
+	m_idx = (m_idx + 1) & m_mask;
+
+	return out;
+}
+
+float SuperSoundFastDelay::get_now()
+{
+	return m_cache[m_idx];
+}
+
+void SuperSoundFastDelay::put_now(float in)
+{
+	int32_t idx = (m_idx + m_len) & m_mask;
+
+	m_cache[idx] = in;
+
+	m_idx = (m_idx + 1) & m_mask;
+}
+
+float SuperSoundFastDelay::get_data(int32_t pos)
+{
+	int32_t idx = (pos + m_idx) & m_mask;
+	return m_cache[idx];
+}
+
+void SuperSoundFastDelay::resample(float *cache, int32_t delay)
+{
+	//数据较少的话就使用拷贝，否则使用重采样的方式
+	if((m_len <= 2) || (delay <= 2))
+	{
+		for(int32_t i = 0; i < (delay / 2); i++)
+		{
+			cache[i] = get_data(m_len / 2);
+		}
+		for(int32_t i = delay / 2; i < delay; i++)
+		{
+			cache[i] = get_data(MAX(0, m_len - 1));
+		}
+	}
+	else
+	{
+		int32_t isample;
+		float istep = (float(m_len - 2)) / (delay - 2);
+		float s1, s2;
+		float alpha;
+		for(int32_t i = 0; i < (delay - 1); i++)
+		{
+			isample = int32_t(i * istep);
+			alpha = i * istep - isample;
+			s1 = get_data(isample);
+			s2 = get_data(isample + 1);
+			cache[i] = s1 * alpha + s2 * (1 - alpha);
+		}
+		cache[delay - 1] = get_data(m_len - 1);
+	}
+}
+
+int32_t SuperSoundFastDelay::supersound_next_power_2(int32_t x)
+{
+    if(x > 0)
+{
+    x--;
+    x |= x >> 1;
+    x |= x >> 2;
+    x |= x >> 4;
+    x |= x >> 8;
+    x |= x >> 16;
+}
+return x + 1;
+}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/fast_delay/SupersoundFastDelay.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/fast_delay/SupersoundFastDelay.h
new file mode 100755
index 0000000..410d376
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/fast_delay/SupersoundFastDelay.h
@@ -0,0 +1,76 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//开发一个快速延迟器
+
+#ifndef __AL_REVERB_FAST_DELAY_H__
+#define __AL_REVERB_FAST_DELAY_H__
+
+#include <stdint.h>
+#include "AudioEffectsConf.h"
+
+namespace SUPERSOUND
+{
+
+
+class SuperSoundFastDelay
+{
+public:
+	SuperSoundFastDelay();
+	~SuperSoundFastDelay();
+
+public:
+	void flush();
+	int32_t get_latecy();
+	int32_t set_delay_len(int32_t len);
+	int32_t set_param(int32_t fs, float ms);
+	float filter(float in);
+	//这两个接口主要是为梳状滤波等需要取和放不同步的问题
+	float get_now();
+	void put_now(float in);
+
+private:
+	float get_data(int32_t pos);
+	void resample(float *cache, int32_t delay);
+    //用来将一个数转为大于它的最小的2的n次方数
+    int32_t supersound_next_power_2(int32_t x);
+private:
+	int32_t m_len;
+	int32_t m_idx;
+	float * m_cache;
+	//缓存的长度，为 2 的 n 次幂减 1
+	int32_t m_mask;
+};
+
+
+}
+
+#endif /* __AL_REVERB_FAST_DELAY_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/filter/CFilters.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/filter/CFilters.cpp
new file mode 100644
index 0000000..7404089
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/filter/CFilters.cpp
@@ -0,0 +1,403 @@
+/************************************************************************/
+/* Phonograph Eimulator                                                 */
+/* written by evieng, 7.21,2013                                       */
+/* last modifiey by evieng, 6.6,2013                                  */
+/* copy right reserved                                                  */
+/************************************************************************/
+
+#include "math.h"
+#include "stdlib.h"
+#include "stdio.h"
+#include "memory.h"
+#include "AlReverbDefs.h"
+#include "filter/CFilters.h"
+//#include "audio_score/Score/KTYPED.h"
+#include "biquad_filters/BiquadFilter.h"
+
+// This is a trick. When enabled, all channels refer to the 1st channel
+// #define PSEUDO_MULTICHANNELS 1   // defined in KTYPED.h
+#ifdef _MSC_VER
+// MSVC build for Windows, and it's (expected to be) able to handle true stereo in real time
+#define PSEUDO_MULTICHANNELS 0
+#else
+#define PSEUDO_MULTICHANNELS 1
+#endif
+#define VERSION_ID_NUMBER	100 /* 7.21,2013 */
+
+using std::vector;
+using namespace BiquadFilter;
+
+
+#define HPF_FREQ (2000.0f / 44100.0f)
+#define LPF_FREQ (6000.0f / 44100.0f)
+#define HPFQ 0.5f
+#define LPFQ 0.5f
+
+#define BPF_LOW_EDGE (600.0f / 44100.0f)
+#define BPF_HIGH_EDGE (8000.0f / 44100.0f)
+
+class CBaseFilters
+{
+public:
+    CBaseFilters();
+    virtual ~CBaseFilters();
+	void reset();
+
+    bool isAllocated() const;
+	int setFilterType(int ftype)
+	{
+		if (ftype < LOW_PASS_FILTER)
+		{
+			m_fType = LOW_PASS_FILTER;
+		}
+		else if (ftype > BAND_PASS_FILTER)
+		{
+			m_fType = BAND_PASS_FILTER;
+		}
+		else
+			m_fType = ftype;
+		return 0;
+	}
+
+    void filtering(std::vector<float> *x);
+
+private:
+    LPFilter* lpf;
+    HPFilter* hpf;
+	BPFilter* bpf;
+	int m_fType;
+};
+
+bool CBaseFilters::isAllocated() const
+{
+    return lpf != NULL && hpf != NULL && bpf != NULL;
+}
+
+
+
+void CBaseFilters::filtering(std::vector<float> *x)
+{
+	if (m_fType == LOW_PASS_FILTER)
+	{
+		lpf->filtering(x);
+	}
+	else if (m_fType == HIGH_PASS_FILTER)
+	{
+		hpf->filtering(x);
+	}
+	else if (m_fType == BAND_PASS_FILTER)
+	{
+		bpf->filtering(x);
+	}
+	else
+		lpf->filtering(x);
+    //hpf->filtering(x);
+}
+
+
+
+CBaseFilters::CBaseFilters()
+{
+	m_fType = LOW_PASS_FILTER;
+    hpf = new HPFilter(HPF_FREQ, HPFQ);    
+    lpf = new LPFilter(LPF_FREQ, LPFQ); 
+	bpf = new BPFilter(BPF_LOW_EDGE, BPF_HIGH_EDGE);
+
+    if (!hpf || !lpf || !bpf)
+    {
+        if (hpf)
+        {
+            delete hpf;
+            hpf = NULL;
+        }
+        if (lpf)
+        {
+            delete lpf;
+            lpf = NULL;
+        }
+		if (bpf)
+		{
+			delete bpf;
+			bpf = NULL;
+		}
+    }
+}
+
+void CBaseFilters::reset()
+{
+	if (hpf)
+	{
+		hpf->reset();
+	}
+	if (lpf)
+	{
+		lpf->reset();
+	}
+	if (bpf)
+	{
+		bpf->reset();
+	}
+}
+
+CBaseFilters::~CBaseFilters()
+{
+    delete lpf;
+    delete hpf;
+	delete bpf;
+    lpf = NULL;
+    hpf = NULL;
+	bpf = NULL;
+}
+
+CFilters::CFilters()
+{
+    m_samplerate = 0;
+    m_channels = 0;
+    handles = NULL;
+}
+
+CFilters::~CFilters()
+{
+    Uninit();
+}
+
+int CFilters::Init(int inSampleRate, int inChannel)
+{
+    m_samplerate = inSampleRate;
+    m_channels = inChannel;
+
+
+    handles = new CBaseFilters*[m_channels];
+
+    if (!handles)
+    {
+        return ALRB_ERR_BASE_H_MALLOC_NULL;
+    }
+
+    for (int chn = 0; chn < m_channels; chn++)
+    {
+        CBaseFilters* filters = new CBaseFilters();
+       
+        ((CBaseFilters**)handles)[chn] = filters;
+
+        if (!filters->isAllocated())
+        {
+            do{
+                CBaseFilters* filters = ((CBaseFilters**)handles)[chn];
+                delete filters;
+
+            } while (chn--);
+
+            delete [] (CBaseFilters**)handles;
+            handles = NULL;
+
+            return ALRB_ERR_BASE_H_MALLOC_NULL;
+        }
+
+    }
+
+    return 0;
+}
+
+void CFilters::Reset()
+{
+	if (handles)
+	{
+		for (int chn = 0; chn < m_channels; chn++)
+		{
+			CBaseFilters* filters = ((CBaseFilters**)handles)[chn];
+
+			if (filters)
+			{
+				filters->reset();
+			}
+
+		}
+	}
+}
+
+void CFilters::Uninit()
+{
+    if (handles)
+    {
+        for (int chn = 0; chn < m_channels; chn++)
+        {
+            CBaseFilters* filters = ((CBaseFilters**)handles)[chn];
+
+            if (filters)
+            {
+                delete filters;
+            }
+
+        }
+
+        delete [] (CBaseFilters**)handles;
+        handles = NULL;
+    }
+}
+int CFilters::setFilterType(int fType)
+{
+	if (handles)
+	{
+		for (int chn = 0; chn < m_channels; chn++)
+		{
+			CBaseFilters* filters = ((CBaseFilters**)handles)[chn];
+
+			if (filters)
+			{
+				filters->setFilterType(fType);
+			}
+
+		}
+		return 0;
+	}
+	else
+		return ALRB_ERR_BASE_H_MALLOC_NULL;
+}
+
+int CFilters::ProcessLRIndependent(float * inLeft, float * inRight, int inOutSize)
+{
+	if (2 != m_channels)
+	{
+		return ALRB_ERR_PARAM;
+	}
+	data.reserve(inOutSize);
+	data.resize(inOutSize);
+	if (handles) {
+		data.assign(inLeft, inLeft + inOutSize);
+		CBaseFilters* filters = ((CBaseFilters**)handles)[0];
+		filters->filtering(&data);
+		for (unsigned int i = 0; i < data.size(); i++) {
+			inLeft[i] = data[i];
+		}
+
+		data.assign(inRight, inRight + inOutSize);
+		filters = ((CBaseFilters**)handles)[1];
+		filters->filtering(&data);
+		for (unsigned int i = 0; i < data.size(); i++) {
+			inRight[i] = data[i];
+		}
+	}
+	return inOutSize;
+}
+
+int CFilters::Process(float* inBuffer, int inSize)
+{
+	if (0 != (inSize % m_channels))
+	{
+		return ALRB_ERR_PARAM;
+	}
+
+	if (handles)
+	{
+
+		data.reserve(inSize / m_channels);
+		data.resize(inSize / m_channels);
+
+		for (int chn = 0; chn < m_channels; chn++)
+		{
+			CBaseFilters* filters = ((CBaseFilters**)handles)[chn];
+			float* audio = inBuffer + chn;
+
+			if (filters)
+			{
+				if (PSEUDO_MULTICHANNELS && chn > 0)
+				{
+					float* audioref = inBuffer;
+
+					for (unsigned int i = 0; i < data.size(); i++){
+						audio[0] = audioref[0];
+						audio += m_channels;
+						audioref += m_channels;
+					}
+				}
+				else
+				{
+
+					for (unsigned int i = 0; i < data.size(); i++){
+						//                    data[i]= audio[i * m_channels + chn] / 32768.0;
+						data[i] = audio[0];
+						audio += m_channels;
+					}
+
+					filters->filtering(&data);
+
+					float* audio = inBuffer + chn;
+
+					for (unsigned int i = 0; i < data.size(); i++){
+						*audio = data[i];
+						audio += m_channels;
+					}
+				} // if (PSEUDO_MULTICHANNELS && chn>0)
+
+			}
+
+		}
+	}
+	return ALRB_ERR_SUCCESS;
+}
+
+int CFilters::Process(char* inBuffer, int inSize)
+{
+    if (0 != (inSize % (sizeof(short) * m_channels)))
+    {
+        return ALRB_ERR_PARAM;
+    }
+
+    if (handles)
+    {
+
+        data.reserve(inSize / sizeof(short) / m_channels);
+        data.resize(inSize / sizeof(short) / m_channels);
+
+        for (int chn = 0; chn < m_channels; chn++)
+        {
+            CBaseFilters* filters = ((CBaseFilters**)handles)[chn];
+            short* audio = chn + (short*)inBuffer;
+
+            if (filters)
+            {
+                if (PSEUDO_MULTICHANNELS && chn>0)
+                {
+                    short* audioref = (short*)inBuffer;
+
+                    for (unsigned int i = 0; i < data.size(); i++){
+                        audio[0] = audioref[0];
+                        audio += m_channels;
+                        audioref += m_channels;
+                    }
+                }
+                else
+                {
+
+                    for (unsigned int i = 0; i < data.size(); i++){
+                        //                    data[i]= audio[i * m_channels + chn] / 32768.0;
+                        data[i]= audio[0] / 32768.0f;
+                        audio += m_channels;
+                    }
+
+                    filters->filtering(&data);
+
+                    short* audio = chn + (short*)inBuffer;
+
+                    for (unsigned int i = 0; i < data.size(); i++){
+                        int sample = (int)(32767.0f * data[i]);
+
+                        if (sample>32767)
+                            sample = 32767;
+                        else if (sample<-32768)
+                            sample = -32768;
+
+                        //                   audio[i * m_channels + chn] = (short)sample;
+                        audio[0] = (short)sample;
+                        audio += m_channels;
+                    }
+                } // if (PSEUDO_MULTICHANNELS && chn>0)
+
+            }
+
+        }
+    }
+
+    return inSize;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/filter/CFilters.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/filter/CFilters.h
new file mode 100644
index 0000000..be681db
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/al_reverb/src/filter/CFilters.h
@@ -0,0 +1,35 @@
+#ifndef KALA_AUDIOBASE_FILTERS_H
+#define KALA_AUDIOBASE_FILTERS_H
+
+#include <vector>
+#include "AudioEffectsConf.h"
+
+#define LOW_PASS_FILTER		0
+#define HIGH_PASS_FILTER	1
+#define BAND_PASS_FILTER	2
+
+
+class  CFilters
+{
+public:
+    CFilters();
+    virtual ~CFilters();
+
+	int Init(int inSampleRate, int inChannel);	// set sample rate, channel and filter type;
+	void Reset();
+	void Uninit();	// uninit
+	int setFilterType(int fType);
+
+	// process input buffer and output size.
+	int Process(char* inBuffer, int inSize);
+	int Process(float* inBuffer, int inSize);
+
+	int ProcessLRIndependent(float * inLeft, float * inRight, int inOutSize);
+
+private:
+    void* handles;
+    int m_samplerate;
+    int m_channels;
+    std::vector<float> data;
+};
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/DecoderCommon.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/DecoderCommon.h
new file mode 100644
index 0000000..25d5395
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/DecoderCommon.h
@@ -0,0 +1,220 @@
+//
+// Created by yangjianli on 2021/1/7.
+//
+
+#ifndef AUDIO_CODEC_DECODERCOMMON_H
+#define AUDIO_CODEC_DECODERCOMMON_H
+#include <new>
+#include <math.h>
+#include "ac_defs.h"
+
+#ifdef ST_DEBUG
+#include <assert.h>
+#define ASSERT(e) assert(e)
+#else
+#define ASSERT(e)
+#endif
+
+//安全关闭文件
+#ifndef SAFE_CLOSE_FILE
+#define SAFE_CLOSE_FILE(file)       \
+{                                   \
+    if(file)                        \
+    {                               \
+        fclose(file);               \
+        file = NULL;                \
+    }                               \
+}
+#endif //SAFE_CLOSE_FILE
+
+//安全释放内存
+#ifndef SAFE_FREE
+#define SAFE_FREE(ptr)              \
+{                                   \
+    if(ptr)                         \
+    {                               \
+        free(ptr);                  \
+        ptr = NULL;                 \
+    }                               \
+}
+#endif //SAFE_FREE
+
+//安全删除对象
+#ifndef SAFE_DELETE_OBJ
+#define SAFE_DELETE_OBJ(obj)        \
+{                                   \
+    if(obj)                         \
+    {                               \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_DELETE_OBJ
+
+//安全逆初始化并删除对象
+#ifndef SAFE_UNINIT_DELETE_OBJ
+#define SAFE_UNINIT_DELETE_OBJ(obj) \
+{                                   \
+    if(obj)                         \
+    {                               \
+        obj->uninit();              \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_UNINIT_DELETE_OBJ
+
+#ifndef SAFE_CLOSE_DELETE_OBJ
+#define SAFE_CLOSE_DELETE_OBJ(obj)  \
+{                                   \
+    if(obj)                         \
+    {                               \
+        obj->close();               \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_CLOSE_DELETE_OBJ
+
+//安全删除数组
+#ifndef SAFE_DELETE_ARRAY
+#define SAFE_DELETE_ARRAY(array)    \
+{                                   \
+    if(array)                       \
+    {                               \
+        delete [] array;            \
+        array = NULL;               \
+    }                               \
+}
+#endif //SAFE_DELETE_ARRAY
+
+//取大值
+#ifndef GLOBAL_MAX
+#define GLOBAL_MAX(a, b)	(((a) > (b)) ? (a) : (b))
+#endif
+
+//取小值
+#ifndef GLOBAL_MIN
+#define GLOBAL_MIN(a,b)		(((a) < (b)) ? (a) : (b))
+#endif
+
+//取中间
+#ifndef GLOBAL_MID
+#define GLOBAL_MID(a, b, c)	(GLOBAL_MAX(a, GLOBAL_MIN(b, c)))
+#endif
+
+//取绝对值
+#ifndef GLOBAL_ABS
+#define GLOBAL_ABS(a)       ((a) < 0 ? (-(a)) : (a))
+#endif
+
+
+#ifndef CHECK_FLOAT_EQUAL
+#define CHECK_FLOAT_EQUAL(a, b)  (fabs(a - b) < 0.001f)
+#endif
+
+// 错误码
+enum
+{
+    E_NATIVE_DECODER_SUCCESS,
+
+    //继续，说明可以继续往下调用
+    E_NATIVE_DECODER_COMMON_CONTINUE   		    = 10000,
+    E_NATIVE_DECODER_MEMORY,
+
+    E_NATIVE_DECODER_NO_MEMORY					= 30000,
+    E_NATIVE_DECODER_FORMAT,
+    E_NATIVE_DECODER_STREAM,
+    E_NATIVE_DECODER_NO_DECODER,
+    E_NATIVE_DECODER_DECODER_OPEN,
+    E_NATIVE_DECODER_ALREADY_INIT,
+    E_NATIVE_DECODER_RESAMPLE,
+    E_NATIVE_DECODER_CONTINUE,
+    E_NATIVE_DECODER_SEEK,
+    E_NATIVE_DECODER_END,
+
+    //协议部分产生的错误码
+    E_NATIVE_PROTOCOL_PATH_OPEN					= 40000,
+    E_NATIVE_NO_PROTOCOL,
+    E_NATIVE_NO_CONTEXT,
+    E_NATIVE_NO_DECODER,
+};
+
+// 类型
+//底层获取的音频文件的参数，文件内部的参数，如采样率之类的
+ST_AC_LIB_API typedef struct _MediaInfo
+{
+    //音频的时长
+    double duration;
+    //音频的采样率
+    int sample_rate;
+    //音频的通道数
+    int channels;
+    //码率
+    int bit_rate;
+}MediaInfo, *pMediaInfo;
+
+//上层设置的音频文件的参数，也就是当成的参数，不是文件内部的参数
+ST_AC_LIB_API typedef struct _MediaParam
+{
+    //音频文件的位置
+    const char * path;
+    //开始播放的时间，单位是ms
+    double start_time;
+    //截止播放的时间，单位是ms，默认和 duration 一致
+    double end_time;
+    //播放的长度，单位是ms，如果小于等于0，则认为播放全曲
+    double duration;
+    //前奏时间，方便跳过前奏处理
+    double prelude_time;
+    //是否需要解密，因为导唱就不需要解密操作
+    bool need_decrypt;
+    //多人同框时加入的时间点ms
+    double multi_join_time;
+    // 音频响度，单位：db
+    double loudness;
+    //是否是hook模式
+    bool is_seek_delay_record;
+}MediaParam, *pMediaParam;
+
+
+#ifndef DEF_AUDIO_FRAME_BUFFER
+#define DEF_AUDIO_FRAME_BUFFER
+//自定义的一帧音频数据
+template <class T>
+class ST_AC_LIB_API AudioFrameBuffer
+{
+public:
+    AudioFrameBuffer()
+            : m_buffer(NULL)
+            , m_size(0)
+            , m_postion(0)
+            , m_duration(0) { }
+
+    ~AudioFrameBuffer() { uninit(); }
+
+public:
+    inline int init(int size) { m_buffer = new T [size]; m_size = size; return E_NATIVE_DECODER_SUCCESS; }
+    inline T * get_buffer() { return m_buffer; }
+    inline int get_size() { return m_size; }
+    inline void set_postion(double postion) { m_postion = postion; }
+    inline double get_postion() { return m_postion; }
+    inline void set_duration(double duration) { m_duration = duration; }
+    inline double get_duration() { return m_duration; }
+    inline void uninit() { SAFE_DELETE_ARRAY(m_buffer); m_size = 0; m_postion = 0; m_duration = 0; }
+
+private:
+    //音频数据
+    T * m_buffer;
+    //音频数据长度
+    int m_size;
+    //音频数据的开始时间点，ms
+    double m_postion;
+    //音频的持续时间，ms
+    double m_duration;
+};
+#endif
+
+
+
+#endif //AUDIO_CODEC_DECODERCOMMON_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/DecoderWrapper.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/DecoderWrapper.h
new file mode 100644
index 0000000..6842415
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/DecoderWrapper.h
@@ -0,0 +1,59 @@
+//
+// Created by 杨将 on 2017/8/14.
+//
+
+#ifndef __DECODERWRAPPER_H__
+#define __DECODERWRAPPER_H__
+
+#include "DecoderCommon.h"
+#include "IProtocol.h"
+#include "IContext.h"
+#include "IDecoder.h"
+#include <cstring>
+#include "ac_defs.h"
+//协议、解密、解码、重采样的一个控制封装
+
+class IEnDeCrypt;
+ST_AC_LIB_API class CDecoderWrapper
+{
+public:
+	CDecoderWrapper();
+	~CDecoderWrapper();
+
+public:
+	int init(pMediaParam param, int samplerate, int channel,
+	         int context_type,
+             int decoder_type,
+             int protocol_type);
+    int init(pMediaParam param, int samplerate, int channel,
+             int context_type=CONTEXT_FFMPEG,
+             int decoder_type=DECODER_FFMPEG) {
+
+		int protocol_type = strncmp(param->path, "stmedia:", 8) == 0 ? ANDROID_PROTOCOL_TYPE_ST_MEDIA : (param->need_decrypt ? PROTOCOL_TYPE_FILE : PROTOCOL_ACCOMPANY_TYPE_FILE);
+        return init(param, samplerate, channel, context_type, decoder_type, protocol_type);
+    }
+	void get_media_info(pMediaInfo media_info);
+	//如果解码结束，则会将frame中的数据置0
+	int decode(AudioFrameBuffer<float> * frame);
+	int seek(double pos);
+	int set_start_end_time(double start_time, double end_time);
+	void uninit();
+
+private:
+	IEnDeCrypt * m_crypt;
+	IProtocol * m_protocol;
+	IContext * m_context;
+	IDecoder * m_decoder;
+
+	double m_start_time;
+	double m_end_time;
+
+	//下一次解码的开始时间
+	double m_next_time;
+	//decode出来的采样率
+	int m_samplerate;
+	//decode出来的通道数
+	int m_channel;
+};
+
+#endif //__DECODERWRAPPER_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IContext.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IContext.h
new file mode 100644
index 0000000..fd71278
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IContext.h
@@ -0,0 +1,37 @@
+//
+// Created by 杨将 on 2017/6/28.
+//
+
+#ifndef __ICONTEXT_H__
+#define __ICONTEXT_H__
+
+//上下文，相当于c中的void*，我们这里统一用这个来代替
+#include "InstanceFactory.h"
+class IContext
+{
+public:
+	IContext() { };
+	virtual ~IContext() { };
+public:
+    virtual void set_protocol(IProtocol * protocol) = 0;
+    virtual IProtocol * get_protocol() = 0;
+    virtual void set_samplerate(int samplerate) = 0;
+    virtual int get_samplerate() = 0;
+    virtual void set_channels(int channels) = 0;
+    virtual int get_channels() = 0;
+};
+
+ST_AC_LIB_API class IContextCreator
+{
+public:
+    IContextCreator() = delete;
+    explicit IContextCreator(int type)
+    {
+        registered_context(type, this);
+    };
+
+public:
+    virtual IContext* get_inst() = 0;
+};
+
+#endif //__ICONTEXT_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IDecoder.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IDecoder.h
new file mode 100644
index 0000000..2901c18
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IDecoder.h
@@ -0,0 +1,45 @@
+//
+// Created by 杨将 on 2017/7/25.
+//
+
+#ifndef __IDECODER_H__
+#define __IDECODER_H__
+
+#include "DecoderCommon.h"
+#include "InstanceFactory.h"
+//外部需要考虑这些函数不能多线程的问题
+
+class IContext;
+
+class IDecoder
+{
+public:
+	IDecoder() { }
+	virtual ~IDecoder() { }
+
+public:
+	//传入解码所需的上下文，包含协议等
+	virtual int init(IContext * context) = 0;
+	//获取音频文件的内部信息
+	virtual void get_media_info(pMediaInfo media_info) = 0;
+	//获取一段固定长度的数据，给frame中的数据填充数据，这里的长度不一定是编码里面的帧
+	virtual int decode(AudioFrameBuffer<float> * frame) = 0;
+	//跳转到某个精确的位置，这里需要在内部转换到固定的点上，ms数
+	virtual int seek(double pos) = 0;
+	//释放掉所有在初始化中申请的资源，回到未初始化的状态
+	virtual void uninit() = 0;
+};
+
+ST_AC_LIB_API class IDecoderCreator
+{
+public:
+    IDecoderCreator() = delete;
+    explicit IDecoderCreator(int type)
+    {
+        registered_decoder(type, this);
+    };
+
+public:
+    virtual IDecoder* get_inst() = 0;
+};
+#endif //__IDECODER_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IProtocol.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IProtocol.h
new file mode 100644
index 0000000..a2d891c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/IProtocol.h
@@ -0,0 +1,41 @@
+//
+// Created by 杨将 on 2017/7/25.
+//
+
+#ifndef __IPROTOCOL_H__
+#define __IPROTOCOL_H__
+#include "InstanceFactory.h"
+class IEnDeCrypt;
+class IProtocol
+{
+public:
+	IProtocol() { }
+	virtual ~IProtocol() { }
+
+public:
+	//打开一个url地址，获取数据，返回错误码
+	virtual int open(const char * url, IEnDeCrypt * crypt) = 0;
+	//读取数据，返回读取到多少数据，如果出错或者读到结尾则返回0
+	virtual int read(unsigned char * buf, int size) = 0;
+	//写数据，返回还有多少数据没写，如果出错则返回-1
+	virtual int write(const unsigned char * buf, int size) = 0;
+	//跳转，返回跳转后的位置，如果失败则返回-1
+	virtual int seek(int offset, int whence) = 0;
+	//关闭url链接
+	virtual void close() = 0;
+};
+
+ST_AC_LIB_API class IProtocolCreator
+{
+public:
+    IProtocolCreator() = delete;
+    explicit IProtocolCreator(int type)
+    {
+        registered_protocol(type, this);
+    };
+
+public:
+    virtual IProtocol* get_inst() = 0;
+};
+
+#endif //__IPROTOCOL_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/InstanceFactory.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/InstanceFactory.h
new file mode 100644
index 0000000..4911bb2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/InstanceFactory.h
@@ -0,0 +1,60 @@
+//
+// Created by yangjianli on 2021/1/7.
+//
+
+#ifndef AUDIO_CODEC_INSTANCEFACTORY_H
+#define AUDIO_CODEC_INSTANCEFACTORY_H
+
+#include "ac_defs.h"
+
+class IProtocol;
+class IProtocolCreator;
+class IContext;
+class IContextCreator;
+class IDecoder;
+class IDecoderCreator;
+
+
+ST_AC_LIB_API void registered_protocol(int type, IProtocolCreator* creator);
+ST_AC_LIB_API IProtocol* get_protocol_inst(int type);
+
+ST_AC_LIB_API void registered_context(int type, IContextCreator* creator);
+ST_AC_LIB_API IContext* get_context_inst(int type);
+
+ST_AC_LIB_API void registered_decoder(int type, IDecoderCreator* creator);
+ST_AC_LIB_API IDecoder* get_decoder_inst(int type);
+
+
+#define REGISTER_CREATOR(BaseCreator,BaseClass, ClassName, type)                \
+    class ClassName##Creator : public BaseCreator {                             \
+    public:                                                                     \
+        ClassName##Creator(int type) : BaseCreator(type) {};                    \
+    public:                                                                     \
+        BaseClass * get_inst() {                                                \
+            return new ClassName();                                             \
+        }                                                                       \
+    };                                                                          \
+    static ClassName##Creator ClassName##type##Creator(type);
+
+// 公有的类型
+enum PROTOCOL_TYPE
+{
+    PROTOCOL_TYPE_FILE,
+    PROTOCOL_IOS,
+    ANDROID_PROTOCOL_TYPE_ST_MEDIA,
+    PROTOCOL_ACCOMPANY_TYPE_FILE
+};
+
+enum CONTEXT_TYPE
+{
+    CONTEXT_FFMPEG,
+    CONTEXT_IOS
+};
+
+enum DECODER_TYPE
+{
+    DECODER_FFMPEG,
+    DECODER_IOS
+};
+
+#endif //AUDIO_CODEC_INSTANCEFACTORY_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/ac_defs.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/ac_defs.h
new file mode 100644
index 0000000..7518327
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_codec/inc/ac_defs.h
@@ -0,0 +1,11 @@
+/**
+ * Author: AlanWang4523.
+ * Date: 2021/12/29 11:38.
+ * Mail: alanwang4523@gmail.com
+ */
+
+#ifndef AVAUDIO_CODEC_LIBS_DEFINES_H
+#define AVAUDIO_CODEC_LIBS_DEFINES_H
+
+#define ST_AC_LIB_API __attribute__ ((visibility("default")))
+#endif //AVAUDIO_CODEC_LIBS_DEFINES_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/CMakeLists.txt
new file mode 100644
index 0000000..7a7e712
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/CMakeLists.txt
@@ -0,0 +1,10 @@
+cmake_minimum_required(VERSION 2.8)
+project(audio_resampler)
+set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+include_directories(./)
+include_directories(inc src)
+
+# ffmpeg-mac
+#include_directories(/Users/yangjianli/starMaker/ffmpeg_lib/ffmpeg-4.3.1/mac/include)
+#set(FFMPEG_LIB /Users/yangjianli/starMaker/ffmpeg_lib/ffmpeg-4.3.1/mac/lib)
+add_library(audio_resample ${RESAMPLE_SRC_CPP})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/inc/FfmpegResampler.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/inc/FfmpegResampler.h
new file mode 100644
index 0000000..c39e185
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/inc/FfmpegResampler.h
@@ -0,0 +1,35 @@
+//
+// Created by 杨将 on 2017/9/4.
+//
+
+#ifndef __FFMPEGRESAMPLER_H__
+#define __FFMPEGRESAMPLER_H__
+
+#include "IResampler.h"
+
+class SwrContext;
+
+class CFfmpegResampler : public IResampler
+{
+public:
+	CFfmpegResampler();
+	virtual ~CFfmpegResampler();
+
+public:
+	virtual int init(int in_samplerate, int out_samplerate, int in_channel=1, int out_channel=1);
+	virtual int get_out_samples(int num);
+	virtual int get_latency();
+	virtual void reset();
+	virtual int resample(float * in_buf, int in_num, float * out_buf, int & out_num);
+	virtual void uninit();
+
+private:
+	SwrContext * m_swr_context;
+	//重采样的buffer和长度
+	unsigned char * m_swr_buffer;
+	int m_swr_bufsize;
+	int m_in_channel;
+	int m_out_channel;
+};
+
+#endif //__FFMPEGRESAMPLER_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/inc/IResampler.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/inc/IResampler.h
new file mode 100644
index 0000000..93baf9b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/inc/IResampler.h
@@ -0,0 +1,67 @@
+//
+// Created by 杨将 on 2017/9/4.
+//
+/**
+ * 基于ffmpeg的重采样模块
+ */
+#ifndef __IRESAMPLER_H__
+#define __IRESAMPLER_H__
+
+enum
+{
+    E_RESAMPLER_SUCCESS            =   0,
+    E_RESAMPLER_NO_MEMORY          =   10000,
+    E_RESAMPLER_NUM_ZERO,
+};
+class IResampler
+{
+public:
+	IResampler() { }
+	virtual ~IResampler() { }
+
+public:
+    /**
+     * 初始化函数
+     * @param in_samplerate 输入数据的采样率
+     * @param out_samplerate 输出数据的采样率
+     * @param in_channel
+     * @param out_channel
+     * @return 0 表示正常
+     */
+	virtual int init(int in_samplerate, int out_samplerate, int in_channel=1, int out_channel=1) = 0;
+
+	/**
+	 * 当输入每个通道采样点数为num长度的数据时,从resample可以获取到的输出数据的最大长度
+	 * @param num 本次将要输入的数据长度[单通道采样点数量]
+	 * @return 单通道采样点数量,负数表示异常
+	 */
+	virtual int get_out_samples(int num) = 0;
+
+	/**
+	 * 获取延迟延迟时间,采样点级别
+	 * @return
+	 */
+	virtual int get_latency() = 0;
+
+	/**
+	 * 重设，清空内部缓存数据[当输入数据源切换时，需要进行设置]
+	 */
+	virtual void reset() = 0;
+
+	/**
+	 * 重采样函数
+	 * @param in_buf 输入数据[多通道时，交错方式的存储][in]
+	 * @param in_num 输入数据单个通道的采样点数量[in]
+	 * @param out_buf 输出数据[多通道时，交错方式的存储][in][注意:需要外部开辟好空间,可以使用get_out_samples获取需要开辟的最大长度]
+	 * @param out_num 输出数据单个通道的采样点数量[out][注意: out_buf真实被写入的单通道采样点数量]
+	 * @return 0表示正常
+	 */
+	virtual int resample(float * in_buf, int in_num, float * out_buf, int & out_num) = 0;
+
+	/**
+	 * 销毁函数
+	 */
+	virtual void uninit() = 0;
+};
+
+#endif //__IRESAMPLER_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/src/FfmpegResampler.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/src/FfmpegResampler.cpp
new file mode 100644
index 0000000..3fb8d98
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/audio_resample/src/FfmpegResampler.cpp
@@ -0,0 +1,138 @@
+//
+// Created by 杨将 on 2017/9/4.
+//
+
+#include "FfmpegResampler.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#include "libswresample/swresample.h"
+#include "libavutil/channel_layout.h"
+
+#ifdef __cplusplus
+};
+#endif
+
+CFfmpegResampler::CFfmpegResampler()
+{
+	m_swr_context = NULL;
+	m_swr_buffer = NULL;
+	m_swr_bufsize = 0;
+}
+
+CFfmpegResampler::~CFfmpegResampler()
+{
+	uninit();
+}
+
+int CFfmpegResampler::init(int in_samplerate, int out_samplerate, int in_channel, int out_channel)
+{
+	if(in_samplerate != out_samplerate)
+	{
+		m_swr_context = swr_alloc_set_opts(
+				NULL,
+				av_get_default_channel_layout(out_channel),
+				AV_SAMPLE_FMT_FLT,
+				out_samplerate,
+				av_get_default_channel_layout(in_channel),
+				AV_SAMPLE_FMT_FLT,
+				in_samplerate,
+				0,
+				NULL
+		);
+
+		if((NULL == m_swr_context) || swr_init(m_swr_context))
+		{
+			return E_RESAMPLER_NO_MEMORY;
+		}
+	}
+    m_in_channel = in_channel;
+	m_out_channel = out_channel;
+	return E_RESAMPLER_SUCCESS;
+}
+
+int CFfmpegResampler::get_out_samples(int num)
+{
+	if(m_swr_context)
+	{
+		return swr_get_out_samples(m_swr_context, num);
+	}
+	else
+	{
+		return num;
+	}
+}
+
+int CFfmpegResampler::get_latency()
+{
+	return 0;
+}
+
+void CFfmpegResampler::reset()
+{
+	if(m_swr_context && m_swr_buffer)
+	{
+		swr_convert(m_swr_context, &m_swr_buffer, m_swr_bufsize, 0, 0);
+	}
+}
+
+int CFfmpegResampler::resample(float * in_buf, int in_num, float * out_buf, int & out_num)
+{
+	if(m_swr_context)
+	{
+		//看之前申请的内存空间是否足够，不足的话，就进行申请空间
+		if(out_num > m_swr_bufsize)
+		{
+			unsigned char * buffer = NULL;
+			if(av_samples_alloc(&buffer, NULL, m_out_channel, out_num, AV_SAMPLE_FMT_FLT, 0) < 0)
+			{
+				return E_RESAMPLER_NO_MEMORY;
+			}
+			m_swr_bufsize = out_num;
+			if(m_swr_buffer)
+			{
+				av_freep(&m_swr_buffer);
+			}
+			m_swr_buffer = buffer;
+		}
+
+		out_num = swr_convert(
+				m_swr_context,
+				&m_swr_buffer,
+				out_num,
+				(const uint8_t **)(&in_buf),
+				in_num
+		);
+		if(out_num < 0)
+		{
+			out_num = 0;
+			return E_RESAMPLER_NUM_ZERO;
+		}
+
+		memcpy(out_buf, m_swr_buffer, out_num * sizeof(float) * m_out_channel);
+	}
+	else if(in_buf == out_buf)
+	{
+		out_num = in_num;
+	}
+	else
+	{
+		memcpy(out_buf, in_buf, out_num * sizeof(float) * m_out_channel);
+	}
+	return E_RESAMPLER_SUCCESS;
+}
+
+void CFfmpegResampler::uninit()
+{
+	if(m_swr_context)
+	{
+		swr_free(&m_swr_context);
+	}
+	if(m_swr_buffer)
+    {
+        av_freep(&m_swr_buffer);
+    }
+	m_swr_bufsize = 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/CMakeLists.txt
new file mode 100644
index 0000000..2a32277
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/CMakeLists.txt
@@ -0,0 +1,9 @@
+include_directories(./)
+include_directories(inc)
+include_directories(src)
+
+file(GLOB_RECURSE AUTOTUNE_SRC_CPP_FILES src/*cpp)
+file(GLOB_RECURSE AUTOTUNE_SRC_C_FILES src/*c)
+
+add_library(autotune ${AUTOTUNE_SRC_CPP_FILES} ${AUTOTUNE_SRC_C_FILES})
+#set_target_properties(autotune PROPERTIES CXX_VISIBILITY_PRESET hidden)
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/inc/ATndkWrapper.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/inc/ATndkWrapper.h
new file mode 100644
index 0000000..6f6ade5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/inc/ATndkWrapper.h
@@ -0,0 +1,54 @@
+//
+// Created by 杨将 on 2017/7/12.
+//
+
+#ifndef __ATNDKWRAPPER_H__
+#define __ATNDKWRAPPER_H__
+#include "AudioEffectsConf.h"
+#include <memory>
+
+//keychange的参数
+typedef struct _KeyChangeParam
+{
+    //更新的开始时间点，单位ms
+    float * times;
+    //更新的key值
+    int * keys;
+    //更新的scale值
+    int * scales;
+    //总共的个数
+    int count;
+}KeyChangeParam, *pKeyChangeParam;
+
+class CAutoTuneWrapper;
+
+class CATndkWrapper
+{
+public:
+	CATndkWrapper();
+	~CATndkWrapper();
+
+public:
+	int init(int samplerate, int channels);
+	int set_key_change(pKeyChangeParam param);
+	void reset();
+	int process(short * input, short * output, int samples, double ms);
+	int process(float * input, float * output, int samples, double ms);
+    int get_latency_time_ms();
+	void uninit();
+
+private:
+	void quick_set_key_change(double ms);
+	void destroy_key_change();
+
+private:
+	CAutoTuneWrapper * m_autotune;
+	KeyChangeParam m_keychange;
+	int m_current_idx;
+	int m_channels;
+	float * m_float_buffer;
+	int m_last_sample_num_of_float;
+
+};
+
+#endif //__ATNDKWRAPPER_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/inc/AutoTuneDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/inc/AutoTuneDef.h
new file mode 100644
index 0000000..c5a4b68
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/inc/AutoTuneDef.h
@@ -0,0 +1,17 @@
+//
+// Created by yangjianli on 2020-01-13.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_AOTOTUNEDEF_H
+#define AUDIO_EFFECTS_LIB_AOTOTUNEDEF_H
+#include "AudioEffectsConf.h"
+enum AT_ERR {
+    AT_ERR_SUCCESS            = 0,
+    AT_ERR_NO_MEMORY          = -1,
+    AT_ERR_PARAM              = -2,
+    AT_ERR_HAS_SET_PARAM      = -3,
+    AT_ERR_AUTOTUNE_INIT      = -4,
+    AT_ERR_BASE_H_NULL        = -5,
+    AT_ERR_BASE_H_MALLOC_NULL = -6,
+};
+#endif //AUDIO_EFFECTS_LIB_AOTOTUNEDEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ATndkWrapper.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ATndkWrapper.cpp
new file mode 100644
index 0000000..ca1563c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ATndkWrapper.cpp
@@ -0,0 +1,243 @@
+//
+// Created by 杨将 on 2017/7/12.
+//
+
+#include <stdio.h>
+#include <new>
+#include <cstring>
+#include "common/util/util.h"
+#include "ATndkWrapper.h"
+#include "AutoTuneDef.h"
+#include "common/common.h"
+#include "autotune/CAutoTuneWrapper.h"
+
+CATndkWrapper::CATndkWrapper()
+{
+	m_autotune = NULL;
+
+	m_keychange.times = NULL;
+	m_keychange.keys = NULL;
+	m_keychange.scales = NULL;
+	m_keychange.count = 0;
+
+	m_current_idx = 0;
+	m_channels = 1;
+
+	m_float_buffer = NULL;
+	m_last_sample_num_of_float = 0;
+}
+
+CATndkWrapper::~CATndkWrapper()
+{
+	uninit();
+}
+
+int CATndkWrapper::init(int samplerate, int channels)
+{
+	int nRet = AT_ERR_SUCCESS;
+
+	m_channels = channels;
+
+	m_autotune = new(std::nothrow) CAutoTuneWrapper();
+	if(NULL == m_autotune)
+	{
+		nRet = AT_ERR_NO_MEMORY;
+		goto exit;
+	}
+
+    nRet = m_autotune->init(samplerate, channels);
+    if(AT_ERR_SUCCESS != nRet)
+    {
+        nRet = AT_ERR_AUTOTUNE_INIT;
+        goto exit;
+    }
+exit:
+	if(AT_ERR_SUCCESS != nRet)
+	{
+		uninit();
+	}
+	return nRet;
+}
+
+int CATndkWrapper::set_key_change(pKeyChangeParam param)
+{
+	//已经设置了参数直接返回，这里会有两个出口，切记
+	if(m_keychange.count > 0)
+	{
+		return AT_ERR_HAS_SET_PARAM;
+	}
+
+	//必须在init之后才能调用set参数接口
+	int nRet = AT_ERR_SUCCESS;
+
+	m_keychange.count = param->count;
+
+	m_keychange.times = new(std::nothrow) float[m_keychange.count];
+	if(NULL == m_keychange.times)
+	{
+		nRet = AT_ERR_NO_MEMORY;
+		goto exit;
+	}
+    memcpy(m_keychange.times, param->times, m_keychange.count * sizeof(float));
+
+	m_keychange.keys = new(std::nothrow) int[m_keychange.count];
+	if(NULL == m_keychange.keys)
+	{
+		nRet = AT_ERR_NO_MEMORY;
+		goto exit;
+	}
+    memcpy(m_keychange.keys, param->keys, m_keychange.count * sizeof(int));
+
+	m_keychange.scales = new(std::nothrow) int[m_keychange.count];
+	if(NULL == m_keychange.scales)
+	{
+		nRet = AT_ERR_NO_MEMORY;
+		goto exit;
+	}
+    memcpy(m_keychange.scales, param->scales, m_keychange.count * sizeof(int));
+
+exit:
+	if(AT_ERR_SUCCESS != nRet)
+	{
+		destroy_key_change();
+	}
+
+	return nRet;
+}
+
+void CATndkWrapper::reset()
+{
+	m_autotune->reset();
+}
+
+int CATndkWrapper::process(short * input, short * output, int samples, double ms)
+{
+	//如果当前的m_float_buffer空间不足则重新申请
+	if (m_last_sample_num_of_float < samples)
+	{
+		float * last_buffer = m_float_buffer;
+
+		m_float_buffer = (float *) malloc(samples * sizeof(float));
+		if (NULL == m_float_buffer)
+		{
+			return AT_ERR_NO_MEMORY;
+		}
+
+		//释放之前分配的内存
+		SAFE_FREE(last_buffer);
+		m_last_sample_num_of_float = samples;
+	}
+
+	//查找当前的key 和 scale
+	quick_set_key_change(ms);
+
+	short_to_float(input, m_float_buffer, samples);
+
+	m_autotune->process(m_float_buffer, m_float_buffer, samples);
+
+	//返回输出的数据
+	float_to_short(m_float_buffer, output, samples);
+
+	return AT_ERR_SUCCESS;
+}
+
+int CATndkWrapper::process(float *input, float * output, int samples, double ms)
+{
+
+	//如果当前的m_float_buffer空间不足则重新申请
+	if (m_last_sample_num_of_float < samples)
+	{
+		float * last_buffer = m_float_buffer;
+
+		m_float_buffer = (float *) malloc(samples * sizeof(float));
+		if (NULL == m_float_buffer)
+		{
+			return AT_ERR_NO_MEMORY;
+		}
+
+		//释放之前分配的内存
+		SAFE_FREE(last_buffer);
+		m_last_sample_num_of_float = samples;
+	}
+
+	//查找当前的key 和 scale
+	quick_set_key_change(ms);
+
+	memcpy(m_float_buffer, input, samples * sizeof(float));
+
+	m_autotune->process(m_float_buffer, output, samples);
+
+	return AT_ERR_SUCCESS;
+}
+
+int CATndkWrapper::get_latency_time_ms()
+{
+	return m_autotune->get_latency();
+}
+
+void CATndkWrapper::uninit()
+{
+	SAFE_DELETE_OBJ(m_autotune);
+
+	SAFE_FREE(m_float_buffer);
+	m_last_sample_num_of_float = 0;
+
+	destroy_key_change();
+
+	m_current_idx = 0;
+}
+
+void CATndkWrapper::quick_set_key_change(double ms)
+{
+	int idx = m_current_idx;
+	float * times = m_keychange.times;
+	int count = m_keychange.count - 1;
+
+	//如果没有设置过keychange这个时候要返回
+	if(NULL == times)
+	{
+		return ;
+	}
+
+	//本来应该如果重置过了，说明跳转了或者切换过了，因此进行二分查找
+	//否则进行直接往后查找
+	//简单点，直接当前位置前后查找
+	if(times[idx] <= ms)
+	{
+		while(idx < count)
+		{
+			if((times[idx + 1] > ms) && (times[idx] <= ms))
+			{
+				break;
+			}
+			++idx;
+		}
+	}
+	else
+	{
+		while(idx > 0)
+		{
+			if((times[idx - 1] <= ms) && (times[idx] > ms))
+			{
+				--idx;
+				break;
+			}
+			--idx;
+		}
+	}
+
+	if(idx != m_current_idx)
+	{
+		bool notes[12];
+		m_current_idx = idx;
+//		m_autotune->Set_notes_from_key_and_scale(notes, m_keychange.keys[m_current_idx], m_keychange.scales[m_current_idx]);
+	}
+}
+
+void CATndkWrapper::destroy_key_change()
+{
+	SAFE_DELETE_ARRAY(m_keychange.times);
+	SAFE_DELETE_ARRAY(m_keychange.keys);
+	SAFE_DELETE_ARRAY(m_keychange.scales);
+	m_keychange.count = 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTune.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTune.cpp
new file mode 100644
index 0000000..cd9394a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTune.cpp
@@ -0,0 +1,509 @@
+
+#include <stdlib.h>
+#include <string.h>
+#include <math.h>
+#include <stdio.h>
+#include "ref/CircularBuffer.h"
+#include "pitch/PitchDetector.h"
+#include "formant_corrector/FormantCorrector.h"
+#include "pitch/PitchShifter.h"
+#include "autotune/CAutoTune.h"
+#include "AutoTuneDef.h"
+
+extern "C"
+{
+#include "ref/fftwrap.h"
+}
+
+#if 0
+//ndef WIN32
+
+#include <stdlib.h>
+#include <android/log.h>
+#include "logutil.h"
+
+//void androidLog(int, const char*, ...);
+
+#define   LOG_TAG    "CAUTOTUNE_NATIVE"
+#define   LOGD(...)  androidLog(ANDROID_LOG_DEBUG,LOG_TAG,__VA_ARGS__)
+#define   LOGI(...)  androidLog(ANDROID_LOG_INFO,LOG_TAG,__VA_ARGS__)
+#define   LOGW(...)  androidLog(ANDROID_LOG_WARN,LOG_TAG,__VA_ARGS__)
+#define   LOGE(...)  androidLog(ANDROID_LOG_ERROR,LOG_TAG,__VA_ARGS__)
+
+#else
+
+#define LOGE(...)
+
+#endif
+
+
+#define PI (float)3.14159265358979323846
+#define L2SC (float)3.32192809488736218171
+
+
+typedef struct {
+
+    float m_fTune;
+    float m_fFixed;
+    float m_fPull;
+    float m_fAmount;
+    float m_fSmooth;
+    float m_fShift;
+    int m_iScwarp;
+    int m_iLfoquant;
+    float m_fMix;
+    float m_fLatency;
+    fft_vars* fmembvars; // member variables for fft routine
+
+    unsigned long fs; // Sample rate
+
+
+    int noverlap;
+
+
+    // VARIABLES FOR LOW-RATE SECTION
+    float aref; // A tuning reference (Hz)
+
+
+    float lfophase;
+
+    CircularBuffer buffer;
+    PitchDetector pdetector;
+    FormantCorrector fcorrector;
+    PitchShifter pshifter;
+
+} Autotalent;
+
+int CAutoTune::init(unsigned long samplerate, const int* suggestion)
+{
+
+    Autotalent* membvars = (Autotalent*)malloc(sizeof(Autotalent));
+    if (membvars == NULL)
+    {
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+    int ti;
+    membvars->aref = 440.0f;
+    membvars->fs = samplerate;
+    int ret = 0;
+    ret = instantiate_circular_buffer(&membvars->buffer, samplerate);
+    if (ret != 0)
+    {
+        if (membvars != NULL)
+        {
+            free(membvars);
+            membvars = NULL;
+        }
+        return ret;
+    }
+    membvars->fmembvars = fft_con((int)membvars->buffer.cbsize);
+    if (membvars->fmembvars == NULL)
+    {
+        if (membvars != NULL)
+        {
+            free(membvars);
+            membvars = NULL;
+        }
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+    ret = instantiate_pitch_detector(&membvars->pdetector, membvars->fmembvars, membvars->buffer.cbsize,
+                                     (int) samplerate);
+    if (ret != 0)
+    {
+        if (membvars != NULL)
+        {
+            free(membvars);
+            membvars = NULL;
+        }
+        return ret;
+    }
+
+    ret = formant_corrector_init(&membvars->fcorrector, samplerate, (int) membvars->buffer.cbsize);
+    if (ret != 0)
+    {
+        if (membvars != NULL)
+        {
+            free(membvars);
+            membvars = NULL;
+        }
+        return ret;
+    }
+    membvars->noverlap = 4;
+
+    membvars->lfophase = 0;
+
+    ret = pitch_shifter_init(&membvars->pshifter, samplerate, membvars->buffer.cbsize);
+    if (ret != 0)
+    {
+        if (membvars != NULL)
+        {
+            free(membvars);
+            membvars = NULL;
+        }
+        return ret;
+    }
+    membvars->m_fTune = 440.0f;
+    membvars->m_fFixed = 0.0f;
+    membvars->m_fPull = 0.0f;
+
+    for (ti = 0; ti < 12; ti++)
+    {
+        m_originalSeq[ti] = m_iNotes[ti] = suggestion[(ti - 3 + 12)%12];//g_ScalePara[scale][ti];
+		//m_originalSeq[ti] = suggestion[ti];
+
+		LOGE("sugg:%02d/%d", ti, m_originalSeq[ti]);
+	}
+
+    membvars->m_fAmount = 1.0f;
+    membvars->m_fSmooth = 0.5f;
+    membvars->m_fShift = 0.0f;
+    membvars->m_iScwarp = 0;
+    membvars->m_iLfoquant = 1;
+    membvars->fcorrector.iFcorr = 0;
+    membvars->fcorrector.fFwarp = 0.0f;
+    membvars->m_fMix = 1.0f;
+
+
+
+    membvars->pdetector.confidence = 0.0f;
+
+    membvars->m_fLatency = membvars->buffer.cbsize - 1;
+
+    update_formant_warp(&membvars->fcorrector);
+    m_membvars = membvars;
+
+    scaleSemitoneConversion();
+
+    inpitch = 0.0f;
+    outpitch = 0.0f;
+//	m_scale = 0;//scale;
+
+    return 0;
+}
+
+int CAutoTune::updateScale(int scale)
+{
+
+	int ti;
+	for (ti = 0; ti < 12; ti++)
+	{
+		m_iNotes[ti] = m_originalSeq[(-scale+ti+12)%12];
+//		m_originalSeq[ti] = suggestion[ti];
+	}
+
+	return scaleSemitoneConversion();
+
+}
+// Called every time we get a new chunk of audio
+void CAutoTune::process(float *indata, float *outdata, unsigned long SampleCount) 
+{
+    Autotalent* psAutotalent = (Autotalent *)m_membvars;
+
+    for (unsigned long lSampleIndex = 0; lSampleIndex < SampleCount; lSampleIndex++)
+    {
+
+        // load data into circular buffer
+        tf = (float)*(indata++);
+        ti4 = psAutotalent->buffer.cbiwr;
+        psAutotalent->buffer.cbi[ti4] = tf;
+
+        if (psAutotalent->fcorrector.iFcorr >= 1)
+        {
+            remove_formants(&psAutotalent->fcorrector, &psAutotalent->buffer, tf);
+        }
+        else
+        {
+            psAutotalent->buffer.cbf[ti4] = tf;
+        }
+        // Input write pointer logic
+        psAutotalent->buffer.cbiwr++;
+        if (psAutotalent->buffer.cbiwr >= psAutotalent->buffer.cbsize)
+        {
+            psAutotalent->buffer.cbiwr = 0;
+        }
+
+        // Every N/noverlap samples, run pitch estimation / manipulation code
+        if ((psAutotalent->buffer.cbiwr) % (psAutotalent->buffer.cbsize / psAutotalent->noverlap) == 0)
+        {
+
+            // ---- Obtain autocovariance ----
+            bbtain_autocovariance(&psAutotalent->pdetector, psAutotalent->fmembvars, &psAutotalent->buffer,
+                                  psAutotalent->buffer.cbsize, psAutotalent->buffer.corrsize);
+
+            get_pitch_conf(&psAutotalent->pdetector, psAutotalent->fmembvars, psAutotalent->buffer.corrsize,
+                           psAutotalent->fs, psAutotalent->aref, inpitch);
+
+            outpitch = inpitch;
+
+            // Pull to fixed pitch
+            outpitch = (1 - psAutotalent->m_fPull)*outpitch + psAutotalent->m_fPull*psAutotalent->m_fFixed;
+
+            // -- Convert from semitones to scale notes --
+            ti = (int)(outpitch / 12 + 32) - 32; // octave
+            tf = outpitch - ti * 12; // semitone in octave
+            ti2 = (int)tf;
+            ti3 = ti2 + 1;
+            // a little bit of pitch correction logic, since it's a convenient place for it
+            if (m_iNotes[ti2 % 12]<0 || m_iNotes[ti3 % 12]<0)
+            { // if between 2 notes that are more than a semitone apart
+                lowersnap = 1;
+                uppersnap = 1;
+            }
+            else
+            {
+                lowersnap = 0;
+                uppersnap = 0;
+                if (m_iNotes[ti2 % 12] == 1)
+                { // if specified by user
+                    lowersnap = 1;
+                }
+                if (m_iNotes[ti3 % 12] == 1)
+                { // if specified by user
+                    uppersnap = 1;
+                }
+            }
+            // (back to the semitone->scale conversion)
+            // finding next lower pitch in scale
+            while (m_iNotes[(ti2 + 12) % 12]<0)
+            {
+                ti2 = ti2 - 1;
+            }
+            // finding next higher pitch in scale
+            while (m_iNotes[ti3 % 12]<0)
+            {
+                ti3 = ti3 + 1;
+            }
+            tf = (tf - ti2) / (ti3 - ti2) + m_iPitch2Note[(ti2 + 12) % 12];
+            if (ti2<0)
+            {
+                tf = tf - m_numNotes;
+            }
+            outpitch = tf + m_numNotes*ti;
+            // -- Done converting to scale notes --
+
+            // The actual pitch correction
+            ti = (int)(outpitch + 128) - 128;
+            tf = outpitch - ti - 0.5;
+            ti2 = ti3 - ti2;
+            if (ti2>2)
+            { // if more than 2 semitones apart, put a 2-semitone-like transition halfway between
+                tf2 = (float)ti2 / 2;
+            }
+            else
+            {
+                tf2 = (float)1;
+            }
+
+            if ((psAutotalent->m_fSmooth * 0.8)<0.001)
+            {
+                tf2 = tf*tf2 / 0.001;
+            }
+            else
+            {
+                tf2 = tf*tf2 / (psAutotalent->m_fSmooth * 0.8);
+            }
+            if (tf2<-0.5) tf2 = -0.5;
+            if (tf2>0.5) tf2 = 0.5;
+            tf2 = 0.5*sin(PI*tf2) + 0.5; // jumping between notes using horizontally-scaled sine segment
+            tf2 = tf2 + ti;
+            if ((tf<0.5 && lowersnap) || (tf >= 0.5 && uppersnap))
+            {
+                outpitch = psAutotalent->m_fAmount*tf2 + ((float)1 - psAutotalent->m_fAmount)*outpitch;
+            }
+
+            // Add in pitch shift
+            outpitch = outpitch + psAutotalent->m_fShift;
+
+            // LFO logic
+            //tf = psAutotalent->m_fLforate*psAutotalent->buffer.cbsize / (psAutotalent->noverlap*psAutotalent->fs);
+            //if (tf>1)
+            //    tf = 1;
+            //psAutotalent->lfophase = psAutotalent->lfophase + tf;
+            //if (psAutotalent->lfophase > 1)
+            //    psAutotalent->lfophase = psAutotalent->lfophase - 1;
+            //float lfoval = psAutotalent->lfophase;
+            //tf = (psAutotalent->m_fLfosymm + 1) / 2;
+            //if (tf <= 0 || tf >= 1)
+            //{
+            //    if (tf <= 0) 
+            //        lfoval = 1 - lfoval;
+            //}
+            //else
+            //{
+            //    if (lfoval <= tf)
+            //    {
+            //        lfoval = lfoval / tf;
+            //    }
+            //    else
+            //    {
+            //        lfoval = 1 - (lfoval - tf) / (1 - tf);
+            //    }
+            //}
+            //if (psAutotalent->m_fLfoshape >= 0)
+            //{
+            //    // linear combination of cos and line
+            //    lfoval = (0.5 - 0.5*cos(lfoval*PI))*psAutotalent->m_fLfoshape + lfoval*(1 - psAutotalent->m_fLfoshape);
+            //    lfoval = psAutotalent->m_fLfoamp*(lfoval * 2 - 1);
+            //}
+            //else
+            //{
+            //    // smoosh the sine horizontally until it's squarish
+            //    tf = 1 + psAutotalent->m_fLfoshape;
+            //    if (tf<0.001)
+            //    {
+            //        lfoval = (lfoval - 0.5) * 2 / 0.001;
+            //    }
+            //    else
+            //    {
+            //        lfoval = (lfoval - 0.5) * 2 / tf;
+            //    }
+            //    if (lfoval>1) lfoval = 1;
+            //    if (lfoval < -1) lfoval = -1;
+            //    lfoval = psAutotalent->m_fLfoamp*sin(lfoval*PI*0.5);
+            //}
+            // add in quantized LFO
+            if (psAutotalent->m_iLfoquant >= 1)
+            {
+                outpitch = outpitch + (int)(/*m_numNotes*lfoval +*/ m_numNotes + 0.5) - m_numNotes;
+            }
+
+
+            // Convert back from scale notes to semitones
+            outpitch = outpitch + m_iScwarp; // output scale rotate implemented here
+            ti = (int)(outpitch / m_numNotes + 32) - 32;
+            tf = outpitch - ti*m_numNotes;
+            ti2 = (int)tf;
+            ti3 = ti2 + 1;
+            outpitch = m_iNote2Pitch[ti3%m_numNotes] - m_iNote2Pitch[ti2];
+            if (ti3 >= m_numNotes)
+            {
+                outpitch = outpitch + 12;
+            }
+            outpitch = outpitch*(tf - ti2) + m_iNote2Pitch[ti2];
+            outpitch = outpitch + 12 * ti;
+            outpitch = outpitch - (m_iNote2Pitch[m_iScwarp] - m_iNote2Pitch[0]); //more scale rotation here
+
+            // add in unquantized LFO
+            if (psAutotalent->m_iLfoquant <= 0)
+            {
+                //outpitch = outpitch;// + lfoval * 2;
+            }
+
+
+            if (outpitch<-36) outpitch = -48;
+            if (outpitch>24) outpitch = 24;
+
+
+            //  ---- END Modify pitch in all kinds of ways! ----
+
+            // Compute variables for pitch shifter that depend on pitch
+            psAutotalent->pshifter.inphinc = psAutotalent->aref*pow(2, inpitch / 12) / psAutotalent->fs;
+            psAutotalent->pshifter.outphinc = psAutotalent->aref*pow(2, outpitch / 12) / psAutotalent->fs;
+            psAutotalent->pshifter.phincfact = psAutotalent->pshifter.outphinc / psAutotalent->pshifter.inphinc;
+        }
+
+        tf = shift_pitch(&psAutotalent->pshifter, &psAutotalent->buffer, psAutotalent->buffer.cbsize);
+
+
+        ti4 = (psAutotalent->buffer.cbiwr + 2) % psAutotalent->buffer.cbsize;
+        if (psAutotalent->fcorrector.iFcorr >= 1)
+        {
+            tf = add_formants(&psAutotalent->fcorrector, tf, ti4);
+        }
+        else
+        {
+            psAutotalent->fcorrector.fmute = 0;
+        }
+
+
+        *(outdata++) = (float)psAutotalent->m_fMix*tf + (1 - psAutotalent->m_fMix)*psAutotalent->buffer.cbi[ti4];
+
+    }
+    // Tell the host the algorithm latency
+    psAutotalent->m_fLatency = (float)(psAutotalent->buffer.cbsize - 1);
+}
+
+int CAutoTune::getLatency()
+{
+    Autotalent* psAutotalent = (Autotalent *)m_membvars;
+    return (int)(1000.0f * psAutotalent->m_fLatency / psAutotalent->fs);
+}
+
+void CAutoTune::reset()
+{
+    Autotalent* psAutotalent = (Autotalent *)m_membvars;
+
+    // circlebuffer reset
+    memset(psAutotalent->buffer.cbi, 0, sizeof(float) * psAutotalent->buffer.cbsize);
+    memset(psAutotalent->buffer.cbf, 0, sizeof(float) * psAutotalent->buffer.cbsize);
+    psAutotalent->buffer.cbiwr = 0;
+
+    //formant_corrector_init reset
+    // Initialize formant corrector
+    int i;
+    for (i=0; i<psAutotalent->fcorrector.ford; i++)
+    {
+        memset(psAutotalent->fcorrector.flevels[i].buff, 0, sizeof(float) * psAutotalent->buffer.cbsize);
+    }
+    memset(psAutotalent->fcorrector.ftvec, 0, sizeof(float) * psAutotalent->fcorrector.ford);
+
+    //pitch_shifter
+    memset(psAutotalent->pshifter.frag, 0, sizeof(float) * psAutotalent->buffer.cbsize);
+    psAutotalent->pshifter.fragsize = 0;
+
+    memset(psAutotalent->pshifter.cbo, 0, sizeof(float) * psAutotalent->buffer.cbsize);
+    psAutotalent->pshifter.cbord = 0;
+}
+
+void CAutoTune::unInit()
+{
+    fft_des(((Autotalent*)m_membvars)->fmembvars);
+    free(((Autotalent*)m_membvars)->buffer.cbi);
+    free(((Autotalent*)m_membvars)->buffer.cbf);
+    free(((Autotalent*)m_membvars)->pshifter.cbo);
+    free(((Autotalent*)m_membvars)->pdetector.cbwindow);
+    free(((Autotalent*)m_membvars)->pshifter.hannwindow);
+    free(((Autotalent*)m_membvars)->pdetector.acwinv);
+    free(((Autotalent*)m_membvars)->pshifter.frag);
+
+    cleanup_formant_corrector(&((Autotalent *) m_membvars)->fcorrector);
+    free((Autotalent*)m_membvars);
+}
+
+int CAutoTune::scaleSemitoneConversion()
+{
+    // Some logic for the semitone->scale and scale->semitone conversion
+    // If no notes are selected as being in the scale, instead snap to all notes
+    int ti2 = 0;
+    for (ti = 0; ti<12; ti++)
+    {
+        if (m_iNotes[ti] >= 0)
+        {
+            m_iPitch2Note[ti] = ti2;
+            m_iNote2Pitch[ti2] = ti;
+            ti2 = ti2 + 1;
+        }
+        else
+        {
+            m_iPitch2Note[ti] = -1;
+        }
+    }
+    m_numNotes = ti2;
+    while (ti2<12)
+    {
+        m_iNote2Pitch[ti2] = -1;
+        ti2 = ti2 + 1;
+    }
+    if (m_numNotes == 0)
+    {
+        for (ti = 0; ti<12; ti++)
+        {
+            m_iNotes[ti] = 1;
+            m_iPitch2Note[ti] = ti;
+            m_iNote2Pitch[ti] = ti;
+        }
+        m_numNotes = 12;
+    }
+    m_iScwarp = (((Autotalent*)m_membvars)->m_iScwarp + m_numNotes * 5) % m_numNotes;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTune.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTune.h
new file mode 100644
index 0000000..ebc5c23
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTune.h
@@ -0,0 +1,50 @@
+#ifndef __AUTO_TUNE_H_
+#define __AUTO_TUNE_H_
+#include "AudioEffectsConf.h"
+
+
+class CAutoTune
+{
+public:
+    int init(unsigned long samplerate, const int* suggestion);
+
+    void
+        process(float *indata, float *outdata,
+        unsigned long SampleCount);
+    void
+        unInit();
+    void reset();
+	int updateScale(int scale); // Key Shift
+	int getLatency();
+
+private:
+    int scaleSemitoneConversion();
+
+private:
+    void* m_membvars;
+    int m_iNotes[12];
+    int m_iPitch2Note[12];
+    int m_iNote2Pitch[12];
+	int m_originalSeq[12];
+    int m_iScwarp;
+    int m_numNotes;
+	//int m_scale;
+
+    long int ti;
+    long int ti2;
+    long int ti3;
+    long int ti4;
+    float tf;
+    float tf2;
+
+    // Variables for cubic spline interpolator
+
+    int lowersnap;
+    int uppersnap;
+    float inpitch;
+    float outpitch;
+
+};
+
+
+#endif // !__AUTO_TUNE_H_
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTuneWrapper.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTuneWrapper.cpp
new file mode 100644
index 0000000..2c2c041
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTuneWrapper.cpp
@@ -0,0 +1,95 @@
+//
+// Created by wangjianjun on 18/8/21.
+//
+
+#include <cstdlib>
+#include <cmath>
+#include "CAutoTuneWrapper.h"
+#include "AutoTuneDef.h"
+
+CAutoTuneWrapper::CAutoTuneWrapper()
+{
+    m_autotune = NULL;
+    m_channels = 1;
+}
+
+CAutoTuneWrapper::~CAutoTuneWrapper()
+{
+    uninit();
+}
+
+void CAutoTuneWrapper::uninit()
+{
+    if (m_autotune)
+    {
+        m_autotune->unInit();
+        delete m_autotune;
+        m_autotune = NULL;
+    }
+    m_channels = 1;
+}
+
+int CAutoTuneWrapper::init(int samplerate, int channels)
+{
+    int res = 0;
+    m_channels = channels;
+
+    m_autotune = new CAutoTune();
+    if (m_autotune == NULL)
+    {
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+
+    int suggestion[12] = {1,-1,1,-1,1,1,-1,1,-1,1,-1,1};//默认C大调
+    res = m_autotune->init(samplerate, suggestion);
+    if (res != 0)
+    {
+        goto exit;
+    }
+exit:
+    if (res != 0)
+    {
+        uninit();
+    }
+    return res;
+}
+
+int CAutoTuneWrapper::update_scale(int scale) {
+    if (m_autotune == NULL) {
+        return AT_ERR_BASE_H_NULL;
+    }
+    return m_autotune->updateScale(scale);
+}
+
+int CAutoTuneWrapper::process(float *inData, float *outData, unsigned int count)
+{
+    if (m_channels == 1)
+    {
+        m_autotune->process(inData, outData, count);
+    }
+    else if (m_channels == 2)
+    {
+        for (size_t i = 0; i < count / 2; i++)
+        {
+            inData[i] = (inData[2 * i] + inData[2 * i + 1]) / 2.0f;
+        }
+        m_autotune->process(inData, outData + count / 2, count / 2);
+
+        for (size_t i = 0; i < count / 2; i++)
+        {
+            outData[2 * i] = outData[count / 2 + i];
+            outData[2 * i + 1] = outData[count / 2 + i];
+        }
+    }
+    return count;
+}
+
+
+int CAutoTuneWrapper::get_latency() {
+    return m_autotune->getLatency();
+}
+
+void CAutoTuneWrapper::reset()
+{
+    m_autotune->reset();
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTuneWrapper.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTuneWrapper.h
new file mode 100644
index 0000000..5042a11
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/autotune/CAutoTuneWrapper.h
@@ -0,0 +1,29 @@
+//
+// Created by wangjianjun on 18/8/21.
+//
+
+#ifndef CAUDIODECODER_CAUTOTUNEWRAPPER_H
+#define CAUDIODECODER_CAUTOTUNEWRAPPER_H
+
+#include "CAutoTune.h"
+
+class CAutoTuneWrapper {
+public:
+    CAutoTuneWrapper();
+    ~CAutoTuneWrapper();
+
+public:
+    int init(int samplerate, int channels);
+    int process(float *inData, float *outData, unsigned int count);
+    int update_scale(int scale);
+    int get_latency();
+    void reset();
+private:
+    void uninit();
+private:
+    CAutoTune * m_autotune;
+    int m_channels;
+};
+
+
+#endif //CAUDIODECODER_CAUTOTUNEWRAPPER_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/common.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/common.h
new file mode 100644
index 0000000..779f0fc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/common.h
@@ -0,0 +1,150 @@
+//
+// Created by 杨将 on 2017/6/27.
+//
+
+#ifndef __COMMON_H__
+#define __COMMON_H__
+//
+//#ifdef __APPLE__
+//#include <sys/malloc.h>
+//#else
+//#include "malloc.h"
+//#endif
+
+#include <new>
+#include <math.h>
+
+#ifdef ST_DEBUG
+#include <assert.h>
+#define ASSERT(e) assert(e)
+#else
+#define ASSERT(e)
+#endif
+
+
+//定义一些常用的宏或者常量等
+
+//录制、播放、解码的缓存buffer的时间长度，单位ms
+#define RECORDER_CIRCLE_BUFFER_TIME     ((int)200)
+
+//默认写入文件的人声采样率
+#define FILE_VOCAL_SAMPLERATE           ((int)44100)
+
+//跳转在多少ms以内不需要进行跳转
+#define SEEK_NO_OPRATE                  (1.01)
+
+//文件读取的基本长度
+#define FILE_OPERATE_LEN                ((int)2048)
+//人声文件中进行fade的最大长度
+#define FILE_FADE_LEN                   ((int)240)
+//最大声道数，这个值不能改动，可以改成1
+#define MAX_CHANNEL                     ((int)2)
+
+//底层音量的中值
+#define DEFAULT_VOLUME                  ((int)50)
+
+//伴奏音量的基准值（分贝）
+#define DEFAULT_BASELINE_DB                  ((float)-14.57f)
+
+//安全关闭文件
+#ifndef SAFE_CLOSE_FILE
+#define SAFE_CLOSE_FILE(file)       \
+{                                   \
+    if(file)                        \
+    {                               \
+        fclose(file);               \
+        file = NULL;                \
+    }                               \
+}
+#endif //SAFE_CLOSE_FILE
+
+//安全释放内存
+#ifndef SAFE_FREE
+#define SAFE_FREE(ptr)              \
+{                                   \
+    if(ptr)                         \
+    {                               \
+        free(ptr);                  \
+        ptr = NULL;                 \
+    }                               \
+}
+#endif //SAFE_FREE
+
+//安全删除对象
+#ifndef SAFE_DELETE_OBJ
+#define SAFE_DELETE_OBJ(obj)        \
+{                                   \
+    if(obj)                         \
+    {                               \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_DELETE_OBJ
+
+//安全逆初始化并删除对象
+#ifndef SAFE_UNINIT_DELETE_OBJ
+#define SAFE_UNINIT_DELETE_OBJ(obj) \
+{                                   \
+    if(obj)                         \
+    {                               \
+        obj->uninit();              \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_UNINIT_DELETE_OBJ
+
+#ifndef SAFE_CLOSE_DELETE_OBJ
+#define SAFE_CLOSE_DELETE_OBJ(obj)  \
+{                                   \
+    if(obj)                         \
+    {                               \
+        obj->close();               \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_CLOSE_DELETE_OBJ
+
+//安全删除数组
+#ifndef SAFE_DELETE_ARRAY
+#define SAFE_DELETE_ARRAY(array)    \
+{                                   \
+    if(array)                       \
+    {                               \
+        delete [] array;            \
+        array = NULL;               \
+    }                               \
+}
+#endif //SAFE_DELETE_ARRAY
+
+//取大值
+#ifndef GLOBAL_MAX
+#define GLOBAL_MAX(a, b)	(((a) > (b)) ? (a) : (b))
+#endif
+
+//取小值
+#ifndef GLOBAL_MIN
+#define GLOBAL_MIN(a,b)		(((a) < (b)) ? (a) : (b))
+#endif
+
+//取中间
+#ifndef GLOBAL_MID
+#define GLOBAL_MID(a, b, c)	(GLOBAL_MAX(a, GLOBAL_MIN(b, c)))
+#endif
+
+//取绝对值
+#ifndef GLOBAL_ABS
+#define GLOBAL_ABS(a)       ((a) < 0 ? (-(a)) : (a))
+#endif
+
+
+#ifndef CHECK_FLOAT_EQUAL
+#define CHECK_FLOAT_EQUAL(a, b)  (fabs(a - b) < 0.001f)
+#endif
+
+#define TYPE_PLAY_ORIGIN 1
+#define TYPE_PLAY_CORRECTION 2
+
+#endif //__COMMON_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/util/util.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/util/util.cpp
new file mode 100644
index 0000000..b69e696
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/util/util.cpp
@@ -0,0 +1,206 @@
+//
+// Created by 杨将 on 2017/6/27.
+//
+
+#include "util.h"
+#include "common/common.h"
+#include <time.h>
+#include <sys/stat.h>
+#ifdef __ANDROID__
+#include <sys/system_properties.h>
+#else
+#include <sys/time.h>
+#endif
+#include <cstdint>
+
+void short_fade_in(short * buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = (short)(buffer[i] * i / size);
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = (short)(buffer[i] * i / size);
+            buffer[i + 1] = (short)(buffer[i + 1] * i / size);
+        }
+    }
+}
+
+void float_fade_in(float * buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = buffer[i] * i / size;
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = buffer[i] * i / size;
+            buffer[i + 1] = buffer[i + 1] * i / size;
+        }
+    }
+}
+
+void short_fade_out(short * buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = (short)(buffer[i] * (size - i) / size);
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = (short)(buffer[i] * (size - i) / size);
+            buffer[i + 1] = (short)(buffer[i + 1] * (size - i) / size);
+        }
+    }
+}
+
+void float_fade_out(float * buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = buffer[i] * (size - i) / size;
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = buffer[i] * (size - i) / size;
+            buffer[i + 1] = buffer[i + 1] * (size - i) / size;
+        }
+    }
+}
+
+void float_to_short(float * in, short * out, int num)
+{
+    for(int i = 0; i < num; i++)
+    {
+        out[i] = (short)GLOBAL_MID(-32768, in[i] * 32767, 32767);
+    }
+}
+
+void short_to_float(short * in, float * out, int num)
+{
+    for(int i = 0; i < num; i++)
+    {
+        out[i] = in[i] / 32768.0f;
+    }
+}
+//立体声转单声道
+void short_stereo_to_mono(short * in, short * out, int num)
+{
+    for(int i = 0; i < num; i++)
+    {
+        out[i] = in[i*2];
+    }
+}
+//双声道转单声道
+void float_stereo_to_mono(float * in, float * out, int num)
+{
+    for(int i = 0; i < num; i++)
+    {
+        out[i] = in[i*2];
+    }
+}
+
+void float_crossfade(float * fadein_buf, float * fadeout_buf, float * out, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            out[i] = fadein_buf[i] + fadeout_buf[i] * (size - i) / size;
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            out[i] = fadein_buf[i] + fadeout_buf[i] * (size - i) / size;
+            out[i + 1] = fadein_buf[i + 1] + fadeout_buf[i + 1] * (size - i) / size;
+        }
+    }
+}
+
+double get_current_time_ms()
+{
+    struct timeval now;
+    if(0 == gettimeofday(&now, NULL))
+    {
+        return 1000.0 * now.tv_sec + now.tv_usec / 1000.0;
+    }
+    else
+    {
+        return 0;
+    }
+}
+
+long get_file_size(const char * path) {
+    int32_t file_size = -1;
+
+    struct stat statbuf;
+    if (stat(path, &statbuf) >= 0)
+    {
+        file_size = statbuf.st_size;
+    }
+    return file_size;
+}
+
+int getSdkVersion() {
+#ifdef __ANDROID__
+    static int sCachedSdkVersion = -1;
+    if (sCachedSdkVersion == -1) {
+        char sdk[PROP_VALUE_MAX] = {0};
+        if (__system_property_get("ro.build.version.sdk", sdk) != 0) {
+            sCachedSdkVersion = atoi(sdk);
+        }
+    }
+    return sCachedSdkVersion;
+#endif
+    return -1;
+}
+
+float calc_rms(float *in, int len, int channel)
+{
+    float rms = 0;
+    // 只取用第一个声道数据
+    for(int i=0;i<len;i+=channel)
+    {
+        rms += in[i] * in[i];
+    }
+    rms /= int(len / channel);
+    rms = sqrt(rms);
+    return rms;
+}
+
+void float_gain_crossfade(float src_gain, float dst_gain, float* in, int size, int channel)
+{
+    float gain = 0.0;
+    for(int k=0;k<size;k+=channel)
+    {
+        gain = src_gain * (size - k) / size +
+               dst_gain * k / size;
+        for(int kk=0;kk<channel;kk++)
+        {
+            in[k+kk] *= gain;
+        }
+    }
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/util/util.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/util/util.h
new file mode 100644
index 0000000..33ea65e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/common/util/util.h
@@ -0,0 +1,48 @@
+//
+// Created by 杨将 on 2017/6/27.
+//
+
+#ifndef __UTIL_H__
+#define __UTIL_H__
+
+#ifndef SWAP
+#define SWAP(x, y) do { \
+    decltype(x) t = (y); (y) = (x); (x) = t; \
+} while (0)
+#endif // SWAP
+
+//进行一段数据的fadein
+void short_fade_in(short * buffer, int size, int channel);
+void float_fade_in(float * buffer, int size, int channel);
+
+//进行一段数据的fadeout
+void short_fade_out(short * buffer, int size, int channel);
+void float_fade_out(float * buffer, int size, int channel);
+
+//浮点转定点数据
+void float_to_short(float * in, short * out, int num);
+
+//定点转浮点数据
+void short_to_float(short * in, float * out, int num);
+
+//浮点的crossfade代码
+void float_crossfade(float * fadein_buf, float * fadeout_buf, float * out, int size, int channel);
+
+//获取当前时间点，按照绝对时间，不是NTP之类的同步时间
+double get_current_time_ms();
+
+void short_stereo_to_mono(short * in, short * out, int num);
+
+void float_stereo_to_mono(float * in, float * out, int num);
+
+long get_file_size(const char * path);
+
+int getSdkVersion();
+
+// 计算rms
+float calc_rms(float *in, int len, int channel);
+
+// 从src_gain->dst_gain增益平滑增长
+void float_gain_crossfade(float src_gain, float dst_gain, float* in, int size, int channel);
+
+#endif //__UTIL_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/formant_corrector/FormantCorrector.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/formant_corrector/FormantCorrector.cpp
new file mode 100644
index 0000000..1795ce4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/formant_corrector/FormantCorrector.cpp
@@ -0,0 +1,192 @@
+#include "FormantCorrector.h"
+#include "AutoTuneDef.h"
+
+int formant_corrector_init(FormantCorrector *fcorrector, unsigned long sample_rate, int cbsize)
+{
+	// Initialize formant corrector
+	fcorrector->ford = 7; // should be sufficient to capture formants
+	fcorrector->falph = pow(0.001f, (float) 80 / (sample_rate));
+	fcorrector->flamb = -(0.8517*sqrt(atan(0.06583*sample_rate))-0.1916); // or about -0.88 @ 44.1kHz
+    fcorrector->flevels = (FormantLevel*)calloc(fcorrector->ford, sizeof(FormantLevel));
+    if (fcorrector->flevels == NULL)
+    {
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+	fcorrector->fhp = 0;
+	fcorrector->flp = 0;
+	fcorrector->flpa = pow(0.001f, (float) 10 / (sample_rate));
+    fcorrector->ftvec = (float*)calloc(fcorrector->ford, sizeof(float));
+    if (fcorrector->ftvec == NULL)
+    {
+        if (fcorrector->flevels != NULL)
+        {
+            free(fcorrector->flevels);
+            fcorrector->flevels = NULL;
+        }
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+	int i;
+	for (i=0; i<fcorrector->ford; i++) 
+    {
+		fcorrector->flevels[i].buff = (float*)calloc(cbsize, sizeof(float));
+        if (fcorrector->flevels[i].buff == NULL)
+        {
+           
+            i--;
+            for (; i >= 0; i--)
+            {
+                if (fcorrector->flevels[i].buff != NULL)
+                {
+                    free(fcorrector->flevels[i].buff);
+                    fcorrector->flevels[i].buff = NULL;
+                }
+            }
+            if (fcorrector->flevels != NULL)
+            {
+                free(fcorrector->flevels);
+                fcorrector->flevels = NULL;
+            }
+            if (fcorrector->ftvec != NULL)
+            {
+                free(fcorrector->ftvec);
+                fcorrector->ftvec = NULL;
+            }
+            return AT_ERR_BASE_H_MALLOC_NULL;
+        }
+	}
+	fcorrector->fmute = 1;
+	fcorrector->fmutealph = powf(0.001f, (float)1 / (sample_rate));
+    return 0;
+}
+
+
+float FormantRemovalIteration(FormantLevel* level, float falph, float flamb, float *fa, float* fb) 
+{
+        float foma=(1-falph);
+	    level->fsig = (*fa)*(*fa)*foma + level->fsig*falph;
+		float fc = (*fb-(level->fc))*(flamb) + level->fb;
+
+		level->fc=fc;
+	    level->fb=*fb;
+		float fk_tmp = (*fa)*fc*foma + level->fk*falph;
+		level->fk = fk_tmp;
+		float result = fk_tmp/(level->fsig + 0.000001);
+		result = result*foma + level->fsmooth*falph;
+		level->fsmooth = result;
+		*fb = fc - result*(*fa);
+		*fa = *fa - result*fc;
+	    return result;
+}
+// tf is signal input
+void remove_formants(FormantCorrector *fcorrector, CircularBuffer *buffer, float tf)
+{
+    // Somewhat experimental formant corrector
+	//  formants are removed using an adaptive pre-filter and
+	//  re-introduced after pitch manipulation using post-filter
+                    
+	float fa = tf - fcorrector->fhp; // highpass pre-emphasis filter
+    fcorrector->fhp = tf;
+    float fb = fa;
+	
+	int i;
+	for (i=0; i<(fcorrector->ford); i++) 
+    {
+		FormantLevel* level=&fcorrector->flevels[i];
+		level->buff[buffer->cbiwr]=FormantRemovalIteration(level,fcorrector->falph, fcorrector->flamb,&fa,&fb);
+	}
+	buffer->cbf[buffer->cbiwr] = fa;
+	// Now hopefully the formants are reduced
+	// More formant correction code at the end of the DSP loops
+}
+float FormantCorrectorIteration(FormantCorrector* fcorrector, float fa, long int writepoint) 
+{
+	float fb=fa;
+	for (int i=0; i<fcorrector->ford; i++) 
+    {
+		FormantLevel level=fcorrector->flevels[i];
+		float fc = (fb-level.frc)*fcorrector->frlamb + level.frb;
+		float tf = level.buff[writepoint];
+		fb = fc - tf*fa;
+        fcorrector->ftvec[i] = tf*fc;
+        fa = fa - fcorrector->ftvec[i];
+	}
+
+	float tf = -fa;
+    for (int i = fcorrector->ford - 1; i >= 0; i--)
+    {
+        tf = tf + fcorrector->ftvec[i];
+    }
+    return  tf;
+}
+float add_formants(FormantCorrector *fcorrector, float in, long int writepoint)
+{
+	// The second part of the formant corrector
+	// This is a post-filter that re-applies the formants, designed
+	//   to result in the exact original signal when no pitch
+	//   manipulation is performed.
+	// tf is signal input
+	// gotta run it 3 times because of a pesky delay free loop
+	//  first time: compute 0-response
+	float f0resp = FormantCorrectorIteration(fcorrector,0,writepoint);
+	//  second time: compute 1-response
+	float f1resp = FormantCorrectorIteration(fcorrector,1,writepoint);
+	//  now solve equations for output, based on 0-response and 1-response
+    float tf = (float)2 * in;
+    float tf2 = tf;
+    tf = ((float)1 - f1resp + f0resp);
+    if (tf != 0)
+    {
+        tf2 = (tf2 + f0resp) / tf;
+    }
+    else
+    {
+        tf2 = 0;
+    }
+    //  third time: update delay registers
+    float fa = tf2;
+    float fb = fa;
+    for (int ti = 0; ti<fcorrector->ford; ti++)
+    {
+        float fc = (fb - fcorrector->flevels[ti].frc)*fcorrector->frlamb + fcorrector->flevels[ti].frb;
+        fcorrector->flevels[ti].frc = fc;
+        fcorrector->flevels[ti].frb = fb;
+        tf = fcorrector->flevels[ti].buff[writepoint];
+        fb = fc - tf*fa;
+        fa = fa - tf*fc;
+    }
+    tf = tf2;
+    tf = tf + fcorrector->flpa * fcorrector->flp;  // lowpass post-emphasis filter
+    fcorrector->flp = tf;
+    // Bring up the gain slowly when formant correction goes from disabled
+    // to enabled, while things stabilize.
+    if (fcorrector->fmute>0.5)
+    {
+        tf = tf*(fcorrector->fmute - 0.5) * 2;
+    }
+    else
+    {
+        tf = 0;
+    }
+    tf2 = fcorrector->fmutealph;
+    fcorrector->fmute = (1 - tf2) + tf2*fcorrector->fmute;
+	// now tf is signal output
+	// ...and we're done messing with formants
+    return tf;
+}
+
+void update_formant_warp(FormantCorrector *fcorrector)
+{
+	float f = pow((float)2,(fcorrector->fFwarp)/2)*(1+fcorrector->flamb)/(1-fcorrector->flamb);
+	fcorrector->frlamb = (f - 1)/(f + 1);
+}
+
+void cleanup_formant_corrector(FormantCorrector *fcorrector)
+{
+	int i;
+  	for (i=0; i<fcorrector->ford; i++) 
+    {
+  		free(fcorrector->flevels[i].buff);
+  	}
+  	free(fcorrector->flevels);
+    free(fcorrector->ftvec);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/formant_corrector/FormantCorrector.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/formant_corrector/FormantCorrector.h
new file mode 100644
index 0000000..faea0f7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/formant_corrector/FormantCorrector.h
@@ -0,0 +1,44 @@
+#ifndef __FORMANT_CORRECTOR_H_
+#define __FORMANT_CORRECTOR_H_
+
+#include <math.h>
+#include <stdlib.h>
+#include "ref/CircularBuffer.h"
+ // VARIABLES FOR FORMANT CORRECTOR
+
+typedef struct {
+	float fk;
+	float fb;
+	float fc;
+	float frb;
+	float frc;
+	float fsig;
+	float fsmooth;
+	float* buff;
+} FormantLevel;
+
+ typedef struct {
+  int iFcorr;
+  float fFwarp;
+	 
+  int ford;	 
+  float falph;
+  float flamb;
+  float frlamb;
+  FormantLevel* flevels;
+  float fhp;
+  float flp;
+  float flpa;
+  float fmute;
+  float fmutealph;
+  float *ftvec;
+} FormantCorrector;
+
+
+int formant_corrector_init(FormantCorrector *fcorrector, unsigned long sample_rate, int cbsize);
+void remove_formants(FormantCorrector *fcorrector, CircularBuffer *buffer, float tf);
+void update_formant_warp(FormantCorrector *fcorrector);
+float add_formants(FormantCorrector *fcorrector, float in, long int writepoint);
+void cleanup_formant_corrector(FormantCorrector *fcorrector);
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchDetector.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchDetector.cpp
new file mode 100644
index 0000000..937bde3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchDetector.cpp
@@ -0,0 +1,173 @@
+#include "PitchDetector.h"
+#include "AutoTuneDef.h"
+#include <float.h>
+
+#define L2SC (float)3.32192809488736218171
+void bbtain_autocovariance(PitchDetector *pdetector, fft_vars *fftvars, CircularBuffer *buffer, long int N, long int Nf) {
+
+    // Window and fill FFT buffer
+    unsigned long ti2 = buffer->cbiwr;
+    long ti = 0;
+    for (long ti = 0; ti < N; ti++)
+    {
+        fftvars->ffttime[ti] = (float)(buffer->cbi[(ti2 - ti + N) % N] * pdetector->cbwindow[ti]);
+    }
+
+    // Calculate FFT
+    fft_forward(fftvars, fftvars->ffttime, fftvars->fftfreqre, fftvars->fftfreqim);
+
+    // Remove DC
+    fftvars->fftfreqre[0] = 0;
+    fftvars->fftfreqim[0] = 0;
+
+    // Take magnitude squared
+    for (ti = 1; ti < Nf; ti++)
+    {
+        fftvars->fftfreqre[ti] = (fftvars->fftfreqre[ti])*(fftvars->fftfreqre[ti]) + (fftvars->fftfreqim[ti])*(fftvars->fftfreqim[ti]);
+        fftvars->fftfreqim[ti] = 0;
+    }
+
+    // Calculate IFFT
+    fft_inverse(fftvars, fftvars->fftfreqre, fftvars->fftfreqim, fftvars->ffttime);
+
+    // Normalize
+    float tf = fabs(fftvars->ffttime[0]) < FLT_EPSILON ? 0.0f : (float)1 / fftvars->ffttime[0];
+    for (ti = 1; ti < N; ti++)
+    {
+        fftvars->ffttime[ti] = fftvars->ffttime[ti] * tf;
+    }
+    fftvars->ffttime[0] = 1;
+
+}
+
+void get_pitch_conf(PitchDetector *pdetector, fft_vars *fftvars, unsigned long Nf, float fs, float aref, float &inpitch)
+{
+	// Calculate pitch period
+
+	//MPM Algorithm, thanks to Philip McLeod, and Geoff Wyvill, adapted from their GPL Tartini program
+    // Calculate pitch period
+    //   Pitch period is determined by the location of the max (biased)
+    //     peak within a given range
+    //   Confidence is determined by the corresponding unbiased height
+    long ti2 = 0;
+    long ti3 = 0;
+    long ti4 = 0;
+    long ti = 0;
+    float tf = 0.0f;
+    float tf2 = 0.0f;
+    float pperiod = pdetector->pmin;
+    for (ti = pdetector->nmin; ti < pdetector->nmax; ti++) //here is 63~630
+    {
+        ti2 = ti - 1;
+        ti3 = ti + 1;
+        if (ti2<0) //check
+        {
+            ti2 = 0;
+        }
+        if (ti3>Nf) //check
+        {
+            ti3 = Nf;
+        }
+        tf = fftvars->ffttime[ti];
+
+        if (tf > fftvars->ffttime[ti2] && tf >= fftvars->ffttime[ti3] && tf > tf2)
+        {
+            tf2 = tf;
+            ti4 = ti;
+        }
+    }
+    float conf = 0.0f;
+    if (tf2 > 0)
+    {
+        conf = tf2*pdetector->acwinv[ti4];
+        if (ti4 > 0 && ti4 < Nf)
+        {
+            // Find the center of mass in the vicinity of the detected peak
+            tf = fftvars->ffttime[ti4 - 1] * (ti4 - 1);
+            tf = tf + fftvars->ffttime[ti4] * (ti4);
+            tf = tf + fftvars->ffttime[ti4 + 1] * (ti4 + 1);
+            tf = fabs(fftvars->ffttime[ti4 - 1] + fftvars->ffttime[ti4] + fftvars->ffttime[ti4 + 1]) < FLT_EPSILON ? (float)ti4 : tf / (fftvars->ffttime[ti4 - 1] + fftvars->ffttime[ti4] + fftvars->ffttime[ti4 + 1]);
+            pperiod = tf / fs;
+        }
+        else
+        {
+            pperiod = (float)ti4 / fs;
+        }
+    }
+
+    // Convert to semitones
+    tf = (float)-12 * log10((float)aref*pperiod)*L2SC;
+    if (conf >= pdetector->vthresh)
+    {
+        inpitch = tf;
+        pdetector->inpitch = tf; // update pitch only if voiced
+    }
+    pdetector->confidence = conf;
+
+    //  ---- END Calculate pitch and confidence ----
+}
+
+int instantiate_pitch_detector(PitchDetector *pdetector, fft_vars *fftvars, unsigned long cbsize, int samplerate) {
+	//pdetector->ppickthresh=0.9;//I have no idea what this should be, except the MPM paper suggested between 0.8 and 1, so I am taking the average :P
+	unsigned long corrsize=cbsize/2+1;
+    
+	pdetector->pmax = 1/(float)70;  // max and min periods (ms)
+	pdetector->pmin = 1/(float)700; // eventually may want to bring these out as sliders
+
+    pdetector->nmax = (unsigned long)(samplerate * pdetector->pmax);
+	if (pdetector->nmax > corrsize) {
+		pdetector->nmax =corrsize;
+	}
+    pdetector->nmin = (unsigned long)(samplerate * pdetector->pmin);
+	pdetector->vthresh = 0.7;  //  The voiced confidence (unbiased peak) threshold level
+	// Generate a window with a single raised cosine from N/4 to 3N/4
+    pdetector->cbwindow = (float*)calloc(cbsize, sizeof(float));
+    if (pdetector->cbwindow == NULL)
+    {
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+    unsigned long ti = 0;
+    for (ti = 0; ti < (cbsize / 2); ti++) {
+        pdetector->cbwindow[ti + cbsize / 4] = -0.5*cos(4 * PI*ti / (cbsize - 1)) + 0.5;
+    }
+
+  
+
+    //fftvars = fft_con(cbsize);
+
+
+
+    // ---- Calculate autocorrelation of window ----
+    pdetector->acwinv = (float*)calloc(cbsize, sizeof(float));
+    if (pdetector->acwinv == NULL)
+    {
+        if (pdetector->cbwindow != NULL)
+        {
+            free(pdetector->cbwindow);
+            pdetector->cbwindow = NULL;
+        }
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+    for (ti = 0; ti < cbsize; ti++) {
+        fftvars->ffttime[ti] = pdetector->cbwindow[ti];
+    }
+    fft_forward(fftvars, pdetector->cbwindow, fftvars->fftfreqre, fftvars->fftfreqim);
+    for (ti = 0; ti < corrsize; ti++) {
+        fftvars->fftfreqre[ti] = (fftvars->fftfreqre[ti])*(fftvars->fftfreqre[ti]) + (fftvars->fftfreqim[ti])*(fftvars->fftfreqim[ti]);
+        fftvars->fftfreqim[ti] = 0;
+    }
+    fft_inverse(fftvars, fftvars->fftfreqre, fftvars->fftfreqim, fftvars->ffttime);
+    for (ti = 1; ti<cbsize; ti++) {
+        pdetector->acwinv[ti] = fftvars->ffttime[ti] / fftvars->ffttime[0];
+        if (pdetector->acwinv[ti] > 0.000001) {
+            pdetector->acwinv[ti] = (float)1 / pdetector->acwinv[ti];
+        }
+        else {
+            pdetector->acwinv[ti] = 0;
+        }
+    }
+    pdetector->acwinv[0] = 1;
+    return 0;
+	// ---- END Calculate autocorrelation of window ----
+
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchDetector.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchDetector.h
new file mode 100644
index 0000000..76008b2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchDetector.h
@@ -0,0 +1,38 @@
+#ifndef __PITCH_DETECTOR_H_
+#define __PITCH_DETECTOR_H_
+
+#include <math.h>
+#include "ref/CircularBuffer.h"
+extern "C"
+{
+#include "ref/fftwrap.h"
+}
+
+#include <string.h>
+#include <stdio.h>
+
+
+
+#define PI (float)3.14159265358979323846
+
+typedef struct 
+{
+  float pmax; // Maximum allowable pitch period (seconds)
+  float pmin; // Minimum allowable pitch period (seconds)
+  unsigned long nmax; // Maximum period index for pitch prd est
+  unsigned long nmin; // Minimum period index for pitch prd est
+  float inpitch;
+  float confidence;
+  float* cbwindow;  //cosine window;
+  float* acwinv; // inverse of autocorrelation of window
+  
+  float vthresh; // Voiced speech threshold
+  //float ppickthresh;	
+} PitchDetector;
+
+void bbtain_autocovariance(PitchDetector *pdetector, fft_vars *fftvars, CircularBuffer *buffer, long int N, long int Nf);
+
+void get_pitch_conf(PitchDetector *pdetector, fft_vars *fftvars, unsigned long Nf, float fs, float aref, float &inpitch);
+
+int instantiate_pitch_detector(PitchDetector *pdetector, fft_vars *fftvars, unsigned long cbsize, int samplerate);
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchShifter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchShifter.cpp
new file mode 100644
index 0000000..0c08db3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchShifter.cpp
@@ -0,0 +1,124 @@
+#include "pitch/PitchShifter.h"
+#include "AutoTuneDef.h"
+#include <stdio.h>
+int pitch_shifter_init(PitchShifter *pshifter, unsigned long sampleRate, unsigned long cbsize) {
+	// Pitch shifter initialization
+	pshifter->phprdd = 0.01; // Default period
+	pshifter->inphinc = (float)1/(pshifter->phprdd * sampleRate);
+	pshifter->phincfact = 1;
+	pshifter->phasein = 0;
+	pshifter->phaseout = 0;
+	pshifter->frag = (float*)calloc(cbsize, sizeof(float));
+    if (pshifter->frag == NULL)
+    {
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+	pshifter->fragsize = 0;
+
+	// Standard raised cosine window, max height at N/2
+	pshifter->hannwindow = (float*)calloc(cbsize, sizeof(float));
+    if (pshifter->hannwindow == NULL)
+    {
+        if (pshifter->frag != NULL)
+        {
+            free(pshifter->frag);
+            pshifter->frag = NULL;
+        }
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+	long int i;
+	for (i=0; i<cbsize; i++) {
+		pshifter->hannwindow[i] = -0.5*cos(2*PI*i/cbsize) + 0.5;
+	}
+
+	pshifter->cbo = (float*)calloc(cbsize, sizeof(float));
+	pshifter->cbord = 0;
+    pshifter->active = 0;
+    pshifter->outphinc = 0;
+    return 0;
+}
+
+void compute_pitch_shifter_variables(PitchShifter *pshifter, float inpperiod, float outpperiod, float fs) {
+	float invinphinc=inpperiod*fs;
+	pshifter->inphinc = 1/invinphinc; //This is like the fraction of a period every sample is.
+	pshifter->outphinc = 1/(outpperiod*fs); 
+	pshifter->phincfact = pshifter->outphinc*invinphinc;
+
+}
+
+float shift_pitch(PitchShifter *pshifter, CircularBuffer *buffer, long int N)
+{
+	// Pitch shifter (kind of like a pitch-synchronous version of Fairbanks' technique)
+	//   Note: pitch estimate is naturally N/2 samples old
+	pshifter->phasein = pshifter->phasein + pshifter->inphinc; //This is like the total amount of the period we've been through.
+	
+	pshifter->phaseout = pshifter->phaseout + pshifter->outphinc; //likewise for output
+
+	//   When input phase resets, take a snippet from N/2 samples in the past
+	if (pshifter->phasein >= 1) {
+		pshifter->phasein = pshifter->phasein - 1;
+		long fragment_beginning= buffer->cbiwr - N/2;
+
+#define FRAGCOPYLOOP(lower,upper,index) {\
+	for (long i=lower; i<upper; i++) {\
+		pshifter->frag[index] = buffer->cbf[(i + fragment_beginning + N)%N];\
+        }\
+}
+
+		FRAGCOPYLOOP(-N/2,0,i+N)
+		FRAGCOPYLOOP(0,N/2,i)
+	}
+
+	//   When output phase resets, put a snippet N/2 samples in the future
+	if (pshifter->phaseout >= 1) {
+		pshifter->fragsize = pshifter->fragsize*2;
+		if (pshifter->fragsize > N) {
+			pshifter->fragsize = N;
+		}
+		pshifter->phaseout = pshifter->phaseout - 1;
+		long int ti3 = (long int)(((float)pshifter->fragsize) / pshifter->phincfact);
+
+		//Interpolator
+        interpolate(pshifter, ti3, N);
+		pshifter->fragsize = 0;
+	}
+	pshifter->fragsize++;
+
+	//   Get output signal from buffer
+	float tf = pshifter->cbo[pshifter->cbord]; // read buffer
+
+	pshifter->cbo[pshifter->cbord] = 0; // erase for next cycle
+	pshifter->cbord++; // increment read pointer
+	if (pshifter->cbord >= N) {
+		pshifter->cbord = 0;
+	}
+	return tf;
+}
+
+void interpolate(PitchShifter *pshifter, long int bounds, long int N)
+{
+	if (bounds>=N/2) {
+		bounds = N/2 - 1;
+	}
+	long int i;
+	for (i=-bounds/2; i<(bounds/2); i++)
+    {
+		float tf = pshifter->hannwindow[(long int)N/2 + i*(long int)N/bounds];
+		// 3rd degree polynomial interpolator - based on eqns from Hal Chamberlin's book
+		float indd = pshifter->phincfact*i;
+		int ind1 = (int)indd;
+		int ind2 = ind1+1;
+		int ind3 = ind1+2;
+		int ind0 = ind1-1;
+		float val0 = pshifter->frag[(ind0+N)%N];
+		float val1 = pshifter->frag[(ind1+N)%N];
+		float val2 = pshifter->frag[(ind2+N)%N];
+		float val3 = pshifter->frag[(ind3+N)%N];
+		float vald = 0;
+		vald = vald - (float)0.166666666667 * val0 * (indd - ind1) * (indd - ind2) * (indd - ind3);
+		vald = vald + (float)0.5 * val1 * (indd - ind0) * (indd - ind2) * (indd - ind3);
+		vald = vald - (float)0.5 * val2 * (indd - ind0) * (indd - ind1) * (indd - ind3);
+		vald = vald + (float)0.166666666667 * val3 * (indd - ind0) * (indd - ind1) * (indd - ind2);
+		pshifter->cbo[(i + pshifter->cbord + 3*N/2)%N] = pshifter->cbo[(i + pshifter->cbord + 3*N/2)%N] + vald*tf;
+	}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchShifter.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchShifter.h
new file mode 100644
index 0000000..f276e66
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/pitch/PitchShifter.h
@@ -0,0 +1,39 @@
+#ifndef __PITCH_SHIFTER_H_
+#define __PITCH_SHIFTER_H_
+
+
+#include <stdlib.h>
+#include <math.h>
+#include "PitchDetector.h"
+#include "ref/CircularBuffer.h"
+ typedef struct 
+ {
+// VARIABLES FOR PITCH SHIFTER
+  float phprdd; // default (unvoiced) phase period
+  double inphinc; // input phase increment
+  double outphinc; // output phase increment
+  double phincfact; // factor determining output phase increment
+	 
+  double phasein;
+  double phaseout;
+	 
+  float* frag; // windowed fragment of speech
+  unsigned long fragsize; // size of fragment in samples
+
+  float* hannwindow; // length-N hann
+	 
+  float* cbo; // circular output buffer
+  unsigned long cbord;  //read index for circular buffer;
+	 
+  int active;
+} PitchShifter;
+
+
+int pitch_shifter_init(PitchShifter *pshifter, unsigned long sampleRate, unsigned long cbsize);
+
+void compute_pitch_shifter_variables(PitchShifter *pshifter, float inpperiod, float outpperiod, float fs);
+
+float shift_pitch(PitchShifter *pshifter, CircularBuffer *buffer, long int N);
+
+void interpolate(PitchShifter *pshifter, long int bounds, long int N);
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/CircularBuffer.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/CircularBuffer.cpp
new file mode 100644
index 0000000..8008681
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/CircularBuffer.cpp
@@ -0,0 +1,30 @@
+#include "ref/CircularBuffer.h"
+#include "AutoTuneDef.h"
+
+int instantiate_circular_buffer(CircularBuffer *buffer, unsigned long samplerate) {
+	if (samplerate>=88200) {
+		buffer->cbsize = 4096;
+	}
+	else {
+		buffer->cbsize = 2048;
+	}
+	buffer->corrsize = buffer->cbsize / 2 + 1;
+
+	buffer->cbi = (float*)calloc(buffer->cbsize, sizeof(float));
+    if (buffer->cbi == NULL)
+    {
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+	buffer->cbf = (float*)calloc(buffer->cbsize, sizeof(float));
+    if (buffer->cbf == NULL)
+    {
+        if (buffer->cbi != NULL)
+        {
+            free(buffer->cbi);
+            buffer->cbi = NULL;
+        }
+        return AT_ERR_BASE_H_MALLOC_NULL;
+    }
+	buffer->cbiwr = 0;
+    return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/CircularBuffer.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/CircularBuffer.h
new file mode 100644
index 0000000..47826cc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/CircularBuffer.h
@@ -0,0 +1,14 @@
+#ifndef __CIRCULAR_BUFFER_H_
+#define __CIRCULAR_BUFFER_H_
+#include <stdlib.h>
+
+typedef struct {
+	unsigned long cbsize; // size of circular buffer
+	unsigned long corrsize; // cbsize/2 + 1
+	unsigned long cbiwr;  //write pointer;
+	float* cbi;
+	float* cbf; // circular formant correction buffer	
+} CircularBuffer;
+
+int instantiate_circular_buffer(CircularBuffer *buffer, unsigned long samplerate);
+#endif
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/fftwrap.c b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/fftwrap.c
new file mode 100644
index 0000000..dbbd653
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/fftwrap.c
@@ -0,0 +1,99 @@
+
+#include <stdlib.h>
+
+#include "ref/fftwrap.h"
+#include "ref/mayer_fft.h"
+
+fft_vars* fft_con(int nfft)
+{
+    fft_vars* membvars = (fft_vars*)malloc(sizeof(fft_vars));
+    if (membvars == NULL)
+    {
+        return NULL;
+    }
+
+    membvars->nfft = nfft;
+    membvars->numfreqs = nfft / 2 + 1;
+
+    membvars->fft_data = (float*)calloc(nfft, sizeof(float));
+    membvars->ffttime = (float*)calloc(nfft, sizeof(float));
+    membvars->fftfreqre = (float*)calloc(nfft, sizeof(float));
+    membvars->fftfreqim = (float*)calloc(nfft, sizeof(float));
+    return membvars;
+}
+
+// Destructor for FFT routine
+void fft_des(fft_vars* membvars)
+{
+    free(membvars->fft_data);
+    free(membvars->ffttime);
+    free(membvars->fftfreqre);
+    free(membvars->fftfreqim);
+    free(membvars);
+}
+
+// Perform forward FFT of real data
+// Accepts:
+//   membvars - pointer to struct of FFT variables
+//   input - pointer to an array of (real) input values, size nfft
+//   output_re - pointer to an array of the real part of the output,
+//     size nfft/2 + 1
+//   output_im - pointer to an array of the imaginary part of the output,
+//     size nfft/2 + 1
+void fft_forward(fft_vars* membvars, float* input, float* output_re, float* output_im)
+{
+    int ti;
+    int nfft;
+    int hnfft;
+    int numfreqs;
+
+    nfft = membvars->nfft;
+    hnfft = nfft / 2;
+    numfreqs = membvars->numfreqs;
+
+    for (ti = 0; ti < nfft; ti++) {
+        membvars->fft_data[ti] = input[ti];
+    }
+
+    mayer_realfft(nfft, membvars->fft_data);
+
+    output_im[0] = 0;
+    for (ti = 0; ti < hnfft; ti++) {
+        output_re[ti] = membvars->fft_data[ti];
+        output_im[ti + 1] = membvars->fft_data[nfft - 1 - ti];
+    }
+    output_re[hnfft] = membvars->fft_data[hnfft];
+    output_im[hnfft] = 0;
+}
+
+// Perform inverse FFT, returning real data
+// Accepts:
+//   membvars - pointer to struct of FFT variables
+//   input_re - pointer to an array of the real part of the output,
+//     size nfft/2 + 1
+//   input_im - pointer to an array of the imaginary part of the output,
+//     size nfft/2 + 1
+//   output - pointer to an array of (real) input values, size nfft
+void fft_inverse(fft_vars* membvars, float* input_re, float* input_im, float* output)
+{
+    int ti;
+    int nfft;
+    int hnfft;
+    int numfreqs;
+
+    nfft = membvars->nfft;
+    hnfft = nfft / 2;
+    numfreqs = membvars->numfreqs;
+
+    for (ti = 0; ti < hnfft; ti++) {
+        membvars->fft_data[ti] = input_re[ti];
+        membvars->fft_data[nfft - 1 - ti] = input_im[ti + 1];
+    }
+    membvars->fft_data[hnfft] = input_re[hnfft];
+
+    mayer_realifft(nfft, membvars->fft_data);
+
+    for (ti = 0; ti < nfft; ti++) {
+        output[ti] = membvars->fft_data[ti];
+    }
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/fftwrap.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/fftwrap.h
new file mode 100644
index 0000000..528157e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/fftwrap.h
@@ -0,0 +1,41 @@
+#ifndef __FFT_WRAP_H_
+#define __FFT_WRAP_H_
+
+// Variables for FFT routine
+typedef struct
+{
+    int nfft;        // size of FFT
+    int numfreqs;    // number of frequencies represented (nfft/2 + 1)
+    float* ffttime;
+    float* fftfreqre;
+    float* fftfreqim;
+    float* fft_data; // array for writing/reading to/from FFT function
+} fft_vars;
+
+// Constructor for FFT routine
+fft_vars* fft_con(int nfft);
+
+// Destructor for FFT routine
+void fft_des(fft_vars* membvars);
+
+// Perform forward FFT of real data
+// Accepts:
+//   membvars - pointer to struct of FFT variables
+//   input - pointer to an array of (real) input values, size nfft
+//   output_re - pointer to an array of the real part of the output,
+//     size nfft/2 + 1
+//   output_im - pointer to an array of the imaginary part of the output,
+//     size nfft/2 + 1
+void fft_forward(fft_vars* membvars, float* input, float* output_re, float* output_im);
+
+// Perform inverse FFT, returning real data
+// Accepts:
+//   membvars - pointer to struct of FFT variables
+//   input_re - pointer to an array of the real part of the output,
+//     size nfft/2 + 1
+//   input_im - pointer to an array of the imaginary part of the output,
+//     size nfft/2 + 1
+//   output - pointer to an array of (real) input values, size nfft
+void fft_inverse(fft_vars* membvars, float* input_re, float* input_im, float* output);
+#endif
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/mayer_fft.c b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/mayer_fft.c
new file mode 100644
index 0000000..a93698e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/mayer_fft.c
@@ -0,0 +1,419 @@
+/* This is the FFT routine taken from PureData, a great piece of
+software by Miller S. Puckette.
+http://crca.ucsd.edu/~msp/software.html */
+
+/*
+** FFT and FHT routines
+**  Copyright 1988, 1993; Ron Mayer
+**  
+**  mayer_fht(fz,n);
+**      Does a hartley transform of "n" points in the array "fz".
+**  mayer_fft(n,real,imag)
+**      Does a fourier transform of "n" points of the "real" and
+**      "imag" arrays.
+**  mayer_ifft(n,real,imag)
+**      Does an inverse fourier transform of "n" points of the "real"
+**      and "imag" arrays.
+**  mayer_realfft(n,real)
+**      Does a real-valued fourier transform of "n" points of the
+**      "real" array.  The real part of the transform ends
+**      up in the first half of the array and the imaginary part of the
+**      transform ends up in the second half of the array.
+**  mayer_realifft(n,real)
+**      The inverse of the realfft() routine above.
+**      
+**      
+** NOTE: This routine uses at least 2 patented algorithms, and may be
+**       under the restrictions of a bunch of different organizations.
+**       Although I wrote it completely myself, it is kind of a derivative
+**       of a routine I once authored and released under the GPL, so it
+**       may fall under the free software foundation's restrictions;
+**       it was worked on as a Stanford Univ project, so they claim
+**       some rights to it; it was further optimized at work here, so
+**       I think this company claims parts of it.  The patents are
+**       held by R. Bracewell (the FHT algorithm) and O. Buneman (the
+**       trig generator), both at Stanford Univ.
+**       If it were up to me, I'd say go do whatever you want with it;
+**       but it would be polite to give credit to the following people
+**       if you use this anywhere:
+**           Euler     - probable inventor of the fourier transform.
+**           Gauss     - probable inventor of the FFT.
+**           Hartley   - probable inventor of the hartley transform.
+**           Buneman   - for a really cool trig generator
+**           Mayer(me) - for authoring this particular version and
+**                       including all the optimizations in one package.
+**       Thanks,
+**       Ron Mayer; mayer@acuson.com
+**
+*/
+
+/* This is a slightly modified version of Mayer's contribution; write
+* msp@ucsd.edu for the original code.  Kudos to Mayer for a fine piece
+* of work.  -msp
+*/
+
+#define REAL float
+#define GOOD_TRIG
+
+#ifdef GOOD_TRIG
+#else
+#define FAST_TRIG
+#endif
+
+#if defined(GOOD_TRIG)
+#define FHT_SWAP(a,b,t) {(t)=(a);(a)=(b);(b)=(t);}
+#define TRIG_VARS                                                \
+      int t_lam=0;
+#define TRIG_INIT(k,c,s)                                         \
+     {                                                           \
+      int i;                                                     \
+      for (i=2 ; i<=k ; i++)                                     \
+          {coswrk[i]=costab[i];sinwrk[i]=sintab[i];}             \
+      t_lam = 0;                                                 \
+      c = 1;                                                     \
+      s = 0;                                                     \
+     }
+#define TRIG_NEXT(k,c,s)                                         \
+     {                                                           \
+         int i,j;                                                \
+         (t_lam)++;                                              \
+         for (i=0 ; !((1<<i)&t_lam) ; i++);                      \
+         i = k-i;                                                \
+         s = sinwrk[i];                                          \
+         c = coswrk[i];                                          \
+         if (i>1)                                                \
+            {                                                    \
+             for (j=k-i+2 ; (1<<j)&t_lam ; j++);                 \
+             j         = k - j;                                  \
+             sinwrk[i] = halsec[i] * (sinwrk[i-1] + sinwrk[j]);  \
+             coswrk[i] = halsec[i] * (coswrk[i-1] + coswrk[j]);  \
+            }                                                    \
+     }
+#define TRIG_RESET(k,c,s)
+#endif
+
+#if defined(FAST_TRIG)
+#define TRIG_VARS                                        \
+      REAL t_c,t_s;
+#define TRIG_INIT(k,c,s)                                 \
+    {                                                    \
+     t_c  = costab[k];                                   \
+     t_s  = sintab[k];                                   \
+     c    = 1;                                           \
+     s    = 0;                                           \
+    }
+#define TRIG_NEXT(k,c,s)                                 \
+    {                                                    \
+     REAL t = c;                                         \
+     c   = t*t_c - s*t_s;                                \
+     s   = t*t_s + s*t_c;                                \
+    }
+#define TRIG_RESET(k,c,s)
+#endif
+
+static REAL halsec[20]=
+    {
+     0,
+     0,
+     .54119610014619698439972320536638942006107206337801,
+     .50979557910415916894193980398784391368261849190893,
+     .50241928618815570551167011928012092247859337193963,
+     .50060299823519630134550410676638239611758632599591,
+     .50015063602065098821477101271097658495974913010340,
+     .50003765191554772296778139077905492847503165398345,
+     .50000941253588775676512870469186533538523133757983,
+     .50000235310628608051401267171204408939326297376426,
+     .50000058827484117879868526730916804925780637276181,
+     .50000014706860214875463798283871198206179118093251,
+     .50000003676714377807315864400643020315103490883972,
+     .50000000919178552207366560348853455333939112569380,
+     .50000000229794635411562887767906868558991922348920,
+     .50000000057448658687873302235147272458812263401372
+    };
+static REAL costab[20]=
+    {
+     .00000000000000000000000000000000000000000000000000,
+     .70710678118654752440084436210484903928483593768847,
+     .92387953251128675612818318939678828682241662586364,
+     .98078528040323044912618223613423903697393373089333,
+     .99518472667219688624483695310947992157547486872985,
+     .99879545620517239271477160475910069444320361470461,
+     .99969881869620422011576564966617219685006108125772,
+     .99992470183914454092164649119638322435060646880221,
+     .99998117528260114265699043772856771617391725094433,
+     .99999529380957617151158012570011989955298763362218,
+     .99999882345170190992902571017152601904826792288976,
+     .99999970586288221916022821773876567711626389934930,
+     .99999992646571785114473148070738785694820115568892,
+     .99999998161642929380834691540290971450507605124278,
+     .99999999540410731289097193313960614895889430318945,
+     .99999999885102682756267330779455410840053741619428
+    };
+static REAL sintab[20]=
+    {
+     1.0000000000000000000000000000000000000000000000000,
+     .70710678118654752440084436210484903928483593768846,
+     .38268343236508977172845998403039886676134456248561,
+     .19509032201612826784828486847702224092769161775195,
+     .09801714032956060199419556388864184586113667316749,
+     .04906767432741801425495497694268265831474536302574,
+     .02454122852291228803173452945928292506546611923944,
+     .01227153828571992607940826195100321214037231959176,
+     .00613588464915447535964023459037258091705788631738,
+     .00306795676296597627014536549091984251894461021344,
+     .00153398018628476561230369715026407907995486457522,
+     .00076699031874270452693856835794857664314091945205,
+     .00038349518757139558907246168118138126339502603495,
+     .00019174759731070330743990956198900093346887403385,
+     .00009587379909597734587051721097647635118706561284,
+     .00004793689960306688454900399049465887274686668768
+    };
+static REAL coswrk[20]=
+    {
+     .00000000000000000000000000000000000000000000000000,
+     .70710678118654752440084436210484903928483593768847,
+     .92387953251128675612818318939678828682241662586364,
+     .98078528040323044912618223613423903697393373089333,
+     .99518472667219688624483695310947992157547486872985,
+     .99879545620517239271477160475910069444320361470461,
+     .99969881869620422011576564966617219685006108125772,
+     .99992470183914454092164649119638322435060646880221,
+     .99998117528260114265699043772856771617391725094433,
+     .99999529380957617151158012570011989955298763362218,
+     .99999882345170190992902571017152601904826792288976,
+     .99999970586288221916022821773876567711626389934930,
+     .99999992646571785114473148070738785694820115568892,
+     .99999998161642929380834691540290971450507605124278,
+     .99999999540410731289097193313960614895889430318945,
+     .99999999885102682756267330779455410840053741619428
+    };
+static REAL sinwrk[20]=
+    {
+     1.0000000000000000000000000000000000000000000000000,
+     .70710678118654752440084436210484903928483593768846,
+     .38268343236508977172845998403039886676134456248561,
+     .19509032201612826784828486847702224092769161775195,
+     .09801714032956060199419556388864184586113667316749,
+     .04906767432741801425495497694268265831474536302574,
+     .02454122852291228803173452945928292506546611923944,
+     .01227153828571992607940826195100321214037231959176,
+     .00613588464915447535964023459037258091705788631738,
+     .00306795676296597627014536549091984251894461021344,
+     .00153398018628476561230369715026407907995486457522,
+     .00076699031874270452693856835794857664314091945205,
+     .00038349518757139558907246168118138126339502603495,
+     .00019174759731070330743990956198900093346887403385,
+     .00009587379909597734587051721097647635118706561284,
+     .00004793689960306688454900399049465887274686668768
+    };
+
+
+#define SQRT2_2   0.70710678118654752440084436210484
+#define SQRT2   2*0.70710678118654752440084436210484
+
+void mayer_fht(REAL *fz, int n)
+{
+/*  REAL a,b;
+REAL c1,s1,s2,c2,s3,c3,s4,c4;
+ REAL f0,g0,f1,g1,f2,g2,f3,g3; */
+ int  k,k1,k2,k3,k4,kx;
+ REAL *fi,*fn,*gi;
+ TRIG_VARS;
+
+ for (k1=1,k2=0;k1<n;k1++)
+    {
+     REAL aa;
+     for (k=n>>1; (!((k2^=k)&k)); k>>=1);
+     if (k1>k2)
+        {
+             aa=fz[k1];fz[k1]=fz[k2];fz[k2]=aa;
+        }
+    }
+ for ( k=0 ; (1<<k)<n ; k++ );
+ k  &= 1;
+ if (k==0)
+    {
+         for (fi=fz,fn=fz+n;fi<fn;fi+=4)
+            {
+             REAL f0,f1,f2,f3;
+             f1     = fi[0 ]-fi[1 ];
+             f0     = fi[0 ]+fi[1 ];
+             f3     = fi[2 ]-fi[3 ];
+             f2     = fi[2 ]+fi[3 ];
+             fi[2 ] = (f0-f2);  
+             fi[0 ] = (f0+f2);
+             fi[3 ] = (f1-f3);  
+             fi[1 ] = (f1+f3);
+            }
+    }
+ else
+    {
+         for (fi=fz,fn=fz+n,gi=fi+1;fi<fn;fi+=8,gi+=8)
+            {
+             REAL bs1,bc1,bs2,bc2,bs3,bc3,bs4,bc4,
+                bg0,bf0,bf1,bg1,bf2,bg2,bf3,bg3;
+             bc1     = fi[0 ] - gi[0 ];
+             bs1     = fi[0 ] + gi[0 ];
+             bc2     = fi[2 ] - gi[2 ];
+             bs2     = fi[2 ] + gi[2 ];
+             bc3     = fi[4 ] - gi[4 ];
+             bs3     = fi[4 ] + gi[4 ];
+             bc4     = fi[6 ] - gi[6 ];
+             bs4     = fi[6 ] + gi[6 ];
+             bf1     = (bs1 - bs2);     
+             bf0     = (bs1 + bs2);
+             bg1     = (bc1 - bc2);     
+             bg0     = (bc1 + bc2);
+             bf3     = (bs3 - bs4);     
+             bf2     = (bs3 + bs4);
+             bg3     = SQRT2*bc4;               
+             bg2     = SQRT2*bc3;
+             fi[4 ] = bf0 - bf2;
+             fi[0 ] = bf0 + bf2;
+             fi[6 ] = bf1 - bf3;
+             fi[2 ] = bf1 + bf3;
+             gi[4 ] = bg0 - bg2;
+             gi[0 ] = bg0 + bg2;
+             gi[6 ] = bg1 - bg3;
+             gi[2 ] = bg1 + bg3;
+            }
+    }
+ if (n<16) return;
+
+ do
+    {
+     REAL s1,c1;
+     int ii;
+     k  += 2;
+     k1  = 1  << k;
+     k2  = k1 << 1;
+     k4  = k2 << 1;
+     k3  = k2 + k1;
+     kx  = k1 >> 1;
+         fi  = fz;
+         gi  = fi + kx;
+         fn  = fz + n;
+         do
+            {
+             REAL g0,f0,f1,g1,f2,g2,f3,g3;
+             f1      = fi[0 ] - fi[k1];
+             f0      = fi[0 ] + fi[k1];
+             f3      = fi[k2] - fi[k3];
+             f2      = fi[k2] + fi[k3];
+             fi[k2]  = f0         - f2;
+             fi[0 ]  = f0         + f2;
+             fi[k3]  = f1         - f3;
+             fi[k1]  = f1         + f3;
+             g1      = gi[0 ] - gi[k1];
+             g0      = gi[0 ] + gi[k1];
+             g3      = SQRT2  * gi[k3];
+             g2      = SQRT2  * gi[k2];
+             gi[k2]  = g0         - g2;
+             gi[0 ]  = g0         + g2;
+             gi[k3]  = g1         - g3;
+             gi[k1]  = g1         + g3;
+             gi     += k4;
+             fi     += k4;
+            } while (fi<fn);
+     TRIG_INIT(k,c1,s1);
+     for (ii=1;ii<kx;ii++)
+        {
+         REAL c2,s2;
+         TRIG_NEXT(k,c1,s1);
+         c2 = c1*c1 - s1*s1;
+         s2 = 2*(c1*s1);
+             fn = fz + n;
+             fi = fz +ii;
+             gi = fz +k1-ii;
+             do
+                {
+                 REAL a,b,g0,f0,f1,g1,f2,g2,f3,g3;
+                 b       = s2*fi[k1] - c2*gi[k1];
+                 a       = c2*fi[k1] + s2*gi[k1];
+                 f1      = fi[0 ]    - a;
+                 f0      = fi[0 ]    + a;
+                 g1      = gi[0 ]    - b;
+                 g0      = gi[0 ]    + b;
+                 b       = s2*fi[k3] - c2*gi[k3];
+                 a       = c2*fi[k3] + s2*gi[k3];
+                 f3      = fi[k2]    - a;
+                 f2      = fi[k2]    + a;
+                 g3      = gi[k2]    - b;
+                 g2      = gi[k2]    + b;
+                 b       = s1*f2     - c1*g3;
+                 a       = c1*f2     + s1*g3;
+                 fi[k2]  = f0        - a;
+                 fi[0 ]  = f0        + a;
+                 gi[k3]  = g1        - b;
+                 gi[k1]  = g1        + b;
+                 b       = c1*g2     - s1*f3;
+                 a       = s1*g2     + c1*f3;
+                 gi[k2]  = g0        - a;
+                 gi[0 ]  = g0        + a;
+                 fi[k3]  = f1        - b;
+                 fi[k1]  = f1        + b;
+                 gi     += k4;
+                 fi     += k4;
+                } while (fi<fn);
+        }
+     TRIG_RESET(k,c1,s1);
+    } while (k4<n);
+}
+
+void mayer_fft(int n, REAL *real, REAL *imag)
+{
+ REAL a,b,c,d;
+ REAL q,r,s,t;
+ int i,j,k;
+ for (i=1,j=n-1,k=n/2;i<k;i++,j--) {
+  a = real[i]; b = real[j];  q=a+b; r=a-b;
+  c = imag[i]; d = imag[j];  s=c+d; t=c-d;
+  real[i] = (q+t)*.5; real[j] = (q-t)*.5;
+  imag[i] = (s-r)*.5; imag[j] = (s+r)*.5;
+ }
+ mayer_fht(real,n);
+ mayer_fht(imag,n);
+}
+
+void mayer_ifft(int n, REAL *real, REAL *imag)
+{
+ REAL a,b,c,d;
+ REAL q,r,s,t;
+ int i,j,k;
+ mayer_fht(real,n);
+ mayer_fht(imag,n);
+ for (i=1,j=n-1,k=n/2;i<k;i++,j--) {
+  a = real[i]; b = real[j];  q=a+b; r=a-b;
+  c = imag[i]; d = imag[j];  s=c+d; t=c-d;
+  imag[i] = (s+r)*0.5;  imag[j] = (s-r)*0.5;
+  real[i] = (q-t)*0.5;  real[j] = (q+t)*0.5;
+ }
+}
+
+void mayer_realfft(int n, REAL *real)
+{
+  REAL a,b;
+ int i,j,k;
+
+ mayer_fht(real,n);
+ for (i=1,j=n-1,k=n/2;i<k;i++,j--) {
+  a = real[i];
+  b = real[j];
+  real[j] = (a-b)*0.5;
+  real[i] = (a+b)*0.5;
+ }
+}
+
+void mayer_realifft(int n, REAL *real)
+{
+  REAL a,b;
+ int i,j,k;
+
+ for (i=1,j=n-1,k=n/2;i<k;i++,j--) {
+  a = real[i];
+  b = real[j];
+  real[j] = (a-b);
+  real[i] = (a+b);
+ }
+ mayer_fht(real,n);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/mayer_fft.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/mayer_fft.h
new file mode 100644
index 0000000..397a0b6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/autotune/src/ref/mayer_fft.h
@@ -0,0 +1,9 @@
+#ifndef MAYER_H
+#define MAYER_H
+
+#define REAL float
+
+void mayer_realfft(int n, REAL *real);
+void mayer_realifft(int n, REAL *real);
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/CMakeLists.txt
new file mode 100644
index 0000000..f3beb37
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(./)
+file(GLOB_RECURSE COMMON_SRC_FILES ./*cpp)
+add_library(ref_common ${COMMON_SRC_FILES})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/APFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/APFilter.cpp
new file mode 100644
index 0000000..a1f3ebb
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/APFilter.cpp
@@ -0,0 +1,27 @@
+//APFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+namespace BiquadFilter {
+	APFilter::APFilter(float cutoff, float Q){
+		this->cutoff = cutoff;
+		this->Q = Q;
+
+		alloc();
+
+		//init filter coefficient
+		float omega = 2.0 * M_PI* cutoff;
+		float alpha = sin(omega) / 2.0 * Q;
+
+		a[0] = 1.0 + alpha;
+		a[1] = -2.0 * cos(omega);
+		a[2] = 1.0 - alpha;
+		b[0] = 1.0 - alpha;
+		b[1] = -2.0 * cos(omega);
+		b[2] = 1.0 + alpha;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BPFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BPFilter.cpp
new file mode 100644
index 0000000..8994f32
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BPFilter.cpp
@@ -0,0 +1,40 @@
+//BPFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+/**
+#ifndef _MSC_VER
+
+static float log2(float x)
+{
+	return log(x) / log(2.0);
+}
+
+#endif // _MSC_VER
+**/
+
+namespace BiquadFilter{
+	BPFilter::BPFilter(float low_edge, float high_edge){
+		this->low_edge = low_edge;
+		this->high_edge = high_edge;
+
+		alloc();
+
+		//init filter coefficient
+		float bw = log2(high_edge / low_edge);
+		float cutoff = low_edge * pow(2, bw/2);
+		float omega = 2.0 * M_PI* cutoff;
+		float alpha = sin(omega) * sinh(log(2.0)) / 2.0 * bw * omega / sin(omega);
+
+		a[0] = 1.0 + alpha;
+		a[1] = -2.0 * cos(omega);
+		a[2] = 1.0 - alpha;
+		b[0] = alpha;
+		b[1] = 0.0;
+		b[2] = -alpha;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BiquadFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BiquadFilter.cpp
new file mode 100644
index 0000000..942b6b6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BiquadFilter.cpp
@@ -0,0 +1,59 @@
+//BiquadFilter.cpp
+
+#include "biquad_filters/BiquadFilter.h"
+
+//using
+using std::vector;
+
+
+namespace BiquadFilter{
+
+    CBaseFilter::CBaseFilter()
+    {
+		reset();
+    }
+
+	CBaseFilter::~CBaseFilter(){}
+
+	void CBaseFilter::filtering(vector<float> *x){
+		vector<float> &in = *x;
+		vector<float> out(in.size());
+
+        float b00 = b[0] / a[0];
+        float b10 = b[1] / a[0];
+        float b20 = b[2] / a[0];
+        float a10 = a[1] / a[0];
+        float a20 = a[2] / a[0];
+
+        for (unsigned int i = 0; i < out.size(); i++){
+			out[i] = b00 * in[i] + b10 * bin1 + b20 * bin2 - a10 * bout1 - a20 * bout2;
+//			out[i] = (b[0] / a[0]) * in[i] + (b[1] / a[0]) * bin1 + (b[2] / a[0]) * bin2 - (a[1] / a[0]) * bout1 - (a[2] / a[0]) * bout2;
+			//update input buf
+			bin2 = bin1;
+			bin1 = in[i];
+			//update output buf
+			bout2 = bout1;
+			bout1 = out[i];
+		}
+
+		//copy
+		for (unsigned int i = 0; i < in.size(); i++){
+			in[i] = out[i];
+		}
+
+	}
+
+	void CBaseFilter::alloc(){
+		a.resize(3);
+		b.resize(3);
+	}
+
+	void CBaseFilter::reset()
+	{
+		bin1 = 0; //= 0.0, bin2 = 0.0;
+		bout1 = 0;// = 0.0, bout2 = 0.0;
+		bin2 = 0; //= 0.0, bin2 = 0.0;
+		bout2 = 0;// = 0.0, bout2 = 0.0;
+	}
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BiquadFilter.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BiquadFilter.h
new file mode 100644
index 0000000..c1c53df
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/BiquadFilter.h
@@ -0,0 +1,103 @@
+﻿#ifndef __BIQUADFILTER_H__
+#define __BIQUADFILTER_H__
+
+#include <vector>
+#include "AudioEffectsConf.h"
+
+namespace BiquadFilter
+{
+	class CBaseFilter{
+	public:
+        CBaseFilter();
+		virtual ~CBaseFilter();
+		void filtering(std::vector<float> *x);
+		void reset();
+	protected:
+		void alloc();
+
+	protected:
+
+		std::vector<float> a;
+		std::vector<float> b;
+    private:
+		float bin1; //= 0.0, bin2 = 0.0;
+		float bout1;// = 0.0, bout2 = 0.0;
+		float bin2; //= 0.0, bin2 = 0.0;
+		float bout2;// = 0.0, bout2 = 0.0;
+	};
+
+
+	class LPFilter : public CBaseFilter{
+	public:
+		LPFilter(float cutoff, float Q);
+	private:
+		float cutoff;
+
+		float Q;
+	};
+
+
+	class HPFilter : public CBaseFilter{
+	public:
+		HPFilter(float cutoff, float Q);
+	private:
+		float cutoff;
+
+		float Q;
+	};
+   
+    class BPFilter : public CBaseFilter{
+	public:
+		BPFilter(float low_edge, float high_edge);
+	private:
+		float low_edge;
+		float high_edge;
+	};
+
+	class NTFilter : public CBaseFilter{
+	public:
+		NTFilter(float low_edge, float high_edge);
+	private:
+		float low_edge;
+		float high_edge;
+	};
+
+
+	class LSFilter : public CBaseFilter{
+	public:
+		LSFilter(float cutoff, float Q, float gain);
+	private:
+		float cutoff;
+		float Q;
+		float gain;
+	};
+
+
+	class HSFilter : public CBaseFilter{
+	public:
+		HSFilter(float cutoff, float Q, float gain);
+	private:
+		float cutoff;
+		float Q;
+		float gain;
+	};
+ 
+    class PKFilter : public CBaseFilter{
+	public:
+		PKFilter(float low_edge, float high_edge, float gain);
+	private:
+		float low_edge;
+		float high_edge;
+		float gain;
+	};
+
+    class APFilter : public CBaseFilter{
+	public:
+		APFilter(float cutoff, float Q);
+	private:
+		float cutoff;
+		float Q;
+	};
+}
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/HPFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/HPFilter.cpp
new file mode 100644
index 0000000..cfb8103
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/HPFilter.cpp
@@ -0,0 +1,27 @@
+//LPFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+namespace BiquadFilter{
+	HPFilter::HPFilter(float cutoff, float Q){
+		this->cutoff = cutoff;
+		this->Q = Q;
+
+		alloc();
+
+		//init filter coefficient
+		float omega = 2.0 * M_PI* cutoff;
+		float alpha = sin(omega) / (2.0*Q);
+
+		a[0] = 1.0 + alpha;
+		a[1] = -2.0 * cos(omega);
+		a[2] = 1.0 - alpha;
+		b[0] = (1.0 + cos(omega)) / 2.0;
+		b[1] = -(1.0 + cos(omega));
+		b[2] = (1.0 + cos(omega)) / 2.0;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/HSFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/HSFilter.cpp
new file mode 100644
index 0000000..57de803
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/HSFilter.cpp
@@ -0,0 +1,29 @@
+//HSFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+namespace BiquadFilter{
+	HSFilter::HSFilter(float cutoff, float Q, float gain){
+		this->cutoff = cutoff;
+		this->Q = Q;
+		this->gain = gain;
+
+		alloc();
+
+		//init filter coefficient
+		float omega = 2.0 * M_PI* cutoff;
+		float A = pow(10.0, (gain / 40.0));
+		float beta = sqrt(A) / Q;
+
+		a[0] = (A + 1.0) - (A - 1.0) * cos(omega) + beta * sin(omega);
+		a[1] = 2.0 * ((A - 1.0) - (A + 1.0) * cos(omega));
+		a[2] = (A + 1.0) - (A - 1.0) * cos(omega) - beta * sin(omega);
+		b[0] = A * ((A + 1.0) + (A - 1.0) * cos(omega) + beta * sin(omega));
+		b[1] = -2.0 * A * ((A - 1.0) + (A + 1.0) * cos(omega));
+		b[2] = A * ((A + 1.0) + (A - 1.0) * cos(omega) - beta * sin(omega));
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/LPFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/LPFilter.cpp
new file mode 100644
index 0000000..6315592
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/LPFilter.cpp
@@ -0,0 +1,27 @@
+//LPFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+namespace BiquadFilter{
+	LPFilter::LPFilter(float cutoff, float Q){
+		this->cutoff = cutoff;
+		this->Q = Q;
+
+		alloc();
+
+		//init filter coefficient
+		float omega = 2.0 * M_PI* cutoff;
+		float alpha = sin(omega) / (2.0*Q);
+
+		a[0] = 1.0 + alpha;
+		a[1] = -2.0 * cos(omega);
+		a[2] = 1.0 - alpha;
+		b[0] = (1.0 - cos(omega)) / 2.0;
+		b[1] = 1.0 - cos(omega);
+		b[2] = (1.0 - cos(omega)) / 2.0;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/LSFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/LSFilter.cpp
new file mode 100644
index 0000000..a0e85ae
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/LSFilter.cpp
@@ -0,0 +1,29 @@
+//LSFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+namespace BiquadFilter{
+	LSFilter::LSFilter(float cutoff, float Q, float gain){
+		this->cutoff = cutoff;
+		this->Q = Q;
+		this->gain = gain;
+
+		alloc();
+
+		//init filter coefficient
+		float omega = 2.0 * M_PI* cutoff;
+		float A = pow(10.0, (gain / 40.0));
+		float beta = sqrt(A) / Q;
+
+		a[0] = (A + 1.0) + (A - 1.0) * cos(omega) + beta * sin(omega);
+		a[1] = -2.0 * ((A - 1.0) + (A + 1.0) * cos(omega));
+		a[2] = (A + 1.0) + (A - 1.0) * cos(omega) - beta * sin(omega);
+		b[0] = A * ((A + 1.0) - (A - 1.0) * cos(omega) + beta * sin(omega));
+		b[1] = 2.0 * A * ((A - 1.0) - (A + 1.0) * cos(omega));
+		b[2] = A * ((A + 1.0) - (A - 1.0) * cos(omega) - beta * sin(omega));
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/NTFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/NTFilter.cpp
new file mode 100644
index 0000000..d385ddd
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/NTFilter.cpp
@@ -0,0 +1,40 @@
+//NotchFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+/**
+#ifndef _MSC_VER
+
+static float log2(float x)
+{
+	return log(x) / log(2.0);
+}
+
+#endif // _MSC_VER
+*/
+
+using std::vector;
+
+namespace BiquadFilter{
+	NTFilter::NTFilter(float low_edge, float high_edge){
+		this->low_edge = low_edge;
+		this->high_edge = high_edge;
+
+		alloc();
+
+		//init filter coefficient
+		float bw = log2(high_edge / low_edge);
+		float cutoff = low_edge * pow(2, bw / 2);
+		float omega = 2.0 * M_PI* cutoff;
+		float alpha = sin(omega) * sinh(log(2.0)) / 2.0 * bw * omega / sin(omega);
+
+		a[0] = 1.0 + alpha;
+		a[1] = -2.0 * cos(omega);
+		a[2] = 1.0 - alpha;
+		b[0] = 1.0;
+		b[1] = -2.0 * cos(omega);
+		b[2] = 1.0;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/PKFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/PKFilter.cpp
new file mode 100644
index 0000000..4f0345d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/common/biquad_filters/PKFilter.cpp
@@ -0,0 +1,42 @@
+//PKFilter.cpp
+#define _USE_MATH_DEFINES
+
+#include "biquad_filters/BiquadFilter.h"
+#include <cmath>
+
+using std::vector;
+
+/**
+#ifndef _MSC_VER
+
+static float log2(float x)
+{
+	return log(x) / log(2.0);
+}
+
+#endif // _MSC_VER
+**/
+
+namespace BiquadFilter{
+	PKFilter::PKFilter(float low_edge, float high_edge, float gain){
+		this->low_edge = low_edge;
+		this->high_edge = high_edge;
+		this->gain = gain;
+
+		alloc();
+
+		//init filter coefficient
+		float bw = log2(high_edge / low_edge);
+		float cutoff = low_edge * pow(2, bw / 2);
+		float omega = 2.0 * M_PI* cutoff;
+		float alpha = sin(omega) * sinh(log(2.0)) / 2.0 * bw * omega / sin(omega);
+		float A = pow(10.0, (gain/40.0));
+
+		a[0] = 1.0 + alpha / A;
+		a[1] = -2.0 * cos(omega);
+		a[2] = 1.0 - alpha / A;
+		b[0] = 1.0 + alpha * A;
+		b[1] = -2.0 * cos(omega);
+		b[2] = 1.0 - alpha * A;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/CMakeLists.txt
new file mode 100644
index 0000000..47a9c3d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/CMakeLists.txt
@@ -0,0 +1,15 @@
+#cmake_minimum_required(VERSION 2.8)
+#project(iir_eq)
+#set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+set(CMAKE_CXX_STANDARD 11)
+
+include_directories(./)
+include_directories(inc)
+include_directories(src)
+include_directories(src/audacious_arma)
+include_directories(src/audacious_eq)
+
+file(GLOB_RECURSE SRC_IIR_EQ_SRC src/*cpp)
+
+add_library(iir_eq ${SRC_IIR_EQ_SRC})
+#set_target_properties(iir_eq PROPERTIES CXX_VISIBILITY_PRESET hidden)
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/build_bash.sh b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/build_bash.sh
new file mode 100755
index 0000000..1cc5d56
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/build_bash.sh
@@ -0,0 +1,62 @@
+#!/bin/sh
+
+# @Time    : 2019-06-18 17:50
+# @Author  : AlanWang
+# @FileName: build_android.sh
+
+# MY_NDK 和 MY_CMAKE 需要改成自己对应的 ndk 中的目录
+# MY_NDK="/Users/wangjianjun/AndroidDev/sdk/ndk-bundle"
+# MY_NDK="/Users/yangjianli/Library/Android/sdk/ndk-bundle"
+MY_NDK="/Users/yangjianli/Library/Android/sdk/ndk-bundle"
+MY_CMAKE="/Users/yangjianli/Library/Android/sdk/cmake/3.6.4111459/bin/cmake"
+
+if [ -z "$MY_NDK" ]; then
+  echo "Please set MY_NDK to the Android NDK folder"
+  exit 1
+fi
+
+if [ -z "$MY_CMAKE" ]; then
+  echo "Please set MY_CMAKE to the Android CMake folder"
+  exit 1
+fi
+
+OUTPUT_LIBS="./build/libs/android"
+ANDROID_NATIVE_API_LEVEL="android-16"
+
+# arme_abis=(armeabi armeabi-v7a arm64-v8a x86 x86_64 mips mips64)
+arme_abis=(armeabi-v7a arm64-v8a x86 x86_64)
+
+function build_with_armeabi() {
+	ARME_ABI=$1
+	echo ${ARME_ABI}
+
+	BUILD_DIR="./build/android/${ARME_ABI}"
+	PRE_EXE_DIR=$(pwd)
+	echo ${PRE_EXE_DIR}
+
+	${MY_CMAKE} \
+	-H"./" \
+	-B"${BUILD_DIR}" \
+	-DANDROID_ABI="${ARME_ABI}" \
+	-DANDROID_NDK="${MY_NDK}" \
+	-DCMAKE_LIBRARY_OUTPUT_DIRECTORY="./build/android/libs/${ARME_ABI}" \
+	-DCMAKE_BUILD_TYPE="Release" \
+	-DCMAKE_TOOLCHAIN_FILE="${MY_NDK}/build/cmake/android.toolchain.cmake" \
+	-DANDROID_NATIVE_API_LEVEL=${ANDROID_NATIVE_API_LEVEL} \
+	-DANDROID_TOOLCHAIN="clang" \
+	-DCMAKE_C_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DCMAKE_CXX_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DANDROID_STL="c++_static" \
+
+	cd ${BUILD_DIR}
+	make
+
+	cd ${PRE_EXE_DIR}
+	mkdir -p ${OUTPUT_LIBS}/${ARME_ABI}/
+	mv ${PRE_EXE_DIR}/lib/* ${OUTPUT_LIBS}/${ARME_ABI}/
+	rm -r ./build/android
+}
+
+for i in ${arme_abis[@]}; do
+	build_with_armeabi $i
+done
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/inc/CAudaciousEqApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/inc/CAudaciousEqApi.h
new file mode 100644
index 0000000..61a519c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/inc/CAudaciousEqApi.h
@@ -0,0 +1,42 @@
+//
+// Created by yangjianli on 2019-10-17.
+//
+/***
+ * 封装eq，支持多个声道的音频
+ */
+#ifndef IIR_EQ_ALL_AUDACIOUS_EQ_API_H
+#define IIR_EQ_ALL_AUDACIOUS_EQ_API_H
+
+#include "stdio.h"
+#include "CAudaciousEqDef.h"
+
+namespace SUPERSOUND
+{
+    class CAudaciousEq;
+}
+
+class CAudaciousEqApi
+{
+
+public:
+    CAudaciousEqApi();
+    ~CAudaciousEqApi();
+public:
+    int init(int sample_rate, int channel);
+    int uninit();
+    int32_t set_param(const float *bands); // length is 10
+    int32_t set_param(int nType);
+    int32_t reset();
+    int32_t process(float *in, float *out, int length);
+    int32_t get_latency_ms(); // 返回第一个声道的延迟
+
+private:
+    bool m_b_need_eq;
+    int m_sample_rate;
+    int m_channel;
+    SUPERSOUND::CAudaciousEq* m_eqs;
+
+};
+
+
+#endif //IIR_EQ_ALL_AUDACIOUS_EQ_API_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/inc/CAudaciousEqDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/inc/CAudaciousEqDef.h
new file mode 100644
index 0000000..2244062
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/inc/CAudaciousEqDef.h
@@ -0,0 +1,15 @@
+//
+// Created by yangjianli on 2020-01-10.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDACIOUSEQDEF_H
+#define AUDIO_EFFECTS_LIB_CAUDACIOUSEQDEF_H
+#include "AudioEffectsDef.h"
+// 错误码
+enum AUDACIOUS_EQ_ERROR_CODE {
+    AUDACIOUS_EQ_ERROR_CODE_SUCCESS = 0,
+    AUDACIOUS_EQ_ERROR_CODE_INPUT_ERROR = -1,
+    AUDACIOUSEQAPI_ERROR_INIT_ERROR = -2,
+};
+
+#endif //AUDIO_EFFECTS_LIB_CAUDACIOUSEQDEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/CAudaciousEqApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/CAudaciousEqApi.cpp
new file mode 100644
index 0000000..62521ae
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/CAudaciousEqApi.cpp
@@ -0,0 +1,148 @@
+//
+// Created by yangjianli on 2019-10-17.
+//
+
+#include "CAudaciousEq.h"
+#include "CAudaciousEqApi.h"
+#include "cstring"
+#include "iostream"
+
+CAudaciousEqApi::CAudaciousEqApi()
+{
+    m_eqs = NULL;
+}
+
+CAudaciousEqApi::~CAudaciousEqApi()
+{
+    uninit();
+}
+
+/**
+ * 初始化，每个channel一个10段均衡器
+ * @param sample_rate
+ * @param channel
+ * @return
+ */
+int CAudaciousEqApi::init(int sample_rate, int channel)
+{
+    m_sample_rate = sample_rate;
+    m_channel = channel;
+    m_b_need_eq = false;
+    if(channel <= 0)
+    {
+        return AUDACIOUS_EQ_ERROR_CODE_INPUT_ERROR;
+    }
+    m_eqs = new (std::nothrow) SUPERSOUND::CAudaciousEq[channel];
+    if(NULL == m_eqs )
+    {
+        return AUDACIOUSEQAPI_ERROR_INIT_ERROR;
+    }
+    return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
+
+/**
+ * 释放空间
+ */
+int CAudaciousEqApi::uninit()
+{
+    if(m_eqs != NULL)
+    {
+        delete [] m_eqs;
+        m_eqs = NULL;
+    }
+    return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
+
+/**
+ * 清空缓存数据
+ * @return
+ */
+int CAudaciousEqApi::reset()
+{
+    for(int i=0;i<m_channel;i++)
+    {
+        m_eqs[i].reset();
+    }
+    return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
+
+/**
+ * 返回第一个声道的延迟
+ * @return
+ */
+int32_t CAudaciousEqApi::get_latency_ms()
+{
+    return m_channel >0 ? m_eqs[0].get_latency_ms() : 0;
+}
+
+/**
+ * 设置参数
+ * @param nType
+ * @return
+ */
+int CAudaciousEqApi::set_param(int nType)
+{
+    for(int i=0;i<m_channel;i++)
+    {
+        int nRet = m_eqs[i].set_param(m_sample_rate, nType);
+        if(AUDACIOUS_EQ_ERROR_CODE_SUCCESS != nRet)
+        {
+            m_b_need_eq = false;
+            return nRet;
+        }
+    }
+    m_b_need_eq = true;
+    return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
+
+/**
+ * 设置自定义参数
+ * @param bands
+ * @return
+ */
+int CAudaciousEqApi::set_param(const float *bands)
+{
+    if(NULL == bands)
+    {
+        m_b_need_eq = false;
+        return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+    }
+    for(int i=0;i<m_channel;i++)
+    {
+        int nRet = m_eqs[i].set_param(m_sample_rate, bands);
+        if(AUDACIOUS_EQ_ERROR_CODE_SUCCESS != nRet)
+        {
+            m_b_need_eq = false;
+            return nRet;
+        }
+    }
+    m_b_need_eq = true;
+    return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
+
+/**
+ * 输入数据
+ * @param in
+ * @param nLength
+ * @return
+ */
+int32_t CAudaciousEqApi::process(float *in, float *out, int length)
+{
+    // 不是同一个地址
+    if(in != out)
+    {
+        memcpy(out, in, sizeof(float) * length);
+    }
+
+    if(m_b_need_eq)
+    {
+        for(int i=0;i<length;i+=m_channel)
+        {
+            for(int j=i;j<i+m_channel;j++)
+            {
+                out[j] = m_eqs[j - i].process(in[j]);
+            }
+        }
+    }
+    return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_arma/CAudaciousArma.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_arma/CAudaciousArma.cpp
new file mode 100755
index 0000000..fd174ce
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_arma/CAudaciousArma.cpp
@@ -0,0 +1,63 @@
+
+#include "CAudaciousArma.h"
+#include <math.h>
+
+namespace SUPERSOUND
+{
+
+
+CAudaciousArma::CAudaciousArma()
+{
+	m_a0 = 0;
+	m_a1 = 0;
+	m_b0 = 0;
+	m_b1 = 0;
+
+    reset();
+}
+
+CAudaciousArma::~CAudaciousArma()
+{
+
+}
+
+void CAudaciousArma::reset()
+{
+	m_y0 = 0;
+	m_y1 = 0;
+}
+
+int32_t CAudaciousArma::get_latency_ms()
+{
+	return 0;
+}
+
+int32_t CAudaciousArma::set_param(int32_t fs, float f0, float Q, float gain)
+{
+	m_gain = pow(10, gain / 20) - 1;
+
+	float th = float(2 * M_PI * f0 / fs);
+	float C = (1 - tan(th * Q / 2)) / (1 + tan(th * Q / 2));
+
+	m_a0 = (1 + C) * cosf (th);
+	m_a1 = -C;
+	m_b0 = (1 - C) / 2;
+	m_b1 = -1.005f;
+
+	return AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+}
+
+float CAudaciousArma::process(float in)
+{
+	float y0 = in * m_b0 + m_y0 * m_a0 + m_y1 * m_a1;
+
+	in += (y0 + m_y1 * m_b1) * m_gain;
+
+	m_y1 = m_y0;
+	m_y0 = y0;
+
+	return in;
+}
+
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_arma/CAudaciousArma.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_arma/CAudaciousArma.h
new file mode 100755
index 0000000..7b7c4a0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_arma/CAudaciousArma.h
@@ -0,0 +1,68 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//封装开源库 audacious 中的 IIR 的双二阶滤波器带通部分
+//这里只是使用了 ARMA 模型来做，其实也可以改成 AudioCookBook
+
+#ifndef __AUDACIOUS_ARMA_H__
+#define __AUDACIOUS_ARMA_H__
+
+#include <stdint.h>
+#include "CAudaciousEqDef.h"
+namespace SUPERSOUND
+{
+
+
+class CAudaciousArma
+{
+public:
+	CAudaciousArma();
+	~CAudaciousArma();
+
+public:
+	void reset();
+	int32_t get_latency_ms();
+	int32_t set_param(int32_t fs, float f0, float Q, float gain);
+	float process(float in);
+
+private:
+	float m_a0;
+	float m_a1;
+	float m_b0;
+	float m_b1;
+	float m_y0;
+	float m_y1;
+	float m_gain;
+};
+
+}
+
+#endif /* __AUDACIOUS_ARMA_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_eq/CAudaciousEq.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_eq/CAudaciousEq.cpp
new file mode 100755
index 0000000..b94d713
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_eq/CAudaciousEq.cpp
@@ -0,0 +1,107 @@
+
+#include "CAudaciousEq.h"
+
+namespace SUPERSOUND
+{
+
+
+static const float CF[10] = {
+	31.25, 62.5, 125, 250, 500,
+	1000, 2000, 4000, 8000, 16000
+};
+static const int STYLES_LEN = 25;
+// 线上应用
+// 0 2 3 4 7 8 10 13 17 22
+static const float STYLES[STYLES_LEN][10] = {
+        {4,2,0,-3,-6,-6,-3,0,1,3}, // pop 0
+        {7,6,3,0,0,-4,-6,-6,0,0}, // dance 1
+        {3,6,8,3,-2,0,4,7,9,10}, // blues 2
+        {0,0,0,0,0,0,-6,-6,-6,-8}, // classic 3
+        {0,0,1,4,4,4,0,1,3,3}, // jazz 4
+        {5,4,2,0,-2,0,3,6,7,8}, // slow 5
+        {6,5,0,-5,-4,0,6,8,8,7}, // electronica 6
+        {7,4,-4,7,-2,1,5,7,9,9}, // rock 7
+        {5,6,2,-5,1,1,-5,3,8,5}, // country 8
+        {-2,-1,-1,0,3,4,3,0,0,1},// voice 9
+        {5.8,5.8,3,0,-1.5,-1.5,0,0,0,0},//低音 10
+        {13.8,12.6,6.3,0,-1.5,-1.5,0,0,0,0},//超重低音 11
+        {5.8,5.8,3,0,-1.5,-1.5,0,1.5,5.8,5.8},//低音&高音 12
+        {-3,-3,-3,-3,-1.5,-1.5,0,6.3,9.6,12.3},//高音 13
+        {0,0,0,0,0,0,-3,-3,-3,-4.5},//经典 14
+        {5.8,3.2,2.1,0,0,-2.7,-2,-2.2,-0.6,-0.1},//舞曲 15
+        {5.8,3.2,1.3,-3,-2.3,2.2,3.6,5.8,5.8,5.8},//摇滚 16
+        {5.8,5.8,0,-2.9,-2.1,0,3.6,7.4,7.7,7.5},//电子 17
+        {-2.9,-2.9,2.5,3.6,4.8,4.7,6,6,3,3},//扬声器(响亮) 18
+        {-4.5,-3.8,2.2,2.2,2.2,2.2,2.1,1.5,1.5,1.5},//现场 19
+        {-4.5,-4.5,-1.5,-1.5,4.5,4.5,1.5,0,-4.5,-6},//中音 20
+        {1.5,4.5,5.8,3,1.5,0,0,0,1.5,3},//流行 21
+        {5.5,2.5,0.9,-2.6,-5,-10.6,-12.4,-13.3,-10.6,-6.7},//柔和 22
+        {3,3,3,0,-3,-3,0,0,0,0},//柔和低音 23
+        {0,0,-4.5,-4.5,-4.5,-4.5,-3,0,4.5,4.5},//柔和高音 24
+};
+
+CAudaciousEq::CAudaciousEq()
+{
+
+}
+
+CAudaciousEq::~CAudaciousEq()
+{
+
+}
+
+void CAudaciousEq::reset()
+{
+	for(int32_t i = 0; i < 10; i++)
+	{
+        m_arma[i].reset();
+	}
+}
+
+int32_t CAudaciousEq::get_latency_ms()
+{
+	int32_t latecy = 0;
+
+	for(int32_t i = 0; i < 10; i++)
+	{
+		latecy += m_arma[i].get_latency_ms();
+	}
+
+	return latecy;
+}
+
+int32_t CAudaciousEq::set_param(int32_t fs, const float *fBands)
+{
+	int32_t nRet = AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+
+	for(int32_t i = 0; i < 10; i++)
+	{
+		nRet = m_arma[i].set_param(fs, CF[i], 1.2247449f, fBands[i]);
+		if(nRet != AUDACIOUS_EQ_ERROR_CODE_SUCCESS)
+			return nRet;
+	}
+
+	return nRet;
+}
+
+int32_t CAudaciousEq::set_param(int32_t fs, int nType) {
+    int32_t nRet = AUDACIOUS_EQ_ERROR_CODE_SUCCESS;
+    if(nType >= STYLES_LEN || nType < 0)
+    {
+        return AUDACIOUSEQAPI_ERROR_INIT_ERROR;
+    }
+    nRet = set_param(fs, STYLES[nType]);
+    return nRet;
+}
+
+float CAudaciousEq::process(float in)
+{
+	for(int32_t i = 0; i < 10; i++)
+	{
+		in = m_arma[i].process(in);
+	}
+	return in;
+}
+
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_eq/CAudaciousEq.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_eq/CAudaciousEq.h
new file mode 100755
index 0000000..1cf3f01
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/iir_eq/src/audacious_eq/CAudaciousEq.h
@@ -0,0 +1,63 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//封装开源库 audacious 中的 IIR 的 10 段 Eq 部分
+
+#ifndef __AUDACIOUS_EQ_H__
+#define __AUDACIOUS_EQ_H__
+
+#include "CAudaciousArma.h"
+
+namespace SUPERSOUND
+{
+
+class CAudaciousEq
+{
+public:
+	CAudaciousEq();
+	~CAudaciousEq();
+
+public:
+	void reset();
+	int32_t get_latency_ms();
+	//外围保证带长为 10
+	int32_t set_param(int32_t fs, const float *fBands);
+	int32_t set_param(int32_t fs, int nType); // 使用预先设置好的类型
+	float process(float in);
+
+private:
+	// 10 段均衡器
+	CAudaciousArma m_arma[10];
+};
+
+}
+
+#endif /* __AUDACIOUS_EQ_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/CMakeLists.txt
new file mode 100644
index 0000000..2fc7827
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/CMakeLists.txt
@@ -0,0 +1,4 @@
+include_directories(./ inc src)
+file(GLOB_RECURSE PHONOGRAPH_SRC_FILES src/*cpp)
+add_library(phonograph ${PHONOGRAPH_SRC_FILES})
+#set_target_properties(phonograph PROPERTIES CXX_VISIBILITY_PRESET hidden)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/inc/CPhonograph.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/inc/CPhonograph.h
new file mode 100644
index 0000000..5316aba
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/inc/CPhonograph.h
@@ -0,0 +1,30 @@
+#ifndef KALA_AUDIOBASE_PHONOGRAPH_H
+#define KALA_AUDIOBASE_PHONOGRAPH_H
+
+#include <vector>
+#include "CPhonographDef.h"
+
+class CPhonograph
+{
+public:
+    CPhonograph();
+    virtual ~CPhonograph();
+	void reset();
+
+	int init(int sample_rate, int channel);	// set sample rate and channel;
+	void uninit();	// uninit
+
+	// process input buffer and output size.
+	int process(short* in_buffer, int in_size);
+
+    int process(float * in_buffer, int in_size);
+
+	int process_lr_independent(float *in_left, float *in_right, int in_out_size);
+
+private:
+    void* handles;
+    int m_samplerate;
+    int m_channels;
+    std::vector<float> data;
+};
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/inc/CPhonographDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/inc/CPhonographDef.h
new file mode 100644
index 0000000..8acf064
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/inc/CPhonographDef.h
@@ -0,0 +1,14 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_PHONOGRAPHDEF_H
+#define AUDIO_EFFECTS_LIB_PHONOGRAPHDEF_H
+#include "AudioEffectsDef.h"
+enum PG_ERR {
+    PG_ERR_SUCCESS            = 0,
+    PG_ERR_PARAM              = -1,
+    PG_ERR_BASE_H_MALLOC_NULL = -2,
+};
+
+#endif //AUDIO_EFFECTS_LIB_PHONOGRAPHDEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/src/CPhonograph.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/src/CPhonograph.cpp
new file mode 100644
index 0000000..b0da905
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/phonograph/src/CPhonograph.cpp
@@ -0,0 +1,309 @@
+/************************************************************************/
+/* Phonograph Eimulator                                                 */
+/* copy right reserved                                                  */
+/************************************************************************/
+
+#include "math.h"
+#include "stdlib.h"
+#include "stdio.h"
+#include "memory.h"
+#include "CPhonograph.h"
+#include "biquad_filters/BiquadFilter.h"
+
+// This is a trick. When enabled, all channels refer to the 1st channel
+#define PSEUDO_MULTICHANNELS 0   // defined in KTYPED.h
+
+#define VERSION_ID_NUMBER	100 /* 7.21,2013 */
+
+using std::vector;
+using namespace BiquadFilter;
+
+
+#define HPF_FREQ 1712 / 44100.0f
+#define LPF_FREQ 2222 / 44100.0f
+#define HPFQ 2.1f
+#define LPFQ 2.1f
+
+
+class CPhonographFilters
+{
+public:
+    CPhonographFilters();
+    virtual ~CPhonographFilters();
+	void reset();
+
+    bool isAllocated() const;
+
+    void filtering(std::vector<float> *x);
+
+private:
+    LPFilter* lpf;
+    HPFilter* hpf;
+};
+
+bool CPhonographFilters::isAllocated() const
+{
+    return lpf != NULL && hpf != NULL;
+}
+
+
+
+void CPhonographFilters::filtering(std::vector<float> *x)
+{
+    hpf->filtering(x);
+    lpf->filtering(x);
+}
+
+
+
+CPhonographFilters::CPhonographFilters()
+{
+    hpf = new HPFilter(HPF_FREQ, HPFQ);    
+    lpf = new LPFilter(LPF_FREQ, LPFQ);   
+
+    if (!hpf || !lpf)
+    {
+        if (hpf)
+        {
+            delete hpf;
+            hpf = NULL;
+        }
+        if (lpf)
+        {
+            delete lpf;
+            lpf = NULL;
+        }
+    }
+}
+
+void CPhonographFilters::reset()
+{
+	if (hpf)
+	{
+		hpf->reset();
+	}
+	if (lpf)
+	{
+		lpf->reset();
+	}
+}
+
+CPhonographFilters::~CPhonographFilters()
+{
+    delete lpf;
+    delete hpf;
+
+    lpf = NULL;
+    hpf = NULL;
+}
+
+CPhonograph::CPhonograph()
+{
+    m_samplerate = 0;
+    m_channels = 0;
+    handles = NULL;
+}
+
+void CPhonograph::reset()
+{
+	if (handles)
+	{
+		for (int chn = 0; chn < m_channels; chn++)
+		{
+			CPhonographFilters* filters = ((CPhonographFilters**)handles)[chn];
+
+			if (filters)
+			{
+				filters->reset();
+			}
+
+		}
+	}
+}
+
+CPhonograph::~CPhonograph()
+{
+    uninit();
+}
+
+int CPhonograph::init(int sample_rate, int channel)
+{
+    m_samplerate = sample_rate;
+    m_channels = channel;
+
+
+    handles = new CPhonographFilters*[m_channels];
+
+    if (!handles)
+    {
+        return PG_ERR_BASE_H_MALLOC_NULL;
+    }
+
+    for (int chn = 0; chn < m_channels; chn++)
+    {
+        CPhonographFilters* filters = new CPhonographFilters();
+       
+        ((CPhonographFilters**)handles)[chn] = filters;
+
+        if (!filters->isAllocated())
+        {
+            do{
+                CPhonographFilters* filters = ((CPhonographFilters**)handles)[chn];
+                delete filters;
+
+            } while (chn--);
+
+            delete [] (CPhonographFilters**)handles;
+            handles = NULL;
+
+            return PG_ERR_BASE_H_MALLOC_NULL;
+        }
+
+    }
+
+    return 0;
+}
+
+void CPhonograph::uninit()
+{
+    if (handles)
+    {
+        for (int chn = 0; chn < m_channels; chn++)
+        {
+            CPhonographFilters* filters = ((CPhonographFilters**)handles)[chn];
+
+            if (filters)
+            {
+                delete filters;
+            }
+
+        }
+
+        delete [] (CPhonographFilters**)handles;
+        handles = NULL;
+    }
+}
+
+int CPhonograph::process(short* inBuffer, int inSize)
+{
+    if (0 != (inSize % m_channels))
+    {
+        return PG_ERR_PARAM;
+    }
+
+    if (handles)
+    {
+
+        data.reserve(inSize / m_channels);
+        data.resize(inSize / m_channels);
+
+        for (int chn = 0; chn < m_channels; chn++)
+        {
+            CPhonographFilters* filters = ((CPhonographFilters**)handles)[chn];
+            short* audio = chn + inBuffer;
+
+            if (filters)
+            {
+                if (PSEUDO_MULTICHANNELS && chn>0)
+                {
+                    short* audioref = (short*)inBuffer;
+
+                    for (unsigned int i = 0; i < data.size(); i++){
+                        audio[0] = audioref[0];
+                        audio += m_channels;
+                        audioref += m_channels;
+                    }
+                }
+                else
+                {
+
+                    for (unsigned int i = 0; i < data.size(); i++){
+                        //                    data[i]= audio[i * m_channels + chn] / 32768.0;
+                        data[i]= audio[0] / 32768.0f; 
+                        audio += m_channels;
+                    }
+
+                    filters->filtering(&data);
+
+                    short* audio = chn + inBuffer;
+
+                    for (unsigned int i = 0; i < data.size(); i++){
+                        int sample = (int)(32767.0f * data[i]);
+//                        int sample = (int)(20767.0f * data[i]);
+#if 1
+                        if (sample>32767)
+                            sample = 32767;
+                        else if (sample<-32768)
+                            sample = -32768;
+#endif
+                        //                   audio[i * m_channels + chn] = (short)sample;
+                        audio[0] = (short)sample;
+                        audio += m_channels;
+                    }
+                } // if (PSEUDO_MULTICHANNELS && chn>0)
+
+            }
+
+        }
+    }
+
+    return inSize;
+}
+
+int CPhonograph::process_lr_independent(float *in_left, float *in_right, int in_out_size)
+{
+	if (2 != m_channels)
+	{
+		return PG_ERR_PARAM;
+	}
+	data.reserve(in_out_size);
+	data.resize(in_out_size);
+	if (handles) {
+		data.assign(in_left, in_left + in_out_size);
+		CPhonographFilters* filters = ((CPhonographFilters**)handles)[0];
+		filters->filtering(&data);
+		for (unsigned int i = 0; i < data.size(); i++) {
+			in_left[i] = data[i];
+		}
+
+		data.assign(in_right, in_right + in_out_size);
+		filters = ((CPhonographFilters**)handles)[1];
+		filters->filtering(&data);
+		for (unsigned int i = 0; i < data.size(); i++) {
+			in_right[i] = data[i];
+		}
+	}
+	return in_out_size;
+}
+
+int CPhonograph::process(float* inBuffer, int inSize) {
+    if (handles) {
+        data.reserve(inSize / m_channels);
+        data.resize(inSize / m_channels);
+        for (int chn = 0; chn < m_channels; chn++) {
+            CPhonographFilters* filters = ((CPhonographFilters**)handles)[chn];
+            float* audio = chn + inBuffer;
+            if (filters) {
+                for (unsigned int i = 0; i < data.size(); i++) {
+                    data[i]= audio[0];
+                    audio += m_channels;
+                }
+                filters->filtering(&data);
+                float* audio = chn + inBuffer;
+                for (unsigned int i = 0; i < data.size(); i++) {
+                    float sample = data[i];
+//                    float sample = (20767.0f / 32768) * data[i];
+#if 1
+                    if (sample > (32767.0f / 32768))
+                        sample = 32767.0f / 32768;
+                    else if (sample < -1.0f)
+                        sample = -1.0f;
+#endif
+                    audio[0] = sample;
+                    audio += m_channels;
+                }
+            }
+        }
+    }
+    return inSize;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/CMakeLists.txt
new file mode 100644
index 0000000..57010ef
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/CMakeLists.txt
@@ -0,0 +1,4 @@
+include_directories(./ inc)
+file(GLOB_RECURSE REVERB_SRC_FILES src/*cpp)
+add_library(reverb ${REVERB_SRC_FILES})
+#set_target_properties(reverb PROPERTIES CXX_VISIBILITY_PRESET hidden)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/inc/CReverb.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/inc/CReverb.h
new file mode 100644
index 0000000..caa6446
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/inc/CReverb.h
@@ -0,0 +1,81 @@
+#ifndef C_REVERB_RATION_H
+#define C_REVERB_RATION_H
+/************************************************************************/
+/* reverberation				                                        */
+/************************************************************************/
+
+//#include "KalaInterfaces.h"
+#include <inc/AudioEffectsDef.h>
+#include "CReverbDef.h"
+/* version before kala v2.6, only 0\4\5\6 used. kala 1.0 use id [0,3]*/
+#define KALA_VB_RECORD_STUDIO	0		// lu yin peng
+#define KALA_VB_KTV				1		// KTV
+#define KALA_VB_CONCERT			2		// yan chang hui
+#define KALA_VB_THEATER			3		// ju chang
+#define KALA_VB_NEW_KTV			4		// new ktv
+#define KALA_VB_NEW_CONCERT		5		// new concert
+#define KALA_VB_NEW_THEATER		6		// new theater
+
+/* id not used */
+#define KALA_VB_ID_7			7		// lu yin pen
+#define KALA_VB_ID_8			8		// lu yin pen
+#define KALA_VB_ID_9			9		// lu yin pen
+
+/* id used for kala v3.0's quick version */
+#define KALA_VB_ID_10			10		// 
+#define KALA_VB_ID_11			11		// 
+#define KALA_VB_ID_12			12		// 
+#define KALA_VB_ID_13			13		// 
+#define KALA_VB_ID_14			14		// 
+#define KALA_VB_ID_15			15		// 
+#define KALA_VB_ID_16			16		// 
+#define KALA_VB_ID_17			17		// 
+#define KALA_VB_ID_18			18		// 
+
+#include "CReverbParams.h"
+
+class CReverb
+{
+public:
+    CReverb();
+    ~CReverb();
+
+public:
+    int     init(int sample_rate, int channel);
+	void	reset();
+    void    uninit();
+    
+    void    get_id_range(int *max_val, int *min_val);
+    int     get_id_default();
+    
+    int     set_type_id(int type_id);
+    int     set_params(AE_PARAMS_REVERB* param);
+    int     get_type_id();
+    char *  get_name_by_id(int type_id);
+
+	int  set_room_size(float room_size);
+	int  set_wet(float wet);
+
+	float  get_room_size();
+	float  get_wet();
+
+	int     get_latency();
+    
+    int     process(short *in_buffer, int in_size, short *out_buffer, int out_size);
+    int     process(float *in_buffer, int in_size, float *out_buffer, int out_size);
+
+	int     process_lr_independent(float *in_left, float *in_right, float *out_left, float *out_right, int in_out_size);
+    
+private:
+	int m_id;
+	int m_sampleRate;
+	int m_channel;
+    bool m_need_process;
+	void* m_pvb;
+};
+
+
+
+#endif
+
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/inc/CReverbDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/inc/CReverbDef.h
new file mode 100644
index 0000000..7b55dc5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/inc/CReverbDef.h
@@ -0,0 +1,24 @@
+//
+// Created by yangjianli on 2020-01-13.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CREVERBDEF_H
+#define AUDIO_EFFECTS_LIB_CREVERBDEF_H
+
+#include "stdlib.h"
+#include "AudioEffectsConf.h"
+enum RB_ERR {
+    RB_ERR_SUCCESS            = 0,
+    RB_ERR_NO_MEMORY          = -1,
+    RB_ERR_PARAM              = -2,
+    RB_ERR_HAS_SET_PARAM      = -3,
+    RB_ERR_AUTOTUNE_INIT      = -4,
+    RB_ERR_BASE_H_NULL        = -5,
+    RB_ERR_BASE_H_MALLOC_NULL = -6,
+};
+
+#ifndef safe_free
+#define safe_free(p)      { if(p) { free(p); (p)=NULL; } }
+#endif
+
+#endif //AUDIO_EFFECTS_LIB_CREVERBDEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/CReverb.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/CReverb.cpp
new file mode 100644
index 0000000..b8a6f44
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/CReverb.cpp
@@ -0,0 +1,663 @@
+#include "CReverbDef.h"
+#include "CReverb.h"
+#include "verb/revmodel.h"
+
+#define MAX_VERB_VALUE	19
+#define MIN_VERB_VALUE	0
+#define MAX_NUMBER_OF_VERB MAX_VERB_VALUE +1
+const char g_p_verb_id_names[][64] = {
+	{ "studio" },
+	{ "KTV" },
+	{ "concert" },
+	{ "theater" },
+	{ "ktv 2" },
+	{ "concert 2" },
+	{ "theater 2" },
+	{ "7" },
+	{ "8" },
+	{"9"},
+	{"10"},
+	{ "11" },
+	{"12"},
+	{"13"},
+	{ "14" },
+	{ "15" },
+	{ "16" },
+	{ "17" },
+	{ "distant" },
+	{ "custom" }
+};
+
+#ifndef SHORTMAX
+#define SHORTMAX 32767
+#endif
+#ifndef SHORTMIN
+#define SHORTMIN -32768
+#endif
+
+#ifndef Clip_short	
+#define Clip_short(x) (short)((x)>SHORTMAX?SHORTMAX:((x)<SHORTMIN?SHORTMIN:(x)))
+#endif
+
+CReverb::CReverb()
+{
+    m_id = KALA_VB_RECORD_STUDIO;
+    m_pvb = NULL;
+    m_need_process = false;
+    m_channel = 0;
+    m_sampleRate = 0;
+}
+
+CReverb::~CReverb()
+{
+    uninit();
+}
+
+int CReverb::init(int sample_rate, int channel)
+{
+	revmodel* pmd = new revmodel;
+	if (pmd == NULL)
+	{
+		return RB_ERR_BASE_H_MALLOC_NULL;
+	}
+
+	pmd->mute();
+
+	m_channel = channel;
+	m_sampleRate = sample_rate;
+
+	m_pvb = (void*)pmd;
+    m_need_process = false;
+	return 0;
+}
+
+void CReverb::reset()
+{
+	revmodel* pmv = (revmodel*)m_pvb;
+	if (pmv != NULL)
+	{
+		pmv->mute();
+	}
+	return;
+}
+
+void CReverb::uninit()
+{
+	revmodel* pmv = (revmodel*)m_pvb;
+	if (pmv != NULL)
+	{
+		delete pmv;
+		pmv = NULL;
+
+		m_pvb = NULL;
+        m_need_process = false;
+	}
+
+}
+
+int CReverb::get_latency()
+{
+	return 0;
+}
+
+void CReverb::get_id_range(int *max_val, int *min_val)
+{
+	*max_val = MAX_VERB_VALUE;
+	*min_val = MIN_VERB_VALUE;
+}
+
+int CReverb::get_id_default()
+{
+	return KALA_VB_RECORD_STUDIO;
+}
+
+int  CReverb::set_room_size(float room_size)
+{
+	if (room_size > 1.0f || room_size < 0.0f)
+		return RB_ERR_BASE_H_NULL;
+
+	revmodel* pmd = (revmodel*)m_pvb;
+	if (pmd == NULL)
+	{
+		return RB_ERR_BASE_H_NULL;
+	}
+	pmd->setroomsize(room_size);
+	return 0;
+}
+
+float  CReverb::get_room_size()
+{
+	revmodel* pmd = (revmodel*)m_pvb;
+	float roomSize = pmd->getroomsize();
+	return roomSize;
+}
+
+int  CReverb::set_wet(float wet)
+{
+	if (wet > 1.0f || wet < 0.0f)
+		return RB_ERR_BASE_H_NULL;
+	revmodel* pmd = (revmodel*)m_pvb;
+	if (pmd == NULL)
+	{
+		return RB_ERR_BASE_H_NULL;
+	}
+	pmd->setwet(wet/3.0f);
+	return 0;
+}
+
+float  CReverb::get_wet()
+{
+	revmodel* pmd = (revmodel*)m_pvb;
+	float wet = pmd->getwet();
+	wet *= 3.0f;
+	return wet;
+}
+
+int CReverb::set_type_id(int type_id)
+{
+    m_need_process = true;
+	revmodel* pmd = (revmodel*)m_pvb;
+	if (pmd == NULL)
+	{
+		return RB_ERR_BASE_H_NULL;
+	}
+
+	// check input
+	if (type_id<MIN_VERB_VALUE)
+	{
+		type_id = MIN_VERB_VALUE;
+	}
+	else if (type_id >MAX_VERB_VALUE)
+	{
+		type_id = MAX_VERB_VALUE;
+	}
+
+	m_id = type_id;
+
+	/* it's better here to use id array than switch case, can optimization here later */
+	switch (m_id)
+	{
+		/***************** v1.0, id 0~3, add here ************************************/
+	case KALA_VB_RECORD_STUDIO:
+	{
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0);
+		pmd->setdamp(0);
+		pmd->setwet(0);
+		pmd->setdry(0.8f);
+		pmd->setwidth(0.5f);
+		break;
+	}
+	case KALA_VB_KTV:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+
+	case KALA_VB_CONCERT:
+	{
+		// for concert ok
+		pmd->setmode(0.3f);
+		pmd->setroomsize(0.50f);
+		pmd->setdamp(0.6f);
+		pmd->setwet(0.3f);
+		pmd->setdry(0.6f);
+		pmd->setwidth(0.56f);
+		break;
+	}
+
+	case KALA_VB_THEATER:
+	{
+		// for theater
+		pmd->setmode(0.0);
+		pmd->setroomsize(0.6f);
+		pmd->setdamp(0.2f);
+		pmd->setwet(0.4f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.20f);
+		break;
+	}
+	/***************** kala v2.6, id 0\4\5\6, add here ************************************/
+	case KALA_VB_NEW_KTV:
+	{
+
+		// v2.2
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.7f);
+		pmd->setdamp(0.9f);
+		pmd->setwet(0.11f);
+		pmd->setdry(0.44f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_NEW_CONCERT:
+	{
+		// v2.2
+		pmd->setmode(0.3f);
+		pmd->setroomsize(0.60f);
+		pmd->setdamp(0.6f);
+		pmd->setwet(0.18f);
+		pmd->setdry(0.37f);
+		pmd->setwidth(0.56f);
+
+		break;
+	}
+	case KALA_VB_NEW_THEATER:
+	{
+
+		//old version 
+		//pmd->setmode(0.0);
+		//pmd->setroomsize(0.6f);
+		//pmd->setdamp(0.2f);
+		//pmd->setwet(0.4f);
+		//pmd->setdry(0.5f);
+		//pmd->setwidth(0.20f);
+
+		// new 1.0
+		//pmd->setmode(0.0);
+		//pmd->setroomsize(0.8f);
+		//pmd->setdamp(0.8f);
+		//pmd->setwet(0.3f);
+		//pmd->setdry(0.4f);
+		//pmd->setwidth(0.50f);
+
+		// v2.0
+		//pmd->setmode(0.0);
+		//pmd->setroomsize(0.8f);
+		//pmd->setdamp(0.8f);
+		//pmd->setwet(0.22f);
+		//pmd->setdry(0.14f);
+		//pmd->setwidth(0.50f);
+
+		//v2.2
+		pmd->setmode(0.0);
+		pmd->setroomsize(0.8f);
+		pmd->setdamp(0.8f);
+		pmd->setwet(0.248f);
+		pmd->setdry(0.182f);
+		pmd->setwidth(0.50f);
+
+		break;
+	}
+	/***************** kala v2.6, id 0\4\5\6, add here ************************************/
+	case KALA_VB_ID_7:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_ID_8:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_ID_9:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_ID_10:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_ID_11:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_ID_12:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.4f);
+		pmd->setdamp(0.69f);
+		pmd->setwet(0.14f);
+		pmd->setdry(0.22f);
+		pmd->setwidth(0.82f);
+
+		break;
+	}
+	case KALA_VB_ID_13:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.41f);
+		pmd->setdamp(0.18f);
+		pmd->setwet(0.16f);
+		pmd->setdry(0.24f);
+		pmd->setwidth(0.68f);
+
+		break;
+	}
+	case KALA_VB_ID_14:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.79f);
+		pmd->setdamp(0.63f);
+		pmd->setwet(0.14f);
+		pmd->setdry(0.26f);
+		pmd->setwidth(0.92f);
+
+		break;
+	}
+	case KALA_VB_ID_15:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.84f);
+		pmd->setdamp(0.25f);
+		pmd->setwet(0.12f);
+		pmd->setdry(0.22f);
+		pmd->setwidth(0.76f);
+
+		break;
+	}
+	case KALA_VB_ID_16:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.88f);
+		pmd->setdamp(0.42f);
+		pmd->setwet(0.12f);
+		pmd->setdry(0.17f);
+		pmd->setwidth(0.84f);
+
+		break;
+	}
+	case KALA_VB_ID_17:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.35f);
+		pmd->setdamp(0.5f);
+		pmd->setwet(0.20f);
+		pmd->setdry(0.5f);
+		pmd->setwidth(0.5f);
+
+		break;
+	}
+	case KALA_VB_ID_18:
+	{
+		// for ktv
+		pmd->setmode(0.2f);
+		pmd->setroomsize(0.65f);
+		pmd->setdamp(0.25f);
+		pmd->setwet(0.25f);
+		pmd->setdry(0.6f);
+		pmd->setwidth(0.95f);
+
+		break;
+	}
+	default:
+	{
+		pmd->setmode(1);
+		break;
+	}
+	}
+
+	return 0;
+}
+
+int CReverb::get_type_id()
+{
+	return m_id;
+}
+
+char* CReverb::get_name_by_id(int type_id)
+{
+	if (type_id <0)
+	{
+		type_id = 0;
+	}
+	else if (type_id > MAX_VERB_VALUE -1)
+	{
+		type_id = MAX_VERB_VALUE -1;
+	}
+
+	return (char*)g_p_verb_id_names[type_id];
+}
+
+int CReverb::process(short *in_buffer, int in_size, short *out_buffer, int out_size)
+{
+    if(!m_need_process)
+    {
+        if(in_buffer != out_buffer)
+        {
+            memcpy(in_buffer, out_buffer, sizeof(float)* out_size);
+        }
+        return RB_ERR_SUCCESS;
+    }
+
+	/* check input */
+	revmodel* pmd = (revmodel*)m_pvb;
+	if (pmd == NULL)
+	{
+		return RB_ERR_BASE_H_NULL;
+	}
+
+	if (in_size!= out_size)
+	{
+		return RB_ERR_PARAM;
+	}
+
+	in_size /= m_channel;
+	out_size /= m_channel;
+
+	/* for mono */
+	if (m_channel == 1)
+	{
+		int j;
+		short* pInSample	= in_buffer;
+		short* pOutSample	= out_buffer;
+
+		for (j = 0; j < in_size; j++)
+		{
+			float saminL;
+			float samoutL;
+
+			saminL = pInSample[j]/32768.0f;
+			//saminL = pInSample[j];
+			pmd->processMono(&saminL,&samoutL, 1,0);
+
+			pOutSample[j] = (short)Clip_short((int)(samoutL*32768.0f));
+			//pOutSample[j] = (short)Clip_short((int)samoutL);
+		}
+
+	}
+	else if (m_channel == 2)
+	{
+		int j;
+		short* pInSample	= in_buffer;
+		short* pOutSample	= out_buffer;
+
+		for (j = 0; j < in_size; j++)
+		{
+			float saminL,saminR;
+			float samoutL,samoutR;
+
+			saminL = pInSample[j+j]/32768.0f;
+			saminR = pInSample[j+j +1]/32768.0f;
+
+			pmd->processreplace(&saminL,&saminR,&samoutL,&samoutR, 1,0);
+
+			pOutSample[j+j] = (short)Clip_short((int)(samoutL*32768.0f));
+			pOutSample[j+j+1] = (short)Clip_short((int)(samoutR*32768.0f));
+		}
+	}
+
+	return out_size;
+}
+
+int CReverb::process_lr_independent(float *in_left, float *in_right, float *out_left, float *out_right, int in_out_size)
+{
+    if(!m_need_process)
+    {
+        if(in_left != out_left)
+        {
+            memcpy(in_left, out_left, sizeof(float)* in_out_size);
+        }
+        if(in_right != out_right)
+        {
+            memcpy(in_right, out_left, sizeof(float)* in_out_size);
+        }
+        return RB_ERR_SUCCESS;
+    }
+
+	if (2 != m_channel)
+	{
+		return RB_ERR_PARAM;
+	}
+	/* check input */
+	revmodel* pmd = (revmodel*)m_pvb;
+	if (pmd == NULL)
+	{
+		return RB_ERR_BASE_H_NULL;
+	}
+
+	int j;
+	for (j = 0; j < in_out_size; j++)
+	{
+		pmd->processreplace(in_left + j, in_right + j, out_left + j, out_right + j, 1, 0);
+	}
+	return in_out_size;
+}
+
+int CReverb::process(float *in_buffer, int in_size, float *out_buffer, int out_size)
+{
+    if(!m_need_process)
+    {
+        if(in_buffer != out_buffer)
+        {
+            memcpy(in_buffer, out_buffer, sizeof(float)* out_size);
+        }
+        return RB_ERR_SUCCESS;
+    }
+
+    /* check input */
+    revmodel* pmd = (revmodel*)m_pvb;
+    if (pmd == NULL)
+    {
+        return RB_ERR_BASE_H_NULL;
+    }
+    
+    if (in_size!= out_size)
+    {
+        return RB_ERR_PARAM;
+    }
+
+	in_size /= m_channel;
+	out_size /= m_channel;
+    
+    /* for mono */
+    if (m_channel == 1)
+    {
+        int j;
+        float* pInSample	= in_buffer;
+        float* pOutSample	= out_buffer;
+        
+        for (j = 0; j < in_size; j++)
+        {
+            float saminL;
+            float samoutL;
+            
+            saminL = pInSample[j];
+            //saminL = pInSample[j];
+            pmd->processMono(&saminL,&samoutL, 1,0);
+            
+            pOutSample[j] = samoutL;
+            //pOutSample[j] = (short)Clip_short((int)samoutL);
+        }
+        
+    }
+    else if (m_channel == 2)
+    {
+        int j;
+        float* pInSample	= in_buffer;
+        float* pOutSample	= out_buffer;
+        
+        for (j = 0; j < in_size; j++)
+        {
+            float saminL,saminR;
+            float samoutL,samoutR;
+            
+            saminL = pInSample[j+j];
+            saminR = pInSample[j+j +1];
+            
+            pmd->processreplace(&saminL,&saminR,&samoutL,&samoutR, 1,0);
+            
+            pOutSample[j+j] = samoutL;
+            pOutSample[j+j+1] = samoutR;
+        }
+    }
+    
+    return out_size;
+}
+
+int CReverb::set_params(AE_PARAMS_REVERB *param)
+{
+    revmodel* pmd = (revmodel*)m_pvb;
+    if (pmd == NULL)
+    {
+        return RB_ERR_BASE_H_NULL;
+    }
+    if(NULL == param)
+    {
+        pmd->setmode(1);
+        m_need_process = false;
+        return RB_ERR_SUCCESS;
+    }
+
+    pmd->setmode(param->mode);
+    pmd->setroomsize(param->room_size);
+    pmd->setdamp(param->damp);
+    pmd->setwet(param->wet);
+    pmd->setdry(param->dry);
+    pmd->setwidth(param->width);
+
+    m_need_process = true;
+    return RB_ERR_SUCCESS;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/allpass.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/allpass.cpp
new file mode 100644
index 0000000..850337e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/allpass.cpp
@@ -0,0 +1,36 @@
+// Allpass filter implementation
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#include "allpass.h"
+
+allpass::allpass()
+{
+	bufidx = 0;
+}
+
+void allpass::setbuffer(float *buf, int size) 
+{
+	buffer = buf; 
+	bufsize = size;
+}
+
+void allpass::mute()
+{
+	for (int i=0; i<bufsize; i++)
+		buffer[i]=0;
+}
+
+void allpass::setfeedback(float val) 
+{
+	feedback = val;
+}
+
+float allpass::getfeedback() 
+{
+	return feedback;
+}
+
+//ends
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/allpass.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/allpass.h
new file mode 100644
index 0000000..b68e378
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/allpass.h
@@ -0,0 +1,50 @@
+// Allpass filter declaration
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#ifndef _allpass_
+#define _allpass_
+//#include "denormals.h"
+
+#include "tuning.h"
+
+class allpass
+{
+public:
+					allpass();
+			void	setbuffer(float *buf, int size);
+	inline  float	process(float input);
+			void	mute();
+			void	setfeedback(float val);
+			float	getfeedback();
+// private:
+	float	feedback;
+	float	*buffer;
+	int		bufsize;
+	int		bufidx;
+};
+
+
+// Big to inline - but crucial for speed
+
+inline float allpass::process(float input)
+{
+	float output;
+	float bufout;
+	
+	bufout = buffer[bufidx];
+	//undenormalise(bufout);
+	
+	output = -input + bufout;
+	buffer[bufidx] = input + (bufout*feedback);
+
+	if(++bufidx>=bufsize) bufidx = 0;
+
+	return output;
+}
+
+#endif//_allpass
+
+//ends
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/comb.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/comb.cpp
new file mode 100644
index 0000000..62be706
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/comb.cpp
@@ -0,0 +1,48 @@
+// Comb filter implementation
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#include "comb.h"
+
+comb::comb()
+{
+	filterstore = 0;
+	bufidx = 0;
+}
+
+void comb::setbuffer(float *buf, int size) 
+{
+	buffer = buf; 
+	bufsize = size;
+}
+
+void comb::mute()
+{
+	for (int i=0; i<bufsize; i++)
+		buffer[i]=0;
+}
+
+void comb::setdamp(float val) 
+{
+	damp1 = val; 
+	damp2 = 1-val;
+}
+
+float comb::getdamp() 
+{
+	return damp1;
+}
+
+void comb::setfeedback(float val) 
+{
+	feedback = val;
+}
+
+float comb::getfeedback() 
+{
+	return feedback;
+}
+
+// ends
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/comb.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/comb.h
new file mode 100644
index 0000000..8e90bf2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/comb.h
@@ -0,0 +1,56 @@
+// Comb filter class declaration
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#ifndef _comb_
+#define _comb_
+
+//#include "denormals.h"
+#include "tuning.h"
+
+class comb
+{
+public:
+					comb();
+			void	setbuffer(float *buf, int size);
+	inline  float	process(float input);
+			void	mute();
+			void	setdamp(float val);
+			float	getdamp();
+			void	setfeedback(float val);
+			float	getfeedback();
+private:
+	float	feedback;
+	float	filterstore;
+	float	damp1;
+	float	damp2;
+	float	*buffer;
+	int		bufsize;
+	int		bufidx;
+};
+
+
+// Big to inline - but crucial for speed
+
+inline float comb::process(float input)
+{
+	float output;
+
+	output = buffer[bufidx];
+	//undenormalise(output);
+
+	filterstore = (output*damp2) + (filterstore*damp1);
+	//undenormalise(filterstore);
+
+	buffer[bufidx] = input + (filterstore*feedback);
+
+	if(++bufidx>=bufsize) bufidx = 0;
+
+	return output;
+}
+
+#endif //_comb_
+
+//ends
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/revmodel.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/revmodel.cpp
new file mode 100644
index 0000000..c2d0ea6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/revmodel.cpp
@@ -0,0 +1,493 @@
+// Reverb model implementation
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#include "revmodel.h"
+//#include "MSdcommon.h"
+#include "CReverbDef.h"
+#include "string"
+
+revmodel::revmodel()
+{
+	//
+	mallocBuffers();
+
+	// Tie the components to their buffers
+	combL[0].setbuffer(bufcombL1,combtuningL1);
+	combR[0].setbuffer(bufcombR1,combtuningR1);
+	combL[1].setbuffer(bufcombL2,combtuningL2);
+	combR[1].setbuffer(bufcombR2,combtuningR2);
+	combL[2].setbuffer(bufcombL3,combtuningL3);
+	combR[2].setbuffer(bufcombR3,combtuningR3);
+	combL[3].setbuffer(bufcombL4,combtuningL4);
+	combR[3].setbuffer(bufcombR4,combtuningR4);
+	combL[4].setbuffer(bufcombL5,combtuningL5);
+	combR[4].setbuffer(bufcombR5,combtuningR5);
+	combL[5].setbuffer(bufcombL6,combtuningL6);
+	combR[5].setbuffer(bufcombR6,combtuningR6);
+	combL[6].setbuffer(bufcombL7,combtuningL7);
+	combR[6].setbuffer(bufcombR7,combtuningR7);
+	combL[7].setbuffer(bufcombL8,combtuningL8);
+	combR[7].setbuffer(bufcombR8,combtuningR8);
+	allpassL[0].setbuffer(bufallpassL1,allpasstuningL1);
+	allpassR[0].setbuffer(bufallpassR1,allpasstuningR1);
+	allpassL[1].setbuffer(bufallpassL2,allpasstuningL2);
+	allpassR[1].setbuffer(bufallpassR2,allpasstuningR2);
+	allpassL[2].setbuffer(bufallpassL3,allpasstuningL3);
+	allpassR[2].setbuffer(bufallpassR3,allpasstuningR3);
+	allpassL[3].setbuffer(bufallpassL4,allpasstuningL4);
+	allpassR[3].setbuffer(bufallpassR4,allpasstuningR4);
+
+	// Set default values
+	allpassL[0].setfeedback(0.5f);
+	allpassR[0].setfeedback(0.5f);
+	allpassL[1].setfeedback(0.5f);
+	allpassR[1].setfeedback(0.5f);
+	allpassL[2].setfeedback(0.5f);
+	allpassR[2].setfeedback(0.5f);
+	allpassL[3].setfeedback(0.5f);
+	allpassR[3].setfeedback(0.5f);
+	setwet(initialwet);
+	setroomsize(initialroom);
+	setdry(initialdry);
+	setdamp(initialdamp);
+	setwidth(initialwidth);
+	setmode(initialmode);
+
+	// Buffer will be full of rubbish - so we MUST mute them
+	mute();
+}
+
+revmodel::~revmodel()
+{
+	safe_free(bufallpassL1);
+	safe_free(bufallpassL2);
+	safe_free(bufallpassL3);
+	safe_free(bufallpassL4);
+	safe_free(bufallpassR1);
+	safe_free(bufallpassR2);
+	safe_free(bufallpassR3);
+	safe_free(bufallpassR4);
+
+	safe_free(bufcombL1);
+	safe_free(bufcombL2);
+	safe_free(bufcombL3);
+	safe_free(bufcombL4);
+	safe_free(bufcombL5);
+	safe_free(bufcombL6);
+	safe_free(bufcombL7);
+	safe_free(bufcombL8);
+
+	safe_free(bufcombR1);
+	safe_free(bufcombR2);
+	safe_free(bufcombR3);
+	safe_free(bufcombR4);
+	safe_free(bufcombR5);
+	safe_free(bufcombR6);
+	safe_free(bufcombR7);
+	safe_free(bufcombR8);
+
+}
+
+int revmodel::mallocBuffers()
+{
+	//int ires; 
+
+	bufallpassL1 = NULL;
+	bufallpassL2 = NULL;
+	bufallpassL3 = NULL;
+	bufallpassL4 = NULL;
+	bufallpassR1 = NULL;
+	bufallpassR2 = NULL;
+	bufallpassR3 = NULL;
+	bufallpassR4 = NULL;
+
+	bufcombL1 = NULL;
+	bufcombL2 = NULL;
+	bufcombL3 = NULL;
+	bufcombL4 = NULL;
+	bufcombL5 = NULL;
+	bufcombL6 = NULL;
+	bufcombL7 = NULL;
+	bufcombL8 = NULL;
+
+	bufcombR1 = NULL;
+	bufcombR2 = NULL;
+	bufcombR3 = NULL;
+	bufcombR4 = NULL;
+	bufcombR5 = NULL;
+	bufcombR6 = NULL;
+	bufcombR7 = NULL;
+	bufcombR8 = NULL;
+
+	bufcombL1 = (float*)malloc(combtuningL1*sizeof(float));
+	bufcombL2 = (float*)malloc(combtuningL2*sizeof(float));
+	bufcombL3 = (float*)malloc(combtuningL3*sizeof(float));
+	bufcombL4 = (float*)malloc(combtuningL4*sizeof(float));
+	bufcombL5 = (float*)malloc(combtuningL5*sizeof(float));
+	bufcombL6 = (float*)malloc(combtuningL6*sizeof(float));
+	bufcombL7 = (float*)malloc(combtuningL7*sizeof(float));
+	bufcombL8 = (float*)malloc(combtuningL8*sizeof(float));
+	
+	bufcombR1 = (float*)malloc(combtuningR1*sizeof(float));
+	bufcombR2 = (float*)malloc(combtuningR2*sizeof(float));
+	bufcombR3 = (float*)malloc(combtuningR3*sizeof(float));
+	bufcombR4 = (float*)malloc(combtuningR4*sizeof(float));
+	bufcombR5 = (float*)malloc(combtuningR5*sizeof(float));
+	bufcombR6 = (float*)malloc(combtuningR6*sizeof(float));
+	bufcombR7 = (float*)malloc(combtuningR7*sizeof(float));
+	bufcombR8 = (float*)malloc(combtuningR8*sizeof(float));
+
+	bufallpassL1 = (float*)malloc(allpasstuningL1*sizeof(float));
+	bufallpassL2 = (float*)malloc(allpasstuningL2*sizeof(float));
+	bufallpassL3 = (float*)malloc(allpasstuningL3*sizeof(float));
+	bufallpassL4 = (float*)malloc(allpasstuningL4*sizeof(float));
+	bufallpassR1 = (float*)malloc(allpasstuningR1*sizeof(float));
+	bufallpassR2 = (float*)malloc(allpasstuningR2*sizeof(float));
+	bufallpassR3 = (float*)malloc(allpasstuningR3*sizeof(float));
+	bufallpassR4 = (float*)malloc(allpasstuningR4*sizeof(float));
+
+	memset(bufcombL1,0,combtuningL1*sizeof(float));
+	memset(bufcombL2,0,combtuningL2*sizeof(float));
+	memset(bufcombL3,0,combtuningL3*sizeof(float));
+	memset(bufcombL4,0,combtuningL4*sizeof(float));
+	memset(bufcombL5,0,combtuningL5*sizeof(float));
+	memset(bufcombL6,0,combtuningL6*sizeof(float));
+	memset(bufcombL7,0,combtuningL7*sizeof(float));
+	memset(bufcombL8,0,combtuningL8*sizeof(float));
+	memset(bufcombR1,0,combtuningR1*sizeof(float));
+	memset(bufcombR2,0,combtuningR2*sizeof(float));
+	memset(bufcombR3,0,combtuningR3*sizeof(float));
+	memset(bufcombR4,0,combtuningR4*sizeof(float));
+	memset(bufcombR5,0,combtuningR5*sizeof(float));
+	memset(bufcombR6,0,combtuningR6*sizeof(float));
+	memset(bufcombR7,0,combtuningR7*sizeof(float));
+	memset(bufcombR8,0,combtuningR8*sizeof(float));
+
+	memset(bufallpassL1,0,allpasstuningL1*sizeof(float));
+	memset(bufallpassL2,0,allpasstuningL2*sizeof(float));
+	memset(bufallpassL3,0,allpasstuningL3*sizeof(float));
+	memset(bufallpassL4,0,allpasstuningL4*sizeof(float));
+	memset(bufallpassR1,0,allpasstuningR1*sizeof(float));
+	memset(bufallpassR2,0,allpasstuningR2*sizeof(float));
+	memset(bufallpassR3,0,allpasstuningR3*sizeof(float));
+	memset(bufallpassR4,0,allpasstuningR4*sizeof(float));
+
+	return 0;
+
+
+	//float	bufcombL1[combtuningL1];
+	//float	bufcombR1[combtuningR1];
+	//float	bufcombL2[combtuningL2];
+	//float	bufcombR2[combtuningR2];
+	//float	bufcombL3[combtuningL3];
+	//float	bufcombR3[combtuningR3];
+	//float	bufcombL4[combtuningL4];
+	//float	bufcombR4[combtuningR4];
+	//float	bufcombL5[combtuningL5];
+	//float	bufcombR5[combtuningR5];
+	//float	bufcombL6[combtuningL6];
+	//float	bufcombR6[combtuningR6];
+	//float	bufcombL7[combtuningL7];
+	//float	bufcombR7[combtuningR7];
+	//float	bufcombL8[combtuningL8];
+	//float	bufcombR8[combtuningR8];
+
+	//// Buffers for the allpasses
+	//float	bufallpassL1[allpasstuningL1];
+	//float	bufallpassR1[allpasstuningR1];
+	//float	bufallpassL2[allpasstuningL2];
+	//float	bufallpassR2[allpasstuningR2];
+	//float	bufallpassL3[allpasstuningL3];
+	//float	bufallpassR3[allpasstuningR3];
+	//float	bufallpassL4[allpasstuningL4];
+	//float	bufallpassR4[allpasstuningR4];
+}
+
+void revmodel::mute()
+{
+	int i;
+	if (getmode() >= freezemode)
+		return;
+
+	for (i=0;i<numcombs;i++)
+	{
+		combL[i].mute();
+		combR[i].mute();
+	}
+	for (i=0;i<numallpasses;i++)
+	{
+		allpassL[i].mute();
+		allpassR[i].mute();
+	}
+}
+
+void revmodel::processMono(float* inputL,float* outputL, long numsamples,int skip)
+{
+	float outL,input;
+
+	while(numsamples-- > 0)
+	{
+		int i;
+		outL = 0;
+		input = (*inputL + *inputL) * gain;
+
+		for(i=0; i<numcombs; i++)
+		{
+			outL += combL[i].process(input);
+		}
+
+		for(i=0; i<numallpasses; i++)
+		{
+			outL = allpassL[i].process(outL);
+		}
+
+		*outputL = outL*wet1 + outL*wet2 + *inputL*dry;
+			
+		inputL += skip;
+		outputL += skip;
+	}
+}
+
+void revmodel::processreplace(float *inputL, float *inputR, float *outputL, float *outputR, long numsamples, int skip)
+{
+	float outL,outR,input;
+
+	while(numsamples-- > 0)
+	{
+		int i;
+		outL = outR = 0;
+		input = (*inputL + *inputR) * gain;
+
+		// Accumulate comb filters in parallel
+		for(i=0; i<numcombs; i++)
+		{
+			outL += combL[i].process(input);
+			outR += combR[i].process(input);
+		}
+
+		// Feed through allpasses in series
+		for(i=0; i<numallpasses; i++)
+		{
+			outL = allpassL[i].process(outL);
+			outR = allpassR[i].process(outR);
+		}
+
+		// Calculate output REPLACING anything already there
+		*outputL = outL*wet1 + outR*wet2 + *inputL*dry;
+		*outputR = outR*wet1 + outL*wet2 + *inputR*dry;
+
+		// Increment sample pointers, allowing for interleave (if any)
+		inputL += skip;
+		inputR += skip;
+		outputL += skip;
+		outputR += skip;
+	}
+}
+
+void revmodel::processmix(float *inputL, float *inputR, float *outputL, float *outputR, long numsamples, int skip)
+{
+	float outL,outR,input;
+
+	while(numsamples-- > 0)
+	{
+		int i;
+		outL = outR = 0;
+		input = (*inputL + *inputR) * gain;
+
+		// Accumulate comb filters in parallel
+		for(i=0; i<numcombs; i++)
+		{
+			outL += combL[i].process(input);
+			outR += combR[i].process(input);
+		}
+
+		// Feed through allpasses in series
+		for(i=0; i<numallpasses; i++)
+		{
+			outL = allpassL[i].process(outL);
+			outR = allpassR[i].process(outR);
+		}
+
+		// Calculate output MIXING with anything already there
+		*outputL += outL*wet1 + outR*wet2 + *inputL*dry;
+		*outputR += outR*wet1 + outL*wet2 + *inputR*dry;
+
+		// Increment sample pointers, allowing for interleave (if any)
+		inputL += skip;
+		inputR += skip;
+		outputL += skip;
+		outputR += skip;
+	}
+}
+
+void revmodel::update()
+{
+// Recalculate internal values after parameter change
+
+	int i;
+
+	wet1 = wet*(width/2 + 0.5f);
+	wet2 = wet*((1-width)/2);
+
+	if (mode >= freezemode)
+	{
+		roomsize1 = 1;
+		damp1 = 0;
+		gain = muted;
+	}
+	else
+	{
+		roomsize1 = roomsize;
+		damp1 = damp;
+		gain = fixedgain;
+	}
+
+	for(i=0; i<numcombs; i++)
+	{
+		combL[i].setfeedback(roomsize1);
+		combR[i].setfeedback(roomsize1);
+	}
+
+	for(i=0; i<numcombs; i++)
+	{
+		combL[i].setdamp(damp1);
+		combR[i].setdamp(damp1);
+	}
+}
+
+// The following get/set functions are not inlined, because
+// speed is never an issue when calling them, and also
+// because as you develop the reverb model, you may
+// wish to take dynamic action when they are called.
+
+void revmodel::setroomsize(float value)
+{
+	roomsize = (value*scaleroom) + offsetroom;
+	update();
+}
+
+float revmodel::getroomsize()
+{
+	return (roomsize-offsetroom)/scaleroom;
+}
+
+void revmodel::setdamp(float value)
+{
+	damp = value*scaledamp;
+	update();
+}
+
+float revmodel::getdamp()
+{
+	return damp/scaledamp;
+}
+
+void revmodel::setwet(float value)
+{
+	wet = value*scalewet;
+	update();
+}
+
+float revmodel::getwet()
+{
+	return wet/scalewet;
+}
+
+void revmodel::setdry(float value)
+{
+	dry = value*scaledry;
+}
+
+float revmodel::getdry()
+{
+	return dry/scaledry;
+}
+
+void revmodel::setwidth(float value)
+{
+	width = value;
+	update();
+}
+
+float revmodel::getwidth()
+{
+	return width;
+}
+
+void revmodel::setmode(float value)
+{
+	mode = value;
+	update();
+}
+
+float revmodel::getmode()
+{
+	if (mode >= freezemode)
+		return 1;
+	else
+		return 0;
+}
+
+int revmodel::setverbID(int iID)
+{
+	int i;
+	int j;
+	float fval;
+	float pParam[MAX_VERB_ID_NUMBER][6] = 
+	{
+		//{0.0f,	0.846f,	0.36f,	0.23f,	3.225f,	0.618f},	// 0,big room
+		//{0.2f,	0.721f,	0.20f,	0.16f,	2.337f,	0.618f},	// 1,media room
+		//{0.1f,	0.720f,	0.06f,	0.0f,	1.786f,	0.618f},	// 2,small room
+		//{0.0f,	0.944f,	0.81f,	0.93f,	-2.55f,	0.618f},	// 3,教堂
+		//{0.0f,	0.929f,	0.83f,	0.92f,	-5.62f,	0.618f},	// 4,剧场
+		//{0.4f,	0.942f,	0.13f,	0.32f,	0.886f,	0.618f},	// 5,隧道
+		//{0.4f,	0.912f,	0.66f,	0.36f,	3.225f,	0.618f},	// 6,音乐
+		//{0.4f,	0.882f,	0.42f,	0.22f,	-0.479f,0.618f},	// 7,影院
+		//{0.2f,	0.925f,	1.00f,	1.00f,	-5.621f,0.618f}		// 8,浴室
+
+		{0.0f,	0.846f,	0.36f,	0.23f,	0.0f,	1.0f  },	// 0,big room
+		{0.0f,	0.846f,	0.36f,	0.23f,	2.425f,	0.418f},	// 1,big room
+		{0.2f,	0.721f,	0.20f,	0.16f,	2.107f,	0.418f},	// 2,media room
+		{0.1f,	0.720f,	0.06f,	0.0f,	1.786f,	0.418f},	// 3,small room
+		{0.0f,	0.944f,	0.81f,	0.93f,	1.05f,	0.118f},	// 4,教堂
+		{0.0f,	0.929f,	0.83f,	0.92f,	0.82f,	0.218f},	// 5,剧场
+		{0.4f,	0.942f,	0.13f,	0.32f,	0.886f,	0.618f},	// 6,隧道
+		{0.4f,	0.912f,	0.66f,	0.36f,	1.225f,	0.318f},	// 7,音乐
+		{0.4f,	0.882f,	0.42f,	0.22f,	-0.479f,0.618f},	// 8,影院
+		{0.2f,	0.925f,	1.00f,	1.00f,	0.901f,	0.018f}		// 9,浴室
+	};
+
+	if ((iID<0)||(iID>= MAX_VERB_ID_NUMBER))
+	{
+		return -2;
+	}
+
+	i = iID;
+	j = 0;
+	//setwet(pParam[i][j++]);
+	//setroomsize(pParam[i][j++]);
+	//setdry(pParam[i][j++]);
+	//setdamp(pParam[i][j++]);
+	//setwidth(pParam[i][j++]);
+	//setmode(pParam[i][j++]);
+
+	setmode(pParam[i][j++]);
+	fval = (pParam[i][j++] - 0.7f)/0.28f;
+	setroomsize(fval);
+	//setroomsize(pParam[i][j++]);
+	setdamp(pParam[i][j++]);
+	setwidth(pParam[i][j++]);
+	
+	fval = (pParam[i][j++]/3);
+	setwet(fval);
+
+	fval = (pParam[i][j++]/2);
+	setdry(fval);
+
+	return 0;
+}
+
+//ends
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/revmodel.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/revmodel.h
new file mode 100644
index 0000000..56c6c46
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/revmodel.h
@@ -0,0 +1,120 @@
+// Reverb model declaration
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#ifndef _revmodel_
+#define _revmodel_
+
+#include "comb.h"
+#include "allpass.h"
+#include "tuning.h"
+
+#define MAX_VERB_ID_NUMBER	10	// fixed verb id number
+
+class revmodel
+{
+public:
+					revmodel();
+					~revmodel();
+			void	mute();
+			void	processmix(float *inputL, float *inputR, float *outputL, float *outputR, long numsamples, int skip);
+			void	processreplace(float *inputL, float *inputR, float *outputL, float *outputR, long numsamples, int skip);
+			void	processMono	(float* inputL,float* outputL, long numsamples,int skip);
+			void	setroomsize(float value);
+			float	getroomsize();
+			void	setdamp(float value);
+			float	getdamp();
+			void	setwet(float value);
+			float	getwet();
+			void	setdry(float value);
+			float	getdry();
+			void	setwidth(float value);
+			float	getwidth();
+			void	setmode(float value);
+			float	getmode();
+			int		setverbID(int iID);
+private:
+			void	update();
+			int		mallocBuffers();
+private:
+	float	gain;
+	float	roomsize,roomsize1;
+	float	damp,damp1;
+	float	wet,wet1,wet2;
+	float	dry;
+	float	width;
+	float	mode;
+
+	// The following are all declared inline 
+	// to remove the need for dynamic allocation
+	// with its subsequent error-checking messiness
+
+	// Comb filters
+	comb	combL[numcombs];
+	comb	combR[numcombs];
+
+	// Allpass filters
+	allpass	allpassL[numallpasses];
+	allpass	allpassR[numallpasses];
+
+	// Buffers for the combs
+	//float	bufcombL1[combtuningL1];
+	//float	bufcombR1[combtuningR1];
+	//float	bufcombL2[combtuningL2];
+	//float	bufcombR2[combtuningR2];
+	//float	bufcombL3[combtuningL3];
+	//float	bufcombR3[combtuningR3];
+	//float	bufcombL4[combtuningL4];
+	//float	bufcombR4[combtuningR4];
+	//float	bufcombL5[combtuningL5];
+	//float	bufcombR5[combtuningR5];
+	//float	bufcombL6[combtuningL6];
+	//float	bufcombR6[combtuningR6];
+	//float	bufcombL7[combtuningL7];
+	//float	bufcombR7[combtuningR7];
+	//float	bufcombL8[combtuningL8];
+	//float	bufcombR8[combtuningR8];
+
+	//// Buffers for the allpasses
+	//float	bufallpassL1[allpasstuningL1];
+	//float	bufallpassR1[allpasstuningR1];
+	//float	bufallpassL2[allpasstuningL2];
+	//float	bufallpassR2[allpasstuningR2];
+	//float	bufallpassL3[allpasstuningL3];
+	//float	bufallpassR3[allpasstuningR3];
+	//float	bufallpassL4[allpasstuningL4];
+	//float	bufallpassR4[allpasstuningR4];
+
+	float*	bufcombL1;
+	float*	bufcombR1;
+	float*	bufcombL2;
+	float*	bufcombR2;
+	float*	bufcombL3;
+	float*	bufcombR3;
+	float*	bufcombL4;
+	float*	bufcombR4;
+	float*	bufcombL5;
+	float*	bufcombR5;
+	float*	bufcombL6;
+	float*	bufcombR6;
+	float*	bufcombL7;
+	float*	bufcombR7;
+	float*	bufcombL8;
+	float*	bufcombR8;
+
+	// Buffers for the all passes
+	float*	bufallpassL1;
+	float*	bufallpassR1;
+	float*	bufallpassL2;
+	float*	bufallpassR2;
+	float*	bufallpassL3;
+	float*	bufallpassR3;
+	float*	bufallpassL4;
+	float*	bufallpassR4;
+};
+
+#endif//_revmodel_
+
+//ends
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/tuning.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/tuning.h
new file mode 100644
index 0000000..e8a4cc9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/reverb/src/verb/tuning.h
@@ -0,0 +1,62 @@
+// Reverb model tuning values
+//
+// Written by Jezar at Dreampoint, June 2000
+// http://www.dreampoint.co.uk
+// This code is public domain
+
+#ifndef _tuning_
+#define _tuning_
+#include "AudioEffectsConf.h"
+
+const int	numcombs		= 8;
+const int	numallpasses	= 4;
+const float	muted			= 0;
+const float	fixedgain		= 0.015f;
+const float scalewet		= 3;
+const float scaledry		= 2;
+const float scaledamp		= 0.4f;
+const float scaleroom		= 0.28f;
+const float offsetroom		= 0.7f;
+const float initialroom		= 0.5f;
+const float initialdamp		= 0.5f;
+const float initialwet		= 1/scalewet;
+const float initialdry		= 0;
+const float initialwidth	= 1;
+const float initialmode		= 0;
+const float freezemode		= 0.5f;
+const int	stereospread	= 23;
+
+// These values assume 44.1KHz sample rate
+// they will probably be OK for 48KHz sample rate
+// but would need scaling for 96KHz (or other) sample rates.
+// The values were obtained by listening tests.
+const int combtuningL1		= 1116;
+const int combtuningR1		= 1116+stereospread;
+const int combtuningL2		= 1188;
+const int combtuningR2		= 1188+stereospread;
+const int combtuningL3		= 1277;
+const int combtuningR3		= 1277+stereospread;
+const int combtuningL4		= 1356;
+const int combtuningR4		= 1356+stereospread;
+const int combtuningL5		= 1422;
+const int combtuningR5		= 1422+stereospread;
+const int combtuningL6		= 1491;
+const int combtuningR6		= 1491+stereospread;
+const int combtuningL7		= 1557;
+const int combtuningR7		= 1557+stereospread;
+const int combtuningL8		= 1617;
+const int combtuningR8		= 1617+stereospread;
+const int allpasstuningL1	= 556;
+const int allpasstuningR1	= 556+stereospread;
+const int allpasstuningL2	= 441;
+const int allpasstuningR2	= 441+stereospread;
+const int allpasstuningL3	= 341;
+const int allpasstuningR3	= 341+stereospread;
+const int allpasstuningL4	= 225;
+const int allpasstuningR4	= 225+stereospread;
+
+#endif//_tuning_
+
+//ends
+
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/CMakeLists.txt
new file mode 100644
index 0000000..34490cf
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/CMakeLists.txt
@@ -0,0 +1,13 @@
+#cmake_minimum_required(VERSION 2.8)
+#project(smule_eq)
+#set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+
+include_directories(./ inc)
+include_directories(src/all_plat src/audio_effect src/biquad
+        src/buffer src/damper src/delay src/delayi src/envelope_follower
+        src/equalizer src/reverb src/simple_delay_effect src/simple_reverb_effect)
+
+file(GLOB_RECURSE SAUDIO_EFFECTS_SRC_FILES src/*cpp)
+
+add_library(saudio_effects ${SAUDIO_EFFECTS_SRC_FILES})
+#set_target_properties(saudio_effects PROPERTIES CXX_VISIBILITY_PRESET hidden)
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/build_anrdroid.sh b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/build_anrdroid.sh
new file mode 100755
index 0000000..2abd1de
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/build_anrdroid.sh
@@ -0,0 +1,65 @@
+#!/usr/bin/env bash
+#!/bin/sh
+
+# @Time    : 2019-06-18 17:50
+# @Author  : AlanWang
+# @FileName: build_android.sh
+
+# MY_NDK 和 MY_CMAKE 需要改成自己对应的 ndk 中的目录
+MY_NDK="/Users/wangjianjun/AndroidDev/sdk/ndk-bundle"
+MY_CMAKE="/Users/wangjianjun/AndroidDev/sdk/cmake/3.6.4111459/bin/cmake"
+MY_NDK="/Users/yangjianli/Library/Android/sdk/ndk-bundle"
+MY_CMAKE="/Users/yangjianli/Library/Android/sdk/cmake/3.6.4111459/bin/cmake"
+if [ -z "$MY_NDK" ]; then
+  echo "Please set MY_NDK to the Android NDK folder"
+  exit 1
+fi
+
+if [ -z "$MY_CMAKE" ]; then
+  echo "Please set MY_CMAKE to the Android CMake folder"
+  exit 1
+fi
+
+OUTPUT_LIBS="./build/libs/android"
+ANDROID_NATIVE_API_LEVEL="android-16"
+
+# arme_abis=(armeabi armeabi-v7a arm64-v8a x86 x86_64 mips mips64)
+arme_abis=(armeabi-v7a arm64-v8a x86 x86_64)
+
+function build_with_armeabi() {
+	ARME_ABI=$1
+	echo ${ARME_ABI}
+
+	BUILD_DIR="./build/android/${ARME_ABI}"
+	PRE_EXE_DIR=$(pwd)
+	echo ${PRE_EXE_DIR}
+
+	${MY_CMAKE} \
+	-H"./" \
+	-B"${BUILD_DIR}" \
+	-DANDROID_ABI="${ARME_ABI}" \
+	-DANDROID_NDK="${MY_NDK}" \
+	-DCMAKE_LIBRARY_OUTPUT_DIRECTORY="./build/android/libs/${ARME_ABI}" \
+	-DCMAKE_BUILD_TYPE="Release" \
+	-DCMAKE_TOOLCHAIN_FILE="${MY_NDK}/build/cmake/android.toolchain.cmake" \
+	-DANDROID_NATIVE_API_LEVEL=${ANDROID_NATIVE_API_LEVEL} \
+	-DANDROID_TOOLCHAIN="clang" \
+	-DCMAKE_C_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DCMAKE_CXX_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DANDROID_STL="c++_static" \
+
+	cd ${BUILD_DIR}
+	make
+	make install
+
+	cd ${PRE_EXE_DIR}
+	mkdir -p ${OUTPUT_LIBS}/${ARME_ABI}/
+	mv ${PRE_EXE_DIR}/lib/* ${OUTPUT_LIBS}/${ARME_ABI}/
+	rm -r ./build/android
+	rm -r ${PRE_EXE_DIR}/lib
+}
+
+for i in ${arme_abis[@]}; do
+	build_with_armeabi $i
+done
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/inc/SAudioEffectsApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/inc/SAudioEffectsApi.h
new file mode 100644
index 0000000..9df2389
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/inc/SAudioEffectsApi.h
@@ -0,0 +1,63 @@
+//
+// Created by yangjianli on 2019-11-21.
+//
+
+#ifndef SMULE_EQ_SAUDIOEFFECTSAPI_H
+#define SMULE_EQ_SAUDIOEFFECTSAPI_H
+
+// 音效类对外接口
+// 双声道的数据会被处理为单声道
+#include "AudioEffectsDef.h"
+
+#define ERROR_CODE_SUCCESS 0
+#define ERROR_CODE_NO_MEMORY  -1
+#define ERROR_CODE_EFFECT_ERROR  -2 // 效果器为空
+
+#define STEREO 2
+#define MONO 1
+
+class Equalizer;
+class SimpleDelayEffect;
+class SimpleReverbEffect;
+
+class SAudioEffectsApi {
+public:
+    SAudioEffectsApi();
+    ~SAudioEffectsApi();
+
+public:
+    int init(int sample_rate, int channel);
+    int set_audio_effect(AE_PARAMS* param);
+    void reset();
+
+    // 输出始终是双声道，需要注意空间的大小
+    // 输入的samples长度是给定buffer的长度
+    int process(float* input, float* output, int number_of_samples);
+    int get_latency();
+    void uninit();
+
+private:
+    int allocate(int sample_rate, int channel);
+    void update();
+
+private:
+    Equalizer * m_eq;
+    SimpleDelayEffect * m_delay;
+    SimpleReverbEffect * m_reverb;
+
+private:
+    // buf
+    float* m_tmp_buf;
+    int m_tmp_buf_len;
+
+    int m_sample_rate;
+    int m_channel;
+
+    bool m_need_eq;
+    bool m_need_delay;
+    bool m_need_reverb;
+
+};
+
+
+#endif //SMULE_EQ_SAUDIOEFFECTSAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/inc/SAudioEffectsConf.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/inc/SAudioEffectsConf.h
new file mode 100644
index 0000000..2f47b15
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/inc/SAudioEffectsConf.h
@@ -0,0 +1,8 @@
+//
+// Created by yangjianli on 2020/10/29.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_SAUDIOEFFECTSCONF_H
+#define AUDIO_EFFECTS_LIB_SAUDIOEFFECTSCONF_H
+#include "AudioEffectsConf.h"
+#endif //AUDIO_EFFECTS_LIB_SAUDIOEFFECTSCONF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/SAudioEffectsApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/SAudioEffectsApi.cpp
new file mode 100644
index 0000000..bfec714
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/SAudioEffectsApi.cpp
@@ -0,0 +1,228 @@
+//
+// Created by yangjianli on 2019-11-21.
+//
+#include "SAudioEffectsApi.h"
+
+#include "Equalizer.h"
+#include "SimpleDelayEffect.h"
+#include "SimpleReverbEffect.h"
+
+SAudioEffectsApi::SAudioEffectsApi()
+{
+    m_eq = NULL;
+    m_delay = NULL;
+    m_reverb = NULL;
+    m_tmp_buf = NULL;
+    m_tmp_buf_len = 0;
+
+    m_need_eq = false;
+    m_need_delay = false;
+    m_need_reverb = false;
+}
+
+SAudioEffectsApi::~SAudioEffectsApi() {}
+
+
+int SAudioEffectsApi::init(int sample_rate, int channel)
+{
+    m_sample_rate = sample_rate;
+    m_channel = channel;
+    m_tmp_buf_len = 0;
+
+    m_need_eq = false;
+    m_need_delay = false;
+    m_need_reverb = false;
+    int nRet = allocate(sample_rate, channel);
+    if (ERROR_CODE_SUCCESS  != nRet)
+    {
+        uninit();
+        return nRet;
+    }
+    return ERROR_CODE_SUCCESS;
+}
+
+// 分配内存空间
+int SAudioEffectsApi::allocate(int sample_rate, int channel)
+{
+    m_eq = new(std::nothrow) Equalizer(sample_rate);
+    if (NULL == m_eq)
+    {
+        return ERROR_CODE_NO_MEMORY;
+    }
+    m_delay = new(std::nothrow) SimpleDelayEffect(sample_rate);
+    if (NULL == m_delay)
+    {
+        return ERROR_CODE_NO_MEMORY;
+    }
+
+    // 初始化不需要给空间，process时根据输入处理
+    m_reverb = new(std::nothrow) SimpleReverbEffect(MONO, 0);
+    if (NULL == m_reverb)
+    {
+        return ERROR_CODE_NO_MEMORY;
+    }
+    return ERROR_CODE_SUCCESS;
+}
+
+void SAudioEffectsApi::uninit()
+{
+    if(NULL != m_eq)
+    {
+        delete m_eq;
+        m_eq = NULL;
+    }
+
+    if(NULL != m_delay)
+    {
+        delete m_delay;
+        m_delay = NULL;
+    }
+
+    if(NULL != m_reverb)
+    {
+        delete m_reverb;
+        m_reverb = NULL;
+    }
+
+    if(NULL != m_tmp_buf)
+    {
+        delete[] m_tmp_buf;
+        m_tmp_buf = NULL;
+    }
+}
+
+
+int SAudioEffectsApi::set_audio_effect(AE_PARAMS *param)
+{
+    m_need_eq = false;
+    m_need_delay = false;
+    m_need_reverb = false;
+    if(NULL == param)
+    {
+        return ERROR_CODE_SUCCESS;
+    }
+    AE_PARAMS_SAE* params = (AE_PARAMS_SAE*) param;
+    for(int i=0;i<params->params_list.size();i++)
+    {
+        AE_PARAMS_SAE_CONTENT tp = params->params_list[i];
+        if(SAE_CLASS_EQ == tp.class_name)
+        {
+            m_need_eq = true;
+            m_eq->set_parameter_value(tp.function_name, tp.idx, tp.f_value);
+        }else if(SAE_CLASS_DELAY == tp.class_name)
+        {
+            m_need_delay = true;
+            m_delay->set_parameter_value(tp.function_name, tp.f_value);
+        }else if(SAE_CLASS_REVERB == tp.class_name)
+        {
+            m_need_reverb = true;
+            if(SAE_FUNC_IN_CH == tp.function_name || SAE_FUNC_OUT_CH == tp.function_name)
+            {
+                m_reverb->set_parameter_value(tp.function_name, tp.b_value);
+            }else
+            {
+                m_reverb->set_parameter_value(tp.function_name, tp.f_value);
+            }
+        }
+    }
+    return ERROR_CODE_SUCCESS;
+}
+
+void SAudioEffectsApi::reset()
+{
+    m_eq->reset();
+    m_delay->reset();
+    m_reverb->reset();
+}
+
+int SAudioEffectsApi::process(float *input, float *output, int number_of_samples)
+{
+    if(NULL == m_eq || NULL == m_delay || NULL == m_reverb || 0 == m_channel)
+    {
+        return ERROR_CODE_EFFECT_ERROR;
+    }
+
+    // 什么都不做
+    if(!m_need_eq && !m_need_delay && !m_need_reverb)
+    {
+        if(output != input)
+        {
+            memcpy(output, input, sizeof(float) * number_of_samples);
+        }
+        return ERROR_CODE_SUCCESS;
+    }
+
+    number_of_samples /= m_channel; // 保证和上层一致
+    bool need_trans = false;
+
+    // 立体声，做成单声道
+    if(STEREO == m_channel)
+    {
+        need_trans = true;
+        for(int i=0;i<number_of_samples;i++)
+        {
+            input[i] = (input[2 * i + 0] + input[2 * i + 1]) / 2;
+        }
+    }
+    if(output != input)
+    {
+        memcpy(output, input, sizeof(float) * number_of_samples * m_channel);
+    }
+
+
+    if(m_need_eq)
+    {
+        m_eq->process_internal(input, output, number_of_samples);
+    }
+    if(m_need_delay)
+    {
+        m_delay->process_internal(output, output, number_of_samples);
+    }
+    if(m_need_reverb)
+    {
+        if(MONO == m_channel)
+        {
+            // 单声道输入，内部需要有双声道的空间长度
+            // 最后再重新放回到单声道的空间中
+            if(m_tmp_buf_len != number_of_samples * STEREO)
+            {
+                if(NULL != m_tmp_buf)
+                {
+                    delete [] m_tmp_buf;
+                    m_tmp_buf = NULL;
+                }
+                m_tmp_buf = new (std::nothrow) float[number_of_samples * STEREO];
+                if(NULL == m_tmp_buf)
+                {
+                    return ERROR_CODE_NO_MEMORY;
+                }
+                m_tmp_buf_len = number_of_samples * STEREO;
+            }
+            m_reverb->process_internal(output, m_tmp_buf, number_of_samples);
+            for(int i=0;i<number_of_samples;i++)
+            {
+                output[i] = (m_tmp_buf[2 * i + 0] + m_tmp_buf[2 * i + 1]) / 2;
+            }
+        } else {
+            // 双声道输入
+            m_reverb->process_internal(output, output, number_of_samples);
+        }
+        need_trans = false;
+    }
+
+    if(need_trans)
+    {
+        need_trans = false;
+        for(int i=number_of_samples-1;i>=0;i--)
+        {
+            output[2*i] = output[i];
+            output[2*i+1] = output[i];
+        }
+    }
+    return ERROR_CODE_SUCCESS;
+}
+
+int SAudioEffectsApi::get_latency()
+{
+    return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/all_plat/Allplat.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/all_plat/Allplat.cpp
new file mode 100644
index 0000000..1c364e4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/all_plat/Allplat.cpp
@@ -0,0 +1,124 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "Allplat.h"
+#include <string>
+
+Allplat::Allplat()
+{
+	m_cache = nullptr;
+}
+
+Allplat::~Allplat()
+{
+	allplat_destroy();
+}
+
+void Allplat::allplat_create(int len, float feedback)
+{
+	m_cache = new float[len];
+	if(len)
+	{
+		memset(m_cache, 0, sizeof(float) * len);
+	}
+	m_current_ptr = m_cache;
+	m_end_ptr = m_cache + len;
+	m_len = len;
+	m_feedback = feedback;
+}
+
+void Allplat::allplat_reset()
+{
+	if(m_len)
+	{
+		memset(m_cache, 0, sizeof(float) * m_len);
+	}
+	
+	m_current_ptr = m_cache;
+}
+
+void Allplat::allplat_process(float * data, int len)
+{
+	if(len == 0)
+	{
+		return ;
+	}
+	
+	for(int i = 0; i < len; ++i)
+	{
+		data[i] = allplat_tick(data[i]);
+	}
+}
+
+void Allplat::allplat_tap(float * data, int len, int tap, float wet)
+{
+	tap = std::min(tap, m_len - 1);
+	float * ptr = m_current_ptr - tap - len;
+	while(ptr < m_cache)
+	{
+		ptr += m_len;
+	}
+	
+	for(int i = 0; i < len; ++i)
+	{
+		data[i] = data[i] + *ptr * wet;
+		
+		++ptr;
+		if(ptr >= m_end_ptr)
+		{
+			ptr = m_cache;
+		}
+	}
+}
+
+float Allplat::allplat_tick(float in)
+{
+	in = in - m_feedback * *m_current_ptr;
+	float out = *m_current_ptr + m_feedback * in;
+	
+	*m_current_ptr = in;
+	++m_current_ptr;
+	if(m_current_ptr >= m_end_ptr)
+	{
+		m_current_ptr = m_cache;
+	}
+	
+	return out;
+}
+
+void Allplat::allplat_destroy()
+{
+	if(m_cache)
+	{
+		delete [] m_cache;
+		m_cache = nullptr;
+	}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/all_plat/Allplat.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/all_plat/Allplat.h
new file mode 100644
index 0000000..bda8596
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/all_plat/Allplat.h
@@ -0,0 +1,60 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_ALLPLAT_H__
+#define __SMULE_ALLPLAT_H__
+
+//实现一个简单的全通滤波器，参考了freeverb3代码
+#include "SAudioEffectsConf.h"
+
+class Allplat
+{
+public:
+	Allplat();
+	~Allplat();
+
+public:
+	void allplat_create(int len, float feedback);
+	void allplat_reset();
+	void allplat_process(float * data, int len);
+	void allplat_tap(float * data, int len, int tap, float wet);
+	float allplat_tick(float in);
+	void allplat_destroy();
+
+private:
+	float * m_cache;//0
+	float * m_current_ptr;//4
+	float * m_end_ptr;//8
+	int m_len;//12
+	float m_feedback;//16
+};
+
+#endif /* __SMULE_ALLPLAT_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/audio_effect/AudioEffect.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/audio_effect/AudioEffect.cpp
new file mode 100644
index 0000000..cce72be
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/audio_effect/AudioEffect.cpp
@@ -0,0 +1,60 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "AudioEffect.h"
+
+//void AudioEffect::reset()
+//{
+//
+//}
+//
+//void AudioEffect::set_by_pass(bool bypass)
+//{
+//	m_bypass = bypass;
+//}
+//
+//int AudioEffect::get_latency_frames()
+//{
+//	return 0;
+//}
+//
+//void AudioEffect::set_parameter_value(const std::string & key, int idx, float value)
+//{
+//
+//}
+//
+//void AudioEffect::set_parameter_value(const std::string & key, bool value)
+//{
+//	if(key == "Bypass")
+//	{
+//		m_bypass = value;
+//	}
+//}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/audio_effect/AudioEffect.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/audio_effect/AudioEffect.h
new file mode 100644
index 0000000..001f866
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/audio_effect/AudioEffect.h
@@ -0,0 +1,80 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_AUDIOEFFECT_H__
+#define __SMULE_AUDIOEFFECT_H__
+
+#include <memory>
+#include <string>
+#include "SAudioEffectsConf.h"
+
+class Parameter;
+
+class MidiContext;
+class FXConfigInfo;
+
+//效果器的基类
+class AudioEffect
+{
+public:
+    AudioEffect(unsigned int in_channels, unsigned int out_channels) {m_in_channels = in_channels;m_out_channels=out_channels;};
+    virtual ~AudioEffect() {};
+
+public:
+    //重置缓存
+    virtual void reset() {};
+    virtual void set_by_pass(bool bypass) {};
+    virtual void input_channels() {};
+    virtual void output_channels() {};
+    //返回延迟多少点
+    virtual int get_latency_frames() {};
+    virtual void set_parameter(const std::shared_ptr<Parameter> &) {};
+    virtual void set_render_context(std::shared_ptr<MidiContext>) {};
+    virtual void set_fX_config(std::shared_ptr<FXConfigInfo>) {};
+    virtual void process_internal(const float *input, float *output, unsigned int len) {};
+
+    //下面为设置参数模块
+    virtual void set_parameter_value(const std::string &key, float value) {};
+    virtual void set_parameter_value(const std::string &key, int idx, float value) {};
+    virtual void set_parameter_value(const std::string &, const std::string &, float) {};
+    virtual void set_parameter_value(const std::string &, const std::string &, bool) {};
+    virtual void set_parameter_value(const std::string &, std::string) {};
+    virtual void set_parameter_value(const std::string &key, bool value) {};
+
+protected:
+    bool m_bypass;//4
+    int m_in_channels;//8
+    int m_out_channels;//12
+    int m_16[12];//16
+    int m_64;//64
+};
+
+#endif /* __SMULE_AUDIOEFFECT_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/biquad/Biquad.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/biquad/Biquad.cpp
new file mode 100644
index 0000000..64d481a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/biquad/Biquad.cpp
@@ -0,0 +1,334 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "Biquad.h"
+#include <cmath>
+#include <algorithm>
+
+Biquad::Biquad()
+{
+	m_param = nullptr;
+	m_type = BIQUAD_LOP;
+	m_channels = 0;
+	m_fc = 0;
+	m_Q = 0;
+	m_gain = 0;
+	m_fs = 0;
+}
+
+Biquad::~Biquad()
+{
+	biquad_destroy();
+}
+
+void Biquad::biquad_create_lop(float fc, float Q, float fs, int channels)
+{
+	biquad_create(BIQUAD_LOP, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create_hip(float fc, float Q, float fs, int channels)
+{
+	biquad_create(BIQUAD_HIP, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create_bp(float fc, float Q, float fs, int channels)
+{
+	biquad_create(BIQUAD_BP, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create_notch(float fc, float Q, float fs, int channels)
+{
+	biquad_create(BIQUAD_NOTCH, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create_peak(float fc, float Q, float db, float fs, int channels)
+{
+	biquad_create(BIQUAD_PEAK, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create_loshelf(float fc, float Q, float db, float fs, int channels)
+{
+	biquad_create(BIQUAD_LOSHELF, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create_hishelf(float fc, float Q, float db, float fs, int channels)
+{
+	biquad_create(BIQUAD_HISHELF, fc, Q, 0, fs, channels);
+}
+
+void Biquad::biquad_create(int type, float fc, float Q, float db, float fs, int channels)
+{
+	if(type > BIQUAD_MAX)
+	{
+		return;
+	}
+	
+	m_param = new BiquadParam[channels];
+	m_type = type;
+	m_channels = channels;
+	m_fc = fc;
+	m_Q = Q;
+	m_gain = db;
+	m_fs = fs;
+	
+	biquad_setcoefs(type, fc, Q, db);
+}
+
+int Biquad::biquad_setFreq(float fc)
+{
+	return biquad_setcoefs(m_type, fc, m_Q, m_gain);
+}
+
+int Biquad::biquad_setGain(float db)
+{
+	return biquad_setcoefs(m_type, m_fc, m_Q, db);
+}
+
+int Biquad::biquad_setQ(float Q)
+{
+	return biquad_setcoefs(m_type, m_fc, Q, m_gain);
+}
+
+int Biquad::biquad_setcoefs(int type, float fc, float Q, float db)
+{
+	int err_code = 0;
+	
+	//检查有没有初始化
+	if(m_param == nullptr || m_fs == 0)
+	{
+		return 1;
+	}
+	
+	//检查参数合法性
+	Q = std::max(Q, 0.01f);
+	fc = std::max(0.0f, std::min(fc, m_fs / 2));
+	
+	m_type = type;
+	m_fc = fc;
+	m_Q = Q;
+	m_gain = db;
+	
+	float w0 = (m_fc / m_fs) * 2 * M_PI;
+	float sin0 = sin(w0);
+	float cos0 = cos(w0);
+	float alpha = sin0 / (2 * m_Q);
+	float A = pow(10, m_gain / 40);
+	
+	float a0, a1, a2, b0, b1, b2;
+	
+	switch(m_type)
+	{
+	case BIQUAD_LOP:
+		b0 = (1 - cos0) / 2;
+		b1 = 1 - cos0;
+		b2 = (1 - cos0) / 2;
+		a0 = 1 + alpha;
+		a1 = -2 * cos0;
+		a2 = 1 - alpha;
+		break;
+	case BIQUAD_HIP:
+		b0 = (1 + cos0) / 2;
+		b1 = -(1 + cos0);
+		b2 = (1 + cos0) / 2;
+		a0 = 1 + alpha;
+		a1 = -2 * cos0;
+		a2 = 1 - alpha;
+		break;
+	case BIQUAD_BP:
+		b0 = alpha;
+		b1 = 0;
+		b2 = -alpha;
+		a0 = 1 + alpha;
+		a1 = -2 * cos0;
+		a2 = 1 - alpha;
+		break;
+	case BIQUAD_NOTCH:
+		b0 = 1;
+		b1 = -2 * cos0;
+		b2 = 1;
+		a0 = 1 + alpha;
+		a1 = -2 * cos0;
+		a2 = 1 - alpha;
+		break;
+	case BIQUAD_PEAK:
+		b0 = 1 + alpha * A;
+		b1 = -2 * cos0;
+		b2 = 1 - alpha * A;
+		a0 = 1 + alpha / A;
+		a1 = -2 * cos0;
+		a2 = 1 - alpha / A;
+		break;
+	case BIQUAD_LOSHELF:
+		b0 =     A * ((A + 1) - (A - 1) * cos0 + 2 * sqrt(A) * alpha);
+		b1 = 2 * A * ((A - 1) - (A + 1) * cos0);
+		b2 =     A * ((A + 1) - (A - 1) * cos0 - 2 * sqrt(A) * alpha);
+		a0 =          (A + 1) + (A - 1) * cos0 + 2 * sqrt(A) * alpha;
+		a1 =    -2 * ((A - 1) + (A + 1) * cos0);
+		a2 =          (A + 1) + (A - 1) * cos0 - 2 * sqrt(A) * alpha;
+		break;
+	case BIQUAD_HISHELF:
+		b0 =      A * ((A + 1) + (A - 1) * cos0 + 2 * sqrt(A) * alpha);
+		b1 = -2 * A * ((A - 1) + (A + 1) * cos0);
+		b2 =      A * ((A + 1) + (A - 1) * cos0 - 2 * sqrt(A) * alpha);
+		a0 =           (A + 1) - (A - 1) * cos0 + 2 * sqrt(A) * alpha;
+		a1 =      2 * ((A - 1) - (A + 1) * cos0);
+		a2 =           (A + 1) - (A - 1) * cos0 - 2 * sqrt(A) * alpha;
+		break;
+	default:
+		b0 = 0;
+		b1 = 0;
+		b2 = 0;
+		a0 = 1;
+		a1 = 0;
+		a2 = 0;
+		err_code = 1;
+	}
+	
+	//防止出现除 0 错误
+	if(a0 == 0)
+	{
+		a0 = 1e-20;
+	}
+	
+	//每个通道需要一组参数
+	if(m_channels)
+	{
+		b0 /= a0;
+		b1 /= a0;
+		b2 /= a0;
+		a1 /= a0;
+		a2 /= a0;
+		a0 = 1;
+		
+		for(int i = 0; i < m_channels; ++i)
+		{
+			m_param[i].b0 = b0;
+			m_param[i].b1 = b1;
+			m_param[i].b2 = b2;
+			m_param[i].a1 = a1;
+			m_param[i].a2 = a2;
+		}
+	}
+	
+	return err_code;
+}
+
+void Biquad::biquad_reset()
+{
+	if(m_param && m_channels)
+	{
+		//将保存的延迟参数进行清空
+		for(int i = 0; i < m_channels; ++i)
+		{
+			m_param[i].x1 = 0;
+			m_param[i].x2 = 0;
+			m_param[i].y1 = 0;
+			m_param[i].y2 = 0;
+		}
+	}
+}
+
+void Biquad::biquad_process1(float * data, int len)
+{
+	if(m_channels == 0)
+	{
+		return ;
+	}
+	
+	for(int i = 0; i < m_channels; ++i)
+	{
+		float b0 = m_param[i].b0;
+		float b1 = m_param[i].b1;
+		float b2 = m_param[i].b2;
+		float a1 = m_param[i].a1;
+		float a2 = m_param[i].a2;
+		float x1 = m_param[i].x1;
+		float x2 = m_param[i].x2;
+		float y1 = m_param[i].y1;
+		float y2 = m_param[i].y2;
+		
+		for(int j = i; j < len; j += m_channels)
+		{
+			float x = data[j];
+			data[j] = b0 * x + b1 * x1 + b2 * x2 - a1 * y1 - a2 * y2;
+			
+			x2 = x1;
+			x1 = x;
+			y2 = y1;
+			y1 = data[j];
+		}
+		
+		m_param[i].x1 = x1;
+		m_param[i].x2 = x2;
+		m_param[i].y1 = y1;
+		m_param[i].y2 = y2;
+	}
+}
+
+void Biquad::biquad_process2(float * data, int len)
+{
+	if(m_channels == 0)
+	{
+		return ;
+	}
+	
+	for(int i = 0; i < m_channels; ++i)
+	{
+		float b0 = m_param[i].b0;
+		float b1 = m_param[i].b1;
+		float b2 = m_param[i].b2;
+		float a1 = m_param[i].a1;
+		float a2 = m_param[i].a2;
+		float cache1 = m_param[i].x1;
+		float cache2 = m_param[i].x2;
+		
+		for(int j = i; j < len; j += m_channels)
+		{
+			float cache = data[j] - a1 * cache1 - a2 * cache2;
+			data[j] = b0 * cache + b1 * cache1 + b2 * cache2;
+			
+			cache2 = cache1;
+			cache1 = cache;
+		}
+		
+		m_param[i].x1 = cache1;
+		m_param[i].x2 = cache2;
+	}
+}
+
+void Biquad::biquad_destroy()
+{
+	if(m_param)
+	{
+		delete [] m_param;
+		m_param = nullptr;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/biquad/Biquad.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/biquad/Biquad.h
new file mode 100644
index 0000000..7b51975
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/biquad/Biquad.h
@@ -0,0 +1,123 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_BIQUAD_H__
+#define __SMULE_BIQUAD_H__
+#include "SAudioEffectsConf.h"
+//这里实际上按照 RBJ 的 cookbook 进行设计的双二阶滤波器
+
+//滤波器类型
+#define BIQUAD_LOP		0
+#define BIQUAD_HIP		1
+#define BIQUAD_BP		2
+#define BIQUAD_NOTCH	3
+#define BIQUAD_PEAK		4
+#define BIQUAD_LOSHELF	5
+#define BIQUAD_HISHELF	6
+#define BIQUAD_MAX		BIQUAD_HISHELF
+
+typedef struct _BiquadParam
+{
+	float b0;
+	float b1;
+	float b2;
+	float a1;
+	float a2;
+	float x1;
+	float x2;
+	float y1;
+	float y2;
+	_BiquadParam() : b0(0), b1(0), b2(0), a1(0), a2(0), x1(0), x2(0), y1(0), y2(0) { }
+}BiquadParam;
+
+class Biquad
+{
+public:
+	Biquad();
+	~Biquad();
+
+public:
+	//初始化低通滤波参数
+	void biquad_create_lop(float fc, float Q, float fs, int channels);
+	//初始化高通滤波参数
+	void biquad_create_hip(float fc, float Q, float fs, int channels);
+	//初始化带通滤波参数
+	void biquad_create_bp(float fc, float Q, float fs, int channels);
+	//初始化陷波滤波参数
+	void biquad_create_notch(float fc, float Q, float fs, int channels);
+	//初始化peak滤波参数
+	void biquad_create_peak(float fc, float Q, float db, float fs, int channels);
+	//初始化低搁置滤波参数
+	void biquad_create_loshelf(float fc, float Q, float db, float fs, int channels);
+	//初始化高搁置滤波参数
+	void biquad_create_hishelf(float fc, float Q, float db, float fs, int channels);
+	//初始化函数
+	void biquad_create(int type, float fc, float Q, float db, float fs, int channels);
+	
+	//设置中心频率或者截止频率
+	int biquad_setFreq(float fc);
+	//设置增益
+	int biquad_setGain(float db);
+	//设置Q值
+	int biquad_setQ(float Q);
+	//设置参数
+	int biquad_setcoefs(int type, float fc, float Q, float db);
+	
+	//重置函数
+	void biquad_reset();
+	
+	//按照直接一型进行运算，长度为一个声道的长度
+	void biquad_process1(float * data, int len);
+	//按照直接二型进行运算，长度为一个声道的长度
+	void biquad_process2(float * data, int len);
+
+private:
+	//销毁、释放内存
+	void biquad_destroy();
+
+private:
+	//运行参数
+	BiquadParam * m_param;//0
+	//滤波器类型
+	int m_type;//4
+	//声道数
+	int m_channels;//8
+	//截止频率或中心频率
+	float m_fc;//12
+	//Q值
+	float m_Q;//16
+	//增益
+	float m_gain;//20
+	//采样率
+	float m_fs;//24
+};
+
+#endif /* __SMULE_BIQUAD_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/buffer/Buffer.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/buffer/Buffer.h
new file mode 100644
index 0000000..34b4322
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/buffer/Buffer.h
@@ -0,0 +1,66 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_BUFFER_H__
+#define __SMULE_BUFFER_H__
+#include "SAudioEffectsConf.h"
+
+namespace Smule
+{
+namespace Audio
+{
+
+template <class T, unsigned int chsize>
+class Buffer
+{
+public:
+	Buffer(unsigned int len);
+	~Buffer();
+
+public:
+	void ensure(int len);
+	T * ptr();
+	
+private:
+	//数据指针
+	std::shared_ptr<T> m_ptr;//0
+	//总长度
+	int m_len;//8
+	//当前已写入的位置
+	int m_write_idx;//12
+};
+
+}
+}
+
+#include "Buffer.hpp"
+
+#endif /* __SMULE_BUFFER_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/buffer/Buffer.hpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/buffer/Buffer.hpp
new file mode 100644
index 0000000..36c27c3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/buffer/Buffer.hpp
@@ -0,0 +1,74 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_BUFFER_HPP__
+#define __SMULE_BUFFER_HPP__
+
+namespace Smule
+{
+namespace Audio
+{
+
+template<class T, unsigned int chsize>
+Buffer<T, chsize>::Buffer(unsigned int len)
+	: m_ptr(new T[chsize * len], std::default_delete<T[]>())
+{
+	m_len = len;
+	m_write_idx = 0;
+}
+
+template<class T, unsigned int chsize>
+Buffer<T, chsize>::~Buffer()
+{
+
+}
+
+template<class T, unsigned int chsize>
+void Buffer<T, chsize>::ensure(int len)
+{
+	if(m_len - m_write_idx < len)
+	{
+		std::shared_ptr<T> ptr(new T[m_write_idx + chsize * len], std::default_delete<T[]>());
+		memcpy(ptr.get(), m_ptr.get(), sizeof(T) * m_write_idx);
+		m_ptr = ptr;
+	}
+}
+
+template<class T, unsigned int chsize>
+T * Buffer<T, chsize>::ptr()
+{
+	return m_ptr.get() + m_write_idx;
+}
+
+}
+}
+
+#endif /* __SMULE_BUFFER_HPP__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/damper/Damper.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/damper/Damper.cpp
new file mode 100644
index 0000000..6260e83
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/damper/Damper.cpp
@@ -0,0 +1,85 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "Damper.h"
+
+Damper::Damper()
+{
+	m_coeff = 0;
+	m_y1 = 0;
+}
+
+Damper::~Damper()
+{
+	damper_destroy();
+}
+
+void Damper::damper_create(float coeff)
+{
+	m_coeff = coeff;
+	m_y1 = 0;
+}
+
+void Damper::damper_set(float coeff)
+{
+	m_coeff = coeff;
+}
+
+void Damper::damper_clear()
+{
+	m_y1 = 0;
+}
+
+void Damper::damper_process(float * data, int len)
+{
+	if(len == 0)
+	{
+		return ;
+	}
+	
+	for(int i = 0; i < len; ++i)
+	{
+		data[i] = damper_tick(data[i]);
+	}
+}
+
+float Damper::damper_tick(float in)
+{
+	m_y1 = m_coeff * m_y1 + (1 - m_coeff) * in;
+	
+	return m_y1;
+}
+
+void Damper::damper_destroy()
+{
+	m_coeff = 0;
+	m_y1 = 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/damper/Damper.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/damper/Damper.h
new file mode 100644
index 0000000..07f621b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/damper/Damper.h
@@ -0,0 +1,59 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_DAMPER_H__
+#define __SMULE_DAMPER_H__
+
+//利用单极点来实现减震器，参考 freeverb3 中的 efilter
+#include "SAudioEffectsConf.h"
+
+class Damper
+{
+public:
+	Damper();
+	~Damper();
+
+public:
+	void damper_create(float coeff);
+	void damper_set(float coeff);
+	void damper_clear();
+	void damper_process(float * data, int len);
+	float damper_tick(float in);
+	void damper_destroy();
+
+private:
+	//低通系数
+	float m_coeff;//0
+	//历史数据
+	float m_y1;//4
+};
+
+#endif /* __SMULE_DAMPER_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delay/Delay.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delay/Delay.cpp
new file mode 100644
index 0000000..2f0b595
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delay/Delay.cpp
@@ -0,0 +1,148 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "Delay.h"
+#include <algorithm>
+
+Delay::Delay()
+{
+	m_start_ptr = nullptr;
+	m_read_ptr = nullptr;
+	m_write_ptr = nullptr;
+	m_end_ptr = nullptr;
+}
+
+Delay::~Delay()
+{
+	delay_destroy();
+}
+
+void Delay::delay_create(float delay_time, float fs, float wet, float dry, float feedback)
+{
+	int frames = (int)(delay_time * fs * 0.001);
+	if(frames <= 0)
+	{
+		frames = 1;
+		delay_time = 1 / (fs * 0.001);
+	}
+	
+	m_delay_len = frames + 1;
+	m_start_ptr = new float[m_delay_len];
+	memset(m_start_ptr, 0, sizeof(float) * m_delay_len);
+	
+	m_read_ptr = m_start_ptr;
+	m_write_ptr = m_start_ptr + frames;
+	m_end_ptr = m_start_ptr + m_delay_len;
+	
+	m_fs = fs;
+	m_delay_time = delay_time;
+	m_delay_frame = frames;
+	
+	delay_set_fbk(feedback);
+	delay_set_levels(wet, dry);
+}
+
+void Delay::delay_set_delframes(int frames)
+{
+	m_delay_frame = std::max(1, std::min(frames, m_delay_len - 1));
+	m_delay_time = m_delay_frame / (m_fs * 0.001);
+	
+	//TODO 感觉这里有问题
+	m_write_ptr = m_read_ptr + m_delay_frame;
+	if(m_write_ptr >= m_end_ptr)
+	{
+		m_write_ptr = m_read_ptr;
+	}
+}
+
+void Delay::delay_set_deltime(float time)
+{
+	int frames = (int)(time * m_fs * 0.001);
+	delay_set_delframes(frames);
+}
+
+void Delay::delay_set_fbk(float feedback)
+{
+	m_feedback = feedback;
+}
+
+void Delay::delay_set_levels(float wet, float dry)
+{
+	m_wet = wet;
+	m_dry = dry;
+}
+
+float Delay::delay_get_deltime()
+{
+	return m_delay_time;
+}
+
+void Delay::delay_clear()
+{
+	memset(m_start_ptr, 0, sizeof(float) * m_delay_frame);
+}
+
+void Delay::delay_process(float * data, int len)
+{
+	if(len == 0)
+	{
+		return ;
+	}
+	
+	for(int i = 0; i < len; ++i)
+	{
+		float x = data[i];
+		data[i] = m_dry * x + m_wet * *m_read_ptr;
+		
+		*m_write_ptr = x + m_feedback * *m_read_ptr;
+		
+		++m_read_ptr;
+		if(m_read_ptr >= m_end_ptr)
+		{
+			m_read_ptr -= m_delay_len;
+		}
+		
+		++m_write_ptr;
+		if(m_write_ptr >= m_end_ptr)
+		{
+			m_write_ptr -= m_delay_len;
+		}
+	}
+}
+
+void Delay::delay_destroy()
+{
+	if(m_start_ptr)
+	{
+		delete [] m_start_ptr;
+		m_start_ptr = nullptr;
+	}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delay/Delay.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delay/Delay.h
new file mode 100644
index 0000000..f5d149a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delay/Delay.h
@@ -0,0 +1,71 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_DELAY_H__
+#define __SMULE_DELAY_H__
+#include "SAudioEffectsConf.h"
+//实现简单的延迟器
+
+class Delay
+{
+public:
+	Delay();
+	~Delay();
+	
+public:
+	void delay_create(float delay_time, float fs, float wet, float dry, float feedback);
+	void delay_set_delframes(int frames);
+	void delay_set_deltime(float time);
+	void delay_set_fbk(float feedback);
+	void delay_set_levels(float wet, float dry);
+	float delay_get_deltime();
+	void delay_clear();
+	void delay_process(float * data, int len);
+	void delay_destroy();
+
+private:
+	float * m_start_ptr;//0
+	float * m_read_ptr;//4
+	float * m_write_ptr;//8
+	float * m_end_ptr;//12
+	//延迟线长度
+	int m_delay_len;//16
+	float m_fs;//20
+	//单位ms
+	float m_delay_time;//24
+	//单位为采样点个数
+	int m_delay_frame;//28
+	float m_feedback;//32
+	float m_dry;//36
+	float m_wet;//40
+};
+
+#endif /* __SMULE_DELAY_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delayi/DelayI.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delayi/DelayI.cpp
new file mode 100644
index 0000000..ecd3959
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delayi/DelayI.cpp
@@ -0,0 +1,239 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "DelayI.h"
+#include <algorithm>
+#include <cmath>
+
+#define LFO_LEN	1024
+static float gs_lfo_waves[LFO_LEN];
+static bool gs_lfo_inited = false;
+
+//找到比 x 小的、最大的 2 次方数
+inline int small_biggest_pow2(unsigned int x)
+{
+	int result;
+	
+	do
+	{
+		result = x;
+		x &= (x - 1);
+	}
+	while(x != 0);
+	
+	return result;
+}
+
+DelayI::DelayI()
+{
+	m_cache = nullptr;
+}
+
+DelayI::~DelayI()
+{
+	delayi_destroy();
+}
+
+void DelayI::delayi_create(int depth)
+{
+	depth = std::max(depth, 0);
+	
+	int total_len = std::max(1, 4 * small_biggest_pow2(depth));
+	
+	m_cache = new float[total_len];
+	memset(m_cache, 0, sizeof(float) * total_len);
+	m_delay_len = depth;
+	m_total_len = total_len;
+	m_mask = total_len - 1;
+	m_read_idx = 0;
+	m_write_idx = depth;
+	
+	m_amplitude = 0;
+	m_rate = 0;
+	m_inc = 0;
+	m_phase = 0;
+	m_feedback = 0;
+	
+	if(!gs_lfo_inited)
+	{
+		gs_lfo_inited = true;
+		
+		for(int i = 0; i < LFO_LEN; ++i)
+		{
+			gs_lfo_waves[i] = sinf(2 * M_PI * i / LFO_LEN);
+		}
+	}
+}
+
+void DelayI::delayi_set_fbk(float feedback)
+{
+	m_feedback = feedback;
+}
+
+void DelayI::delayi_set_lfo_amt(float amplitude)
+{
+
+}
+
+void DelayI::delayi_set_lfo_inc(float inc)
+{
+	m_inc = inc;
+}
+
+void DelayI::delayi_set_lfo_phase(float phase)
+{
+	m_phase = phase - (int)phase;
+}
+
+void DelayI::delayi_set_lfo_rate(float rate)
+{
+	m_rate = rate;
+}
+
+void DelayI::delayi_reset()
+{
+	if(m_total_len)
+	{
+		memset(m_cache, 0, sizeof(float) * m_total_len);
+	}
+}
+
+void DelayI::delayi_process(float * data, int len)
+{
+	if(len == 0)
+	{
+		return ;
+	}
+	
+	for(int i = 0; i < len; ++i)
+	{
+		//当前相位对应的LFO的采样点位置并更新相位
+		float lfo_pos = m_phase * LFO_LEN;
+		m_phase += m_inc;
+		m_phase = m_phase - (int)m_phase;
+		
+		//存放延迟数据，只是为方便后面 0 延迟时取数据
+		float x = data[i];
+		m_cache[m_write_idx] = x;
+		
+		//计算需要返回的延迟数据的位置，实际为一个线性插值，并更新读取位置
+		int s = ((int)lfo_pos) & (LFO_LEN - 1);
+		int e = (s + 1) & (LFO_LEN - 1);
+		float delay_pos = m_total_len + m_read_idx +
+				m_amplitude * (gs_lfo_waves[s] + (lfo_pos - (int)lfo_pos) * (gs_lfo_waves[e] - gs_lfo_waves[s]));
+		m_read_idx = (m_read_idx + 1) & m_mask;
+		
+		//计算延迟结果值，实际为一个线性插值
+		s = ((int)delay_pos) & m_mask;
+		e = (s + 1) & m_mask;
+		float value = m_cache[s] + (delay_pos - (int)delay_pos) * (m_cache[e] - m_cache[s]);
+		
+		//计算输出值，应该按照干湿比进行运算
+		if(m_feedback > 0)
+		{
+			data[i] = x + value;
+		}
+		else
+		{
+			data[i] = x - value;
+		}
+		
+		//存放延迟数据，并更新写入位置
+		m_cache[m_write_idx] = x + m_feedback * value;
+		m_write_idx = (m_write_idx + 1) & m_mask;
+	}
+}
+
+void DelayI::delayi_tap(float * data, int len, int tap, float weight)
+{
+	//tap位置不超过延迟长度
+	tap = std::min(tap, (int)(m_delay_len - 1));
+	
+	//计算开始读取的位置
+	int read_idx = m_write_idx - len - tap;
+	while(read_idx < 0)
+	{
+		read_idx += m_total_len;
+	}
+	
+	for(int i = 0; i < len; ++i)
+	{
+		data[i] = data[i] + m_cache[read_idx] * weight;
+		read_idx = (read_idx + 1) & m_mask;
+	}
+}
+
+float DelayI::delayi_tick(float in)
+{
+	//这里加不加这个分支结果是一致的
+	if(m_amplitude == 0)
+	{
+		m_cache[m_write_idx] = in;
+		m_write_idx = (m_write_idx + 1) & m_mask;
+		
+		in = m_cache[m_read_idx];
+		m_read_idx = (m_read_idx + 1) & m_mask;
+	}
+	else
+	{
+		//当前相位对应的LFO的采样点位置并更新相位
+		float lfo_pos = m_phase * LFO_LEN;
+		m_phase += m_inc;
+		m_phase = m_phase - (int)m_phase;
+		
+		//存放延迟数据，并更新写入位置
+		m_cache[m_write_idx] = in;
+		m_write_idx = (m_write_idx + 1) & m_mask;
+		
+		//计算需要返回的延迟数据的位置，实际为一个线性插值，并更新读取位置
+		int s = ((int)lfo_pos) & (LFO_LEN - 1);
+		int e = (s + 1) & (LFO_LEN - 1);
+		float delay_pos = m_total_len + m_read_idx +
+				m_amplitude * (gs_lfo_waves[s] + (lfo_pos - (int)lfo_pos) * (gs_lfo_waves[e] - gs_lfo_waves[s]));
+		m_read_idx = (m_read_idx + 1) & m_mask;
+		
+		//计算延迟结果值，实际为一个线性插值
+		s = ((int)delay_pos) & m_mask;
+		e = (s + 1) & m_mask;
+		in = m_cache[s] + (delay_pos - (int)delay_pos) * (m_cache[e] - m_cache[s]);
+	}
+	
+	return in;
+}
+
+void DelayI::delayi_destroy()
+{
+	if(m_cache)
+	{
+		delete [] m_cache;
+		m_cache = nullptr;
+	}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delayi/DelayI.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delayi/DelayI.h
new file mode 100644
index 0000000..2cd46cc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/delayi/DelayI.h
@@ -0,0 +1,81 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_DELAYI_H__
+#define __SMULE_DELAYI_H__
+#include "SAudioEffectsConf.h"
+//实现一个调制延迟效果器
+
+class DelayI
+{
+public:
+	DelayI();
+	~DelayI();
+
+public:
+	void delayi_create(int depth);
+	void delayi_set_fbk(float feedback);
+	void delayi_set_lfo_amt(float amplitude);
+	void delayi_set_lfo_inc(float inc);
+	void delayi_set_lfo_phase(float phase);
+	void delayi_set_lfo_rate(float rate);
+	void delayi_reset();
+	void delayi_process(float * data, int len);
+	void delayi_tap(float * data, int len, int tap, float weight);
+	float delayi_tick(float in);
+	void delayi_destroy();
+
+private:
+	//循环延迟的缓存数据
+	float * m_cache;//0
+	//延迟长度
+	float m_delay_len;//4
+	//循环的延迟缓存长度
+	int m_total_len;//8
+	//将延迟器长度设置为 2 的次方，然后用与运算加速 idx 的寻址操作
+	int m_mask;//12
+	//当前取出的位置
+	int m_read_idx;//16
+	//当前存入的位置
+	int m_write_idx;//20
+	//LFO的幅度值
+	float m_amplitude;//24
+	//LFO的频率，由于和"每次对输入信号的相移"有一定重合，这里不使用
+	float m_rate;//28
+	//LFO对输入信号每次的相移
+	float m_inc;//32
+	//LFO当前的相位，取值范围 [0, 1)，代表了相位偏移 [0, 360) 度
+	float m_phase;//36
+	//延迟器的反馈比例
+	float m_feedback;//40
+};
+
+#endif /* __SMULE_DELAYI_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/envelope_follower/EnvelopeFollower.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/envelope_follower/EnvelopeFollower.cpp
new file mode 100644
index 0000000..2b9b3af
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/envelope_follower/EnvelopeFollower.cpp
@@ -0,0 +1,143 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "EnvelopeFollower.h"
+#include <cmath>
+
+#define ANALOG_RATIO	0.368
+#define DIGITAL_RATIO	0.1
+
+static inline float get_ratio(EnvelopeFollower * inst, float frames)
+{
+	float result;
+	
+	if(frames == 0)
+	{
+		result = 0;
+	}
+	else
+	{
+		float tc = inst->getTimeConstant();
+		result = expf(tc / frames);
+	}
+	
+	return result;
+}
+
+EnvelopeFollower::EnvelopeFollower(float attack, float release, unsigned int in_channels)
+	: AudioEffect(in_channels, 1)
+{
+	setAttackTime_frames(attack);
+	setReleaseTime_frames(release);
+	setLevel(0);
+}
+
+EnvelopeFollower::~EnvelopeFollower()
+{
+
+}
+
+void EnvelopeFollower::process_internal(const float *input, float *output, unsigned int len)
+{
+	if(m_in_channels == 1)
+	{
+		for(int i = 0; i < len; ++i)
+		{
+			float in = fabsf(input[i]);
+			if(m_level < in)
+			{
+				m_level = in + m_attack * (m_level - in);
+			}
+			else
+			{
+				m_level = in + m_release * (m_level - in);
+			}
+		}
+	}
+	else if(m_in_channels == 2)
+	{
+		for(int i = 0; i < len; ++i)
+		{
+			float in = std::max(fabsf(input[2 * i + 0]), fabsf(input[2 * i + 1]));
+			if(m_level < in)
+			{
+				m_level = in + m_attack * (m_level - in);
+			}
+			else
+			{
+				m_level = in + m_release * (m_level - in);
+			}
+		}
+	}
+}
+
+void EnvelopeFollower::setAttackTime_frames(float frames)
+{
+	m_attack = get_ratio(this, frames);
+}
+
+void EnvelopeFollower::setCircuitType(EnvelopeFollower::CircuitType type)
+{
+
+	float tc = getTimeConstant();
+	float attack = tc / logf(m_attack);
+	float release = tc / logf(m_release);
+
+	m_type = type;
+	setAttackTime_frames(attack);
+	setReleaseTime_frames(release);
+}
+
+void EnvelopeFollower::setLevel(float level)
+{
+	m_level = level;
+}
+
+void EnvelopeFollower::setReleaseTime_frames(float frames)
+{
+	m_release = get_ratio(this, frames);
+}
+
+EnvelopeFollower::CircuitType EnvelopeFollower::getCircuitType()
+{
+	return m_type;
+}
+
+float EnvelopeFollower::getLevel()
+{
+	return m_level;
+}
+
+float EnvelopeFollower::getTimeConstant()
+{
+	float ratio = m_type == EnvelopeFollower::Analog ? ANALOG_RATIO : DIGITAL_RATIO;
+	return logf(ratio);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/envelope_follower/EnvelopeFollower.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/envelope_follower/EnvelopeFollower.h
new file mode 100644
index 0000000..c168804
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/envelope_follower/EnvelopeFollower.h
@@ -0,0 +1,69 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_ENVELOPEFOLLOWER_H__
+#define __SMULE_ENVELOPEFOLLOWER_H__
+#include "SAudioEffectsConf.h"
+#include "AudioEffect.h"
+
+class EnvelopeFollower : public AudioEffect
+{
+public:
+	EnvelopeFollower(float attack, float release, unsigned int in_channels);
+	virtual ~EnvelopeFollower();
+
+public:
+	void process_internal(const float *input, float *output, unsigned int len) override ;
+
+public:
+	enum CircuitType
+	{
+		Analog,
+		Digital
+	};
+	
+public:
+	void setAttackTime_frames(float frames);
+	void setCircuitType(CircuitType type);
+	void setLevel(float level);
+	void setReleaseTime_frames(float frames);
+	CircuitType getCircuitType();
+	float getLevel();
+	float getTimeConstant();
+
+private:
+	float m_level;//68
+	float m_attack;//72
+	float m_release;//76
+	CircuitType m_type;//80
+};
+
+#endif /* __SMULE_ENVELOPEFOLLOWER_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/equalizer/Equalizer.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/equalizer/Equalizer.cpp
new file mode 100644
index 0000000..05c23a9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/equalizer/Equalizer.cpp
@@ -0,0 +1,144 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "Equalizer.h"
+
+static float gs_fc[EQ_BANDS] = { 25, 2229, 20000 };
+
+Equalizer::Equalizer(float fs)
+	: AudioEffect(1, 1)
+{
+	memset(m_gain, 0, sizeof(m_gain));
+	memset(m_Q, 0, sizeof(m_Q));
+	memcpy(m_fc, gs_fc, sizeof(gs_fc));
+	
+	int idx = 0;
+	m_biquad[idx] = std::make_shared<Biquad>();
+	m_biquad[idx]->biquad_create(BIQUAD_LOSHELF, m_fc[idx], m_Q[idx], m_gain[idx], fs, EQ_CHANNEL);
+	
+	for(idx = 1; idx < EQ_BANDS - 1; ++idx)
+	{
+		m_biquad[idx] = std::make_shared<Biquad>();
+		m_biquad[idx]->biquad_create(BIQUAD_PEAK, m_fc[idx], m_Q[idx], m_gain[idx], fs, EQ_CHANNEL);
+	}
+	
+	m_biquad[idx] = std::make_shared<Biquad>();
+	m_biquad[idx]->biquad_create(BIQUAD_HISHELF, m_fc[idx], m_Q[idx], m_gain[idx], fs, EQ_CHANNEL);
+}
+
+Equalizer::~Equalizer()
+{
+	;
+}
+
+void Equalizer::reset()
+{
+	for(auto & biquad : m_biquad)
+	{
+		biquad->biquad_reset();
+	}
+}
+
+void Equalizer::process_internal(const float *input, float *output, unsigned int len)
+{
+	if(input != output)
+	{
+		memcpy(output, input, EQ_CHANNEL * sizeof(float) * len);
+	}
+
+
+    m_biquad[1]->biquad_process2(output, len);
+    m_biquad[0]->biquad_process2(output, len);
+    m_biquad[2]->biquad_process2(output, len);
+//	for(auto & biquad : m_biquad)
+//	{
+//		biquad->biquad_process2(output, len);
+//	}
+}
+
+void Equalizer::set_parameter_value(const std::string &key, int idx, float value)
+{
+	if(key == "Center Freq.")
+	{
+		setFreqForEQBand(value, idx);
+	}
+	else if(key == "Gain")
+	{
+		setGaindBForEQBand(value, idx);
+	}
+	else if(key == "Q")
+	{
+		setSlopeForEQBand(value, idx);
+	}
+}
+
+void Equalizer::setFreqForEQBand(float fc, int idx)
+{
+	if(idx >= 0 && idx < EQ_BANDS)
+	{
+		m_fc[idx] = fc;
+	}
+	
+	updateParameters();
+}
+
+void Equalizer::setGaindBForEQBand(float db, int idx)
+{
+	if(idx >= 0 && idx < EQ_BANDS)
+	{
+		m_gain[idx] = db;
+	}
+	
+	updateParameters();
+}
+
+void Equalizer::setSlopeForEQBand(float Q, int idx)
+{
+	if(idx >= 0 && idx < EQ_BANDS)
+	{
+		m_Q[idx] = Q;
+	}
+	
+	updateParameters();
+}
+
+void Equalizer::updateParameters()
+{
+	int idx = 0;
+	m_biquad[idx]->biquad_setcoefs(BIQUAD_LOSHELF, m_fc[idx], m_Q[idx], m_gain[idx]);
+	
+	for(idx = 1; idx < EQ_BANDS - 1; ++idx)
+	{
+		m_biquad[idx]->biquad_setcoefs(BIQUAD_PEAK, m_fc[idx], m_Q[idx], m_gain[idx]);
+	}
+	
+	m_biquad[idx]->biquad_setcoefs(BIQUAD_HISHELF, m_fc[idx], m_Q[idx], m_gain[idx]);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/equalizer/Equalizer.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/equalizer/Equalizer.h
new file mode 100644
index 0000000..9731b54
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/equalizer/Equalizer.h
@@ -0,0 +1,70 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_EQUALIZER_H__
+#define __SMULE_EQUALIZER_H__
+
+#include "AudioEffect.h"
+#include "Biquad.h"
+#include "SAudioEffectsConf.h"
+//这里实现一个三段均衡器，默认处理单声道
+#define EQ_BANDS	3
+#define EQ_CHANNEL	1
+
+class Equalizer : public AudioEffect
+{
+public:
+	explicit Equalizer(float fs);
+	~Equalizer() override ;
+
+public:
+	void reset() override ;
+	void process_internal(const float *input, float *output, unsigned int len) override ;
+	void set_parameter_value(const std::string &key, int idx, float value) override ;
+
+public:
+	void setFreqForEQBand(float fc, int idx);
+	void setGaindBForEQBand(float db, int idx);
+	void setSlopeForEQBand(float Q, int idx);
+	void updateParameters();
+
+private:
+	//均衡器的增益数组
+	float m_gain[EQ_BANDS];//68
+	//均衡器的Q值数组
+	float m_Q[EQ_BANDS];//80
+	//均衡器的中心频率或者截止频率数组
+	float m_fc[EQ_BANDS];//92
+	//第一个为低搁置滤波、最后一个为高搁置滤波、中间为peak滤波
+	std::shared_ptr<Biquad> m_biquad[EQ_BANDS];//104
+};
+
+#endif /* __SMULE_EQUALIZER_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/reverb/Reverb.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/reverb/Reverb.cpp
new file mode 100644
index 0000000..d17c36b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/reverb/Reverb.cpp
@@ -0,0 +1,393 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "Reverb.h"
+#include <algorithm>
+
+//论文参数对应的采样率
+#define ORIGINAL_FS				29761
+#define BANDWIDTH				0.9995f
+#define INPUT_DIFFUSION1		0.75f
+#define INPUT_DIFFUSION2		0.625f
+#define DECAY_DIFFUSION1		0.7f
+#define DECAY_DIFFUSION2		0.5f
+#define DAMPING					0.0005f
+#define MAX_DAMP_COMP			0.9999999
+#define MAX_DAMP				1
+#define MAX_DECAY				0.999999f
+#define MIN_DECAY				-MAX_DECAY
+//按照论文，湿声比例还需要乘以 WET_RATIO
+#define WET_RATIO				0.6
+
+#define INPUT_ALLPASS_LEN1		142
+#define INPUT_ALLPASS_LEN2		107
+#define INPUT_ALLPASS_LEN3		379
+#define INPUT_ALLPASS_LEN4		277
+
+#define TANK_ALLPASS_LEFT_LEN1	672
+#define TANK_ALLPASS_LEFT_LEN2	1800
+#define TANK_ALLPASS_RIGHT_LEN1	908
+#define TANK_ALLPASS_RIGHT_LEN2	2656
+
+#define TANK_DELAYI_LEFT_LEN1	4453
+#define TANK_DELAYI_LEFT_LEN2	3270
+#define TANK_DELAYI_RIGHT_LEN1	4217
+#define TANK_DELAYI_RIGHT_LEN2	3163
+
+#define OUTPUT_LEFT_C54_1		266
+#define OUTPUT_LEFT_C54_2		2974
+#define OUTPUT_LEFT_C55_59		1913
+#define OUTPUT_LEFT_C63			1996
+#define OUTPUT_LEFT_C30			1990
+#define OUTPUT_LEFT_C31_33		186
+#define OUTPUT_LEFT_C39			1066
+
+#define OUTPUT_RIGHT_C30_1		353
+#define OUTPUT_RIGHT_C30_2		3627
+#define OUTPUT_RIGHT_C31_33		1228
+#define OUTPUT_RIGHT_C39		2673
+#define OUTPUT_RIGHT_C54		2111
+#define OUTPUT_RIGHT_C55_59		335
+#define OUTPUT_RIGHT_C63		121
+
+//帧长和延迟长度有一定的制约关系，需要注意
+#define FRAME_LEN			512
+
+#define DELETE_PTR(ptr)			\
+{								\
+	if(ptr)						\
+	{							\
+		delete ptr;				\
+		ptr = nullptr;			\
+	}							\
+}
+
+#define DELETE_ARRAY(ptr)		\
+{								\
+	if(ptr)						\
+	{							\
+		delete [] ptr;			\
+		ptr = nullptr;			\
+	}							\
+}
+
+Reverb::Reverb()
+{
+	m_damp_in = nullptr;
+	m_allplat_c_13_14 = nullptr;
+	m_allplat_c_19_20 = nullptr;
+	m_allplat_c_15_16 = nullptr;
+	m_allplat_c_21_22 = nullptr;
+	m_allplat_c_23_24 = nullptr;
+	m_allplat_c_31_33 = nullptr;
+	m_allplat_c_46_48 = nullptr;
+	m_allplat_c_55_59 = nullptr;
+	m_delayi_c_30 = nullptr;
+	m_delayi_c_39 = nullptr;
+	m_delayi_c_54 = nullptr;
+	m_delayi_c_63 = nullptr;
+	m_damp_tank_left = nullptr;
+	m_damp_tank_right = nullptr;
+	
+	m_decay_left_in = 0;
+	m_decay_left_out = 0;
+	m_decay_right_in = 0;
+	m_decay_right_out = 0;
+	
+	m_dry = 0;
+	m_wet = 0;
+	
+	m_frame_len = 0;
+	m_frame_ptr = nullptr;
+	m_tank_right_out = nullptr;
+	m_tank_left_out = nullptr;
+}
+
+Reverb::~Reverb()
+{
+	reverb_destroy();
+}
+
+void Reverb::reverb_create(float dry, float wet, float decay)
+{
+	m_damp_in = new Damper();
+	//因为原始论文采用的是这个参数方式，但是实现的时候有点变化，因此这里做了下变换
+	m_damp_in->damper_create(1 - BANDWIDTH);
+	
+	m_allplat_c_13_14 = new Allplat();
+	m_allplat_c_13_14->allplat_create(INPUT_ALLPASS_LEN1, INPUT_DIFFUSION1);
+	m_allplat_c_19_20 = new Allplat();
+	m_allplat_c_19_20->allplat_create(INPUT_ALLPASS_LEN2, INPUT_DIFFUSION1);
+	m_allplat_c_15_16 = new Allplat();
+	m_allplat_c_15_16->allplat_create(INPUT_ALLPASS_LEN3, INPUT_DIFFUSION2);
+	m_allplat_c_21_22 = new Allplat();
+	m_allplat_c_21_22->allplat_create(INPUT_ALLPASS_LEN4, INPUT_DIFFUSION2);
+	
+	m_allplat_c_23_24 = new Allplat();
+	m_allplat_c_23_24->allplat_create(TANK_ALLPASS_LEFT_LEN1, DECAY_DIFFUSION1);
+	m_allplat_c_31_33 = new Allplat();
+	m_allplat_c_31_33->allplat_create(TANK_ALLPASS_LEFT_LEN2, DECAY_DIFFUSION2);
+	
+	m_allplat_c_46_48 = new Allplat();
+	m_allplat_c_46_48->allplat_create(TANK_ALLPASS_RIGHT_LEN1, DECAY_DIFFUSION1);
+	m_allplat_c_55_59 = new Allplat();
+	m_allplat_c_55_59->allplat_create(TANK_ALLPASS_RIGHT_LEN2, DECAY_DIFFUSION2);
+	
+	m_delayi_c_30 = new DelayI();
+	m_delayi_c_30->delayi_create(TANK_DELAYI_LEFT_LEN1);
+	m_delayi_c_30->delayi_set_lfo_amt(11.839);
+	m_delayi_c_30->delayi_set_lfo_inc(0.0000249433106);
+	m_delayi_c_30->delayi_set_lfo_phase(0);
+	m_delayi_c_39 = new DelayI();
+	m_delayi_c_39->delayi_create(TANK_DELAYI_LEFT_LEN2);
+	m_delayi_c_39->delayi_set_lfo_amt(2.2);
+	m_delayi_c_39->delayi_set_lfo_inc(0.0000204081625);
+	m_delayi_c_39->delayi_set_lfo_phase(0.2);
+	
+	m_delayi_c_54 = new DelayI();
+	m_delayi_c_54->delayi_create(TANK_DELAYI_RIGHT_LEN1);
+	m_delayi_c_54->delayi_set_lfo_amt(10);
+	m_delayi_c_54->delayi_set_lfo_inc(0.0000242630394);
+	m_delayi_c_54->delayi_set_lfo_phase(0.4);
+	m_delayi_c_63 = new DelayI();
+	m_delayi_c_63->delayi_create(TANK_DELAYI_RIGHT_LEN2);
+	m_delayi_c_63->delayi_set_lfo_amt(2.11);
+	m_delayi_c_63->delayi_set_lfo_inc(0.0000199546485);
+	m_delayi_c_63->delayi_set_lfo_phase(0.6);
+	
+	m_damp_tank_left = new Damper();
+	m_damp_tank_left->damper_create(DAMPING);
+	
+	m_damp_tank_right = new Damper();
+	m_damp_tank_right->damper_create(DAMPING);
+	
+	reverb_set_decay(decay);
+	reverb_set_dry(dry);
+	reverb_set_wet(wet);
+	
+	m_frame_len = FRAME_LEN;
+	m_frame_ptr = new float[m_frame_len * 4];
+	memset(m_frame_ptr, 0, sizeof(float) * m_frame_len * 4);
+	m_tank_right_out = m_frame_ptr + m_frame_len;
+	m_tank_left_out = m_frame_ptr + 2 * m_frame_len;
+}
+
+void Reverb::reverb_set()
+{
+
+}
+
+void Reverb::reverb_set_decay(float decay)
+{
+	decay = std::max(MIN_DECAY, std::min(decay, MAX_DECAY));
+	m_decay_left_in = decay;
+	m_decay_left_out = decay;
+	m_decay_right_in = decay;
+	m_decay_right_out = decay;
+}
+
+void Reverb::reverb_set_dry(float dry)
+{
+	m_dry = dry;
+}
+
+void Reverb::reverb_set_wet(float wet)
+{
+	m_wet = wet;
+}
+
+void Reverb::reverb_set_indamp(float damp)
+{
+	if(damp > MAX_DAMP_COMP)
+	{
+		damp = MAX_DAMP;
+	}
+	
+	m_damp_in->damper_set(damp);
+}
+
+void Reverb::reverb_set_tankdamp(float damp)
+{
+	if(damp > MAX_DAMP_COMP)
+	{
+		damp = MAX_DAMP;
+	}
+	
+	m_damp_tank_left->damper_set(damp);
+	m_damp_tank_right->damper_set(damp);
+}
+
+float Reverb::reverb_get_wet()
+{
+	return m_wet;
+}
+
+void Reverb::reverb_reset()
+{
+	m_damp_in->damper_clear();
+	
+	m_allplat_c_13_14->allplat_reset();
+	m_allplat_c_19_20->allplat_reset();
+	m_allplat_c_15_16->allplat_reset();
+	m_allplat_c_21_22->allplat_reset();
+	m_allplat_c_23_24->allplat_reset();
+	m_allplat_c_31_33->allplat_reset();
+	m_allplat_c_46_48->allplat_reset();
+	m_allplat_c_55_59->allplat_reset();
+	
+	m_delayi_c_30->delayi_reset();
+	m_delayi_c_39->delayi_reset();
+	m_delayi_c_54->delayi_reset();
+	m_delayi_c_63->delayi_reset();
+	
+	m_damp_tank_left->damper_clear();
+	m_damp_tank_right->damper_clear();
+	
+	memset(m_frame_ptr, 0, sizeof(float) * m_frame_len * 4);
+	m_tank_right_out = m_frame_ptr + m_frame_len;
+	m_tank_left_out = m_frame_ptr + 2 * m_frame_len;
+}
+
+void Reverb::reverb_process(const float * input, int channel, float * out_l, float * out_r, int len)
+{
+	//这里按照每帧固定长度进行
+	while(len > 0)
+	{
+		int proc_len = std::min(len, m_frame_len);
+		len -= proc_len;
+		
+		//只允许输入单声道或者双声道
+		if(channel != 2)
+		{
+			memcpy(m_frame_ptr, input, sizeof(float) * proc_len);
+		}
+		else
+		{
+			//该混响是单声道进，双声道出，因此这里需要先对数据进行单声道处理
+			for(int i = 0; i < proc_len; ++i)
+			{
+				m_frame_ptr[i] = (input[2 * i + 0] + input[2 * i + 1]) / 2;
+			}
+		}
+		
+		//input diffusion
+		m_damp_in->damper_process(m_frame_ptr, proc_len);
+		m_allplat_c_13_14->allplat_process(m_frame_ptr, proc_len);
+		m_allplat_c_19_20->allplat_process(m_frame_ptr, proc_len);
+		m_allplat_c_15_16->allplat_process(m_frame_ptr, proc_len);
+		m_allplat_c_21_22->allplat_process(m_frame_ptr, proc_len);
+		
+		//tank
+		for(int i = 0; i < proc_len; ++i)
+		{
+			//tank feedback input
+			float left_in = m_frame_ptr[i] + *m_tank_right_out;
+			float right_in = m_frame_ptr[i] + *m_tank_left_out;
+			
+			//left tank
+			left_in = m_allplat_c_23_24->allplat_tick(left_in);
+			left_in = m_delayi_c_30->delayi_tick(left_in);
+			left_in = m_damp_tank_left->damper_tick(left_in);
+			left_in = m_allplat_c_31_33->allplat_tick(left_in * m_decay_left_in);
+			*m_tank_left_out = m_delayi_c_39->delayi_tick(left_in) * m_decay_left_out;
+			
+			//right tank
+			right_in = m_allplat_c_46_48->allplat_tick(right_in);
+			right_in = m_delayi_c_54->delayi_tick(right_in);
+			right_in = m_damp_tank_right->damper_tick(right_in);
+			right_in = m_allplat_c_55_59->allplat_tick(right_in * m_decay_right_in);
+			*m_tank_right_out = m_delayi_c_63->delayi_tick(right_in) * m_decay_right_out;
+		}
+		
+		//计算干声输出比例
+		for(int i = 0; i < proc_len; ++i)
+		{
+			out_l[i] = input[channel * i + 0] * m_dry;
+			out_r[i] = input[channel * i + channel - 1] * m_dry;
+		}
+		
+		//delay network
+		memset(m_frame_ptr, 0, sizeof(float) * proc_len);
+		//left reverb out
+		m_delayi_c_54->delayi_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C54_1, m_wet * WET_RATIO);
+		m_delayi_c_54->delayi_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C54_2, m_wet * WET_RATIO);
+		m_allplat_c_55_59->allplat_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C55_59, m_wet * -WET_RATIO);
+		m_delayi_c_63->delayi_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C63, m_wet * WET_RATIO);
+		m_delayi_c_30->delayi_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C30, m_wet * -WET_RATIO);
+		m_allplat_c_31_33->allplat_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C31_33, m_wet * -WET_RATIO);
+		m_delayi_c_39->delayi_tap(m_frame_ptr, proc_len, OUTPUT_LEFT_C39, m_wet * -WET_RATIO);
+		//计算左声道最终输出
+		for(int i = 0; i < proc_len; ++i)
+		{
+			out_l[i] += m_frame_ptr[i];
+		}
+		
+		//right reverb out
+		m_delayi_c_30->delayi_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C30_1, m_wet * WET_RATIO);
+		m_delayi_c_30->delayi_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C30_2, m_wet * WET_RATIO);
+		m_allplat_c_31_33->allplat_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C31_33, m_wet * -WET_RATIO);
+		m_delayi_c_39->delayi_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C39, m_wet * WET_RATIO);
+		m_delayi_c_54->delayi_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C54, m_wet * -WET_RATIO);
+		m_allplat_c_55_59->allplat_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C55_59, m_wet * -WET_RATIO);
+		m_delayi_c_63->delayi_tap(m_frame_ptr, proc_len, OUTPUT_RIGHT_C63, m_wet * -WET_RATIO);
+		//计算右声道最终输出
+		for(int i = 0; i < proc_len; ++i)
+		{
+			out_r[i] += m_frame_ptr[i];
+		}
+		
+		//更新指针位置信息
+		out_l += proc_len;
+		out_r += proc_len;
+		input += proc_len;
+	}
+}
+
+void Reverb::reverb_destroy()
+{
+	DELETE_PTR(m_damp_in)
+	DELETE_PTR(m_allplat_c_13_14)
+	DELETE_PTR(m_allplat_c_19_20)
+	DELETE_PTR(m_allplat_c_15_16)
+	DELETE_PTR(m_allplat_c_21_22)
+	DELETE_PTR(m_allplat_c_23_24)
+	DELETE_PTR(m_allplat_c_31_33)
+	DELETE_PTR(m_allplat_c_46_48)
+	DELETE_PTR(m_allplat_c_55_59)
+	DELETE_PTR(m_delayi_c_30)
+	DELETE_PTR(m_delayi_c_39)
+	DELETE_PTR(m_delayi_c_54)
+	DELETE_PTR(m_delayi_c_63)
+	DELETE_PTR(m_damp_tank_left)
+	DELETE_PTR(m_damp_tank_right)
+	
+	DELETE_ARRAY(m_frame_ptr)
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/reverb/Reverb.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/reverb/Reverb.h
new file mode 100644
index 0000000..f2c99a3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/reverb/Reverb.h
@@ -0,0 +1,91 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_REVERB_H__
+#define __SMULE_REVERB_H__
+
+//Dattorro’s Plate Reverb，代码参考了 freeverb3 中的 strev
+//论文地址为：https://ccrma.stanford.edu/~dattorro/EffectDesignPart1.pdf
+
+#include "Allplat.h"
+#include "DelayI.h"
+#include "Damper.h"
+#include "SAudioEffectsConf.h"
+class Reverb
+{
+public:
+	Reverb();
+	~Reverb();
+
+public:
+	void reverb_create(float dry, float wet, float decay);
+	void reverb_set();
+	void reverb_set_decay(float decay);
+	void reverb_set_dry(float dry);
+	void reverb_set_wet(float wet);
+	void reverb_set_indamp(float damp);
+	void reverb_set_tankdamp(float damp);
+	float reverb_get_wet();
+	void reverb_reset();
+	void reverb_process(const float * input, int channel, float * out_l, float * out_r, int len);
+	void reverb_destroy();
+	
+private:
+	Damper * m_damp_in;//0
+	Allplat * m_allplat_c_13_14;//4
+	Allplat * m_allplat_c_19_20;//8
+	Allplat * m_allplat_c_15_16;//12
+	Allplat * m_allplat_c_21_22;//16
+	//原始论文，23_24 和 46_48 应该为调制全通，但是这里简化了
+	Allplat * m_allplat_c_23_24;//20
+	Allplat * m_allplat_c_31_33;//24
+	Allplat * m_allplat_c_46_48;//28
+	Allplat * m_allplat_c_55_59;//32
+	//原始论文，这里应该都是简单的延迟器，但是这里改成了调制延迟器，单实际还是简单延迟器
+	DelayI * m_delayi_c_30;//36
+	DelayI * m_delayi_c_39;//40
+	DelayI * m_delayi_c_54;//44
+	DelayI * m_delayi_c_63;//48
+	Damper * m_damp_tank_left;//52
+	Damper * m_damp_tank_right;//56
+	float m_decay_left_in;//60
+	float m_decay_left_out;//64
+	float m_decay_right_in;//68
+	float m_decay_right_out;//72
+	float m_dry;//76
+	float m_wet;//80
+	int m_frame_len;//84
+	float * m_frame_ptr;//88
+	float * m_tank_right_out;//92
+	float * m_tank_left_out;//96
+};
+
+#endif /* __SMULE_REVERB_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_delay_effect/SimpleDelayEffect.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_delay_effect/SimpleDelayEffect.cpp
new file mode 100644
index 0000000..3b6fe6b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_delay_effect/SimpleDelayEffect.cpp
@@ -0,0 +1,92 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "SimpleDelayEffect.h"
+
+SimpleDelayEffect::SimpleDelayEffect(unsigned int fs)
+	: AudioEffect(1, 1)
+{
+	m_delay = std::make_shared<Delay>();
+	m_delay->delay_create(100, fs, 28, -27, 0);
+}
+
+SimpleDelayEffect::~SimpleDelayEffect()
+{
+
+}
+
+void SimpleDelayEffect::reset()
+{
+	m_delay->delay_clear();
+}
+
+void SimpleDelayEffect::process_internal(const float *input, float *output, unsigned int len)
+{
+	if(input != output)
+	{
+		memcpy(output, input, sizeof(float) * len);
+	}
+	
+	m_delay->delay_process(output, len);
+}
+
+void SimpleDelayEffect::set_parameter_value(const std::string &key, float value)
+{
+	if(key == "Mix")
+	{
+		setMix(value);
+	}
+	else if(key == "Delay")
+	{
+		setDelayTimeInMS(value);
+	}
+	else if(key == "Feedback")
+	{
+		setFeedback(value);
+	}
+}
+
+void SimpleDelayEffect::setDelayTimeInMS(float time)
+{
+	m_delay->delay_set_deltime(time);
+}
+
+void SimpleDelayEffect::setFeedback(float feedback)
+{
+	m_delay->delay_set_fbk(feedback / 100);
+}
+
+void SimpleDelayEffect::setMix(float mix)
+{
+	float wet = mix / 100;
+	float dry = 1 - wet;
+	m_delay->delay_set_levels(wet, dry);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_delay_effect/SimpleDelayEffect.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_delay_effect/SimpleDelayEffect.h
new file mode 100644
index 0000000..49d603c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_delay_effect/SimpleDelayEffect.h
@@ -0,0 +1,58 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_SIMPLEDELAYEFFECT_H__
+#define __SMULE_SIMPLEDELAYEFFECT_H__
+
+#include "AudioEffect.h"
+#include "Delay.h"
+#include "SAudioEffectsConf.h"
+class SimpleDelayEffect : public AudioEffect
+{
+public:
+	explicit SimpleDelayEffect(unsigned int fs);
+	virtual ~SimpleDelayEffect();
+
+public:
+	void reset() override ;
+	void process_internal(const float *input, float *output, unsigned int len) override ;
+	void set_parameter_value(const std::string &key, float value) override ;
+
+public:
+	void setDelayTimeInMS(float time);
+	void setFeedback(float feedback);
+	void setMix(float mix);
+
+private:
+	std::shared_ptr<Delay> m_delay;//68
+};
+
+#endif /* __SMULE_SIMPLEDELAYEFFECT_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect/SimpleReverbEffect.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect/SimpleReverbEffect.cpp
new file mode 100644
index 0000000..833a2dd
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect/SimpleReverbEffect.cpp
@@ -0,0 +1,153 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#include "SimpleReverbEffect.h"
+
+float SimpleReverbEffect::DEFAULT_DECAY = 0.08;
+float SimpleReverbEffect::DEFAULT_DRY = 0.9;
+float SimpleReverbEffect::DEFAULT_FBKDMP = 0.5;
+float SimpleReverbEffect::DEFAULT_INDAMP = 0.0005;
+float SimpleReverbEffect::DEFAULT_WET = 0.0005;
+
+SimpleReverbEffect::SimpleReverbEffect(unsigned int in_channels, unsigned int frame_len)
+	: AudioEffect(in_channels, 2)
+	, m_left(frame_len)
+	, m_right(frame_len)
+{
+	m_reverb = std::make_shared<Reverb>();
+	m_reverb->reverb_create(DEFAULT_DRY, DEFAULT_WET, DEFAULT_DECAY);
+	m_reverb->reverb_set_wet(DEFAULT_WET);
+	m_reverb->reverb_set_dry(DEFAULT_DRY);
+	m_reverb->reverb_set_decay(DEFAULT_DECAY);
+	m_reverb->reverb_set_indamp(DEFAULT_INDAMP);
+	m_reverb->reverb_set_tankdamp(DEFAULT_FBKDMP);
+}
+
+SimpleReverbEffect::~SimpleReverbEffect()
+{
+
+}
+
+void SimpleReverbEffect::reset()
+{
+	m_reverb->reverb_reset();
+}
+
+void SimpleReverbEffect::process_internal(const float *input, float *output, unsigned int len)
+{
+	//保证长度满足要求
+	m_left.ensure(len);
+	m_right.ensure(len);
+	
+	auto left = m_left.ptr();
+	auto right = m_right.ptr();
+	
+	m_reverb->reverb_process(input, m_in_channels, left, right, len);
+	
+	if(output != nullptr && len != 0)
+	{
+		for(int i = 0; i < len; ++i)
+		{
+			output[2 * i + 0] = left[i];
+			output[2 * i + 1] = right[i];
+		}
+	}
+}
+
+void SimpleReverbEffect::set_parameter_value(const std::string &key, float value)
+{
+	if(key == "Wet")
+	{
+		m_reverb->reverb_set_wet(value);
+	}
+	else if(key == "Dry")
+	{
+		m_reverb->reverb_set_dry(value);
+	}
+	else if(key == "Decay")
+	{
+		m_reverb->reverb_set_decay(value);
+	}
+	else if(key == "Input Damping")
+	{
+		m_reverb->reverb_set_indamp(value);
+	}
+	else if(key == "Feedback Damping")
+	{
+		m_reverb->reverb_set_tankdamp(value);
+	}
+}
+
+void SimpleReverbEffect::set_parameter_value(const std::string &key, bool value)
+{
+	if(key == "In Ch.")
+	{
+		m_in_channels = value ? 2 : 1;
+	}
+	else if(key == "Out Ch.")
+	{
+		m_out_channels = value ? 2 : 1;
+	}
+	else
+	{
+        AudioEffect::set_parameter_value(key, value);
+	}
+}
+
+void SimpleReverbEffect::setDecay(float decay)
+{
+	m_reverb->reverb_set_decay(decay);
+}
+
+void SimpleReverbEffect::setDry(float dry)
+{
+	m_reverb->reverb_set_dry(dry);
+}
+
+void SimpleReverbEffect::setFeedbackDamping(float damp)
+{
+	m_reverb->reverb_set_tankdamp(damp);
+}
+
+void SimpleReverbEffect::setInputDamping(float damp)
+{
+	m_reverb->reverb_set_indamp(damp);
+}
+
+void SimpleReverbEffect::setWet(float wet)
+{
+	m_reverb->reverb_set_wet(wet);
+}
+
+float SimpleReverbEffect::getWet()
+{
+	return m_reverb->reverb_get_wet();
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect/SimpleReverbEffect.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect/SimpleReverbEffect.h
new file mode 100644
index 0000000..b93291a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/saudio_effects/src/simple_reverb_effect/SimpleReverbEffect.h
@@ -0,0 +1,75 @@
+
+/************************************************************
+*				author:					yangjiang			*
+*************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+                佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SMULE_SIMPLEREVERBEFFECT_H__
+#define __SMULE_SIMPLEREVERBEFFECT_H__
+
+//实现简易混响器
+
+#include "AudioEffect.h"
+#include "Reverb.h"
+#include "Buffer.h"
+#include "SAudioEffectsConf.h"
+
+class SimpleReverbEffect : public AudioEffect
+{
+public:
+	explicit SimpleReverbEffect(unsigned int in_channels, unsigned int frame_len);
+	virtual ~SimpleReverbEffect();
+
+public:
+	void reset() override ;
+	void process_internal(const float *input, float *output, unsigned int len) override ;
+	void set_parameter_value(const std::string &key, float value) override ;
+	void set_parameter_value(const std::string &key, bool value) override ;
+
+public:
+	void setDecay(float decay);
+	void setDry(float dry);
+	void setFeedbackDamping(float damp);
+	void setInputDamping(float damp);
+	void setWet(float wet);
+	float getWet();
+	
+private:
+	static float DEFAULT_DECAY;
+	static float DEFAULT_DRY;
+	static float DEFAULT_FBKDMP;
+	static float DEFAULT_INDAMP;
+	static float DEFAULT_WET;
+
+private:
+	std::shared_ptr<Reverb> m_reverb;//68
+	Smule::Audio::Buffer<float, 1> m_left;//76
+	Smule::Audio::Buffer<float, 1> m_right;//92
+};
+
+#endif /* __SMULE_SIMPLEREVERBEFFECT_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/CMakeLists.txt
new file mode 100644
index 0000000..19b6920
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/CMakeLists.txt
@@ -0,0 +1,4 @@
+include_directories(./ inc src)
+file(GLOB_RECURSE SLOWFLANGING_SRC_FILES src/*cpp)
+add_library(slow_flanging ${SLOWFLANGING_SRC_FILES})
+#set_target_properties(slow_flanging PROPERTIES CXX_VISIBILITY_PRESET hidden)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/inc/CSlowFlanging.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/inc/CSlowFlanging.h
new file mode 100644
index 0000000..381dffc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/inc/CSlowFlanging.h
@@ -0,0 +1,40 @@
+#ifndef __SLOW_FLANGING_H_
+#define __SLOW_FLANGING_H_
+
+#include <vector>
+
+#include "CSlowFlangingDef.h"
+class CSlowFlanging
+{
+public:
+	int init(int channel, int sample_rate);
+	void reset();
+	void uninit();
+	int process(const char *in_buffer, char *out_buffer, int size);
+	int process(const float *in_buffer, float *out_buffer, int size);
+
+	int process_lr_independent(float *in_left, float *in_right, float *out_left, float *out_right, int in_out_size);
+private:
+	int process_sample(const float *in_samples, float *out_samples, int sample_count, unsigned int &samples_processed,
+                       float *circle_buffer, int &iwr, float *circle_buffer_fb, int &iwr_fb);
+
+private:
+	unsigned int m_samples_processed_left;
+	unsigned int m_samples_processed_right;
+	//float m_oscillation_period;
+	int m_oscillation_period;
+	//std::vector<float> m_delayed_samples;
+
+	float * m_circle_buffer_l;
+	float * m_circle_buffer_fb_l;
+	int m_iwr_l;
+	int m_iwr_fb_l;
+
+	float * m_circle_buffer_r;
+	float * m_circle_buffer_fb_r;
+	int m_iwr_r;
+	int m_iwr_fb_r;
+	int m_channel;
+	int m_sample_rate;
+};
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/inc/CSlowFlangingDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/inc/CSlowFlangingDef.h
new file mode 100644
index 0000000..61ae467
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/inc/CSlowFlangingDef.h
@@ -0,0 +1,14 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CSLOWFLANGING_DEF_H
+#define AUDIO_EFFECTS_LIB_CSLOWFLANGING_DEF_H
+#include "AudioEffectsConf.h"
+enum SF_ERR {
+    SF_ERR_SUCCESS            = 0,
+    SF_ERR_PARAM              = -1,
+    SF_ERR_BASE_H_MALLOC_NULL = -2,
+    SF_ERR_BASE_H_UNKNOWN     = -3,
+};
+#endif //AUDIO_EFFECTS_LIB_CSLOWFLANGING_DEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/src/CSlowFlanging.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/src/CSlowFlanging.cpp
new file mode 100644
index 0000000..84c69fc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/slow_flanging/src/CSlowFlanging.cpp
@@ -0,0 +1,520 @@
+#include "CSlowFlangingDef.h"
+#define _USE_MATH_DEFINES
+#include <math.h>
+#include "CSlowFlanging.h"
+
+#define MAX_DELAY_SAMPLE (2.53) //
+#define MIN_DELAY_SAMPLE (0.0)
+
+int CSlowFlanging::init(int channel, int sample_rate)
+{
+	
+	m_iwr_l = 0;
+	m_circle_buffer_l = NULL;
+	m_iwr_fb_l = 0;
+	m_circle_buffer_fb_l = NULL;
+	m_iwr_r = 0;
+	m_circle_buffer_r = NULL;
+	m_iwr_fb_r = 0;
+	m_circle_buffer_fb_r = NULL;
+	m_channel = channel;
+	if (channel > 2 || channel < 1)
+	{
+		return SF_ERR_PARAM;
+	}
+	m_sample_rate = sample_rate;
+	m_oscillation_period = 3787.0f*(float)m_sample_rate/1000.0f;
+	m_samples_processed_left = 0;
+	m_samples_processed_right = m_oscillation_period/2;
+#define MAX_DELAY_SAMPLE_COUNT (int(MAX_DELAY_SAMPLE*(float)m_sample_rate/1000.0f)+2)
+	//m_delayed_samples = std::vector<float>(MAX_DELAY_SAMPLE_COUNT,0);
+	m_circle_buffer_l = new(std::nothrow) float[MAX_DELAY_SAMPLE_COUNT];
+	if (m_circle_buffer_l == NULL)
+	{
+        uninit();
+		return SF_ERR_BASE_H_MALLOC_NULL;
+	}
+	//memset(m_circle_buffer,0,MAX_DELAY_SAMPLE_COUNT);
+	for(int i =0;i<MAX_DELAY_SAMPLE_COUNT;i++) m_circle_buffer_l[i]=0.0f;
+
+	m_circle_buffer_fb_l = new(std::nothrow) float[MAX_DELAY_SAMPLE_COUNT];
+	if (m_circle_buffer_fb_l == NULL)
+	{
+        uninit();
+		return SF_ERR_BASE_H_MALLOC_NULL;
+	}
+	//memset(m_circle_buffer_fb,0.0,MAX_DELAY_SAMPLE_COUNT);
+	for(int i =0;i<MAX_DELAY_SAMPLE_COUNT;i++) m_circle_buffer_fb_l[i]=0.0f;
+	if (m_channel == 2)
+	{
+		m_circle_buffer_r = new(std::nothrow) float[MAX_DELAY_SAMPLE_COUNT];
+		if (m_circle_buffer_r == NULL)
+		{
+            uninit();
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+		//memset(m_circle_buffer,0,MAX_DELAY_SAMPLE_COUNT);
+		for(int i =0;i<MAX_DELAY_SAMPLE_COUNT;i++) m_circle_buffer_r[i]=0.0f;
+
+		m_circle_buffer_fb_r = new(std::nothrow) float[MAX_DELAY_SAMPLE_COUNT];
+		if (m_circle_buffer_fb_r == NULL)
+		{
+            uninit();
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+		//memset(m_circle_buffer_fb,0.0,MAX_DELAY_SAMPLE_COUNT);
+		for(int i =0;i<MAX_DELAY_SAMPLE_COUNT;i++) m_circle_buffer_fb_r[i]=0.0f;
+	}
+	return 0;
+}
+
+void CSlowFlanging::reset()
+{
+	m_iwr_l = 0;
+	m_iwr_fb_l = 0;
+	m_iwr_r = 0;
+	m_iwr_fb_r = 0;
+	m_samples_processed_left = 0;
+	m_samples_processed_right = m_oscillation_period / 2;
+	if (m_circle_buffer_l != NULL)
+	{
+		memset(m_circle_buffer_l, MAX_DELAY_SAMPLE_COUNT * sizeof(float),0);
+	}
+	if (m_circle_buffer_fb_l != NULL)
+	{
+		memset(m_circle_buffer_fb_l, MAX_DELAY_SAMPLE_COUNT * sizeof(float), 0);
+	}
+	if (m_circle_buffer_r != NULL)
+	{
+		memset(m_circle_buffer_r, MAX_DELAY_SAMPLE_COUNT * sizeof(float), 0);
+	}
+	if (m_circle_buffer_fb_r != NULL)
+	{
+		memset(m_circle_buffer_fb_r, MAX_DELAY_SAMPLE_COUNT * sizeof(float), 0);
+	}
+}
+
+int CSlowFlanging::process_lr_independent(float *in_left, float *in_right, float *out_left, float *out_right, int in_out_size)
+{
+	if (2 != m_channel)
+	{
+		return SF_ERR_PARAM;
+	}
+
+	int sample_count_l = process_sample(in_left, out_left, in_out_size, m_samples_processed_left, m_circle_buffer_l,
+                                        m_iwr_l, m_circle_buffer_fb_l, m_iwr_fb_l);
+	int sample_count_r = process_sample(in_right, out_right, in_out_size, m_samples_processed_right, m_circle_buffer_r,
+                                        m_iwr_r, m_circle_buffer_fb_r, m_iwr_fb_r);
+	if (sample_count_l != in_out_size || sample_count_r != in_out_size)
+	{
+		return SF_ERR_BASE_H_UNKNOWN;
+	}
+	return in_out_size;
+}
+
+int CSlowFlanging::process(const float *in_buffer, float *out_buffer, int size)
+{
+	if (m_channel == 1)
+	{
+		int sample_count = process_sample(in_buffer, out_buffer, size, m_samples_processed_left, m_circle_buffer_l,
+                                          m_iwr_l, m_circle_buffer_fb_l, m_iwr_fb_l);
+		if (sample_count != size)
+		{
+			return SF_ERR_BASE_H_UNKNOWN;
+		}
+	}
+	else if (m_channel == 2)
+	{
+		if (size % 2 != 0)
+		{
+			return SF_ERR_PARAM;
+		}
+		float *in_samples_l = new(std::nothrow) float[size / 2];
+		if (in_samples_l == NULL)
+		{
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+		float *in_samples_r = new(std::nothrow) float[size / 2];
+		if (in_samples_r == NULL)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+
+
+		for (int i = 0; i < size / 2; i++)
+		{
+			in_samples_l[i] = in_buffer[2*i];
+			in_samples_r[i] = in_buffer[2*i + 1];
+		}
+
+		float *out_samples_l = new(std::nothrow) float[size / 2];
+		if (out_samples_l == NULL)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			if (in_samples_r != NULL)
+			{
+				delete[] in_samples_r;
+				in_samples_r = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+		float *out_samples_r = new(std::nothrow) float[size / 2];
+		if (out_samples_r == NULL)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			if (in_samples_r != NULL)
+			{
+				delete[] in_samples_r;
+				in_samples_r = NULL;
+			}
+			if (out_samples_l != NULL)
+			{
+				delete[] out_samples_l;
+				out_samples_l = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+
+		int sample_count_l = process_sample(in_samples_l, out_samples_l, size / 2, m_samples_processed_left,
+                                            m_circle_buffer_l, m_iwr_l, m_circle_buffer_fb_l, m_iwr_fb_l);
+		int sample_count_r = process_sample(in_samples_r, out_samples_r, size / 2, m_samples_processed_right,
+                                            m_circle_buffer_r, m_iwr_r, m_circle_buffer_fb_r, m_iwr_fb_r);
+		if (sample_count_l != size / 2 || sample_count_r != size / 2)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			if (in_samples_r != NULL)
+			{
+				delete[] in_samples_r;
+				in_samples_r = NULL;
+			}
+			if (out_samples_l != NULL)
+			{
+				delete[] out_samples_l;
+				out_samples_l = NULL;
+
+			}
+			if (out_samples_r != NULL)
+			{
+				delete[] out_samples_r;
+				out_samples_r = NULL;
+			}
+			return SF_ERR_BASE_H_UNKNOWN;
+		}
+
+		for (int i = 0; i < size / 2; i++)
+		{
+			out_buffer[2 * i] = out_samples_l[i];
+			out_buffer[2 * i + 1] = out_samples_r[i];
+		}
+
+		if (in_samples_l != NULL)
+		{
+			delete[] in_samples_l;
+			in_samples_l = NULL;
+		}
+		if (in_samples_r != NULL)
+		{
+			delete[] in_samples_r;
+			in_samples_r = NULL;
+		}
+		if (out_samples_l != NULL)
+		{
+			delete[] out_samples_l;
+			out_samples_l = NULL;
+
+		}
+		if (out_samples_r != NULL)
+		{
+			delete[] out_samples_r;
+			out_samples_r = NULL;
+		}
+	}
+	return size;
+}
+
+int CSlowFlanging::process(const char *in_buffer, char *out_buffer, int size)
+{
+	if (m_channel == 1)
+	{
+		if (size%2 != 0)
+		{
+			return -1;
+		}
+		float *in_samples = new(std::nothrow) float[size/2];
+		if (in_samples == NULL)
+		{
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+
+		for (int i = 0; i < size/2; i++)
+		{
+			in_samples[i] = *(((short*)in_buffer+i))/32767.0f;
+		}
+
+		float *out_samples = new float[size/2];
+		if (out_samples == NULL)
+		{
+			if (in_samples != NULL)
+			{
+				delete[] in_samples;
+				in_samples = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+
+		int sample_count = process_sample(in_samples, out_samples, size / 2, m_samples_processed_left,
+                                          m_circle_buffer_l, m_iwr_l, m_circle_buffer_fb_l, m_iwr_fb_l);
+		if (sample_count != size/2)
+		{
+			if (in_samples != NULL)
+			{
+				delete[] in_samples;
+				in_samples = NULL;
+			}
+			if (out_samples != NULL)
+			{
+				delete[] out_samples;
+				out_samples = NULL;
+			}
+			return SF_ERR_BASE_H_UNKNOWN;
+		}
+
+		for (int i = 0; i < size/2; i++)
+		{
+			*((short*)out_buffer+i) = (short)(fabs(out_samples[i]) > 1.0f ? out_samples[i]/fabs(out_samples[i])*32767.0f : out_samples[i]*32767.0f);
+		}
+		if (in_samples != NULL)
+		{
+			delete[] in_samples;
+			in_samples = NULL;
+		}
+		if (out_samples != NULL)
+		{
+			delete[] out_samples;
+			out_samples = NULL;
+		}
+	}
+	else if (m_channel == 2)
+	{
+		if (size % 4 != 0)
+		{
+			return SF_ERR_PARAM;
+		}
+		float *in_samples_l = new(std::nothrow) float[size/4];
+		if (in_samples_l == NULL)
+		{
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+		float *in_samples_r = new(std::nothrow) float[size/4];
+		if (in_samples_r == NULL)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+
+
+		for (int i = 0; i < size/4; i++)
+		{
+			in_samples_l[i] = *(((short*)in_buffer+i*2))/32767.0f;
+			in_samples_r[i] = *(((short*)in_buffer+i*2+1))/32767.0f;
+		}
+
+		float *out_samples_l = new(std::nothrow) float[size/4];
+		if (out_samples_l == NULL)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			if (in_samples_r != NULL)
+			{
+				delete[] in_samples_r;
+				in_samples_r = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+		float *out_samples_r = new(std::nothrow) float[size/4];
+		if (out_samples_r == NULL)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			if (in_samples_r != NULL)
+			{
+				delete[] in_samples_r;
+				in_samples_r = NULL;
+			}
+			if (out_samples_l != NULL)
+			{
+				delete[] out_samples_l;
+				out_samples_l = NULL;
+			}
+			return SF_ERR_BASE_H_MALLOC_NULL;
+		}
+
+		int sample_count_l = process_sample(in_samples_l, out_samples_l, size / 4, m_samples_processed_left,
+                                            m_circle_buffer_l, m_iwr_l, m_circle_buffer_fb_l, m_iwr_fb_l);
+		int sample_count_r = process_sample(in_samples_r, out_samples_r, size / 4, m_samples_processed_right,
+                                            m_circle_buffer_r, m_iwr_r, m_circle_buffer_fb_r, m_iwr_fb_r);
+		if (sample_count_l != size/4 || sample_count_r != size/4)
+		{
+			if (in_samples_l != NULL)
+			{
+				delete[] in_samples_l;
+				in_samples_l = NULL;
+			}
+			if (in_samples_r != NULL)
+			{
+				delete[] in_samples_r;
+				in_samples_r = NULL;
+			}
+			if (out_samples_l != NULL)
+			{
+				delete[] out_samples_l;
+				out_samples_l = NULL;
+			
+			}
+			if (out_samples_r != NULL)
+			{
+				delete[] out_samples_r;
+				out_samples_r = NULL;
+			}
+			return SF_ERR_BASE_H_UNKNOWN;
+		}
+		
+		for (int i = 0; i < size/4; i++)
+		{
+			*((short*)out_buffer+2*i) = (short)(fabs(out_samples_l[i]) > 1.0f ? out_samples_l[i]/fabs(out_samples_l[i])*32767.0f : out_samples_l[i]*32767.0f);
+			*((short*)out_buffer+2*i+1) = (short)(fabs(out_samples_r[i]) > 1.0f ? out_samples_r[i]/fabs(out_samples_r[i])*32767.0f : out_samples_r[i]*32767.0f);
+		}
+
+		if (in_samples_l != NULL)
+		{
+			delete[] in_samples_l;
+			in_samples_l = NULL;
+		}
+		if (in_samples_r != NULL)
+		{
+			delete[] in_samples_r;
+			in_samples_r = NULL;
+		}
+		if (out_samples_l != NULL)
+		{
+			delete[] out_samples_l;
+			out_samples_l = NULL;
+
+		}
+		if (out_samples_r != NULL)
+		{
+			delete[] out_samples_r;
+			out_samples_r = NULL;
+		}
+	}
+	else
+		;
+	return size;
+}
+
+int CSlowFlanging::process_sample(const float *in_samples, float *out_samples, int sample_count,
+                                  unsigned int &samples_processed,
+                                  float *circle_buffer, int &iwr, float *circle_buffer_fb, int &iwr_fb)
+{
+	//float r = (float)(MAX_DELAY_SAMPLE_COUNT - MIN_DELAY_SAMPLE_COUNT)*2.0f/(float)OSCILLATION_PERIOD;
+#define MAX_DELAY_SAMPLE_COUNT (int(MAX_DELAY_SAMPLE*(float)m_sample_rate/1000.0f)+2)
+#define AVE_DELAY_SAMPLE (((MAX_DELAY_SAMPLE) - (MIN_DELAY_SAMPLE))*(float)m_sample_rate/1000.0f/2)
+
+	float gfb = 0.2f;
+	float gff = 1.0f;
+	for (int i = 0; i < sample_count; i++)
+	{
+		//int delay_index = (m_samples_processed % OSCILLATION_PERIOD) <= OSCILLATION_PERIOD / 2 ?
+		//	(float)(m_samples_processed % OSCILLATION_PERIOD) * r  + MIN_DELAY_SAMPLE_COUNT 
+		//	: - (float)(m_samples_processed % OSCILLATION_PERIOD) * r + 2 * MAX_DELAY_SAMPLE_COUNT - MIN_DELAY_SAMPLE_COUNT;
+		// 		if (m_samples_processed > OSCILLATION_PERIOD)
+		// 		{
+		// 			break;
+		// 		}
+		float delay_t = (float)(AVE_DELAY_SAMPLE+MIN_DELAY_SAMPLE) + (AVE_DELAY_SAMPLE*sin(((float)(samples_processed)*2*M_PI)/(float)m_oscillation_period));
+		//float delay_t_1 = (float)(MAX_DELAY_SAMPLE_COUNT/2) + (MAX_DELAY_SAMPLE_COUNT/2*sin(((float)(m_samples_processed+m_start_delay+1)*M_PI)/(float)OSCILLATION_PERIOD));
+		//printf("%f\n",delay_t);
+
+		int delay_n = int(delay_t);
+		int delay_n_1 = delay_n + 1;//= delay_t_1 > delay_t ? delay_n+1 : delay_n-1;
+
+		int delay_n_fb = delay_n;
+		int delay_n_fb_1 = delay_n_fb + 1;
+		float ita = delay_t - (float)delay_n;
+		//int delay_n_1 = delay_n+1;
+
+		delay_n = delay_n <= iwr ? iwr - delay_n : MAX_DELAY_SAMPLE_COUNT + iwr - delay_n;
+		delay_n_1 = delay_n_1 <= iwr ? iwr - delay_n_1 : MAX_DELAY_SAMPLE_COUNT + iwr - delay_n_1;
+		delay_n_fb = delay_n_fb <= iwr_fb ? iwr_fb - delay_n_fb : MAX_DELAY_SAMPLE_COUNT + iwr_fb - delay_n_fb;
+		delay_n_fb_1 = delay_n_fb_1 <= iwr_fb ? iwr_fb - delay_n_fb_1 : MAX_DELAY_SAMPLE_COUNT + iwr_fb - delay_n_fb_1;
+		//delay_n_1 = delay_n_1 <= m_iwr ? m_iwr - delay_n_1 : MAX_DELAY_SAMPLE_COUNT+1 + m_iwr - delay_n_1;
+		//out_samples[i] = in_samples[i] + ((float)delay_n + 1.0f - delay_t)*m_circle_buffer[delay_n]+(delay_t-(float)delay_n)*m_circle_buffer[delay_n_1];
+		//m_circle_buffer_fb[m_iwr_fb] = (m_circle_buffer[delay_n] + ita*(m_circle_buffer[delay_n_1]-m_circle_buffer[delay_n])) 
+		//	+ gfb*(m_circle_buffer_fb[delay_n_fb]+ita*(m_circle_buffer_fb[delay_n_fb_1]-m_circle_buffer_fb[delay_n_fb]));
+
+		//out_samples[i] = in_samples[i] + gff * m_circle_buffer_fb[m_iwr_fb];
+		out_samples[i] = in_samples[i] + gff*(circle_buffer[delay_n] + ita*(circle_buffer[delay_n_1]-circle_buffer[delay_n])) + gfb*(circle_buffer_fb[delay_n_fb]+ita*(circle_buffer_fb[delay_n_fb_1]-circle_buffer_fb[delay_n_fb]));
+		out_samples[i] = 0.6f*out_samples[i];
+		samples_processed++;
+		circle_buffer[iwr] = in_samples[i];
+		iwr++;
+		circle_buffer_fb[iwr_fb] = out_samples[i];
+		iwr_fb++;
+		iwr = iwr >= MAX_DELAY_SAMPLE_COUNT ? 0 : iwr;
+		iwr_fb = iwr_fb >= MAX_DELAY_SAMPLE_COUNT ? 0 : iwr_fb;
+
+	}
+	return sample_count;
+}
+
+void CSlowFlanging::uninit()
+{
+	//m_delayed_samples.clear();
+	if (m_circle_buffer_l != NULL)
+	{
+		delete[] m_circle_buffer_l;
+		m_circle_buffer_l = NULL;
+	}
+	if (m_circle_buffer_fb_l != NULL)
+	{
+		delete[] m_circle_buffer_fb_l;
+		m_circle_buffer_fb_l = NULL;
+	}
+	if (m_circle_buffer_r != NULL)
+	{
+		delete[] m_circle_buffer_r;
+		m_circle_buffer_r = NULL;
+	}
+	if (m_circle_buffer_fb_r != NULL)
+	{
+		delete[] m_circle_buffer_fb_r;
+		m_circle_buffer_fb_r = NULL;
+	}
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/CMakeLists.txt
new file mode 100644
index 0000000..7a39e15
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/CMakeLists.txt
@@ -0,0 +1,4 @@
+include_directories(./ inc ref src src/common ref ref/kiss_fft)
+file(GLOB_RECURSE SUPERSOUND_SRC_FILES src/*cpp ref/*cpp)
+add_library(supersound ${SUPERSOUND_SRC_FILES})
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/impulse_types.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/impulse_types.h
new file mode 100755
index 0000000..0f54d5a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/impulse_types.h
@@ -0,0 +1,59 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//在 impulse 工程中使用到的常量和结构
+
+#ifndef __IMPULSE_TYPES_H__
+#define __IMPULSE_TYPES_H__
+
+#include <stdint.h>
+#include "CImEffectParams.h"
+//typedef struct _Impulse_Param
+//{
+//    //采样率，单位 hz
+//    int32_t fs;
+//    //输入声道数
+//    int32_t in_channels;
+//    //输出声道数，需和输入通道相同
+//    int32_t out_channels;
+//    //FIR 窗 bit 长度，最小为 10
+//    int32_t window_bits;
+//    //im 响应，外围需要保证其采样率和输入的采样率一致
+//    float * im_response;
+//    //响应的长度
+//    int32_t response_len;
+//    //响应的通道数，该通道数必须与输入通道数相同或为1，为1时表示输入的所有通道使用相同的响应
+//    int32_t response_channels;
+//    // 每次处理时输入的音频的长度(单声道的长度)，用于计算延迟
+//    int32_t process_buffer_len;
+//} Impulse_Param;
+
+#endif /* __IMPULSE_TYPES_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/supersound_err.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/supersound_err.h
new file mode 100755
index 0000000..8f9de9c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/supersound_err.h
@@ -0,0 +1,45 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SUPERSOUND_ERR_H__
+#define __SUPERSOUND_ERR_H__
+
+//成功
+#define ERROR_SUPERSOUND_SUCCESS		            0
+
+//输入参数有误
+#define ERROR_SUPERSOUND_PARAM			            2000
+//内存不够
+#define ERROR_SUPERSOUND_MEMORY			            2001
+
+#define ERROR_SUPERSOUND_INPUT_NOT_SAME_OUT			2002
+
+#endif /* __SUPERSOUND_ERR_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/supersound_types.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/supersound_types.h
new file mode 100755
index 0000000..1043f7c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/inc/supersound_types.h
@@ -0,0 +1,74 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//在 super sound 工程中使用到的常量和结构
+
+#ifndef __SUPERSOUND_TYPES_H__
+#define __SUPERSOUND_TYPES_H__
+
+#include <stdint.h>
+
+//+ ----------------------------------------------------
+//+ 版本定义，实际含义是 N 位 2 位 2 位：3.10.01 版本
+//+ ----------------------------------------------------
+#define SUPERSOUND_VERSION	31001
+
+//+ ----------------------------------------------------
+//+ 实例定义
+//+ ----------------------------------------------------
+typedef void* SUPERSOUND_INST;
+
+//+ ----------------------------------------------------
+//+ 音效类型定义
+//+ ----------------------------------------------------
+enum SUPERSOUND_EFFECT_TYPE
+{
+	SUPERSOUND_MIN_TYPE = -1,			//类型最小值，限制输入
+
+	SUPERSOUND_IMPULSE_TYPE,			//IM 效果
+
+	SUPERSOUND_MAX_TYPE,			//类型最大值，限制输入
+};
+
+//声道的宏定义，方便在数组中表示
+#define CHANNEL_FL		0
+#define CHANNEL_FC		1
+#define CHANNEL_FR		2
+#define CHANNEL_SL		3
+#define CHANNEL_SR		4
+#define CHANNEL_LFE		5
+//后环绕
+#define	CHANNEL_BSUR	6
+#define CHANNEL_BL		6
+#define CHANNEL_BR		7
+#define CHANNEL_MAX		8
+
+#endif /* __SUPERSOUND_TYPES_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/_kiss_fft_guts.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/_kiss_fft_guts.h
new file mode 100755
index 0000000..62951be
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/_kiss_fft_guts.h
@@ -0,0 +1,132 @@
+/*
+Copyright (c) 2003-2004, Mark Borgerding
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
+    * Neither the author nor the names of any contributors may be used to endorse or promote products derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+/* kiss_fft.h
+   defines kiss_fft_scalar as either short or a float type
+   and defines
+   typedef struct { kiss_fft_scalar r; kiss_fft_scalar i; }kiss_fft_cpx; */
+#include "kiss_fft.h"
+
+
+#define MAXFACTORS 32
+/* e.g. an fft of length 128 has 4 factors 
+ as far as kissfft is concerned
+ 4*4*4*2
+ */
+
+struct kiss_fft_state{
+    int nfft;
+    int inverse;
+    int factors[2*MAXFACTORS];
+    kiss_fft_cpx twiddles[1];
+};
+
+/*
+  Explanation of macros dealing with complex math:
+
+   C_MUL(m,a,b)         : m = a*b
+   C_FIXDIV( c , div )  : if a fixed point impl., c /= div. noop otherwise
+   C_SUB( res, a,b)     : res = a - b
+   C_SUBFROM( res , a)  : res -= a
+   C_ADDTO( res , a)    : res += a
+ * */
+#ifdef FIXED_POINT
+
+#if defined(CHECK_OVERFLOW)
+#  define CHECK_OVERFLOW_OP(a,op,b)  \
+	if ( (long)(a) op (long)(b) > 32767 || (long)(a) op (long)(b) < -32768 ) { \
+		fprintf(stderr,"WARNING:overflow @ " __FILE__ "(%d): (%d " #op" %d) = %ld\n",__LINE__,(a),(b),(long)(a) op (long)(b) );  }
+#endif
+
+
+#   define smul(a,b) ( (long)(a)*(b) )
+#   define sround( x )  (short)( ( (x) + (1<<14) ) >>15 )
+
+#   define S_MUL(a,b) sround( smul(a,b) )
+
+#   define C_MUL(m,a,b) \
+      do{ (m).r = sround( smul((a).r,(b).r) - smul((a).i,(b).i) ); \
+          (m).i = sround( smul((a).r,(b).i) + smul((a).i,(b).r) ); }while(0)
+
+#   define DIVSCALAR(x,k) \
+	(x) = sround( smul(  x, 32767/k ) )
+
+#   define C_FIXDIV(c,div) \
+	do {    DIVSCALAR( (c).r , div);  \
+		DIVSCALAR( (c).i  , div); }while (0)
+
+#   define C_MULBYSCALAR( c, s ) \
+    do{ (c).r =  sround( smul( (c).r , s ) ) ;\
+        (c).i =  sround( smul( (c).i , s ) ) ; }while(0)
+
+#else  /* not FIXED_POINT*/
+
+#   define S_MUL(a,b) ( (a)*(b) )
+#define C_MUL(m,a,b) \
+    do{ (m).r = (a).r*(b).r - (a).i*(b).i;\
+        (m).i = (a).r*(b).i + (a).i*(b).r; }while(0)
+#   define C_FIXDIV(c,div) /* NOOP */
+#   define C_MULBYSCALAR( c, s ) \
+    do{ (c).r *= (s);\
+        (c).i *= (s); }while(0)
+#endif
+
+#ifndef CHECK_OVERFLOW_OP
+#  define CHECK_OVERFLOW_OP(a,op,b) /* noop */
+#endif
+
+#define  C_ADD( res, a,b)\
+    do { \
+	    CHECK_OVERFLOW_OP((a).r,+,(b).r)\
+	    CHECK_OVERFLOW_OP((a).i,+,(b).i)\
+	    (res).r=(a).r+(b).r;  (res).i=(a).i+(b).i; \
+    }while(0)
+#define  C_SUB( res, a,b)\
+    do { \
+	    CHECK_OVERFLOW_OP((a).r,-,(b).r)\
+	    CHECK_OVERFLOW_OP((a).i,-,(b).i)\
+	    (res).r=(a).r-(b).r;  (res).i=(a).i-(b).i; \
+    }while(0)
+#define C_ADDTO( res , a)\
+    do { \
+	    CHECK_OVERFLOW_OP((res).r,+,(a).r)\
+	    CHECK_OVERFLOW_OP((res).i,+,(a).i)\
+	    (res).r += (a).r;  (res).i += (a).i;\
+    }while(0)
+
+#define C_SUBFROM( res , a)\
+    do {\
+	    CHECK_OVERFLOW_OP((res).r,-,(a).r)\
+	    CHECK_OVERFLOW_OP((res).i,-,(a).i)\
+	    (res).r -= (a).r;  (res).i -= (a).i; \
+    }while(0)
+
+
+
+
+static 
+void kf_cexp(kiss_fft_cpx * x,double phase) /* returns e ** (j*phase)   */
+{
+#ifdef FIXED_POINT
+    x->r = (kiss_fft_scalar) (32767 * cos (phase));
+    x->i = (kiss_fft_scalar) (32767 * sin (phase));
+#else
+    x->r = (kiss_fft_scalar) cos (phase);
+    x->i = (kiss_fft_scalar) sin (phase);
+#endif
+}
+
+/* a debugging function */
+#define pcpx(c)\
+    fprintf(stderr,"%g + %gi\n",(double)((c)->r),(double)((c)->i) )
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fft.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fft.cpp
new file mode 100755
index 0000000..62c787f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fft.cpp
@@ -0,0 +1,369 @@
+/*
+Copyright (c) 2003-2004, Mark Borgerding
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
+    * Neither the author nor the names of any contributors may be used to endorse or promote products derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+#include "_kiss_fft_guts.h"
+/* The guts header contains all the multiplication and addition macros that are defined for
+ fixed or floating point complex numbers.  It also delares the kf_ internal functions.
+ */
+
+static kiss_fft_cpx *scratchbuf=NULL;
+static size_t nscratchbuf=0;
+static kiss_fft_cpx *tmpbuf=NULL;
+static size_t ntmpbuf=0;
+
+#define CHECKBUF(buf,nbuf,n) \
+	do { \
+	if ( nbuf < (size_t)(n) ) {\
+	buf = (kiss_fft_cpx*)realloc(buf,sizeof(kiss_fft_cpx)*(n)); \
+	nbuf = (size_t)(n); \
+	} \
+	}while(0)
+
+
+static void kf_bfly2(
+					 kiss_fft_cpx * Fout,
+					 const size_t fstride,
+					 const kiss_fft_cfg st,
+					 int m
+					 )
+{
+	kiss_fft_cpx * Fout2;
+	kiss_fft_cpx * tw1 = st->twiddles;
+	kiss_fft_cpx t;
+	Fout2 = Fout + m;
+	do{
+		C_FIXDIV(*Fout,2); C_FIXDIV(*Fout2,2);
+
+		C_MUL (t,  *Fout2 , *tw1);
+		tw1 += fstride;
+		C_SUB( *Fout2 ,  *Fout , t );
+		C_ADDTO( *Fout ,  t );
+		++Fout2;
+		++Fout;
+	}while (--m);
+}
+
+static void kf_bfly4(
+					 kiss_fft_cpx * Fout,
+					 const size_t fstride,
+					 const kiss_fft_cfg st,
+					 const size_t m
+					 )
+{
+	kiss_fft_cpx *tw1,*tw2,*tw3;
+	kiss_fft_cpx scratch[6];
+	size_t k=m;
+	const size_t m2=2*m;
+	const size_t m3=3*m;
+
+	tw3 = tw2 = tw1 = st->twiddles;
+
+	do {
+		C_FIXDIV(*Fout,4); C_FIXDIV(Fout[m],4); C_FIXDIV(Fout[m2],4); C_FIXDIV(Fout[m3],4);
+
+		C_MUL(scratch[0],Fout[m] , *tw1 );
+		C_MUL(scratch[1],Fout[m2] , *tw2 );
+		C_MUL(scratch[2],Fout[m3] , *tw3 );
+
+		C_SUB( scratch[5] , *Fout, scratch[1] );
+		C_ADDTO(*Fout, scratch[1]);
+		C_ADD( scratch[3] , scratch[0] , scratch[2] );
+		C_SUB( scratch[4] , scratch[0] , scratch[2] );
+		C_SUB( Fout[m2], *Fout, scratch[3] );
+		tw1 += fstride;
+		tw2 += fstride*2;
+		tw3 += fstride*3;
+		C_ADDTO( *Fout , scratch[3] );
+
+		if(st->inverse) {
+			Fout[m].r = scratch[5].r - scratch[4].i;
+			Fout[m].i = scratch[5].i + scratch[4].r;
+			Fout[m3].r = scratch[5].r + scratch[4].i;
+			Fout[m3].i = scratch[5].i - scratch[4].r;
+		}else{
+			Fout[m].r = scratch[5].r + scratch[4].i;
+			Fout[m].i = scratch[5].i - scratch[4].r;
+			Fout[m3].r = scratch[5].r - scratch[4].i;
+			Fout[m3].i = scratch[5].i + scratch[4].r;
+		}
+		++Fout;
+	}while(--k);
+}
+
+static void kf_bfly3(
+					 kiss_fft_cpx * Fout,
+					 const size_t fstride,
+					 const kiss_fft_cfg st,
+					 size_t m
+					 )
+{
+	size_t k=m;
+	const size_t m2 = 2*m;
+	kiss_fft_cpx *tw1,*tw2;
+	kiss_fft_cpx scratch[5];
+	kiss_fft_cpx epi3;
+	epi3 = st->twiddles[fstride*m];
+
+	tw1=tw2=st->twiddles;
+
+	do{
+		C_FIXDIV(*Fout,3); C_FIXDIV(Fout[m],3); C_FIXDIV(Fout[m2],3);
+
+		C_MUL(scratch[1],Fout[m] , *tw1);
+		C_MUL(scratch[2],Fout[m2] , *tw2);
+
+		C_ADD(scratch[3],scratch[1],scratch[2]);
+		C_SUB(scratch[0],scratch[1],scratch[2]);
+		tw1 += fstride;
+		tw2 += fstride*2;
+
+		Fout[m].r = Fout->r - scratch[3].r/2;
+		Fout[m].i = Fout->i - scratch[3].i/2;
+
+		C_MULBYSCALAR( scratch[0] , epi3.i );
+
+		C_ADDTO(*Fout,scratch[3]);
+
+		Fout[m2].r = Fout[m].r + scratch[0].i;
+		Fout[m2].i = Fout[m].i - scratch[0].r;
+
+		Fout[m].r -= scratch[0].i;
+		Fout[m].i += scratch[0].r;
+
+		++Fout;
+	}while(--k);
+}
+
+static void kf_bfly5(
+					 kiss_fft_cpx * Fout,
+					 const size_t fstride,
+					 const kiss_fft_cfg st,
+					 int m
+					 )
+{
+	kiss_fft_cpx *Fout0,*Fout1,*Fout2,*Fout3,*Fout4;
+	int u;
+	kiss_fft_cpx scratch[13];
+	kiss_fft_cpx * twiddles = st->twiddles;
+	kiss_fft_cpx *tw;
+	kiss_fft_cpx ya,yb;
+	ya = twiddles[fstride*m];
+	yb = twiddles[fstride*2*m];
+
+	Fout0=Fout;
+	Fout1=Fout0+m;
+	Fout2=Fout0+2*m;
+	Fout3=Fout0+3*m;
+	Fout4=Fout0+4*m;
+
+	tw=st->twiddles;
+	for ( u=0; u<m; ++u ) {
+		C_FIXDIV( *Fout0,5); C_FIXDIV( *Fout1,5); C_FIXDIV( *Fout2,5); C_FIXDIV( *Fout3,5); C_FIXDIV( *Fout4,5);
+		scratch[0] = *Fout0;
+
+		C_MUL(scratch[1] ,*Fout1, tw[u*fstride]);
+		C_MUL(scratch[2] ,*Fout2, tw[2*u*fstride]);
+		C_MUL(scratch[3] ,*Fout3, tw[3*u*fstride]);
+		C_MUL(scratch[4] ,*Fout4, tw[4*u*fstride]);
+
+		C_ADD( scratch[7],scratch[1],scratch[4]);
+		C_SUB( scratch[10],scratch[1],scratch[4]);
+		C_ADD( scratch[8],scratch[2],scratch[3]);
+		C_SUB( scratch[9],scratch[2],scratch[3]);
+
+		Fout0->r += scratch[7].r + scratch[8].r;
+		Fout0->i += scratch[7].i + scratch[8].i;
+
+		scratch[5].r = scratch[0].r + S_MUL(scratch[7].r,ya.r) + S_MUL(scratch[8].r,yb.r);
+		scratch[5].i = scratch[0].i + S_MUL(scratch[7].i,ya.r) + S_MUL(scratch[8].i,yb.r);
+
+		scratch[6].r =  S_MUL(scratch[10].i,ya.i) + S_MUL(scratch[9].i,yb.i);
+		scratch[6].i = -S_MUL(scratch[10].r,ya.i) - S_MUL(scratch[9].r,yb.i);
+
+		C_SUB(*Fout1,scratch[5],scratch[6]);
+		C_ADD(*Fout4,scratch[5],scratch[6]);
+
+		scratch[11].r = scratch[0].r + S_MUL(scratch[7].r,yb.r) + S_MUL(scratch[8].r,ya.r);
+		scratch[11].i = scratch[0].i + S_MUL(scratch[7].i,yb.r) + S_MUL(scratch[8].i,ya.r);
+		scratch[12].r = - S_MUL(scratch[10].i,yb.i) + S_MUL(scratch[9].i,ya.i);
+		scratch[12].i = S_MUL(scratch[10].r,yb.i) - S_MUL(scratch[9].r,ya.i);
+
+		C_ADD(*Fout2,scratch[11],scratch[12]);
+		C_SUB(*Fout3,scratch[11],scratch[12]);
+
+		++Fout0;++Fout1;++Fout2;++Fout3;++Fout4;
+	}
+}
+
+/* perform the butterfly for one stage of a mixed radix FFT */
+static void kf_bfly_generic(
+							kiss_fft_cpx * Fout,
+							const size_t fstride,
+							const kiss_fft_cfg st,
+							int m,
+							int p
+							)
+{
+	int u,k,q1,q;
+	kiss_fft_cpx * twiddles = st->twiddles;
+	kiss_fft_cpx t;
+	int Norig = st->nfft;
+
+	CHECKBUF(scratchbuf,nscratchbuf,p);
+
+	for ( u=0; u<m; ++u ) {
+		k=u;
+		for ( q1=0 ; q1<p ; ++q1 ) {
+			scratchbuf[q1] = Fout[ k  ];
+			C_FIXDIV(scratchbuf[q1],p);
+			k += m;
+		}
+
+		k=u;
+		for ( q1=0 ; q1<p ; ++q1 ) {
+			int twidx=0;
+			Fout[ k ] = scratchbuf[0];
+			for (q=1;q<p;++q ) {
+				twidx += fstride * k;
+				if (twidx>=Norig) twidx-=Norig;
+				C_MUL(t,scratchbuf[q] , twiddles[twidx] );
+				C_ADDTO( Fout[ k ] ,t);
+			}
+			k += m;
+		}
+	}
+}
+
+static
+void kf_work(
+			 kiss_fft_cpx * Fout,
+			 const kiss_fft_cpx * f,
+			 const size_t fstride,
+			 int in_stride,
+			 int * factors,
+			 const kiss_fft_cfg st
+			 )
+{
+	kiss_fft_cpx * Fout_beg=Fout;
+	const int p=*factors++; /* the radix  */
+	const int m=*factors++; /* stage's fft length/p */
+	const kiss_fft_cpx * Fout_end = Fout + p*m;
+
+	if (m==1) {
+		do{
+			*Fout = *f;
+			f += fstride*in_stride;
+		}while(++Fout != Fout_end );
+	}else{
+		do{
+			kf_work( Fout , f, fstride*p, in_stride, factors,st);
+			f += fstride*in_stride;
+		}while( (Fout += m) != Fout_end );
+	}
+
+	Fout=Fout_beg;
+
+	switch (p) {
+		case 2: kf_bfly2(Fout,fstride,st,m); break;
+		case 3: kf_bfly3(Fout,fstride,st,m); break; 
+		case 4: kf_bfly4(Fout,fstride,st,m); break;
+		case 5: kf_bfly5(Fout,fstride,st,m); break; 
+		default: kf_bfly_generic(Fout,fstride,st,m,p); break;
+	}
+}
+
+/*  facbuf is populated by p1,m1,p2,m2, ...
+where 
+p[i] * m[i] = m[i-1]
+m0 = n                  */
+static 
+void kf_factor(int n,int * facbuf)
+{
+	int p=4;
+	double floor_sqrt;
+	floor_sqrt = floor( sqrt((double)n) );
+
+	/*factor out powers of 4, powers of 2, then any remaining primes */
+	do {
+		while (n % p) {
+			switch (p) {
+				case 4: p = 2; break;
+				case 2: p = 3; break;
+				default: p += 2; break;
+			}
+			if (p > floor_sqrt)
+				p = n;          /* no more factors, skip to end */
+		}
+		n /= p;
+		*facbuf++ = p;
+		*facbuf++ = n;
+	} while (n > 1);
+}
+
+/*
+*
+* User-callable function to allocate all necessary storage space for the fft.
+*
+* The return value is a contiguous block of memory, allocated with malloc.  As such,
+* It can be freed with free(), rather than a kiss_fft-specific function.
+* */
+kiss_fft_cfg kiss_fft_alloc(int nfft,int inverse_fft,void * mem,size_t * lenmem )
+{
+	kiss_fft_cfg st=NULL;
+	size_t memneeded = sizeof(struct kiss_fft_state)
+		+ sizeof(kiss_fft_cpx)*(nfft-1); /* twiddle factors*/
+
+	if ( lenmem==NULL ) {
+		st = ( kiss_fft_cfg)malloc( memneeded );
+	}else{
+		if (*lenmem >= memneeded)
+			st = (kiss_fft_cfg)mem;
+		*lenmem = memneeded;
+	}
+	if (st) {
+		int i;
+		st->nfft=nfft;
+		st->inverse = inverse_fft;
+
+		for (i=0;i<nfft;++i) {
+			const double pi=3.14159265358979323846264338327;
+			double phase = ( -2*pi /nfft ) * i;
+			if (st->inverse)
+				phase *= -1;
+			kf_cexp(st->twiddles+i, phase );
+		}
+
+		kf_factor(nfft,st->factors);
+	}
+	return st;
+}
+
+
+
+
+void kiss_fft_stride(kiss_fft_cfg st,const kiss_fft_cpx *fin,kiss_fft_cpx *fout,int in_stride)
+{
+	if (fin == fout) {
+		CHECKBUF(tmpbuf,ntmpbuf,st->nfft);
+		kf_work(tmpbuf,fin,1,in_stride, st->factors,st);
+		memcpy(fout,tmpbuf,sizeof(kiss_fft_cpx)*st->nfft);
+	}else{
+		kf_work( fout, fin, 1,in_stride, st->factors,st );
+	}
+}
+
+void kiss_fft(kiss_fft_cfg cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout)
+{
+	kiss_fft_stride(cfg,fin,fout,1);
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fft.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fft.h
new file mode 100755
index 0000000..1e9f023
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fft.h
@@ -0,0 +1,92 @@
+#ifndef KISS_FFT_H
+#define KISS_FFT_H
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <math.h>
+#include <memory.h>
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/*
+ ATTENTION!
+ If you would like a :
+ -- a utility that will handle the caching of fft objects
+ -- real-only (no imaginary time component ) FFT
+ -- a multi-dimensional FFT
+ -- a command-line utility to perform ffts
+ -- a command-line utility to perform fast-convolution filtering
+
+ Then see kfc.h kiss_fftr.h kiss_fftnd.h fftutil.c kiss_fastfir.c
+  in the tools/ directory.
+*/
+
+#ifdef FIXED_POINT
+# define kiss_fft_scalar short
+#else
+# ifndef kiss_fft_scalar
+/*  default is float */
+#   define kiss_fft_scalar float
+# endif
+#endif
+
+typedef struct {
+    kiss_fft_scalar r;
+    kiss_fft_scalar i;
+}kiss_fft_cpx;
+
+typedef struct kiss_fft_state* kiss_fft_cfg;
+
+/* 
+ *  kiss_fft_alloc
+ *  
+ *  Initialize a FFT (or IFFT) algorithm's cfg/state buffer.
+ *
+ *  typical usage:      kiss_fft_cfg mycfg=kiss_fft_alloc(1024,0,NULL,NULL);
+ *
+ *  The return value from fft_alloc is a cfg buffer used internally
+ *  by the fft routine or NULL.
+ *
+ *  If lenmem is NULL, then kiss_fft_alloc will allocate a cfg buffer using malloc.
+ *  The returned value should be free()d when done to avoid memory leaks.
+ *  
+ *  The state can be placed in a user supplied buffer 'mem':
+ *  If lenmem is not NULL and mem is not NULL and *lenmem is large enough,
+ *      then the function places the cfg in mem and the size used in *lenmem
+ *      and returns mem.
+ *  
+ *  If lenmem is not NULL and ( mem is NULL or *lenmem is not large enough),
+ *      then the function returns NULL and places the minimum cfg 
+ *      buffer size in *lenmem.
+ * */
+
+kiss_fft_cfg kiss_fft_alloc(int nfft,int inverse_fft,void * mem,size_t * lenmem); 
+
+/*
+ * kiss_fft(cfg,in_out_buf)
+ *
+ * Perform an FFT on a complex input buffer.
+ * for a forward FFT,
+ * fin should be  f[0] , f[1] , ... ,f[nfft-1]
+ * fout will be   F[0] , F[1] , ... ,F[nfft-1]
+ * Note that each element is complex and can be accessed like
+    f[k].r and f[k].i
+ * */
+void kiss_fft(kiss_fft_cfg cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout);
+
+/*
+ A more generic version of the above function. It reads its input from every Nth sample.
+ * */
+void kiss_fft_stride(kiss_fft_cfg cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout,int fin_stride);
+
+/* If kiss_fft_alloc allocated a buffer, it is one contiguous 
+   buffer and can be simply free()d when no longer needed*/
+#define kiss_fft_free free
+
+#ifdef __cplusplus
+} 
+#endif
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftnd.c b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftnd.c
new file mode 100755
index 0000000..45be848
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftnd.c
@@ -0,0 +1,173 @@
+
+
+/*
+Copyright (c) 2003-2004, Mark Borgerding
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
+    * Neither the author nor the names of any contributors may be used to endorse or promote products derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+#include "kiss_fftnd.h"
+#include "_kiss_fft_guts.h"
+
+struct kiss_fftnd_state{
+	int dimprod; /* dimsum would be mighty tasty right now */
+	int ndims; 
+	int *dims;
+	kiss_fft_cfg *states; /* cfg states for each dimension */
+	kiss_fft_cpx * tmpbuf; /*buffer capable of hold the entire buffer */
+};
+
+kiss_fftnd_cfg kiss_fftnd_alloc(int *dims,int ndims,int inverse_fft,void*mem,size_t*lenmem)
+{
+	kiss_fftnd_cfg st = NULL;
+	int i;
+	int dimprod=1;
+	size_t memneeded = sizeof(struct kiss_fftnd_state);
+	char * ptr;
+
+	for (i=0;i<ndims;++i) {
+		size_t sublen=0;
+		kiss_fft_alloc (dims[i], inverse_fft, NULL, &sublen);
+		memneeded += sublen;   /* st->states[i] */
+		dimprod *= dims[i];
+	}
+	memneeded += sizeof(int) * ndims;/*  st->dims */
+	memneeded += sizeof(void*) * ndims;/* st->states  */
+	memneeded += sizeof(kiss_fft_cpx) * dimprod; /* st->tmpbuf */
+
+	if (lenmem == NULL) {/* allocate for the caller*/
+		st = (kiss_fftnd_cfg) malloc (memneeded);
+	} else { /* initialize supplied buffer if big enough */
+		if (*lenmem >= memneeded)
+			st = (kiss_fftnd_cfg) mem;
+		*lenmem = memneeded; /*tell caller how big struct is (or would be) */
+	}
+	if (!st)
+		return NULL; /*malloc failed or buffer too small */
+
+	st->dimprod = dimprod;
+	st->ndims = ndims;
+	ptr=(char*)(st+1);
+
+	st->states = (kiss_fft_cfg *)ptr;
+	ptr += sizeof(void*) * ndims;
+
+	st->dims = (int*)ptr;
+	ptr += sizeof(int) * ndims;
+
+	st->tmpbuf = (kiss_fft_cpx*)ptr;
+	ptr += sizeof(kiss_fft_cpx) * dimprod;
+
+	for (i=0;i<ndims;++i) {
+		size_t len;
+		st->dims[i] = dims[i];
+		kiss_fft_alloc (st->dims[i], inverse_fft, NULL, &len);
+		st->states[i] = kiss_fft_alloc (st->dims[i], inverse_fft, ptr,&len);
+		ptr += len;
+	}
+	return st;
+}
+
+/*
+ This works by tackling one dimension at a time.
+
+ In effect,
+ Each stage starts out by reshaping the matrix into a DixSi 2d matrix.
+ A Di-sized fft is taken of each column, transposing the matrix as it goes.
+
+Here's a 3-d example:
+Take a 2x3x4 matrix, laid out in memory as a contiguous buffer
+ [ [ [ a b c d ] [ e f g h ] [ i j k l ] ]
+   [ [ m n o p ] [ q r s t ] [ u v w x ] ] ]
+
+Stage 0 ( D=2): treat the buffer as a 2x12 matrix
+   [ [a b ... k l]
+     [m n ... w x] ]
+
+   FFT each column with size 2.
+   Transpose the matrix at the same time using kiss_fft_stride.
+
+   [ [ a+m a-m ]
+     [ b+n b-n]
+     ...
+     [ k+w k-w ]
+     [ l+x l-x ] ]
+
+   Note fft([x y]) == [x+y x-y]
+
+Stage 1 ( D=3) treats the buffer (the output of stage D=2) as an 3x8 matrix,
+   [ [ a+m a-m b+n b-n c+o c-o d+p d-p ] 
+     [ e+q e-q f+r f-r g+s g-s h+t h-t ]
+     [ i+u i-u j+v j-v k+w k-w l+x l-x ] ]
+
+   And perform FFTs (size=3) on each of the columns as above, transposing 
+   the matrix as it goes.  The output of stage 1 is 
+       (Legend: ap = [ a+m e+q i+u ]
+                am = [ a-m e-q i-u ] )
+   
+   [ [ sum(ap) fft(ap)[0] fft(ap)[1] ]
+     [ sum(am) fft(am)[0] fft(am)[1] ]
+     [ sum(bp) fft(bp)[0] fft(bp)[1] ]
+     [ sum(bm) fft(bm)[0] fft(bm)[1] ]
+     [ sum(cp) fft(cp)[0] fft(cp)[1] ]
+     [ sum(cm) fft(cm)[0] fft(cm)[1] ]
+     [ sum(dp) fft(dp)[0] fft(dp)[1] ]
+     [ sum(dm) fft(dm)[0] fft(dm)[1] ]  ]
+
+Stage 2 ( D=4) treats this buffer as a 4*6 matrix,
+   [ [ sum(ap) fft(ap)[0] fft(ap)[1] sum(am) fft(am)[0] fft(am)[1] ]
+     [ sum(bp) fft(bp)[0] fft(bp)[1] sum(bm) fft(bm)[0] fft(bm)[1] ]
+     [ sum(cp) fft(cp)[0] fft(cp)[1] sum(cm) fft(cm)[0] fft(cm)[1] ]
+     [ sum(dp) fft(dp)[0] fft(dp)[1] sum(dm) fft(dm)[0] fft(dm)[1] ]  ]
+
+   Then FFTs each column, transposing as it goes.
+
+   The resulting matrix is the 3d FFT of the 2x3x4 input matrix.
+
+   Note as a sanity check that the first element of the final 
+   stage's output (DC term) is 
+   sum( [ sum(ap) sum(bp) sum(cp) sum(dp) ] )
+   , i.e. the summation of all 24 input elements. 
+
+   */
+void kiss_fftnd(kiss_fftnd_cfg st,const kiss_fft_cpx *fin,kiss_fft_cpx *fout)
+{
+	int i,k;
+	const kiss_fft_cpx * bufin=fin;
+	kiss_fft_cpx * bufout;
+
+	/*arrange it so the last bufout == fout*/
+	if ( st->ndims & 1 ) {
+		bufout = fout;
+		if (fin==fout) {
+			memcpy( st->tmpbuf, fin, sizeof(kiss_fft_cpx) * st->dimprod );
+			bufin = st->tmpbuf;
+		}
+	}else
+		bufout = st->tmpbuf;
+
+	for ( k=0; k < st->ndims; ++k) {
+		int curdim = st->dims[k];
+		int stride = st->dimprod / curdim;
+
+		for ( i=0 ; i<stride ; ++i ) 
+			kiss_fft_stride( st->states[k], bufin+i , bufout+i*curdim, stride );
+
+		/*toggle back and forth between the two buffers*/
+		if (bufout == st->tmpbuf){
+			bufout = fout;
+			bufin = st->tmpbuf;
+		}else{
+			bufout = st->tmpbuf;
+			bufin = fout;
+		}
+	}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftnd.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftnd.h
new file mode 100755
index 0000000..1404674
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftnd.h
@@ -0,0 +1,18 @@
+#ifndef KISS_FFTND_H
+#define KISS_FFTND_H
+
+#include "kiss_fft.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+typedef struct kiss_fftnd_state * kiss_fftnd_cfg;
+    
+kiss_fftnd_cfg  kiss_fftnd_alloc(int *dims,int ndims,int inverse_fft,void*mem,size_t*lenmem);
+void kiss_fftnd(kiss_fftnd_cfg  cfg,const kiss_fft_cpx *fin,kiss_fft_cpx *fout);
+
+#ifdef __cplusplus
+}
+#endif
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftr.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftr.cpp
new file mode 100755
index 0000000..416ede8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftr.cpp
@@ -0,0 +1,141 @@
+/*
+Copyright (c) 2003-2004, Mark Borgerding
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
+    * Neither the author nor the names of any contributors may be used to endorse or promote products derived from this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+#include "kiss_fftr.h"
+#include "_kiss_fft_guts.h"
+
+struct kiss_fftr_state{
+	kiss_fft_cfg substate;
+	kiss_fft_cpx * tmpbuf;
+	kiss_fft_cpx * super_twiddles;
+};
+
+kiss_fftr_cfg kiss_fftr_alloc(int nfft,int inverse_fft,void * mem,size_t * lenmem)
+{
+	int i;
+	kiss_fftr_cfg st = NULL;
+	size_t subsize, memneeded;
+
+	if (nfft & 1) {
+	//	fprintf(stderr,"Real FFT optimization must be even.\n");
+		return NULL;
+	}
+	nfft >>= 1;
+
+	kiss_fft_alloc (nfft, inverse_fft, NULL, &subsize);
+	memneeded = sizeof(struct kiss_fftr_state) + subsize + sizeof(kiss_fft_cpx) * ( nfft * 2);
+
+	if (lenmem == NULL) {
+		st = (kiss_fftr_cfg) malloc (memneeded);
+	} else {
+		if (*lenmem >= memneeded)
+			st = (kiss_fftr_cfg) mem;
+		*lenmem = memneeded;
+	}
+	if (!st)
+		return NULL;
+
+	st->substate = (kiss_fft_cfg) (st + 1); /*just beyond kiss_fftr_state struct */
+	st->tmpbuf = (kiss_fft_cpx *) (((char *) st->substate) + subsize);
+	st->super_twiddles = st->tmpbuf + nfft;
+	kiss_fft_alloc(nfft, inverse_fft, st->substate, &subsize);
+
+	for (i = 0; i < nfft; ++i) {
+		double phase = -3.14159265358979323846264338327 * ((double) i / nfft + .5);
+		if (inverse_fft)
+			phase *= -1;
+		kf_cexp (st->super_twiddles+i,phase);
+	}
+	return st;
+}
+
+void kiss_fftr(kiss_fftr_cfg st,const kiss_fft_scalar *timedata,kiss_fft_cpx *freqdata)
+{
+	/* input buffer timedata is stored row-wise */
+	int k,N;
+	kiss_fft_cpx fpnk,fpk,f1k,f2k,tw,tdc;
+
+	if ( st->substate->inverse) {
+	//	fprintf(stderr,"kiss fft usage error: improper alloc\n");
+		return;
+	}
+
+	N = st->substate->nfft;
+
+	/*perform the parallel fft of two real signals packed in real,imag*/
+	kiss_fft( st->substate , (const kiss_fft_cpx*)timedata, st->tmpbuf );
+
+	tdc.r = st->tmpbuf[0].r;
+	tdc.i = st->tmpbuf[0].i;
+	C_FIXDIV(tdc,2);
+
+	CHECK_OVERFLOW_OP(tdc.r ,+, tdc.i);
+	freqdata[0].r = tdc.r + tdc.i;
+	freqdata[0].i = 0;
+
+	for (k=1;k <= N/2 ; ++k ) {
+
+		fpk = st->tmpbuf[k]; 
+		fpnk.r =  st->tmpbuf[N-k].r;
+		fpnk.i = -st->tmpbuf[N-k].i;
+		C_FIXDIV(fpk,2);
+		C_FIXDIV(fpnk,2);
+
+		C_ADD( f1k, fpk , fpnk );
+		C_SUB( f2k, fpk , fpnk );
+		C_MUL( tw , f2k , st->super_twiddles[k]);
+
+		C_ADD( freqdata[k] , f1k ,tw);
+		freqdata[k].r = (f1k.r + tw.r) / 2;
+		freqdata[k].i = (f1k.i + tw.i) / 2;
+
+		freqdata[N-k].r =   (f1k.r - tw.r)/2;
+		freqdata[N-k].i = - (f1k.i - tw.i)/2;
+	}
+	CHECK_OVERFLOW_OP(tdc.r ,-, tdc.i);
+	freqdata[N].r = tdc.r - tdc.i;
+	freqdata[N].i = 0;
+}
+
+void kiss_fftri(kiss_fftr_cfg st,const kiss_fft_cpx *freqdata,kiss_fft_scalar *timedata)
+{
+	/* input buffer timedata is stored row-wise */
+	int k, N;
+
+	if (st->substate->inverse == 0) {
+	//	fprintf (stderr, "kiss fft usage error: improper alloc\n");
+		return;
+	}
+
+	N = st->substate->nfft;
+
+	st->tmpbuf[0].r = freqdata[0].r + freqdata[N].r;
+	st->tmpbuf[0].i = freqdata[0].r - freqdata[N].r;
+
+	for (k = 1; k <= N / 2; ++k) {
+		kiss_fft_cpx fk, fnkc, fek, fok, tmpbuf;
+		fk = freqdata[k];
+		fnkc.r = freqdata[N - k].r;
+		fnkc.i = -freqdata[N - k].i;
+		C_FIXDIV( fk , 2 );
+		C_FIXDIV( fnkc , 2 );
+
+		C_ADD (fek, fk, fnkc);
+		C_SUB (tmpbuf, fk, fnkc);
+		C_MUL (fok, tmpbuf, st->super_twiddles[k]);
+		C_ADD (st->tmpbuf[k], fek, fok);
+		C_SUB (st->tmpbuf[N - k], fek, fok);
+		st->tmpbuf[N - k].i *= -1;
+	}
+	kiss_fft (st->substate, st->tmpbuf, (kiss_fft_cpx *) timedata);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftr.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftr.h
new file mode 100755
index 0000000..0d50858
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/ref/kiss_fft/kiss_fftr.h
@@ -0,0 +1,46 @@
+#ifndef KISS_FTR_H
+#define KISS_FTR_H
+
+#include "kiss_fft.h"
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+    
+/* 
+ 
+ Real optimized version can save about 45% cpu time vs. complex fft of a real seq.
+
+ 
+ 
+ */
+
+typedef struct kiss_fftr_state *kiss_fftr_cfg;
+
+
+kiss_fftr_cfg kiss_fftr_alloc(int nfft,int inverse_fft,void * mem, size_t * lenmem);
+/*
+ nfft must be even
+
+ If you don't care to allocate space, use mem = lenmem = NULL 
+*/
+
+
+void kiss_fftr(kiss_fftr_cfg cfg,const kiss_fft_scalar *timedata,kiss_fft_cpx *freqdata);
+/*
+ input timedata has nfft scalar points
+ output freqdata has nfft/2+1 complex points
+*/
+
+void kiss_fftri(kiss_fftr_cfg cfg,const kiss_fft_cpx *freqdata,kiss_fft_scalar *timedata);
+/*
+ input freqdata has  nfft/2+1 complex points
+ output timedata has nfft scalar points
+*/
+
+#define kiss_fftr_free free
+
+#ifdef __cplusplus
+}
+#endif
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/isupersound_convolution.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/isupersound_convolution.h
new file mode 100755
index 0000000..45bdec1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/isupersound_convolution.h
@@ -0,0 +1,67 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//封装卷积，目前有快速卷积和定义卷积做法
+
+#ifndef __I_SUPERSOUND_CONVOLUTION_H__
+#define __I_SUPERSOUND_CONVOLUTION_H__
+
+#include <stdint.h>
+
+namespace SUPERSOUND
+{
+
+
+class ISuperSoundConvolution
+{
+public:
+	ISuperSoundConvolution() { }
+	virtual ~ISuperSoundConvolution() { }
+
+public:
+	//清空所有缓存数据
+	virtual void Flush() = 0;
+	//这个东西该实例只让调用一次，因为多次调用，还不如让外面重新弄个实例
+	//设置处理帧长和交叠 0 的长度
+	//也就是说 FFT 的长度为这两个长度的总和，FFT 的帧移为 frame_len
+	virtual int32_t SetFrameLenZeroLen(int32_t frame_len, int32_t zero_len) = 0;
+	//设置、更新脉冲响应
+	virtual int32_t SetImpulseResponse(float * imres, int32_t len) = 0;
+	//处理，每次处理一，外面保证输入长度为一长，输出的长度放在 out_num 中
+	virtual int32_t ProcessFrame(float * buf, int32_t & out_num) = 0;
+	//获取延迟单元长度
+	virtual int32_t GetLatecy() = 0;
+};
+
+
+}
+
+#endif /* __I_SUPERSOUND_CONVOLUTION_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_fast_convolution.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_fast_convolution.cpp
new file mode 100755
index 0000000..47dd5e6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_fast_convolution.cpp
@@ -0,0 +1,286 @@
+
+#include "supersound_fast_convolution.h"
+#include "supersound_err.h"
+#include "fft/supersound_kiss_fft.h"
+#include "supersound_common.h"
+#include <new>
+#include <cstring>
+
+namespace SUPERSOUND
+{
+
+
+SuperSoundFastConvolution::SuperSoundFastConvolution()
+{
+	m_frame_len = 0;
+	m_frame_step = 0;
+	m_zero_len = 0;
+	m_imres_len = 0;
+	m_kiss_fft = NULL;
+	m_filter_num = 0;
+	m_filter_buf_array = NULL;
+	m_mix_buf_array = NULL;
+	m_mix_buf_idx = 0;
+	m_history_buf = NULL;
+	m_process_buf = NULL;
+	m_b_reduce_delay = false; // 一开始不需要考虑延迟
+}
+
+SuperSoundFastConvolution::~SuperSoundFastConvolution()
+{
+	DestoryAll();
+}
+
+void SuperSoundFastConvolution::DestoryAll()
+{
+	SAFE_DELETE_PTR(m_history_buf);
+	SAFE_DELETE_OBJ(m_kiss_fft);
+	SAFE_DELETE_PTR(m_process_buf);
+	DestoryFilterBuf();
+	DestoryMixBuf();
+}
+
+void SuperSoundFastConvolution::DestoryFilterBuf()
+{
+	if(m_filter_buf_array)
+	{
+		for(int32_t i = 0; i < m_filter_num; i++)
+		{
+			SAFE_DELETE_PTR(m_filter_buf_array[i])
+		}
+		SAFE_DELETE_PTR(m_filter_buf_array);
+	}
+}
+
+void SuperSoundFastConvolution::DestoryMixBuf()
+{
+	if(m_mix_buf_array)
+	{
+		for(int32_t i = 0; i < m_filter_num; i++)
+		{
+			SAFE_DELETE_PTR(m_mix_buf_array[i]);
+		}
+		SAFE_DELETE_PTR(m_mix_buf_array);
+	}
+}
+
+int32_t SuperSoundFastConvolution::SetFrameLenZeroLen( int32_t frame_len, int32_t zero_len )
+{
+	int nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	//更新帧长和帧移
+	m_frame_step = frame_len;
+	m_zero_len = zero_len;
+	m_frame_len = frame_len + zero_len;
+
+	m_kiss_fft = new(std::nothrow) SuperSoundKissFFT();
+	if(m_kiss_fft == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	m_history_buf = new(std::nothrow) float[m_frame_step];
+	if(m_history_buf == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+	memset(m_history_buf, 0, sizeof(float) * m_frame_step);
+
+	m_process_buf = new(std::nothrow) float[m_frame_len];
+	if(m_process_buf == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	nRet = m_kiss_fft->Init(m_frame_len);
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	return nRet;
+}
+
+int32_t SuperSoundFastConvolution::SetImpulseResponse( float * imres, int32_t len )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	//更新脉冲响应长度
+	m_imres_len = len;
+
+	nRet = AllocFilterAndMixBuf();
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	nRet = CalFilterBuf(imres);
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	return nRet;
+}
+
+int32_t SuperSoundFastConvolution::ProcessFrame( float * buf, int32_t & out_num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	memcpy(m_process_buf, buf, sizeof(float) * m_frame_step);
+	memset(m_process_buf + m_frame_step, 0, sizeof(float) * m_zero_len);
+
+	//先对该帧做 FFT 变换
+	nRet = m_kiss_fft->FFT(m_process_buf);
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	//相乘混合
+	CalMixBuf(m_process_buf);
+
+	//最后 IFFT 变换
+	nRet = m_kiss_fft->IFFT(m_mix_buf_array[m_mix_buf_idx]);
+	if(ERROR_SUPERSOUND_SUCCESS != nRet)
+		return nRet;
+
+	//和上一次的输出进行交叠相加获取输出
+	for(int32_t i = 0; i < m_frame_step; i++)
+	{
+		buf[i] = (m_mix_buf_array[m_mix_buf_idx][i] + m_history_buf[i]) / m_frame_len;
+	}
+
+	//重置历史帧数据
+	int32_t copynum = MIN(m_frame_step, m_zero_len);
+	memcpy(m_history_buf, m_mix_buf_array[m_mix_buf_idx] + m_frame_step, sizeof(float) * copynum);
+	memset(m_history_buf + copynum, 0, sizeof(float) * MAX(0, m_frame_step - copynum));
+
+	//清空输出混合帧
+	memset(m_mix_buf_array[m_mix_buf_idx], 0, sizeof(float) * m_frame_len);
+	m_mix_buf_idx = (m_mix_buf_idx + 1) % m_filter_num;
+
+	//计算应该输出的长度
+	if(m_b_reduce_delay)
+	{
+		out_num = m_frame_step - m_frame_step / 2;
+		memmove(buf, buf + m_frame_step / 2, sizeof(float) * out_num);
+		m_b_reduce_delay = false;
+	}
+	else
+	{
+		out_num = m_frame_step;
+	}
+
+	return nRet;
+}
+
+void SuperSoundFastConvolution::Flush()
+{
+	m_b_reduce_delay = false; // 默认完整输出
+
+	if(m_history_buf)
+	{
+		memset(m_history_buf, 0, sizeof(float) * m_frame_step);
+	}
+
+	if(m_mix_buf_array)
+	{
+		for(int32_t i = 0; i < m_filter_num; i++)
+		{
+			memset(m_mix_buf_array[i], 0, sizeof(float) * m_frame_len);
+		}
+	}
+	m_mix_buf_idx = 0;
+}
+
+int32_t SuperSoundFastConvolution::GetLatecy()
+{
+    // 默认不需要考虑延迟
+    return 0;
+//	return m_frame_step / 2;
+}
+
+int32_t SuperSoundFastConvolution::AllocFilterAndMixBuf()
+{
+	//向上取整
+	int32_t filter_num = (m_imres_len + m_frame_step - 1) / m_frame_step;
+
+	if(filter_num == m_filter_num)
+		return ERROR_SUPERSOUND_SUCCESS;
+
+	//将老的 Filter 内存释放掉
+	DestoryFilterBuf();
+
+    //将老的 Mix 内存释放掉
+    DestoryMixBuf();
+
+	m_filter_num = filter_num;
+	
+	m_filter_buf_array = new(std::nothrow) float *[m_filter_num];
+	if(m_filter_buf_array == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	for(int32_t i = 0; i < m_filter_num; i++)
+	{
+		m_filter_buf_array[i] = new(std::nothrow) float[m_frame_len];
+		if(m_filter_buf_array[i] == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+	}
+
+
+	
+	m_mix_buf_array = new(std::nothrow) float *[m_filter_num];
+	if(m_mix_buf_array == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	for(int32_t i = 0; i < m_filter_num; i++)
+	{
+		m_mix_buf_array[i] = new(std::nothrow) float[m_frame_len];
+		if(m_mix_buf_array[i] == NULL)
+			return ERROR_SUPERSOUND_MEMORY;
+		memset(m_mix_buf_array[i], 0, sizeof(float) * m_frame_len);
+	}
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundFastConvolution::CalFilterBuf( float * imres )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+	int32_t lastframe = m_filter_num - 1;
+
+	//考虑下这里需不需要进行增益先
+
+	for(int32_t i = 0; i < lastframe; i++)
+	{
+		memcpy(m_filter_buf_array[i], imres + i * m_frame_step, sizeof(float) * m_frame_step);
+		memset(m_filter_buf_array[i] + m_frame_step, 0, sizeof(float) * m_zero_len);
+		nRet = m_kiss_fft->FFT(m_filter_buf_array[i]);
+		if(nRet != ERROR_SUPERSOUND_SUCCESS)
+			return nRet;
+	}
+
+	//最后一帧不够的话，进行补 0 操作
+	int32_t copylen = m_imres_len - lastframe * m_frame_step;
+	memcpy(m_filter_buf_array[lastframe], imres + lastframe * m_frame_step, sizeof(float) * copylen);
+	memset(m_filter_buf_array[lastframe] + copylen, 0, sizeof(float) * (m_frame_len - copylen));
+	nRet = m_kiss_fft->FFT(m_filter_buf_array[lastframe]);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	return nRet;
+}
+
+void SuperSoundFastConvolution::CalMixBuf( float * freq )
+{
+	//指示当前混合的位置
+	int32_t idx;
+
+	for(int32_t i = 0; i < m_filter_num; i++)
+	{
+		idx = (m_mix_buf_idx + i) % m_filter_num;
+
+		//将两个特殊的点先进行计算
+		m_mix_buf_array[idx][0] += freq[0] * m_filter_buf_array[i][0];
+		m_mix_buf_array[idx][1] += freq[1] * m_filter_buf_array[i][1];
+
+		for(int32_t j = 2; j < m_frame_len; j += 2)
+		{
+			//两个复数相乘
+			m_mix_buf_array[idx][j] += freq[j] * m_filter_buf_array[i][j] - 
+				freq[j + 1] * m_filter_buf_array[i][j + 1];
+			m_mix_buf_array[idx][j + 1] += freq[j + 1] * m_filter_buf_array[i][j] +
+				freq[j] * m_filter_buf_array[i][j + 1];
+		}
+	}
+}
+
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_fast_convolution.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_fast_convolution.h
new file mode 100755
index 0000000..7532c6f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_fast_convolution.h
@@ -0,0 +1,93 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现快速卷积，分段卷积
+
+#ifndef __SUPERSOUND_FAST_CONVOLUTION_H__
+#define __SUPERSOUND_FAST_CONVOLUTION_H__
+
+#include "isupersound_convolution.h"
+#include "fft/isupersound_fft.h"
+
+namespace SUPERSOUND
+{
+
+
+class SuperSoundFastConvolution : public ISuperSoundConvolution
+{
+public:
+	SuperSoundFastConvolution();
+	virtual ~SuperSoundFastConvolution();
+
+public:
+	virtual void Flush();
+	virtual int32_t SetFrameLenZeroLen(int32_t frame_len, int32_t zero_len);
+	virtual int32_t SetImpulseResponse(float * imres, int32_t len);
+	virtual int32_t ProcessFrame(float * buf, int32_t & out_num);
+	virtual int32_t GetLatecy();
+
+private:
+	int32_t AllocFilterAndMixBuf();
+	int32_t CalFilterBuf(float * imres);
+	void DestoryFilterBuf();
+	void DestoryMixBuf();
+	void DestoryAll();
+	void CalMixBuf(float * freq);
+
+private:
+	//类内部的实际帧长，为 m_frame_len = m_frame_step + m_zero_len
+	int32_t m_frame_len;
+	//类内部实际为帧移，对外部而言是帧长，每帧的数据长度
+	int32_t m_frame_step;
+	//补 0 的长度，交叠的长度
+	int32_t m_zero_len;
+	int32_t m_imres_len;
+	ISuperSoundFFT * m_kiss_fft;
+	//将 im 分成这么多段，降低延迟
+	int32_t m_filter_num;
+	//每个段对应的频谱
+	float ** m_filter_buf_array;
+	//每段的混合频谱
+	float ** m_mix_buf_array;
+	//使用循环的方式来找到当前的输出 mix_buf 位置
+	int32_t m_mix_buf_idx;
+	//历史交叠部分
+	float * m_history_buf;
+	//对输入的临时处理的 buf
+	float * m_process_buf;
+	//是否需要考虑延迟
+	bool m_b_reduce_delay;
+};
+
+
+}
+
+#endif /* __SUPERSOUND_FAST_CONVOLUTION_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_simple_convolution.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_simple_convolution.cpp
new file mode 100644
index 0000000..673de12
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_simple_convolution.cpp
@@ -0,0 +1,202 @@
+//
+// Created by yangjianli on 2019-11-19.
+//
+
+#include "supersound_simple_convolution.h"
+#include "string"
+#include "supersound_err.h"
+#include "supersound_common.h"
+namespace SUPERSOUND {
+    SupersoundSimpleConvolution::SupersoundSimpleConvolution() {
+        m_kiss_fft = NULL;
+        // 历史数据
+        m_history_buf = NULL;
+        // 分段数据
+        m_segmentation_buf = NULL;
+        // 脉冲响应的频谱
+        m_filter_buf_array = NULL;
+        // 输入数据
+        m_frame_buf = NULL;
+        // 脉冲响应分段数量
+        m_filter_num = 0;
+        // 一帧长度
+        m_frame_len = 0;
+        // 输入长度
+        m_input_len = 0;
+        //补零长度
+        m_zero_len = 0;
+        // history当前的下标
+        m_history_idx = 0;
+        // 历史buf长度
+        m_history_len = 0;
+    }
+
+    SupersoundSimpleConvolution::~SupersoundSimpleConvolution() {
+        DestoryAll();
+    }
+
+// 分段卷积
+    void SupersoundSimpleConvolution::CalcSegmentation(float *input) {
+        memset(m_segmentation_buf, 0, sizeof(float) * m_history_len);
+        memset(m_frame_buf, 0, sizeof(float) * m_frame_len);
+        memcpy(m_frame_buf, input, sizeof(float) * m_input_len);
+
+        // 获取频谱
+        m_kiss_fft->FFT(m_frame_buf);
+        // 分段乘法
+        for (int i = 0; i < m_filter_num; i++) {
+            //将两个特殊的点先进行计算
+            m_tmp_buf[0] = m_frame_buf[0] * m_filter_buf_array[i][0];
+            m_tmp_buf[1] = m_frame_buf[1] * m_filter_buf_array[i][1];
+
+            for (int j = 2; j < m_frame_len; j+=2) {
+                //两个复数相乘
+                m_tmp_buf[j] = m_frame_buf[j] * m_filter_buf_array[i][j] -
+                        m_frame_buf[j + 1] * m_filter_buf_array[i][j + 1];
+                m_tmp_buf[j + 1] = m_frame_buf[j + 1] * m_filter_buf_array[i][j] +
+                                     m_frame_buf[j] * m_filter_buf_array[i][j + 1];
+            }
+
+            // ifft
+            for (int j = 0; j < m_frame_len; j++) {
+                m_tmp_buf[j] /= m_frame_len;
+            }
+
+            m_kiss_fft->IFFT(m_tmp_buf);
+
+            // 叠加
+            for (int j = 0; j < m_frame_len; j++) {
+                m_segmentation_buf[i * (m_zero_len + 1) + j] += m_tmp_buf[j];
+            }
+        }
+    }
+
+// 主处理函数
+    int32_t SupersoundSimpleConvolution::ProcessFrame(float *buf, int32_t &out_num) {
+        CalcSegmentation(buf);
+        //外部叠加
+        for (int i = 0; i < m_history_len; i++) {
+            int now_index = (m_history_idx + i) % m_history_len;
+            m_history_buf[now_index] += m_segmentation_buf[i];
+        }
+        // 将数据输出
+        for (int i = 0; i < m_input_len; i++) {
+            buf[i] = m_history_buf[m_history_idx];
+
+            // 恢复设置
+            m_history_buf[m_history_idx] = 0;
+            m_history_idx = (m_history_idx + 1) % m_history_len;
+        }
+        out_num = m_input_len;
+        return ERROR_SUPERSOUND_SUCCESS;
+    }
+
+// 设置参数
+    int32_t SupersoundSimpleConvolution::SetFrameLenZeroLen(int32_t frame_len, int32_t zero_len) {
+        // 外部每次输入的数据长度
+        m_input_len = frame_len;
+        // 补零长度，用来达到和线性卷积相同的长度输出
+        m_zero_len = zero_len;
+        // 做fft变换的长度
+        m_frame_len = m_input_len + m_zero_len;
+
+        // 长度必须是偶数
+        if (m_frame_len & 1) {
+            return ERROR_SUPERSOUND_PARAM;
+        }
+
+        // 创建补零后的数据长度
+        m_frame_buf = new(std::nothrow) float[m_frame_len];
+        if (NULL == m_frame_buf) {
+            return ERROR_SUPERSOUND_MEMORY;
+        }
+        m_tmp_buf = new(std::nothrow) float[m_frame_len];
+        if (NULL == m_tmp_buf) {
+            return ERROR_SUPERSOUND_MEMORY;
+        }
+        // 初始化fft
+        m_kiss_fft = new (std::nothrow) SuperSoundKissFFT();
+        if (NULL == m_kiss_fft) {
+            return ERROR_SUPERSOUND_MEMORY;
+        }
+        m_kiss_fft->Init(m_frame_len);
+        return ERROR_SUPERSOUND_SUCCESS;
+    }
+
+    int32_t SupersoundSimpleConvolution::SetImpulseResponse(float *imres, int32_t len) {
+        int n_hlen = (m_zero_len + 1);
+        m_history_idx = 0;
+        m_filter_num = len / n_hlen;
+        int tp = len % n_hlen;
+        if (tp > 0) {
+            m_filter_num += 1;
+        }
+        m_history_len = n_hlen * m_filter_num + m_input_len - 1;
+
+        // 历史数据
+        m_history_buf = new(std::nothrow) float[m_history_len];
+        if (NULL == m_history_buf) {
+            return ERROR_SUPERSOUND_MEMORY;
+        }
+        memset(m_history_buf, 0, sizeof(float) * m_history_len);
+
+        // 输入数据与脉冲信号分段卷积
+        m_segmentation_buf = new float[m_history_len];
+        if (NULL == m_segmentation_buf) {
+            return ERROR_SUPERSOUND_MEMORY;
+        }
+        memset(m_segmentation_buf, 0, sizeof(float) * m_history_len);
+
+        // 分段脉冲频谱
+        m_filter_buf_array = new(std::nothrow) float *[m_filter_num];
+        if (m_filter_buf_array == NULL)
+            return ERROR_SUPERSOUND_MEMORY;
+
+        for (int32_t i = 0; i < m_filter_num; i++) {
+            m_filter_buf_array[i] = new(std::nothrow) float[m_frame_len];
+            if (m_filter_buf_array[i] == NULL)
+                return ERROR_SUPERSOUND_MEMORY;
+        }
+
+        // 脉冲信号频谱计算
+        int n_step = n_hlen;
+        for (int i = 0; i < m_filter_num; i++) {
+            if(len - n_step * i < n_step)
+            {
+                n_step = len - n_hlen * i;
+            }
+            memset(m_filter_buf_array[i], 0, sizeof(float) * m_frame_len);
+            memcpy(m_filter_buf_array[i], imres + (i * n_hlen), sizeof(float) * n_step);
+
+            // 计算频谱
+            m_kiss_fft->FFT(m_filter_buf_array[i]);
+        }
+        return ERROR_SUPERSOUND_SUCCESS;
+    }
+
+    int32_t SupersoundSimpleConvolution::GetLatecy() {
+        return 0;
+    }
+
+// 初始化
+    void SupersoundSimpleConvolution::Flush() {
+        m_history_idx = 0;
+        memset(m_history_buf, 0, sizeof(float) * m_history_len);
+    }
+
+// 释放空间
+    void SupersoundSimpleConvolution::DestoryAll() {
+        SAFE_DELETE_PTR(m_history_buf);
+        SAFE_DELETE_PTR(m_frame_buf);
+        SAFE_DELETE_PTR(m_tmp_buf);
+        SAFE_DELETE_PTR(m_segmentation_buf);
+        SAFE_DELETE_OBJ(m_kiss_fft);
+
+        if (m_filter_buf_array) {
+            for (int32_t i = 0; i < m_filter_num; i++) {
+                SAFE_DELETE_PTR(m_filter_buf_array[i])
+            }
+            SAFE_DELETE_PTR(m_filter_buf_array);
+        }
+    }
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_simple_convolution.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_simple_convolution.h
new file mode 100644
index 0000000..7ace608
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/convolution/supersound_simple_convolution.h
@@ -0,0 +1,62 @@
+//
+// Created by yangjianli on 2019-11-19.
+//
+
+#ifndef IMPLUSEEFFECLIBS_SUPERSOUND_SIMPLE_CONVOLUTION_H
+#define IMPLUSEEFFECLIBS_SUPERSOUND_SIMPLE_CONVOLUTION_H
+
+#include "fft/isupersound_fft.h"
+#include "fft/supersound_kiss_fft.h"
+#include "isupersound_convolution.h"
+
+namespace SUPERSOUND {
+
+    class SupersoundSimpleConvolution : public ISuperSoundConvolution {
+    public:
+        SupersoundSimpleConvolution();
+
+        virtual ~SupersoundSimpleConvolution();
+
+    public:
+        virtual void Flush();
+
+        virtual int32_t SetFrameLenZeroLen(int32_t frame_len, int32_t zero_len);
+
+        virtual int32_t SetImpulseResponse(float *imres, int32_t len);
+
+        virtual int32_t ProcessFrame(float *buf, int32_t &out_num);
+
+        virtual int32_t GetLatecy();
+
+    private:
+        // 历史数据
+        float *m_history_buf;
+        // 分段数据
+        float *m_segmentation_buf;
+        // 脉冲响应的频谱
+        float ** m_filter_buf_array;
+        // 输入数据
+        float *m_frame_buf;
+        // 临时数据
+        float *m_tmp_buf;
+        // 脉冲响应分段数量
+        int m_filter_num;
+        // 一帧长度
+        int m_frame_len;
+        // 输入长度
+        int m_input_len;
+        //补零长度
+        int m_zero_len;
+        // history当前的下标
+        int m_history_idx;
+        // 历史buf总长度
+        int m_history_len;
+        SUPERSOUND::SuperSoundKissFFT *m_kiss_fft;
+    private:
+        void CalcSegmentation(float *input);
+
+        void DestoryAll();
+    };
+
+}
+#endif //IMPLUSEEFFECLIBS_SUPERSOUND_SIMPLE_CONVOLUTION_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/isupersound_fft.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/isupersound_fft.h
new file mode 100755
index 0000000..e5b5d09
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/isupersound_fft.h
@@ -0,0 +1,66 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//封装 fft 接口
+
+#ifndef __I_SUPERSOUND_FFT_H__
+#define __I_SUPERSOUND_FFT_H__
+
+#include <stdint.h>
+
+namespace SUPERSOUND
+{
+
+
+//利用对称性将长度进行复数部分的长度缩放成实数长度
+class ISuperSoundFFT
+{
+public:
+	ISuperSoundFFT() { };
+	virtual ~ISuperSoundFFT() { };
+
+public:
+	//初始化，传入进行FFT的长度
+	virtual int32_t Init(int32_t size) = 0;
+	//外围保证输入输出的长度，长度为原始设置的 size
+	virtual int32_t FFT(float * in_out) = 0;
+	//外围保证输入输出的长度，长度为原始设置的 size
+	virtual int32_t IFFT(float * in_out) = 0;
+	//外围保证输入输出的长度，输入长度为原始设置的 size，输出为 2 * size
+	virtual int32_t FFT(float * in, float * out) = 0;
+	//外围保证输入输出的长度，输入长度为 2 * size，输出长度为 size
+	virtual int32_t IFFT(float * in, float * out) = 0;
+};
+
+
+}
+
+#endif /* __I_SUPERSOUND_FFT_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/supersound_kiss_fft.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/supersound_kiss_fft.cpp
new file mode 100755
index 0000000..f5d8647
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/supersound_kiss_fft.cpp
@@ -0,0 +1,122 @@
+
+#include "supersound_kiss_fft.h"
+#include "supersound_err.h"
+
+namespace SUPERSOUND
+{
+
+
+SuperSoundKissFFT::SuperSoundKissFFT()
+{
+	m_fft = NULL;
+	m_ifft = NULL;
+	m_freq = NULL;
+	m_len = 0;
+}
+
+SuperSoundKissFFT::~SuperSoundKissFFT()
+{
+	Destory();
+}
+
+int32_t SuperSoundKissFFT::Init( int32_t size )
+{
+	m_fft = kiss_fftr_alloc(size, 0, NULL, NULL);
+	if(m_fft == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	m_ifft = kiss_fftr_alloc(size, 1, NULL, NULL);
+	if(m_ifft == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	m_freq = (kiss_fft_cpx *)malloc(sizeof(kiss_fft_cpx) * (size / 2 + 1));
+	if(m_freq == NULL)
+		return ERROR_SUPERSOUND_MEMORY;
+
+	m_len = size;
+	
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundKissFFT::FFT( float * in_out )
+{
+	kiss_fftr(m_fft, in_out, m_freq);
+
+	in_out[0] = m_freq[0].r;
+	in_out[1] = m_freq[m_len / 2].r;
+
+	for(int32_t i = 2, j = 1; i < m_len; i += 2, j++)
+	{
+		in_out[i] = m_freq[j].r;
+		in_out[i + 1] = m_freq[j].i;
+	}
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundKissFFT::FFT( float * in, float * out )
+{
+	kiss_fftr(m_fft, in, m_freq);
+
+	for(int32_t i = 0, j = 0; i < m_len; i += 2, j++)
+	{
+		out[i] = m_freq[j].r;
+		out[i + 1] = m_freq[j].i;
+	}
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundKissFFT::IFFT( float * in_out )
+{
+	m_freq[0].r = in_out[0];
+	m_freq[0].i = 0;
+	m_freq[m_len / 2].r = in_out[1];
+	m_freq[m_len / 2].i = 0;
+
+	for(int32_t i = 2, j = 1; i < m_len; i += 2, j++)
+	{
+		m_freq[j].r = in_out[i];
+		m_freq[j].i = in_out[i + 1];
+	}
+
+	kiss_fftri(m_ifft, m_freq, in_out);
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundKissFFT::IFFT( float * in, float * out )
+{
+	for(int32_t i = 0, j = 0; i < m_len; i += 2, j++)
+	{
+		m_freq[j].r = in[i];
+		m_freq[j].i = in[i + 1];
+	}
+
+	kiss_fftri(m_ifft, m_freq, out);
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+void SuperSoundKissFFT::Destory()
+{
+	if(m_fft)
+	{
+		kiss_fftr_free(m_fft);
+		m_fft = NULL;
+	}
+	if(m_ifft)
+	{
+		kiss_fftr_free(m_ifft);
+		m_ifft = NULL;
+	}
+	if(m_freq)
+	{
+		free(m_freq);
+		m_freq = NULL;
+	}
+	m_len = 0;
+}
+
+
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/supersound_kiss_fft.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/supersound_kiss_fft.h
new file mode 100755
index 0000000..328a3b4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/fft/supersound_kiss_fft.h
@@ -0,0 +1,74 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//对 kissfft 进行调用封装
+
+#ifndef __SUPERSOUND_KISS_FFT_H__
+#define __SUPERSOUND_KISS_FFT_H__
+
+#include "kiss_fft/kiss_fftr.h"
+#include "isupersound_fft.h"
+
+namespace SUPERSOUND
+{
+
+
+class SuperSoundKissFFT : public ISuperSoundFFT
+{
+public:
+	SuperSoundKissFFT();
+	virtual ~SuperSoundKissFFT();
+
+public:
+	virtual int32_t Init(int32_t size);
+	virtual int32_t FFT(float * in_out);
+	virtual int32_t IFFT(float * in_out);
+	virtual int32_t FFT(float * in, float * out);
+	virtual int32_t IFFT(float * in, float * out);
+
+private:
+	void Destory();
+
+private:
+	//进行 fft 的实例
+	kiss_fftr_cfg m_fft;
+	//进行 ifft 的实例
+	kiss_fftr_cfg m_ifft;
+	//频域中间结果，包含了全结果
+	kiss_fft_cpx * m_freq;
+	// fft 的计算长度
+	int32_t m_len;
+};
+
+
+}
+
+#endif /* __SUPERSOUND_KISS_FFT_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_common.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_common.h
new file mode 100755
index 0000000..1e6d858
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_common.h
@@ -0,0 +1,91 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __SUPERSOUND_COMMON_H__
+#define __SUPERSOUND_COMMON_H__
+#include <memory>
+namespace SUPERSOUND
+{
+
+
+//安全删除指针
+#ifndef SAFE_DELETE_PTR
+#define SAFE_DELETE_PTR(a)	\
+{							\
+	if(a)					\
+	{						\
+		delete [] a;		\
+		a = NULL;			\
+	}						\
+}
+#endif /* SAFE_DELETE_PTR */
+
+#ifndef SAFE_DELETE_OBJ
+#define SAFE_DELETE_OBJ(a)	\
+{							\
+	if(a)					\
+	{						\
+		delete a;		\
+		a = NULL;			\
+	}						\
+}
+#endif /* SAFE_DELETE_OBJ */
+
+#ifndef MIN
+#define MIN(a,b) (((a) < (b)) ? (a) : (b))
+#endif /* MIN */
+
+#ifndef MAX
+#define MAX(a,b) (((a) > (b)) ? (a) : (b))
+#endif /* MAX */
+
+//将 a 规范到 [b, c] 之间
+#ifndef MIDDLE
+#define MIDDLE(a, b, c) (MIN(c, MAX(a, b)))
+#endif /* MIDDLE */
+
+#ifndef M_PI
+#define M_PI 3.14159265358979323846 
+#endif /* M_PI */
+
+#ifndef FLOAT_EQUAL
+#define FLOAT_EQUAL(a, b)	(fabs((a) - (b)) <= 1E-5)
+#endif /* FLOAT_EQUAL */
+
+//必须是 2 的幂次，这样方便计算一些
+#define SUPERSOUND_WAV_BUF_STEP_LEN		1024
+#define SUPERSOUND_DEFAULT_FFT_LEN		SUPERSOUND_WAV_BUF_STEP_LEN
+#define SUPERSOUND_CHANNEL_PROC_LEN		SUPERSOUND_DEFAULT_FFT_LEN
+
+
+}
+
+#endif /* __SUPERSOUND_COMMON_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_wav_buf.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_wav_buf.cpp
new file mode 100755
index 0000000..9d8a974
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_wav_buf.cpp
@@ -0,0 +1,484 @@
+
+#include "supersound_err.h"
+#include "supersound_wav_buf.h"
+#include "supersound_common.h"
+#include <stdlib.h>
+#include <cstring>
+
+namespace SUPERSOUND
+{
+
+
+SuperSoundWavBuf::SuperSoundWavBuf()
+{
+	m_nChannels = 0;
+	m_nStart = 0;
+	m_nEnd = 0;
+	m_nSize = 0;
+
+	memset(m_ppBuf, 0, sizeof(m_ppBuf));
+}
+
+SuperSoundWavBuf::~SuperSoundWavBuf()
+{
+	Destory();
+}
+
+void SuperSoundWavBuf::Short2Float( short * src, float * dst, int32_t num )
+{
+	for(int32_t i = 0; i < num; i++)
+	{
+		Short2Float(src[i], dst[i]);
+	}
+}
+
+void SuperSoundWavBuf::Short2Float( short in, float & out )
+{
+	out = in * 1.0f / 32768;
+}
+
+void SuperSoundWavBuf::Float2Short( float * src, short * dst, int32_t num )
+{
+	for(int32_t i = 0; i < num; i++)
+	{
+		Float2Short(src[i], dst[i]);
+	}
+}
+
+void SuperSoundWavBuf::Float2Short( float in, short & out )
+{
+	float tmp;
+	tmp = in * 32767;
+
+	if(tmp > 0)
+		out = short(tmp + 0.5);
+	else
+		out = short(tmp - 0.5);
+}
+
+int32_t SuperSoundWavBuf::SetChannels( int32_t channels )
+{
+	if(channels > CHANNEL_MAX)
+		return ERROR_SUPERSOUND_PARAM;
+
+	if(channels > m_nChannels)
+	{
+		if(0 == m_nSize)
+			m_nSize = SUPERSOUND_WAV_BUF_STEP_LEN;
+
+		for(int32_t i = m_nChannels; i < channels; i++)
+		{
+			if(NULL == m_ppBuf[i])
+			{
+				m_ppBuf[i] = new(std::nothrow) float[m_nSize];
+				if(m_ppBuf[i] == NULL)
+					return ERROR_SUPERSOUND_MEMORY;
+
+				memset(m_ppBuf[i], 0, sizeof(float) * m_nSize);
+			}
+		}
+
+		m_nChannels = channels;
+	}
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t SuperSoundWavBuf::GuaranteBufferSize( int32_t size )
+{
+	//因为是循环队列，用一个单元来进行保护
+	++size;
+
+	if(size > m_nSize)
+	{
+		float * buf;
+		int32_t new_size = size + SUPERSOUND_WAV_BUF_STEP_LEN - (size & (SUPERSOUND_WAV_BUF_STEP_LEN - 1));
+
+		for(int32_t i = 0; i < m_nChannels; i++)
+		{
+			buf = new(std::nothrow) float[new_size];
+			if(buf == NULL)
+				return ERROR_SUPERSOUND_MEMORY;
+
+			memset(buf, 0, sizeof(float) * new_size);
+
+			if(m_nEnd >= m_nStart)
+			{
+				memcpy(buf, m_ppBuf[i] + m_nStart, sizeof(float) * (m_nEnd - m_nStart));
+			}
+			else
+			{
+				memcpy(buf, m_ppBuf[i] + m_nStart, sizeof(float) * (m_nSize - m_nStart));
+				memcpy(buf + m_nSize - m_nStart, m_ppBuf[i], sizeof(float) * m_nEnd);
+			}
+
+			SAFE_DELETE_PTR(m_ppBuf[i]);
+
+			m_ppBuf[i] = buf;
+		}
+
+		for(int32_t i = m_nChannels; i < CHANNEL_MAX; i++)
+		{
+			SAFE_DELETE_PTR(m_ppBuf[i]);
+		}
+
+		//更新开始位置和结束位置
+		if(m_nEnd >= m_nStart)
+			m_nEnd = m_nEnd - m_nStart;
+		else
+			m_nEnd = m_nEnd + m_nSize - m_nStart;
+		m_nStart = 0;
+		//更新长度信息
+		m_nSize = new_size;
+	}
+
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+void SuperSoundWavBuf::Destory()
+{
+	for(int32_t i = 0; i < CHANNEL_MAX; i++)
+	{
+		SAFE_DELETE_PTR(m_ppBuf[i]);
+	}
+}
+
+int32_t SuperSoundWavBuf::PushSamples( int32_t num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if((num % m_nChannels) != 0)
+		return ERROR_SUPERSOUND_PARAM;
+
+	int32_t new_len = m_nEnd - m_nStart + num / m_nChannels;
+	if(m_nEnd < m_nStart)
+		new_len += m_nSize;
+	nRet = GuaranteBufferSize(new_len);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	for(int32_t i = 0; i < num; i += m_nChannels)
+	{
+		for(int32_t j = 0; j < m_nChannels; j++)
+		{
+			m_ppBuf[j][m_nEnd] = 0;
+		}
+		++m_nEnd;
+		if(m_nEnd == m_nSize)
+			m_nEnd = 0;
+	}
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PushSamples( short * pdata, int32_t num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if((num % m_nChannels) != 0)
+		return ERROR_SUPERSOUND_PARAM;
+
+	int32_t new_len = m_nEnd - m_nStart + num / m_nChannels;
+	if(m_nEnd < m_nStart)
+		new_len += m_nSize;
+	nRet = GuaranteBufferSize(new_len);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	for(int32_t i = 0; i < num; i += m_nChannels)
+	{
+		for(int32_t j = 0; j < m_nChannels; j++)
+		{
+			 Short2Float(pdata[i + j], m_ppBuf[j][m_nEnd]);
+		}
+		++m_nEnd;
+		if(m_nEnd == m_nSize)
+			m_nEnd = 0;
+	}
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PushSamples( float * pdata, int32_t num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(m_nChannels == 0 || (num % m_nChannels) != 0)
+		return ERROR_SUPERSOUND_PARAM;
+
+	int32_t new_len = m_nEnd - m_nStart + num / m_nChannels;
+	if(m_nEnd < m_nStart)
+		new_len += m_nSize;
+	nRet = GuaranteBufferSize(new_len);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	for(int32_t i = 0; i < num; i += m_nChannels)
+	{
+		for(int32_t j = 0; j < m_nChannels; j++)
+		{
+			m_ppBuf[j][m_nEnd] = pdata[i + j];
+		}
+		++m_nEnd;
+		if(m_nEnd == m_nSize)
+			m_nEnd = 0;
+	}
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PushSamples( std::vector<short *> &ppdata, int32_t num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(int32_t(ppdata.size()) < m_nChannels)
+		return ERROR_SUPERSOUND_PARAM;
+
+	int32_t new_len = m_nEnd - m_nStart + num;
+	if(m_nEnd < m_nStart)
+		new_len += m_nSize;
+	nRet = GuaranteBufferSize(new_len);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	for(int32_t i = 0; i < m_nChannels; i++)
+	{
+		//因为已经保证了缓存 buf 足够长，所以不会存在 end 覆盖 start 的情况
+		if((m_nEnd + num) >= m_nSize)
+		{
+			Short2Float(ppdata[i], m_ppBuf[i] + m_nEnd, m_nSize - m_nEnd);
+			Short2Float(ppdata[i] + (m_nSize - m_nEnd), m_ppBuf[i], num + m_nEnd - m_nSize);
+		}
+		else
+		{
+			Short2Float(ppdata[i], m_ppBuf[i] + m_nEnd, num);
+		}
+	}
+
+	//更新结束位置变量
+	if((m_nEnd + num) >= m_nSize)
+		m_nEnd = num + m_nEnd - m_nSize;
+	else
+		m_nEnd = m_nEnd + num;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PushSamples( std::vector<float *> &ppdata, int32_t num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(int32_t(ppdata.size()) < m_nChannels)
+		return ERROR_SUPERSOUND_PARAM;
+
+	int32_t new_len = m_nEnd - m_nStart + num;
+	if(m_nEnd < m_nStart)
+		new_len += m_nSize;
+	nRet = GuaranteBufferSize(new_len);
+	if(nRet != ERROR_SUPERSOUND_SUCCESS)
+		return nRet;
+
+	for(int32_t i = 0; i < m_nChannels; i++)
+	{
+		//因为已经保证了缓存 buf 足够长，所以不会存在 end 覆盖 start 的情况
+		if((m_nEnd + num) >= m_nSize)
+		{
+			memcpy(m_ppBuf[i] + m_nEnd, ppdata[i], sizeof(float) * (m_nSize - m_nEnd));
+			memcpy(m_ppBuf[i], ppdata[i] + (m_nSize - m_nEnd), sizeof(float) * (num + m_nEnd - m_nSize));
+		}
+		else
+		{
+			memcpy(m_ppBuf[i] + m_nEnd, ppdata[i], sizeof(float) * num);
+		}
+	}
+
+	//更新结束位置变量
+	if((m_nEnd + num) >= m_nSize)
+		m_nEnd = num + m_nEnd - m_nSize;
+	else
+		m_nEnd = m_nEnd + num;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PopSamples( int32_t num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	int32_t out_num = 0;
+
+	if(m_nEnd >= m_nStart)
+		out_num = m_nEnd - m_nStart;
+	else
+		out_num = m_nEnd + m_nSize - m_nStart;
+
+	out_num = MIN(num / m_nChannels, out_num);
+
+	//更新开始位置
+	if((m_nStart + out_num) >= m_nSize)
+		m_nStart = out_num + m_nStart - m_nSize;
+	else
+		m_nStart = m_nStart + out_num;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PopSamples( short * pdata, int32_t max_num, int32_t & out_num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(m_nEnd >= m_nStart)
+		out_num = m_nEnd - m_nStart;
+	else
+		out_num = m_nEnd + m_nSize - m_nStart;
+
+	out_num = MIN(max_num / m_nChannels, out_num);
+
+	for(int32_t i = 0; i < out_num; i++)
+	{
+		for(int32_t j = 0; j < m_nChannels; j++)
+		{
+			Float2Short(m_ppBuf[j][m_nStart], pdata[i * m_nChannels + j]);
+		}
+		++m_nStart;
+		if(m_nStart == m_nSize)
+			m_nStart = 0;
+	}
+
+	out_num = out_num * m_nChannels;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PopSamples( float * pdata, int32_t max_num, int32_t & out_num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(m_nEnd >= m_nStart)
+		out_num = m_nEnd - m_nStart;
+	else
+		out_num = m_nEnd + m_nSize - m_nStart;
+
+	out_num = MIN(max_num / m_nChannels, out_num);
+
+	for(int32_t i = 0; i < out_num; i++)
+	{
+		for(int32_t j = 0; j < m_nChannels; j++)
+		{
+			pdata[i * m_nChannels + j] = m_ppBuf[j][m_nStart];
+		}
+		++m_nStart;
+		if(m_nStart == m_nSize)
+			m_nStart = 0;
+	}
+
+	out_num = out_num * m_nChannels;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PopSamples( std::vector<short *> &ppdata, int32_t max_num, int32_t & out_num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(int32_t(ppdata.size()) < m_nChannels)
+		return ERROR_SUPERSOUND_PARAM;
+
+	if(m_nEnd >= m_nStart)
+		out_num = m_nEnd - m_nStart;
+	else
+		out_num = m_nEnd + m_nSize - m_nStart;
+
+	out_num = MIN(max_num, out_num);
+
+	for(int32_t i = 0; i < m_nChannels; i++)
+	{
+		if((m_nStart + out_num) >= m_nSize)
+		{
+			Float2Short(m_ppBuf[i] + m_nStart, ppdata[i], (m_nSize - m_nStart));
+			Float2Short(m_ppBuf[i], ppdata[i] + m_nSize - m_nStart, out_num + m_nStart - m_nSize);
+		}
+		else
+		{
+			Float2Short(m_ppBuf[i] + m_nStart, ppdata[i], out_num);
+		}
+	}
+
+	//更新开始位置
+	if((m_nStart + out_num) >= m_nSize)
+		m_nStart = out_num + m_nStart - m_nSize;
+	else
+		m_nStart = m_nStart + out_num;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::PopSamples( std::vector<float *> &ppdata, int32_t max_num, int32_t & out_num )
+{
+	int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+
+	if(int32_t(ppdata.size()) < m_nChannels)
+		return ERROR_SUPERSOUND_PARAM;
+
+	if(m_nEnd >= m_nStart)
+		out_num = m_nEnd - m_nStart;
+	else
+		out_num = m_nEnd + m_nSize - m_nStart;
+
+	out_num = MIN(max_num, out_num);
+
+	for(int32_t i = 0; i < m_nChannels; i++)
+	{
+		if((m_nStart + out_num) >= m_nSize)
+		{
+			memcpy(ppdata[i], m_ppBuf[i] + m_nStart, sizeof(float) * (m_nSize - m_nStart));
+			memcpy(ppdata[i] + m_nSize - m_nStart, m_ppBuf[i], sizeof(float) * (out_num + m_nStart - m_nSize));
+		}
+		else
+		{
+			memcpy(ppdata[i], m_ppBuf[i] + m_nStart, sizeof(float) * out_num);
+		}
+	}
+
+	//更新开始位置
+	if((m_nStart + out_num) >= m_nSize)
+		m_nStart = out_num + m_nStart - m_nSize;
+	else
+		m_nStart = m_nStart + out_num;
+
+	return nRet;
+}
+
+int32_t SuperSoundWavBuf::ShadeSamples( int32_t num )
+{
+	if(m_nEnd >= m_nStart)
+	{
+		num = MIN(m_nEnd - m_nStart, num);
+		m_nEnd = m_nEnd - num;
+	}
+	else
+	{
+		num = MIN(m_nSize + m_nEnd - m_nStart, num);
+		m_nEnd = m_nEnd - num;
+		if(m_nEnd < 0)
+			m_nEnd += m_nSize;
+	}
+	return ERROR_SUPERSOUND_SUCCESS;
+}
+
+void SuperSoundWavBuf::Flush()
+{
+	m_nStart = 0;
+	m_nEnd = 0;
+}
+
+int32_t SuperSoundWavBuf::DataSizeInCache()
+{
+	if(m_nEnd >= m_nStart)
+		return m_nEnd - m_nStart;
+	else
+		return (m_nEnd + m_nSize - m_nStart);
+}
+
+
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_wav_buf.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_wav_buf.h
new file mode 100755
index 0000000..f389837
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/common/supersound_wav_buf.h
@@ -0,0 +1,95 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//实现一个循环 buf 
+
+#ifndef __SUPERSOUND_WAV_BUF_H__
+#define __SUPERSOUND_WAV_BUF_H__
+
+#include "supersound_types.h"
+#include <stdint.h>
+#include <vector>
+
+namespace SUPERSOUND
+{
+
+
+class SuperSoundWavBuf
+{
+public:
+	SuperSoundWavBuf();
+	~SuperSoundWavBuf();
+
+public:
+	static void Short2Float(short in, float & out);
+	static void Short2Float(short * src, float * dst, int32_t num);
+	static void Float2Short(float in, short & out);
+	static void Float2Short(float * src, short * dst, int32_t num);
+
+public:
+	int32_t SetChannels(int32_t channels);
+
+	void Flush();
+
+	int32_t DataSizeInCache();
+
+	int32_t PushSamples(int32_t num);
+	int32_t PushSamples(short * pdata, int32_t num);
+	int32_t PushSamples(float * pdata, int32_t num);
+	int32_t PushSamples(std::vector<short *> &ppdata, int32_t num);
+	int32_t PushSamples(std::vector<float *> &ppdata, int32_t num);
+
+	int32_t PopSamples(int32_t num);
+	int32_t PopSamples(short * pdata, int32_t max_num, int32_t & out_num);
+	int32_t PopSamples(float * pdata, int32_t max_num, int32_t & out_num);
+	int32_t PopSamples(std::vector<short *> &ppdata, int32_t max_num, int32_t & out_num);
+	int32_t PopSamples(std::vector<float *> &ppdata, int32_t max_num, int32_t & out_num);
+
+	//从后面删除
+	int32_t ShadeSamples(int32_t num);
+
+private:
+	int32_t GuaranteBufferSize(int32_t size);
+	void Destory();
+
+private:
+	int32_t m_nChannels;
+	float * m_ppBuf[CHANNEL_MAX];
+	int32_t m_nStart;
+	int32_t m_nEnd;
+	//当前一个声道 buf 的长度
+	int32_t m_nSize;
+};
+
+
+}
+
+#endif /* __SUPERSOUND_WAV_BUF_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse.cpp
new file mode 100755
index 0000000..4b087bc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse.cpp
@@ -0,0 +1,258 @@
+
+#include "impulse.h"
+#include "supersound_err.h"
+#include "supersound_common.h"
+
+namespace SUPERSOUND
+{
+namespace IMPULSE
+{
+
+//#define SIMPLE_CONV
+
+Impulse::Impulse()
+{
+    memset(&m_current_param, 0, sizeof(m_current_param));
+    m_new_param.fs = 44100;
+    m_new_param.channels = 2;
+    m_new_param.window_bits = 10;
+    m_new_param.frame_len = 511;
+  
+    m_b_change = true;
+    m_b_update = true;
+    
+    m_im_response_array = NULL;
+    m_im_res_len = 0;
+    m_response_channels = 0;
+    
+    m_convolution_array = NULL;
+}
+
+Impulse::~Impulse()
+{
+    Destory();
+}
+    
+void Impulse::Destory()
+{
+    if(m_convolution_array)
+    {
+        for(int32_t i = 0; i < m_current_param.channels; i++)
+        {
+            SAFE_DELETE_OBJ(m_convolution_array[i]);
+        }
+        SAFE_DELETE_PTR(m_convolution_array);
+    }
+    
+    if (m_im_response_array)
+    {
+        for(int32_t i = 0; i < m_response_channels; i++)
+        {
+            SAFE_DELETE_PTR(m_im_response_array[i]);
+        }
+        SAFE_DELETE_PTR(m_im_response_array);
+    }
+}
+    
+void Impulse::Flush()
+{
+    if(m_convolution_array)
+    {
+        for(int32_t i = 0; i < m_current_param.channels; i++)
+        {
+            if(m_convolution_array[i])
+            {
+                m_convolution_array[i]->Flush();
+            }
+        }
+    }
+}
+    
+int32_t Impulse::GetLatecy()
+{
+    int32_t latecy = 0;
+    
+    //因为每个通道的卷积延迟长度相同，所以直接返回一个
+    if(m_convolution_array)
+    {
+        if(m_convolution_array[0])
+            latecy += m_convolution_array[0]->GetLatecy();
+    }
+    
+    return latecy;
+}
+    
+int32_t Impulse::GetFrameLen()
+{
+    return m_new_param.frame_len;;
+}
+    
+int32_t Impulse::SetSampleRate(int32_t fs)
+{
+    m_new_param.fs = fs;
+    m_b_change = true;
+
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+    
+int32_t Impulse::SetChannels(int32_t channels)
+{
+    m_new_param.channels = channels;
+    m_b_change = true;
+
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t Impulse::SetWindowBit(int32_t bits, int32_t frame_len)
+{
+    m_new_param.window_bits = bits;
+    m_new_param.frame_len = (1 << (bits - 1)); // 为了保证输入为整数，输出也是整数
+    if (frame_len > 0)
+    {
+        m_new_param.frame_len = frame_len;
+    }
+
+    m_b_change = true;
+    
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+    
+int32_t Impulse::SetImpulseResponse(float * im_response, int32_t response_len, int32_t response_channels)
+{
+    if(m_response_channels != response_channels || m_im_res_len != response_len)
+    {
+        if (m_im_response_array)
+        {
+            for(int32_t i = 0; i < m_response_channels; i++)
+            {
+                SAFE_DELETE_PTR(m_im_response_array[i]);
+            }
+            if(m_response_channels != response_channels)
+            {
+                SAFE_DELETE_PTR(m_im_response_array);
+            }
+        }
+        m_response_channels = response_channels;
+        
+        if(m_im_response_array == NULL)
+        {
+            m_im_response_array = new (std::nothrow) float *[response_channels];
+            if(m_im_response_array == NULL)
+                return ERROR_SUPERSOUND_MEMORY;
+        }
+        
+        for (int32_t i = 0; i < response_channels; i++)
+        {
+            m_im_response_array[i] = new(std::nothrow) float[response_len];
+            if(m_im_response_array[i] == NULL)
+                return ERROR_SUPERSOUND_MEMORY;
+        }
+        m_im_res_len = response_len;
+    }
+    
+    //拷贝数据
+//    int momo_response_len = response_len / m_response_channels; // 处理一下
+    int momo_response_len = response_len;
+    for(int32_t i = 0; i < m_response_channels; i++)
+    {
+        for (int32_t j = 0; j < momo_response_len; j++)
+        {
+            m_im_response_array[i][j] = im_response[i + m_response_channels * j];
+        }
+    }
+    m_b_change = true;
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+    
+int32_t Impulse::Update()
+{
+    int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+    
+    if (m_im_response_array == NULL) {
+        return ERROR_SUPERSOUND_PARAM;
+    }
+    
+    //计算窗长，这个是提供给 FFT 的窗长
+    int32_t window_len = 1 << m_new_param.window_bits;
+    //计算窗移
+    int32_t window_step = m_new_param.frame_len;
+    
+    //更新通道数
+    if(m_new_param.channels != m_current_param.channels)
+    {
+        if(m_convolution_array)
+        {
+            for(int32_t i = 0; i < m_current_param.channels; i++)
+            {
+                SAFE_DELETE_OBJ(m_convolution_array[i]);
+            }
+            SAFE_DELETE_PTR(m_convolution_array);
+        }
+
+        m_convolution_array = new(std::nothrow) ISuperSoundConvolution * [m_new_param.channels];
+        if(m_convolution_array == NULL)
+            return ERROR_SUPERSOUND_MEMORY;
+        for(int32_t i = 0; i < m_new_param.channels; i++)
+        {
+    #ifdef SIMPLE_CONV
+            m_convolution_array[i] = new(std::nothrow) SupersoundSimpleConvolution();
+    #else
+            m_convolution_array[i] = new(std::nothrow) SuperSoundFastConvolution();
+    #endif
+            if(m_convolution_array[i] == NULL)
+                return ERROR_SUPERSOUND_MEMORY;
+            nRet = m_convolution_array[i]->SetFrameLenZeroLen(window_step, window_len - window_step);
+            if(nRet != ERROR_SUPERSOUND_SUCCESS)
+                return nRet;
+        }
+    }
+    // 理论上还应该给一个通道数相同但是windows_step不相同的情况,但是外部不会出现，所以不做处理
+
+    //如果输入通道数和响应通道数相同，则每个通道使用对应的响应，否则响应通道数只能为1，即所有通道使用相同的响应
+    int32_t flag = (m_new_param.channels == m_response_channels) ? 1 : 0;
+    for(int32_t i = 0; i < m_new_param.channels; i++)
+    {
+        nRet = m_convolution_array[i]->SetImpulseResponse(m_im_response_array[i * flag], m_im_res_len);
+        if(nRet != ERROR_SUPERSOUND_SUCCESS)
+            return nRet;
+        // 清空内部缓存数据，重新计算数据
+        m_convolution_array[i]->Flush();
+    }
+    
+    m_current_param = m_new_param;
+    m_b_change = false;
+    
+    return nRet;
+}
+    
+int32_t Impulse::Process(std::vector<float *> & buf_vector, int32_t & out_num)
+{
+    int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+    
+    if(m_b_change && m_b_update)
+    {
+        m_b_change = false;
+        nRet = Update();
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+    }
+    //外部控制更新必须得到立马的响应
+    if(m_b_update)
+        m_b_update = false;
+    
+    for(int32_t i = 0; i < m_current_param.channels; i++)
+    {
+        nRet = m_convolution_array[i]->ProcessFrame(buf_vector[i], out_num);
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+    }
+    return nRet;
+}
+    
+void Impulse::ControlUpdate()
+{
+    m_b_update = true;
+}
+    
+}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse.h
new file mode 100755
index 0000000..41a62bf
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse.h
@@ -0,0 +1,114 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __IMPULSE_H__
+#define __IMPULSE_H__
+
+#include "convolution/supersound_fast_convolution.h"
+#include "convolution/supersound_simple_convolution.h"
+
+#include <vector>
+
+namespace SUPERSOUND
+{
+namespace IMPULSE
+{
+
+class Impulse
+{
+public:
+	Impulse();
+	~Impulse();
+
+public:
+    //清空所有缓存
+    void Flush();
+    
+    //获取延迟长度
+    int32_t GetLatecy();
+    
+    //获取外界一次传入多少数据，也就是一帧的长度（单声道）
+    int32_t GetFrameLen();
+    
+    //设置、更新采样率
+    int32_t SetSampleRate(int32_t fs);
+    
+    //设置、更新声道数
+    int32_t SetChannels(int32_t channels);
+    
+    //设置、更新窗的 bit 长度，也就是 FFT 运算的帧长，不是外界传入数据帧长
+    int32_t SetWindowBit(int32_t bits, int32_t frame_len = 0);
+    
+    //设置冲击响应
+    int32_t SetImpulseResponse(float * im_response, int32_t response_len, int32_t response_channels);
+    
+    //处理函数，每次输入一数据，同时输出一数据，这样常规的 DSP 操作
+    int32_t Process(std::vector<float *> & buf_vector, int32_t & out_num);
+    
+    //控制更新的时机
+    void ControlUpdate();
+
+    int32_t Update();
+    
+private:
+    void Destory();
+    
+private:
+    //定义参数结构体
+    typedef struct _ParamInfo
+    {
+        int32_t fs;
+        int32_t channels;
+        int32_t window_bits;
+        int32_t frame_len;
+    }ParamInfo;
+    
+    ParamInfo m_new_param;
+    ParamInfo m_current_param;
+    
+    //参数上的改动
+    bool m_b_change;
+    //外部开始要求要用新参数进行处理
+    bool m_b_update;
+    
+    //脉冲响应数据及长度
+    float ** m_im_response_array;
+    int32_t m_im_res_len;
+    int32_t m_response_channels;
+    
+    ISuperSoundConvolution ** m_convolution_array;
+};
+    
+    
+}
+}
+
+#endif /* __IMPULSE_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse_effect.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse_effect.cpp
new file mode 100755
index 0000000..d647c8f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse_effect.cpp
@@ -0,0 +1,280 @@
+#include "impulse_effect.h"
+#include "supersound_err.h"
+#include "supersound_common.h"
+
+namespace SUPERSOUND
+{
+namespace IMPULSE
+{
+
+ImpulseEffect::ImpulseEffect()
+{
+    //保持和底层相同的默认值
+    m_param.fs = 44100;
+    m_param.in_channels = 2;
+    m_param.out_channels = 2;
+    m_param.window_bits = 10;
+    m_param.im_response = NULL;
+    m_param.response_len = 0;
+    m_param.response_channels = 1;
+    
+    m_frame_len = 0;
+    
+    m_channel_buf = NULL;
+    m_max_buf_num = 0;
+    m_empty_buf = NULL;
+    m_pre_fill_num = 0;
+    
+    m_bInit = false;
+}
+
+ImpulseEffect::~ImpulseEffect()
+{
+    Destory();
+}
+
+SUPERSOUND_EFFECT_TYPE ImpulseEffect::GetEffectId()
+{
+	return SUPERSOUND_IMPULSE_TYPE;
+}
+
+ISuperSound * ImpulseEffect::GetEffectInst()
+{
+	return new(std::nothrow) ImpulseEffect();
+}
+
+int32_t ImpulseEffect::SetParam( void * param )
+{
+    int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+    
+    if(param == NULL)
+        return ERROR_SUPERSOUND_PARAM;
+    
+    Impulse_Param * new_param = (Impulse_Param *)param;
+    
+    //输入输出的声道数必须相同
+    if(new_param->in_channels != new_param->out_channels)
+        return ERROR_SUPERSOUND_PARAM;
+    
+    if(new_param->in_channels > CHANNEL_MAX)
+        return ERROR_SUPERSOUND_PARAM;
+    
+    if(new_param->im_response == NULL || new_param->response_len <= 0)
+        return ERROR_SUPERSOUND_PARAM;
+    
+    if((new_param->response_channels != 1) && new_param->response_channels != new_param->in_channels)
+        return ERROR_SUPERSOUND_PARAM;
+    
+    nRet = m_impulse.SetSampleRate(new_param->fs);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    nRet = m_impulse.SetChannels(new_param->response_channels);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    //更新输入输出缓冲区
+    nRet = m_in_buf.SetChannels(new_param->in_channels);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    nRet = m_out_buf.SetChannels(new_param->out_channels);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    nRet = m_impulse.SetWindowBit(new_param->window_bits, new_param->process_buffer_len);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    
+    m_param.fs = new_param->fs;
+    m_param.in_channels = new_param->in_channels;
+    m_param.out_channels = new_param->out_channels;
+    m_param.window_bits = new_param->window_bits;
+    m_param.response_channels = new_param->response_channels;
+    
+    m_param.response_len = new_param->response_len;
+    m_param.response_channels = new_param->response_channels;
+
+    nRet = m_impulse.SetImpulseResponse(new_param->im_response, new_param->response_len, new_param->response_channels);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+
+    nRet = m_impulse.Update();
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    
+    //主要是为了防止不断压栈
+    int32_t new_frame_len = m_impulse.GetFrameLen();
+    int32_t new_buf_num = new_param->in_channels * new_frame_len;
+    if(m_max_buf_num < new_buf_num)
+    {
+        m_max_buf_num = new_buf_num;
+        SAFE_DELETE_PTR(m_channel_buf);
+        m_channel_buf = new(std::nothrow) float[m_max_buf_num];
+        if(m_channel_buf == NULL)
+            return ERROR_SUPERSOUND_MEMORY;
+    }
+    if((m_buf_vector.size() != new_param->in_channels) || (m_frame_len != new_frame_len))
+    {
+        m_buf_vector.clear();
+        m_frame_len = new_frame_len;
+        for(int32_t i = 0; i < new_param->in_channels; i++)
+        {
+            m_buf_vector.push_back(m_channel_buf + i * m_frame_len);
+        }
+    }
+// 不需要延迟
+//    m_pre_fill_num = (m_frame_len + m_impulse.GetLatecy()) * new_param->in_channels;
+//    SAFE_DELETE_PTR(m_empty_buf);
+//    m_empty_buf = new(std::nothrow) float[m_pre_fill_num];
+//    if(m_empty_buf == NULL)
+//        return ERROR_SUPERSOUND_MEMORY;
+//    memset(m_empty_buf, 0, sizeof(float) * m_pre_fill_num);
+//
+//    m_in_buf.PushSamples(m_empty_buf, m_pre_fill_num);
+
+    m_bInit = true;
+    
+    return nRet;
+}
+
+void ImpulseEffect::Update()
+{
+    m_impulse.ControlUpdate();
+}
+
+int32_t ImpulseEffect::GetParam( void * param )
+{
+    Impulse_Param * new_param = (Impulse_Param *)param;
+    new_param->fs = m_param.fs;
+    new_param->in_channels = m_param.in_channels;
+    new_param->out_channels = m_param.out_channels;
+    
+    return ERROR_SUPERSOUND_SUCCESS;
+}
+
+int32_t ImpulseEffect::GetSampleRate()
+{
+	return m_param.fs;
+}
+
+int32_t ImpulseEffect::GetInputChannels()
+{
+	return m_param.in_channels;
+}
+
+int32_t ImpulseEffect::GetOutputChannels()
+{
+	return m_param.out_channels;
+}
+
+int32_t ImpulseEffect::GetLatency()
+{
+//    int32_t latency = (int32_t)(1000.0f * m_pre_fill_num / m_param.fs + 0.5f);
+//    return latency;
+    return 0;
+}
+
+int32_t ImpulseEffect::GetFrameLen()
+{
+    return m_impulse.GetFrameLen();
+}
+
+void ImpulseEffect::FlushOut()
+{
+    m_in_buf.Flush();
+    m_out_buf.Flush();
+    m_impulse.Flush();
+
+    m_in_buf.PushSamples(m_empty_buf, m_pre_fill_num);
+}
+
+int32_t ImpulseEffect::FlushToBuf( int32_t & canOutputSamples )
+{
+    int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+    
+    if(!m_bInit)
+    {
+        canOutputSamples = 0;
+        return nRet;
+    }
+
+    //每个通道的延迟长度以及剩余长度
+    int32_t len = m_impulse.GetLatecy() + m_in_buf.DataSizeInCache() + m_out_buf.DataSizeInCache();
+    int32_t pro_len = m_param.in_channels * m_frame_len;
+    
+    while(1)
+    {
+        memset(m_channel_buf, 0, sizeof(float) * pro_len);
+        nRet = ProcessfInput(m_channel_buf, pro_len, canOutputSamples);
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+        
+        if((canOutputSamples / m_param.out_channels) >= len)
+        {
+            m_out_buf.ShadeSamples(canOutputSamples / m_param.out_channels - len);
+            break;
+        }
+    }
+    
+    canOutputSamples = m_out_buf.DataSizeInCache() * m_param.out_channels;
+    
+    //将需要清空的清空
+    m_in_buf.Flush();
+    m_impulse.Flush();
+    
+    return nRet;
+}
+
+int32_t ImpulseEffect::ProcessfInput( float * in, int32_t nSamples, int32_t & canOutputSamples )
+{
+    int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+    int32_t out_num;
+    
+    if(!m_bInit)
+    {
+        nRet = SetParam((void *)(&m_param));
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+    }
+    
+    nRet = m_in_buf.PushSamples(in, nSamples);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    
+    while(m_in_buf.DataSizeInCache() >= m_frame_len)
+    {
+        nRet = m_in_buf.PopSamples(m_buf_vector, m_frame_len, out_num);
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+        
+        nRet = m_impulse.Process(m_buf_vector, out_num);
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+        
+        nRet = m_out_buf.PushSamples(m_buf_vector, out_num);
+        if(ERROR_SUPERSOUND_SUCCESS != nRet)
+            return nRet;
+    }
+    
+    canOutputSamples = m_out_buf.DataSizeInCache() * m_param.out_channels;
+    
+    return nRet;
+}
+
+int32_t ImpulseEffect::ProcessfOutput( float * out, int32_t nSamples, int32_t & outSamples )
+{
+    int32_t nRet = ERROR_SUPERSOUND_SUCCESS;
+    
+    nRet = m_out_buf.PopSamples(out, nSamples, outSamples);
+    if(ERROR_SUPERSOUND_SUCCESS != nRet)
+        return nRet;
+    return nRet;
+}
+
+void ImpulseEffect::Destory()
+{
+    SAFE_DELETE_PTR(m_channel_buf);
+//    SAFE_DELETE_PTR(m_param.im_response)
+    SAFE_DELETE_PTR(m_empty_buf)
+    m_pre_fill_num = 0;
+}
+
+}
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse_effect.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse_effect.h
new file mode 100755
index 0000000..20534c3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/impulse/impulse_effect.h
@@ -0,0 +1,95 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               ·ð×æ±£ÓÓ         ÓÀÎÞBUG				+
+//+ ----------------------------------------------------+
+
+#ifndef __IMPULSE_EFFECT_H__
+#define __IMPULSE_EFFECT_H__
+
+#include "impulse_types.h"
+#include "impulse.h"
+#include "isupersound.h"
+#include "supersound_wav_buf.h"
+
+namespace SUPERSOUND
+{
+namespace IMPULSE
+{
+
+
+class ImpulseEffect : public ISuperSound
+{
+public:
+	ImpulseEffect();
+	virtual ~ImpulseEffect();
+
+public:
+	virtual SUPERSOUND_EFFECT_TYPE GetEffectId();
+	virtual ISuperSound * GetEffectInst();
+	virtual int32_t SetParam(void * param);
+	virtual void Update();
+	virtual int32_t GetParam(void * param);
+	virtual int32_t GetSampleRate();
+	virtual int32_t GetInputChannels();
+	virtual int32_t GetOutputChannels();
+	virtual void FlushOut();
+	virtual int32_t FlushToBuf(int32_t & canOutputSamples);
+	virtual int32_t ProcessfInput(float * in, int32_t nSamples, int32_t & canOutputSamples);
+	virtual int32_t ProcessfOutput(float * out, int32_t nSamples, int32_t & outSamples);
+	virtual int32_t GetLatency();
+	virtual int32_t GetFrameLen();
+
+private:
+    void Destory();
+
+private:
+	Impulse_Param m_param;
+
+	Impulse m_impulse;
+    
+    SuperSoundWavBuf m_in_buf;
+    SuperSoundWavBuf m_out_buf;
+    
+    //每次传入的帧长（单声道）
+    int32_t m_frame_len;
+    //防止不断压栈，使用堆空间
+    float * m_channel_buf;
+    int32_t m_max_buf_num;
+    std::vector<float *> m_buf_vector;
+	float * m_empty_buf;
+	int m_pre_fill_num;
+    //是否初始化过了
+    bool m_bInit;
+};
+    
+    
+}
+}
+
+#endif /* __IMPULSE_EFFECT_H__ */
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/isupersound.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/isupersound.h
new file mode 100755
index 0000000..d8251ab
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/supersound/src/isupersound.h
@@ -0,0 +1,144 @@
+
+/***************************************************************************
+*	email					: yijiangyang@tencent.com					   *
+***************************************************************************/
+
+//+ ----------------------------------------------------+
+//+                       _oo0oo_						+
+//+                      o8888888o						+
+//+                      88" . "88						+
+//+                      (| -_- |)						+
+//+                      0\  =  /0						+
+//+                    ___/`---'\___					+
+//+                  .' \\|     |// '.					+
+//+                 / \\|||  :  |||// \					+
+//+                / _||||| -:- |||||- \				+
+//+               |   | \\\  -  /// |   |				+
+//+               | \_|  ''\---/''  |_/ |				+
+//+               \  .-\__  '-'  ___/-. /				+
+//+             ___'. .'  /--.--\  `. .'___				+
+//+          ."" '<  `.___\_<|>_/___.' >' "".			+
+//+         | | :  `- \`.;`\ _ /`;.`/ - ` : | |			+
+//+         \  \ `_.   \_ __\ /__ _/   .-` /  /			+
+//+     =====`-.____`.___ \_____/___.-`___.-'=====		+
+//+                       `=---='						+
+//+														+
+//+														+
+//+     ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~		+
+//+														+
+//+               佛祖保佑         永无BUG				+
+//+ ----------------------------------------------------+
+
+//定义效果器的基类，这样统一所有接口
+
+#ifndef __I_SUPERSOUND_H__
+#define __I_SUPERSOUND_H__
+
+#include "supersound_types.h"
+#include <stdint.h>
+
+namespace SUPERSOUND
+{
+
+
+class ISuperSound
+{
+public:
+	ISuperSound() { };
+	virtual ~ISuperSound() { };
+
+public:
+	//+ ----------------------------------------------------
+	//+ 获取效果器 Id
+	//+ 返回值为 SUPERSOUND_EFFECT_TYPE
+	//+ ----------------------------------------------------
+	virtual SUPERSOUND_EFFECT_TYPE GetEffectId() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取效果器实例
+	//+ 返回值为效果器实例
+	//+ ----------------------------------------------------
+	virtual ISuperSound * GetEffectInst() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 设置、更新参数
+	//+ 返回值为errCode
+	//+ ----------------------------------------------------
+	virtual int32_t SetParam(void * param) = 0;
+
+	//+ ----------------------------------------------------
+	//+ 更新设置，主要是为了做存在参数设置变动比较大的情况下的破音问题
+	//+ 返回值为errCode
+	//+ ----------------------------------------------------
+	virtual void Update() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取参数
+	//+ 返回值为errCode
+	//+ ----------------------------------------------------
+	virtual int32_t GetParam(void * param) = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取采样率
+	//+ 返回值为采样率
+	//+ ----------------------------------------------------
+	virtual int32_t GetSampleRate() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取输入声道数
+	//+ 返回值为输入声道数
+	//+ ----------------------------------------------------
+	virtual int32_t GetInputChannels() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取输出声道数
+	//+ 返回值为输出声道数
+	//+ ----------------------------------------------------
+	virtual int32_t GetOutputChannels() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 清空缓存数据，在外围有进行跳转操作时要调用的操作
+	//+ ----------------------------------------------------
+	virtual void FlushOut() = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取最后的缓存数据到输出缓存中
+	//+ 返回值为errCode
+	//+ ----------------------------------------------------
+	virtual int32_t FlushToBuf(int32_t & canOutputSamples) = 0;
+
+	//+ ----------------------------------------------------
+	//+ 对浮点数据进行处理
+	//+ in：输入音频数据指针
+	//+ nSamples：输入音频数据指针长度
+	//+ canOutputSamples：能够输出的数据长度
+	//+ 返回值为errCode
+	//+ ----------------------------------------------------
+	virtual int32_t ProcessfInput(float * in, int32_t nSamples, int32_t & canOutputSamples) = 0;
+
+	//+ ----------------------------------------------------
+	//+ 对浮点数据进行处理
+	//+ out：输出音频数据指针
+	//+ nSamples：输出音频数据指针长度
+	//+ outSamples：实际获取到的数据长度
+	//+ 返回值为errCode
+	//+ ----------------------------------------------------
+	virtual int32_t ProcessfOutput(float * out, int32_t nSamples, int32_t & outSamples) = 0;
+
+	//+ ----------------------------------------------------
+	//+ 获取效果器延迟时间
+	//+ 返回值为延迟时间，单位：ms
+	//+ ----------------------------------------------------
+	virtual int32_t GetLatency() = 0;
+    //+ ----------------------------------------------------
+    //+ 获取效果器内部一帧的长度[单声道]
+    //+ 返回值为单声道采样点数量
+    //+ ----------------------------------------------------
+	virtual int32_t GetFrameLen() = 0;
+
+};
+
+
+}
+
+#endif /* __I_SUPERSOUND_H__ */
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/CMakeLists.txt
new file mode 100644
index 0000000..e1f7f34
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/CMakeLists.txt
@@ -0,0 +1,15 @@
+include_directories(./ inc src)
+
+include_directories(src/aa_filter)
+include_directories(src/bpm_detect)
+include_directories(src/cpu_detect)
+include_directories(src/fifo_sample_buffer)
+include_directories(src/fir_filter)
+include_directories(src/peak_finder)
+include_directories(src/rate_transposer)
+include_directories(src/sound_touch)
+include_directories(src/td_stretch)
+
+file(GLOB_RECURSE TONESHIFT_SRC_FILES src/*cpp)
+add_library(tone_shift ${TONESHIFT_SRC_FILES})
+#set_target_properties(tone_shift PROPERTIES CXX_VISIBILITY_PRESET hidden)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CSoundTouchDef.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CSoundTouchDef.h
new file mode 100644
index 0000000..c7f1455
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CSoundTouchDef.h
@@ -0,0 +1,15 @@
+//
+// Created by yangjianli on 2020-01-15.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_SOUNDTOUCHDEF_H
+#define AUDIO_EFFECTS_LIB_SOUNDTOUCHDEF_H
+#include "AudioEffectsConf.h"
+enum ST_ERR {
+    ST_ERR_SUCCESS            = 0,
+    ST_ERR_PARAM              = -1,
+    ST_ERR_BASE_H_MALLOC_NULL = -2,
+    ST_ERR_BASE_H_UNKNOWN     = -3,
+};
+
+#endif //AUDIO_EFFECTS_LIB_SOUNDTOUCHDEF_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CSpeedShift.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CSpeedShift.h
new file mode 100644
index 0000000..de269f4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CSpeedShift.h
@@ -0,0 +1,35 @@
+//
+// Created by wangjianjun on 18/11/1.
+//
+
+#ifndef CAUDIODECODER_CSPEEDSHIFT_H
+#define CAUDIODECODER_CSPEEDSHIFT_H
+
+#include "SpeedShiftInterface.h"
+
+class CSpeedShift : public SpeedShiftInterface {
+public:
+    CSpeedShift();
+    ~CSpeedShift();
+
+public:
+    int  init(int sampleRate, int channel);
+    void uninit();
+
+    int  set_speed_value(float speedVal);
+    float  get_speed_value();
+
+    int  get_latence();
+    void reset();
+
+    int process(float *inBuffer, int inSize, float *outBuffer, int outSize);
+
+private:
+    float m_speed_value;		// speed value.
+    int m_channel;			// sample channel, 1 for mono, 2 for stereo.
+
+    void* pTone;
+};
+
+
+#endif //CAUDIODECODER_CSPEEDSHIFT_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CToneShift.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CToneShift.h
new file mode 100644
index 0000000..4acc707
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/CToneShift.h
@@ -0,0 +1,42 @@
+/************************************************************************/
+/* tone shift                                          */
+/* written by ethanzhao,  6-16,2014                                     */
+/************************************************************************/
+#ifndef C_TONE_SHIFT_H
+#define C_TONE_SHIFT_H
+
+#include "ToneShiftInterfaces.h"
+#define MAX_TONE_SHIFT_VALUE	12	// tone shift max value
+#define MIN_TONE_SHIFT_VALUE	-12	// tone shift min value
+
+/* change tone style */
+class CToneShift :public ToneShiftInterface
+{
+public:
+	CToneShift();
+	~CToneShift();
+
+	int  init(int sampe_rate, int channel);
+	void uninit();
+
+	int  get_shift_range(int *max_val, int *min_val);	// get shift range. [-12,+12]
+	int  get_shift_default();							// get shift default value. maybe 0.
+	int  set_shift_value(int shift_val);				// set shift value now.
+	int  get_shift_value();				// get shift value now.
+	int  get_latence();						//time:ms
+	void reset();
+
+	/* process, return the output real size after processing.        */
+	int  process(float *in_buffer, int in_size, float *out_buffer, int out_size);
+
+private:
+	int m_shift_value;		// shift value.
+	int m_iChannel;			// sample channel, 1 for mono, 2 for stereo.
+	int m_i_sample_rate;		// sample rate.
+
+	void* pTone;			// 
+};
+
+
+#endif
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/SpeedShiftInterface.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/SpeedShiftInterface.h
new file mode 100644
index 0000000..baf1890
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/SpeedShiftInterface.h
@@ -0,0 +1,30 @@
+//
+// Created by wangjianjun on 18/11/1.
+//
+
+#ifndef CAUDIODECODER_SPEEDSHIFTINTERFACE_H
+#define CAUDIODECODER_SPEEDSHIFTINTERFACE_H
+
+#define MAX_SPEED_SHIFT_VALUE	5.0f	// 快速最快 5 倍
+#define MIN_SPEED_SHIFT_VALUE	0.2f	// 慢速最慢 5 倍（1/0.2f）
+#include "CSoundTouchDef.h"
+class SpeedShiftInterface
+{
+public:
+    /* 功能：创建及销毁对象 **/
+    static SpeedShiftInterface* CreateObject();
+    static void DestroyObject(SpeedShiftInterface** pObject);
+public:
+    virtual int  init(int sample_rate, int channel) = 0;
+    virtual void uninit() = 0;
+
+    virtual int  set_speed_value(float speed_val) = 0;
+    virtual float  get_speed_value() = 0;
+
+    virtual int  get_latence() = 0;
+    virtual void reset() = 0;
+
+    virtual int process(float *in_buffer, int in_size, float *out_buffer, int out_size) = 0;
+};
+
+#endif //CAUDIODECODER_SPEEDSHIFTINTERFACE_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/ToneShiftInterfaces.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/ToneShiftInterfaces.h
new file mode 100644
index 0000000..e311485
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/inc/ToneShiftInterfaces.h
@@ -0,0 +1,30 @@
+﻿/************************************************************************/
+/* kala ok audio base module interface.                                 */
+/************************************************************************/
+
+#ifndef TONE_SHIFT_INTERFACE_H
+#define TONE_SHIFT_INTERFACE_H
+#include "CSoundTouchDef.h"
+/* change tone style */
+class ToneShiftInterface
+{
+public:
+	/* 功能：创建及销毁对象 **/
+	static ToneShiftInterface* create_object();
+	static void destroy_object(ToneShiftInterface **pObject);
+public:
+	virtual int  init(int sampe_rate, int channel) = 0;
+	virtual void uninit() = 0;
+
+	virtual int  get_shift_range(int *max_val, int *min_val) = 0;
+	virtual int  get_shift_default() = 0;
+	virtual int  set_shift_value(int shift_val) = 0;
+	virtual int  get_shift_value() = 0;
+
+	virtual int  get_latence() = 0;
+	virtual void reset() = 0;
+
+	virtual int process(float *in_buffer, int in_size, float *out_buffer, int out_size) = 0;
+};
+
+#endif //TONE_SHIFT_INTERFACE_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/CSpeedShift.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/CSpeedShift.cpp
new file mode 100644
index 0000000..a448817
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/CSpeedShift.cpp
@@ -0,0 +1,144 @@
+//
+// Created by wangjianjun on 18/11/1.
+//
+
+#include <math.h>
+#include "CSpeedShift.h"
+#include "SoundTouch.h"
+#include "CSoundTouchDef.h"
+#include "string"
+
+using namespace soundtouch;
+
+static float gs_buf[3837 * 2] = { 0.0f };
+
+SpeedShiftInterface* SpeedShiftInterface::CreateObject()
+{
+    CSpeedShift * pSpeedShift = new CSpeedShift();
+    return pSpeedShift;
+}
+
+void SpeedShiftInterface::DestroyObject(SpeedShiftInterface** pObject)
+{
+    delete (*pObject);
+    (*pObject) = NULL;
+}
+
+CSpeedShift::CSpeedShift()
+{
+    pTone = NULL;
+    m_speed_value = 1.0f;
+}
+
+CSpeedShift::~CSpeedShift()
+{
+    uninit();
+}
+
+void CSpeedShift::uninit()
+{
+    SoundTouch* stchTone = (SoundTouch*)pTone;
+    if (stchTone != NULL)
+    {
+        stchTone->flush();
+        delete stchTone;
+
+        pTone = NULL;
+    }
+}
+
+int CSpeedShift::init(int sampleRate, int channel) {
+    SoundTouch* stchTone = new SoundTouch;
+    pTone = stchTone;
+
+    stchTone->setChannels(channel);
+    stchTone->setSampleRate(sampleRate);
+
+    //stchTone->setSetting(SETTING_USE_AA_FILTER,1);
+    stchTone->setSetting(SETTING_USE_AA_FILTER,0);
+    stchTone->setSetting(SETTING_USE_QUICKSEEK,1);
+    stchTone->setSetting(SETTING_SEQUENCE_MS,40);
+    stchTone->setSetting(SETTING_SEEKWINDOW_MS, 15);
+    stchTone->setSetting(SETTING_OVERLAP_MS,8);
+
+    stchTone->setTempo(1.0f);
+
+    stchTone->putSamples(gs_buf, 3837);
+
+    m_channel = channel;
+    return 0;
+}
+
+int CSpeedShift::set_speed_value(float speedVal)
+{
+    SoundTouch* stchTone = (SoundTouch*)pTone;
+    if (stchTone == NULL)
+    {
+        return ST_ERR_BASE_H_MALLOC_NULL;
+    }
+
+    if (speedVal > MAX_SPEED_SHIFT_VALUE)
+    {
+        speedVal = MAX_SPEED_SHIFT_VALUE;
+    }
+    else if (speedVal < MIN_SPEED_SHIFT_VALUE)
+    {
+        speedVal = MIN_SPEED_SHIFT_VALUE;
+    }
+
+    m_speed_value = speedVal;
+    stchTone->setTempo(m_speed_value);
+
+    return 0;
+}
+
+float CSpeedShift::get_speed_value()
+{
+    return m_speed_value;
+}
+
+void CSpeedShift::reset()
+{
+    SoundTouch* stchTone = (SoundTouch*)pTone;
+    if (stchTone == NULL)
+    {
+        return;
+    }
+    stchTone->clear();
+
+    stchTone->putSamples(gs_buf, 3837);
+}
+
+int CSpeedShift::get_latence()
+{
+    return 80;
+}
+
+int CSpeedShift::process(float *inBuffer, int inSize, float *outBuffer, int outSize)
+{
+    int inNum;
+    int outNum;
+
+    SoundTouch* stchTone = (SoundTouch*)pTone;
+    if (stchTone == NULL)
+    {
+        return ST_ERR_BASE_H_MALLOC_NULL;
+    }
+
+    if (fabsf(m_speed_value - 1.0f) <= 0.001f)
+    {
+        outSize = outSize > inSize ? inSize : outSize;
+        // not process it.
+        memcpy(outBuffer, inBuffer, outSize * sizeof(float));
+        return outSize;
+    }
+
+    memset(outBuffer, 0, outSize * sizeof(float));
+
+    inNum = inSize / m_channel;
+    stchTone->putSamples((SAMPLETYPE*)inBuffer, inNum);
+
+    outNum = stchTone->receiveSamples((SAMPLETYPE*)outBuffer, outSize / m_channel);
+
+    return outNum * m_channel;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/CToneShift.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/CToneShift.cpp
new file mode 100644
index 0000000..bb23c10
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/CToneShift.cpp
@@ -0,0 +1,164 @@
+#include "CToneShift.h"
+#include "SoundTouch.h"
+#include "CSoundTouchDef.h"
+#include "string"
+
+using namespace soundtouch;
+
+//static SoundTouch stchTone;			// for tone shift.
+static float gs_blk[3837 * 2] = { 0.0f };
+
+ToneShiftInterface* ToneShiftInterface::create_object()
+{
+	ToneShiftInterface* pObject = new CToneShift;
+	return pObject;
+}
+
+void ToneShiftInterface::destroy_object(ToneShiftInterface **pObject)
+{
+	delete (*pObject);
+	(*pObject) = NULL;
+}
+
+CToneShift::CToneShift()
+{
+}
+
+CToneShift::~CToneShift()
+{
+    uninit();
+}
+
+///////////////////////////// functions for tone shift below ///////////////////////////////////
+int CToneShift::process(float *in_buffer, int in_size, float *out_buffer, int out_size)
+{
+	int inNum;
+	int outNum;
+
+	SoundTouch* stchTone = (SoundTouch*)pTone;
+	if (stchTone == NULL)
+	{
+		return ST_ERR_BASE_H_MALLOC_NULL;
+	}
+
+	out_size = out_size>in_size?in_size:out_size;
+	if (m_shift_value == 0)
+	{
+		// not process it.
+		memcpy(out_buffer,in_buffer,out_size * sizeof(float));
+		return out_size;
+	}
+
+	inNum = in_size/m_iChannel;
+	stchTone->putSamples((SAMPLETYPE*)in_buffer, inNum);
+
+	// 保证in_buffer和out_buffer同一个的时候也可以用
+    memset(out_buffer,0, out_size * sizeof(float));
+
+	outNum = stchTone->receiveSamples((SAMPLETYPE*)out_buffer, out_size / m_iChannel);
+	//return outNum*m_iChannel*sizeof(short);;
+	return outNum * m_iChannel;
+}
+
+int  CToneShift::get_latence()
+{
+	return 84;
+}
+
+void CToneShift::reset()
+{
+	SoundTouch* stchTone = (SoundTouch*)pTone;
+	if (stchTone == NULL)
+	{
+		return;
+	}
+	stchTone->clear();
+	
+	stchTone->putSamples(gs_blk,3837);
+}
+
+int CToneShift::get_shift_value()
+{
+	return m_shift_value;
+}
+
+int CToneShift::set_shift_value(int shift_val)
+{
+	SoundTouch* stchTone = (SoundTouch*)pTone;
+	if (stchTone == NULL)
+	{
+		return ST_ERR_BASE_H_MALLOC_NULL;
+	}
+
+	if (shift_val>MAX_TONE_SHIFT_VALUE)
+	{
+		shift_val = MAX_TONE_SHIFT_VALUE;
+	}
+	else if (shift_val < MIN_TONE_SHIFT_VALUE)
+	{
+		shift_val = MIN_TONE_SHIFT_VALUE;
+	}
+
+	m_shift_value = shift_val;
+	stchTone->setPitchSemiTones(m_shift_value);
+
+	return 0;
+}
+
+int CToneShift::get_shift_default()
+{
+	return 0;
+}
+
+int CToneShift::get_shift_range(int *max_val, int *min_val)
+{
+	*max_val = MAX_TONE_SHIFT_VALUE;
+	*min_val = MIN_TONE_SHIFT_VALUE;
+
+	return 0;
+}
+
+
+void CToneShift::uninit()
+{
+	SoundTouch* stchTone = (SoundTouch*)pTone;
+	if (stchTone != NULL)
+	{
+		stchTone->flush();
+
+		//delete pTone;
+		delete stchTone;
+
+		pTone = NULL;
+	}
+}
+
+int CToneShift::init(int sampe_rate, int channel)
+{
+	pTone = NULL;
+
+	SoundTouch* stchTone = new SoundTouch;
+	pTone = stchTone;
+
+	stchTone->setChannels(channel);
+	stchTone->setSampleRate(sampe_rate);
+
+	//stchTone->setSetting(SETTING_USE_AA_FILTER,1);
+	stchTone->setSetting(SETTING_USE_AA_FILTER,0);
+	stchTone->setSetting(SETTING_USE_QUICKSEEK,1);
+	stchTone->setSetting(SETTING_SEQUENCE_MS,40);
+	stchTone->setSetting(SETTING_SEEKWINDOW_MS, 15);
+	stchTone->setSetting(SETTING_OVERLAP_MS,8);
+	
+	stchTone->setPitchSemiTones(0);
+
+	stchTone->putSamples(gs_blk,3837);
+
+	m_shift_value = 0;
+	m_i_sample_rate = sampe_rate;
+	m_iChannel = channel;
+	return 0;
+}
+
+///////////////////////////// functions for tone shift on top ///////////////////////////////////
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/FIFOSamplePipe.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/FIFOSamplePipe.h
new file mode 100644
index 0000000..f26c57b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/FIFOSamplePipe.h
@@ -0,0 +1,234 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// 'FIFOSamplePipe' : An abstract base class for classes that manipulate sound
+/// samples by operating like a first-in-first-out pipe: New samples are fed
+/// into one end of the pipe with the 'putSamples' function, and the processed
+/// samples are received from the other end with the 'receiveSamples' function.
+///
+/// 'FIFOProcessor' : A base class for classes the do signal processing with 
+/// the samples while operating like a first-in-first-out pipe. When samples
+/// are input with the 'putSamples' function, the class processes them
+/// and moves the processed samples to the given 'output' pipe object, which
+/// may be either another processing stage, or a fifo sample buffer object.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-06-13 22:29:53 +0300 (Wed, 13 Jun 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: FIFOSamplePipe.h 143 2012-06-13 19:29:53Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef FIFOSamplePipe_H
+#define FIFOSamplePipe_H
+
+#include <assert.h>
+#include <stdlib.h>
+#include "STTypes.h"
+
+namespace soundtouch
+{
+
+/// Abstract base class for FIFO (first-in-first-out) sample processing classes.
+class FIFOSamplePipe
+{
+public:
+    // virtual default destructor
+    virtual ~FIFOSamplePipe() {}
+
+
+    /// Returns a pointer to the beginning of the output samples. 
+    /// This function is provided for accessing the output samples directly. 
+    /// Please be careful for not to corrupt the book-keeping!
+    ///
+    /// When using this function to output samples, also remember to 'remove' the
+    /// output samples from the buffer by calling the 
+    /// 'receiveSamples(numSamples)' function
+    virtual SAMPLETYPE *ptrBegin() = 0;
+
+    /// Adds 'numSamples' pcs of samples from the 'samples' memory position to
+    /// the sample buffer.
+    virtual void putSamples(const SAMPLETYPE *samples,  ///< Pointer to samples.
+                            uint numSamples             ///< Number of samples to insert.
+                            ) = 0;
+
+
+    // Moves samples from the 'other' pipe instance to this instance.
+    void moveSamples(FIFOSamplePipe &other  ///< Other pipe instance where from the receive the data.
+         )
+    {
+        int oNumSamples = other.numSamples();
+
+        putSamples(other.ptrBegin(), oNumSamples);
+        other.receiveSamples(oNumSamples);
+    };
+
+    /// Output samples from beginning of the sample buffer. Copies requested samples to 
+    /// output buffer and removes them from the sample buffer. If there are less than 
+    /// 'numsample' samples in the buffer, returns all that available.
+    ///
+    /// \return Number of samples returned.
+    virtual uint receiveSamples(SAMPLETYPE *output, ///< Buffer where to copy output samples.
+                                uint maxSamples                 ///< How many samples to receive at max.
+                                ) = 0;
+
+    /// Adjusts book-keeping so that given number of samples are removed from beginning of the 
+    /// sample buffer without copying them anywhere. 
+    ///
+    /// Used to reduce the number of samples in the buffer when accessing the sample buffer directly
+    /// with 'ptrBegin' function.
+    virtual uint receiveSamples(uint maxSamples   ///< Remove this many samples from the beginning of pipe.
+                                ) = 0;
+
+    /// Returns number of samples currently available.
+    virtual uint numSamples() const = 0;
+
+    // Returns nonzero if there aren't any samples available for outputting.
+    virtual int isEmpty() const = 0;
+
+    /// Clears all the samples.
+    virtual void clear() = 0;
+
+    /// allow trimming (downwards) amount of samples in pipeline.
+    /// Returns adjusted amount of samples
+    virtual uint adjustAmountOfSamples(uint numSamples) = 0;
+
+};
+
+
+
+/// Base-class for sound processing routines working in FIFO principle. With this base 
+/// class it's easy to implement sound processing stages that can be chained together,
+/// so that samples that are fed into beginning of the pipe automatically go through 
+/// all the processing stages.
+///
+/// When samples are input to this class, they're first processed and then put to 
+/// the FIFO pipe that's defined as output of this class. This output pipe can be
+/// either other processing stage or a FIFO sample buffer.
+class FIFOProcessor :public FIFOSamplePipe
+{
+protected:
+    /// Internal pipe where processed samples are put.
+    FIFOSamplePipe *output;
+
+    /// Sets output pipe.
+    void setOutPipe(FIFOSamplePipe *pOutput)
+    {
+        assert(output == NULL);
+        assert(pOutput != NULL);
+        output = pOutput;
+    }
+
+
+    /// Constructor. Doesn't define output pipe; it has to be set be 
+    /// 'setOutPipe' function.
+    FIFOProcessor()
+    {
+        output = NULL;
+    }
+
+
+    /// Constructor. Configures output pipe.
+    FIFOProcessor(FIFOSamplePipe *pOutput   ///< Output pipe.
+                 )
+    {
+        output = pOutput;
+    }
+
+
+    /// Destructor.
+    virtual ~FIFOProcessor()
+    {
+    }
+
+
+    /// Returns a pointer to the beginning of the output samples. 
+    /// This function is provided for accessing the output samples directly. 
+    /// Please be careful for not to corrupt the book-keeping!
+    ///
+    /// When using this function to output samples, also remember to 'remove' the
+    /// output samples from the buffer by calling the 
+    /// 'receiveSamples(numSamples)' function
+    virtual SAMPLETYPE *ptrBegin()
+    {
+        return output->ptrBegin();
+    }
+
+public:
+
+    /// Output samples from beginning of the sample buffer. Copies requested samples to 
+    /// output buffer and removes them from the sample buffer. If there are less than 
+    /// 'numsample' samples in the buffer, returns all that available.
+    ///
+    /// \return Number of samples returned.
+    virtual uint receiveSamples(SAMPLETYPE *outBuffer, ///< Buffer where to copy output samples.
+                                uint maxSamples                    ///< How many samples to receive at max.
+                                )
+    {
+        return output->receiveSamples(outBuffer, maxSamples);
+    }
+
+
+    /// Adjusts book-keeping so that given number of samples are removed from beginning of the 
+    /// sample buffer without copying them anywhere. 
+    ///
+    /// Used to reduce the number of samples in the buffer when accessing the sample buffer directly
+    /// with 'ptrBegin' function.
+    virtual uint receiveSamples(uint maxSamples   ///< Remove this many samples from the beginning of pipe.
+                                )
+    {
+        return output->receiveSamples(maxSamples);
+    }
+
+
+    /// Returns number of samples currently available.
+    virtual uint numSamples() const
+    {
+        return output->numSamples();
+    }
+
+
+    /// Returns nonzero if there aren't any samples available for outputting.
+    virtual int isEmpty() const
+    {
+        return output->isEmpty();
+    }
+
+    /// allow trimming (downwards) amount of samples in pipeline.
+    /// Returns adjusted amount of samples
+    virtual uint adjustAmountOfSamples(uint numSamples)
+    {
+        return output->adjustAmountOfSamples(numSamples);
+    }
+
+};
+
+}
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/STTypes.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/STTypes.h
new file mode 100644
index 0000000..7af6bb9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/STTypes.h
@@ -0,0 +1,188 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// Common type definitions for SoundTouch audio processing library.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-12-28 16:53:56 +0200 (Fri, 28 Dec 2012) $
+// File revision : $Revision: 3 $
+//
+// $Id: STTypes.h 162 2012-12-28 14:53:56Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef STTypes_H
+#define STTypes_H
+
+typedef unsigned int    uint;
+typedef unsigned long   ulong;
+
+// Patch for MinGW: on Win64 long is 32-bit
+#ifdef _WIN64
+    typedef unsigned long long ulongptr;
+#else
+    typedef ulong ulongptr;
+#endif
+
+// Helper macro for aligning pointer up to next 16-byte boundary
+#define SOUNDTOUCH_ALIGN_POINTER_16(x)      ( ( (ulongptr)(x) + 15 ) & ~(ulongptr)15 )
+
+//#if (defined(__GNUC__) && !defined(ANDROID))
+//    // In GCC, include soundtouch_config.h made by config scritps.
+//    // Skip this in Android compilation that uses GCC but without configure scripts.
+//    #include "soundtouch_config.h"
+//#endif
+
+#ifndef _WINDEF_
+    // if these aren't defined already by Windows headers, define now
+
+    //typedef int BOOL;
+#ifndef BOOL
+#define BOOL int
+#endif
+
+    #define FALSE   0
+    #define TRUE    1
+
+#endif  // _WINDEF_
+
+
+namespace soundtouch
+{
+    /// Activate these undef's to overrule the possible sampletype 
+    /// setting inherited from some other header file:
+    //#undef SOUNDTOUCH_INTEGER_SAMPLES
+    //#undef SOUNDTOUCH_FLOAT_SAMPLES
+
+    #if (defined(__SOFTFP__))
+        // For Android compilation: Force use of Integer samples in case that
+        // compilation uses soft-floating point emulation - soft-fp is way too slow
+        #undef  SOUNDTOUCH_FLOAT_SAMPLES	
+        #define SOUNDTOUCH_INTEGER_SAMPLES      1
+    #endif
+
+    #if !(SOUNDTOUCH_INTEGER_SAMPLES || SOUNDTOUCH_FLOAT_SAMPLES)
+       
+        /// Choose either 32bit floating point or 16bit integer sampletype
+        /// by choosing one of the following defines, unless this selection 
+        /// has already been done in some other file.
+        ////
+        /// Notes:
+        /// - In Windows environment, choose the sample format with the
+        ///   following defines.
+        /// - In GNU environment, the floating point samples are used by 
+        ///   default, but integer samples can be chosen by giving the 
+        ///   following switch to the configure script:
+        ///       ./configure --enable-integer-samples
+        ///   However, if you still prefer to select the sample format here 
+        ///   also in GNU environment, then please #undef the INTEGER_SAMPLE
+        ///   and FLOAT_SAMPLE defines first as in comments above.
+        //#define SOUNDTOUCH_INTEGER_SAMPLES     1    //< 16bit integer samples
+        #define SOUNDTOUCH_FLOAT_SAMPLES       1    //< 32bit float samples
+     
+    #endif
+
+    #if (_M_IX86 || __i386__ || __x86_64__ || _M_X64)
+        /// Define this to allow X86-specific assembler/intrinsic optimizations. 
+        /// Notice that library contains also usual C++ versions of each of these
+        /// these routines, so if you're having difficulties getting the optimized 
+        /// routines compiled for whatever reason, you may disable these optimizations 
+        /// to make the library compile.
+
+        //#define SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS     0
+
+        /// In GNU environment, allow the user to override this setting by
+        /// giving the following switch to the configure script:
+        /// ./configure --disable-x86-optimizations
+        /// ./configure --enable-x86-optimizations=no
+        #ifdef SOUNDTOUCH_DISABLE_X86_OPTIMIZATIONS
+            #undef SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS
+        #endif
+    #else
+        /// Always disable optimizations when not using a x86 systems.
+        #undef SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS
+
+    #endif
+
+    // If defined, allows the SIMD-optimized routines to take minor shortcuts 
+    // for improved performance. Undefine to require faithfully similar SIMD 
+    // calculations as in normal C implementation.
+    #define SOUNDTOUCH_ALLOW_NONEXACT_SIMD_OPTIMIZATION    1
+
+
+    #ifdef SOUNDTOUCH_INTEGER_SAMPLES
+        // 16bit integer sample type
+        typedef short SAMPLETYPE;
+        // data type for sample accumulation: Use 32bit integer to prevent overflows
+        typedef long  LONG_SAMPLETYPE;
+
+        #ifdef SOUNDTOUCH_FLOAT_SAMPLES
+            // check that only one sample type is defined
+            #error "conflicting sample types defined"
+        #endif // SOUNDTOUCH_FLOAT_SAMPLES
+
+        #ifdef SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS
+            // Allow MMX optimizations
+            #define SOUNDTOUCH_ALLOW_MMX   1
+        #endif
+
+    #else
+
+        // floating point samples
+        typedef float  SAMPLETYPE;
+        // data type for sample accumulation: Use double to utilize full precision.
+        typedef double LONG_SAMPLETYPE;
+
+        #ifdef SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS
+            // Allow SSE optimizations
+            #define SOUNDTOUCH_ALLOW_SSE       1
+        #endif
+
+    #endif  // SOUNDTOUCH_INTEGER_SAMPLES
+
+};
+
+// define ST_NO_EXCEPTION_HANDLING switch to disable throwing std exceptions:
+#define ST_NO_EXCEPTION_HANDLING    1
+#ifdef ST_NO_EXCEPTION_HANDLING
+    // Exceptions disabled. Throw asserts instead if enabled.
+    #include <assert.h>
+    #define ST_THROW_RT_ERROR(x)    {assert((const char *)x);}
+#else
+    // use c++ standard exceptions
+    #include <stdexcept>
+    #define ST_THROW_RT_ERROR(x)    {throw std::runtime_error(x);}
+#endif
+
+// When this #define is active, eliminates a clicking sound when the "rate" or "pitch" 
+// parameter setting crosses from value <1 to >=1 or vice versa during processing. 
+// Default is off as such crossover is untypical case and involves a slight sound 
+// quality compromise.
+//#define SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER   1
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/aa_filter/AAFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/aa_filter/AAFilter.cpp
new file mode 100644
index 0000000..f099bce
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/aa_filter/AAFilter.cpp
@@ -0,0 +1,184 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// FIR low-pass (anti-alias) filter with filter coefficient design routine and
+/// MMX optimization. 
+/// 
+/// Anti-alias filter is used to prevent folding of high frequencies when 
+/// transposing the sample rate with interpolation.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2009-01-11 13:34:24 +0200 (Sun, 11 Jan 2009) $
+// File revision : $Revision: 4 $
+//
+// $Id: AAFilter.cpp 45 2009-01-11 11:34:24Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <memory.h>
+#include <assert.h>
+#include <math.h>
+#include <stdlib.h>
+#include "AAFilter.h"
+#include "FIRFilter.h"
+
+using namespace soundtouch;
+
+#define PI        3.141592655357989
+#define TWOPI    (2 * PI)
+
+/*****************************************************************************
+ *
+ * Implementation of the class 'AAFilter'
+ *
+ *****************************************************************************/
+
+AAFilter::AAFilter(uint len)
+{
+    pFIR = FIRFilter::newInstance();
+    cutoffFreq = 0.5;
+    setLength(len);
+}
+
+
+
+AAFilter::~AAFilter()
+{
+    delete pFIR;
+}
+
+
+
+// Sets new anti-alias filter cut-off edge frequency, scaled to
+// sampling frequency (nyquist frequency = 0.5).
+// The filter will cut frequencies higher than the given frequency.
+void AAFilter::setCutoffFreq(double newCutoffFreq)
+{
+    cutoffFreq = newCutoffFreq;
+    calculateCoeffs();
+}
+
+
+
+// Sets number of FIR filter taps
+void AAFilter::setLength(uint newLength)
+{
+    length = newLength;
+    calculateCoeffs();
+}
+
+
+
+// Calculates coefficients for a low-pass FIR filter using Hamming window
+void AAFilter::calculateCoeffs()
+{
+    uint i;
+    double cntTemp, temp, tempCoeff,h, w;
+    double fc2, wc;
+    double scaleCoeff, sum;
+    double *work;
+    SAMPLETYPE *coeffs;
+
+    assert(length >= 2);
+    assert(length % 4 == 0);
+    assert(cutoffFreq >= 0);
+    assert(cutoffFreq <= 0.5);
+
+    work = new double[length];
+    coeffs = new SAMPLETYPE[length];
+
+    fc2 = 2.0 * cutoffFreq; 
+    wc = PI * fc2;
+    tempCoeff = TWOPI / (double)length;
+
+    sum = 0;
+    for (i = 0; i < length; i ++) 
+    {
+        cntTemp = (double)i - (double)(length / 2);
+
+        temp = cntTemp * wc;
+        if (temp != 0) 
+        {
+            h = fc2 * sin(temp) / temp;                     // sinc function
+        } 
+        else 
+        {
+            h = 1.0;
+        }
+        w = 0.54 + 0.46 * cos(tempCoeff * cntTemp);       // hamming window
+
+        temp = w * h;
+        work[i] = temp;
+
+        // calc net sum of coefficients 
+        sum += temp;
+    }
+
+    // ensure the sum of coefficients is larger than zero
+    assert(sum > 0);
+
+    // ensure we've really designed a lowpass filter...
+    assert(work[length/2] > 0);
+    assert(work[length/2 + 1] > -1e-6);
+    assert(work[length/2 - 1] > -1e-6);
+
+    // Calculate a scaling coefficient in such a way that the result can be
+    // divided by 16384
+    scaleCoeff = 16384.0f / sum;
+
+    for (i = 0; i < length; i ++) 
+    {
+        // scale & round to nearest integer
+        temp = work[i] * scaleCoeff;
+        temp += (temp >= 0) ? 0.5 : -0.5;
+        // ensure no overfloods
+        assert(temp >= -32768 && temp <= 32767);
+        coeffs[i] = (SAMPLETYPE)temp;
+    }
+
+    // Set coefficients. Use divide factor 14 => divide result by 2^14 = 16384
+    pFIR->setCoefficients(coeffs, length, 14);
+
+    delete[] work;
+    delete[] coeffs;
+}
+
+
+// Applies the filter to the given sequence of samples. 
+// Note : The amount of outputted samples is by value of 'filter length' 
+// smaller than the amount of input samples.
+uint AAFilter::evaluate(SAMPLETYPE *dest, const SAMPLETYPE *src, uint numSamples, uint numChannels) const
+{
+    return pFIR->evaluate(dest, src, numSamples, numChannels);
+}
+
+
+uint AAFilter::getLength() const
+{
+    return pFIR->getLength();
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/aa_filter/AAFilter.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/aa_filter/AAFilter.h
new file mode 100644
index 0000000..d099757
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/aa_filter/AAFilter.h
@@ -0,0 +1,91 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// Sampled sound tempo changer/time stretch algorithm. Changes the sound tempo 
+/// while maintaining the original pitch by using a time domain WSOLA-like method 
+/// with several performance-increasing tweaks.
+///
+/// Anti-alias filter is used to prevent folding of high frequencies when 
+/// transposing the sample rate with interpolation.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2008-02-10 18:26:55 +0200 (Sun, 10 Feb 2008) $
+// File revision : $Revision: 4 $
+//
+// $Id: AAFilter.h 11 2008-02-10 16:26:55Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef AAFilter_H
+#define AAFilter_H
+
+#include "STTypes.h"
+
+namespace soundtouch
+{
+
+class AAFilter
+{
+protected:
+    class FIRFilter *pFIR;
+
+    /// Low-pass filter cut-off frequency, negative = invalid
+    double cutoffFreq;
+
+    /// num of filter taps
+    uint length;
+
+    /// Calculate the FIR coefficients realizing the given cutoff-frequency
+    void calculateCoeffs();
+public:
+    AAFilter(uint length);
+
+    ~AAFilter();
+
+    /// Sets new anti-alias filter cut-off edge frequency, scaled to sampling 
+    /// frequency (nyquist frequency = 0.5). The filter will cut off the 
+    /// frequencies than that.
+    void setCutoffFreq(double newCutoffFreq);
+
+    /// Sets number of FIR filter taps, i.e. ~filter complexity
+    void setLength(uint newLength);
+
+    uint getLength() const;
+
+    /// Applies the filter to the given sequence of samples. 
+    /// Note : The amount of outputted samples is by value of 'filter length' 
+    /// smaller than the amount of input samples.
+    uint evaluate(SAMPLETYPE *dest, 
+                  const SAMPLETYPE *src, 
+                  uint numSamples, 
+                  uint numChannels) const;
+};
+
+}
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/bpm_detect/BPMDetect.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/bpm_detect/BPMDetect.cpp
new file mode 100644
index 0000000..a48cbd9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/bpm_detect/BPMDetect.cpp
@@ -0,0 +1,370 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// Beats-per-minute (BPM) detection routine.
+///
+/// The beat detection algorithm works as follows:
+/// - Use function 'inputSamples' to input a chunks of samples to the class for
+///   analysis. It's a good idea to enter a large sound file or stream in smallish
+///   chunks of around few kilosamples in order not to extinguish too much RAM memory.
+/// - Inputted sound data is decimated to approx 500 Hz to reduce calculation burden,
+///   which is basically ok as low (bass) frequencies mostly determine the beat rate.
+///   Simple averaging is used for anti-alias filtering because the resulting signal
+///   quality isn't of that high importance.
+/// - Decimated sound data is enveloped, i.e. the amplitude shape is detected by
+///   taking absolute value that's smoothed by sliding average. Signal levels that
+///   are below a couple of times the general RMS amplitude level are cut away to
+///   leave only notable peaks there.
+/// - Repeating sound patterns (e.g. beats) are detected by calculating short-term 
+///   autocorrelation function of the enveloped signal.
+/// - After whole sound data file has been analyzed as above, the bpm level is 
+///   detected by function 'getBpm' that finds the highest peak of the autocorrelation 
+///   function, calculates it's precise location and converts this reading to bpm's.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-08-30 22:45:25 +0300 (Thu, 30 Aug 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: BPMDetect.cpp 149 2012-08-30 19:45:25Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <math.h>
+#include <assert.h>
+#include <string.h>
+#include <stdio.h>
+#include "FIFOSampleBuffer.h"
+#include "PeakFinder.h"
+#include "BPMDetect.h"
+
+using namespace soundtouch;
+
+#define INPUT_BLOCK_SAMPLES       2048
+#define DECIMATED_BLOCK_SAMPLES   256
+
+/// decay constant for calculating RMS volume sliding average approximation 
+/// (time constant is about 10 sec)
+const float avgdecay = 0.99986f;
+
+/// Normalization coefficient for calculating RMS sliding average approximation.
+const float avgnorm = (1 - avgdecay);
+
+
+////////////////////////////////////////////////////////////////////////////////
+
+// Enable following define to create bpm analysis file:
+
+// #define _CREATE_BPM_DEBUG_FILE
+
+#ifdef _CREATE_BPM_DEBUG_FILE
+
+    #define DEBUGFILE_NAME  "c:\\temp\\soundtouch-bpm-debug.txt"
+
+    static void _SaveDebugData(const float *data, int minpos, int maxpos, double coeff)
+    {
+        FILE *fptr = fopen(DEBUGFILE_NAME, "wt");
+        int i;
+
+        if (fptr)
+        {
+            printf("\n\nWriting BPM debug data into file " DEBUGFILE_NAME "\n\n");
+            for (i = minpos; i < maxpos; i ++)
+            {
+                fprintf(fptr, "%d\t%.1lf\t%f\n", i, coeff / (double)i, data[i]);
+            }
+            fclose(fptr);
+        }
+    }
+#else
+    #define _SaveDebugData(a,b,c,d)
+#endif
+
+////////////////////////////////////////////////////////////////////////////////
+
+
+BPMDetect::BPMDetect(int numChannels, int aSampleRate)
+{
+    this->sampleRate = aSampleRate;
+    this->channels = numChannels;
+
+    decimateSum = 0;
+    decimateCount = 0;
+
+    envelopeAccu = 0;
+
+    // Initialize RMS volume accumulator to RMS level of 1500 (out of 32768) that's
+    // safe initial RMS signal level value for song data. This value is then adapted
+    // to the actual level during processing.
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+    // integer samples
+    RMSVolumeAccu = (1500 * 1500) / avgnorm;
+#else
+    // float samples, scaled to range [-1..+1[
+    RMSVolumeAccu = (0.045f * 0.045f) / avgnorm;
+#endif
+
+    // choose decimation factor so that result is approx. 1000 Hz
+    decimateBy = sampleRate / 1000;
+    assert(decimateBy > 0);
+    assert(INPUT_BLOCK_SAMPLES < decimateBy * DECIMATED_BLOCK_SAMPLES);
+
+    // Calculate window length & starting item according to desired min & max bpms
+    windowLen = (60 * sampleRate) / (decimateBy * MIN_BPM);
+    windowStart = (60 * sampleRate) / (decimateBy * MAX_BPM);
+
+    assert(windowLen > windowStart);
+
+    // allocate new working objects
+    xcorr = new float[windowLen];
+    memset(xcorr, 0, windowLen * sizeof(float));
+
+    // allocate processing buffer
+    buffer = new FIFOSampleBuffer();
+    // we do processing in mono mode
+    buffer->setChannels(1);
+    buffer->clear();
+}
+
+
+
+BPMDetect::~BPMDetect()
+{
+    delete[] xcorr;
+    delete buffer;
+}
+
+
+
+/// convert to mono, low-pass filter & decimate to about 500 Hz. 
+/// return number of outputted samples.
+///
+/// Decimation is used to remove the unnecessary frequencies and thus to reduce 
+/// the amount of data needed to be processed as calculating autocorrelation 
+/// function is a very-very heavy operation.
+///
+/// Anti-alias filtering is done simply by averaging the samples. This is really a 
+/// poor-man's anti-alias filtering, but it's not so critical in this kind of application
+/// (it'd also be difficult to design a high-quality filter with steep cut-off at very 
+/// narrow band)
+int BPMDetect::decimate(SAMPLETYPE *dest, const SAMPLETYPE *src, int numsamples)
+{
+    int count, outcount;
+    LONG_SAMPLETYPE out;
+
+    assert(channels > 0);
+    assert(decimateBy > 0);
+    outcount = 0;
+    for (count = 0; count < numsamples; count ++) 
+    {
+        int j;
+
+        // convert to mono and accumulate
+        for (j = 0; j < channels; j ++)
+        {
+            decimateSum += src[j];
+        }
+        src += j;
+
+        decimateCount ++;
+        if (decimateCount >= decimateBy) 
+        {
+            // Store every Nth sample only
+            out = (LONG_SAMPLETYPE)(decimateSum / (decimateBy * channels));
+            decimateSum = 0;
+            decimateCount = 0;
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+            // check ranges for sure (shouldn't actually be necessary)
+            if (out > 32767) 
+            {
+                out = 32767;
+            } 
+            else if (out < -32768) 
+            {
+                out = -32768;
+            }
+#endif // SOUNDTOUCH_INTEGER_SAMPLES
+            dest[outcount] = (SAMPLETYPE)out;
+            outcount ++;
+        }
+    }
+    return outcount;
+}
+
+
+
+// Calculates autocorrelation function of the sample history buffer
+void BPMDetect::updateXCorr(int process_samples)
+{
+    int offs;
+    SAMPLETYPE *pBuffer;
+    
+    assert(buffer->numSamples() >= (uint)(process_samples + windowLen));
+
+    pBuffer = buffer->ptrBegin();
+    for (offs = windowStart; offs < windowLen; offs ++) 
+    {
+        LONG_SAMPLETYPE sum;
+        int i;
+
+        sum = 0;
+        for (i = 0; i < process_samples; i ++) 
+        {
+            sum += pBuffer[i] * pBuffer[i + offs];    // scaling the sub-result shouldn't be necessary
+        }
+//        xcorr[offs] *= xcorr_decay;   // decay 'xcorr' here with suitable coefficients 
+                                        // if it's desired that the system adapts automatically to
+                                        // various bpms, e.g. in processing continouos music stream.
+                                        // The 'xcorr_decay' should be a value that's smaller than but 
+                                        // close to one, and should also depend on 'process_samples' value.
+
+        xcorr[offs] += (float)sum;
+    }
+}
+
+
+// Calculates envelope of the sample data
+void BPMDetect::calcEnvelope(SAMPLETYPE *samples, int numsamples) 
+{
+    const static double decay = 0.7f;               // decay constant for smoothing the envelope
+    const static double norm = (1 - decay);
+
+    int i;
+    LONG_SAMPLETYPE out;
+    double val;
+
+    for (i = 0; i < numsamples; i ++) 
+    {
+        // calc average RMS volume
+        RMSVolumeAccu *= avgdecay;
+        val = (float)fabs((float)samples[i]);
+        RMSVolumeAccu += val * val;
+
+        // cut amplitudes that are below cutoff ~2 times RMS volume
+        // (we're interested in peak values, not the silent moments)
+        if (val < 0.5 * sqrt(RMSVolumeAccu * avgnorm))
+        {
+            val = 0;
+        }
+
+        // smooth amplitude envelope
+        envelopeAccu *= decay;
+        envelopeAccu += val;
+        out = (LONG_SAMPLETYPE)(envelopeAccu * norm);
+
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+        // cut peaks (shouldn't be necessary though)
+        if (out > 32767) out = 32767;
+#endif // SOUNDTOUCH_INTEGER_SAMPLES
+        samples[i] = (SAMPLETYPE)out;
+    }
+}
+
+
+
+void BPMDetect::inputSamples(const SAMPLETYPE *samples, int numSamples)
+{
+    SAMPLETYPE decimated[DECIMATED_BLOCK_SAMPLES];
+
+    // iterate so that max INPUT_BLOCK_SAMPLES processed per iteration
+    while (numSamples > 0)
+    {
+        int block;
+        int decSamples;
+
+        block = (numSamples > INPUT_BLOCK_SAMPLES) ? INPUT_BLOCK_SAMPLES : numSamples;
+
+        // decimate. note that converts to mono at the same time
+        decSamples = decimate(decimated, samples, block);
+        samples += block * channels;
+        numSamples -= block;
+
+        // envelope new samples and add them to buffer
+        calcEnvelope(decimated, decSamples);
+        buffer->putSamples(decimated, decSamples);
+    }
+
+    // when the buffer has enought samples for processing...
+    if ((int)buffer->numSamples() > windowLen) 
+    {
+        int processLength;
+
+        // how many samples are processed
+        processLength = (int)buffer->numSamples() - windowLen;
+
+        // ... calculate autocorrelations for oldest samples...
+        updateXCorr(processLength);
+        // ... and remove them from the buffer
+        buffer->receiveSamples(processLength);
+    }
+}
+
+
+
+void BPMDetect::removeBias()
+{
+    int i;
+    float minval = 1e12f;   // arbitrary large number
+
+    for (i = windowStart; i < windowLen; i ++)
+    {
+        if (xcorr[i] < minval)
+        {
+            minval = xcorr[i];
+        }
+    }
+
+    for (i = windowStart; i < windowLen; i ++)
+    {
+        xcorr[i] -= minval;
+    }
+}
+
+
+float BPMDetect::getBpm()
+{
+    double peakPos;
+    double coeff;
+    PeakFinder peakFinder;
+
+    coeff = 60.0 * ((double)sampleRate / (double)decimateBy);
+
+    // save bpm debug analysis data if debug data enabled
+    _SaveDebugData(xcorr, windowStart, windowLen, coeff);
+
+    // remove bias from xcorr data
+    removeBias();
+
+    // find peak position
+    peakPos = peakFinder.detectPeak(xcorr, windowStart, windowLen);
+
+    assert(decimateBy != 0);
+    if (peakPos < 1e-9) return 0.0; // detection failed.
+
+    // calculate BPM
+    return (float) (coeff / peakPos);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/bpm_detect/BPMDetect.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/bpm_detect/BPMDetect.h
new file mode 100644
index 0000000..7248989
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/bpm_detect/BPMDetect.h
@@ -0,0 +1,164 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// Beats-per-minute (BPM) detection routine.
+///
+/// The beat detection algorithm works as follows:
+/// - Use function 'inputSamples' to input a chunks of samples to the class for
+///   analysis. It's a good idea to enter a large sound file or stream in smallish
+///   chunks of around few kilosamples in order not to extinguish too much RAM memory.
+/// - Input sound data is decimated to approx 500 Hz to reduce calculation burden,
+///   which is basically ok as low (bass) frequencies mostly determine the beat rate.
+///   Simple averaging is used for anti-alias filtering because the resulting signal
+///   quality isn't of that high importance.
+/// - Decimated sound data is enveloped, i.e. the amplitude shape is detected by
+///   taking absolute value that's smoothed by sliding average. Signal levels that
+///   are below a couple of times the general RMS amplitude level are cut away to
+///   leave only notable peaks there.
+/// - Repeating sound patterns (e.g. beats) are detected by calculating short-term 
+///   autocorrelation function of the enveloped signal.
+/// - After whole sound data file has been analyzed as above, the bpm level is 
+///   detected by function 'getBpm' that finds the highest peak of the autocorrelation 
+///   function, calculates it's precise location and converts this reading to bpm's.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-08-30 22:53:44 +0300 (Thu, 30 Aug 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: BPMDetect.h 150 2012-08-30 19:53:44Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef _BPMDetect_H_
+#define _BPMDetect_H_
+
+#include "STTypes.h"
+#include "FIFOSampleBuffer.h"
+
+namespace soundtouch
+{
+
+/// Minimum allowed BPM rate. Used to restrict accepted result above a reasonable limit.
+#define MIN_BPM 29
+
+/// Maximum allowed BPM rate. Used to restrict accepted result below a reasonable limit.
+#define MAX_BPM 200
+
+
+/// Class for calculating BPM rate for audio data.
+class BPMDetect
+{
+protected:
+    /// Auto-correlation accumulator bins.
+    float *xcorr;
+    
+    /// Amplitude envelope sliding average approximation level accumulator
+    double envelopeAccu;
+
+    /// RMS volume sliding average approximation level accumulator
+    double RMSVolumeAccu;
+
+    /// Sample average counter.
+    int decimateCount;
+
+    /// Sample average accumulator for FIFO-like decimation.
+    soundtouch::LONG_SAMPLETYPE decimateSum;
+
+    /// Decimate sound by this coefficient to reach approx. 500 Hz.
+    int decimateBy;
+
+    /// Auto-correlation window length
+    int windowLen;
+
+    /// Number of channels (1 = mono, 2 = stereo)
+    int channels;
+
+    /// sample rate
+    int sampleRate;
+
+    /// Beginning of auto-correlation window: Autocorrelation isn't being updated for
+    /// the first these many correlation bins.
+    int windowStart;
+ 
+    /// FIFO-buffer for decimated processing samples.
+    soundtouch::FIFOSampleBuffer *buffer;
+
+    /// Updates auto-correlation function for given number of decimated samples that 
+    /// are read from the internal 'buffer' pipe (samples aren't removed from the pipe 
+    /// though).
+    void updateXCorr(int process_samples      /// How many samples are processed.
+                     );
+
+    /// Decimates samples to approx. 500 Hz.
+    ///
+    /// \return Number of output samples.
+    int decimate(soundtouch::SAMPLETYPE *dest,      ///< Destination buffer
+                 const soundtouch::SAMPLETYPE *src, ///< Source sample buffer
+                 int numsamples                     ///< Number of source samples.
+                 );
+
+    /// Calculates amplitude envelope for the buffer of samples.
+    /// Result is output to 'samples'.
+    void calcEnvelope(soundtouch::SAMPLETYPE *samples,  ///< Pointer to input/output data buffer
+                      int numsamples                    ///< Number of samples in buffer
+                      );
+
+    /// remove constant bias from xcorr data
+    void removeBias();
+
+public:
+    /// Constructor.
+    BPMDetect(int numChannels,  ///< Number of channels in sample data.
+              int sampleRate    ///< Sample rate in Hz.
+              );
+
+    /// Destructor.
+    virtual ~BPMDetect();
+
+    /// Inputs a block of samples for analyzing: Envelopes the samples and then
+    /// updates the autocorrelation estimation. When whole song data has been input
+    /// in smaller blocks using this function, read the resulting bpm with 'getBpm' 
+    /// function. 
+    /// 
+    /// Notice that data in 'samples' array can be disrupted in processing.
+    void inputSamples(const soundtouch::SAMPLETYPE *samples,    ///< Pointer to input/working data buffer
+                      int numSamples                            ///< Number of samples in buffer
+                      );
+
+
+    /// Analyzes the results and returns the BPM rate. Use this function to read result
+    /// after whole song data has been input to the class by consecutive calls of
+    /// 'inputSamples' function.
+    ///
+    /// \return Beats-per-minute rate, or zero if detection failed.
+    float getBpm();
+};
+
+}
+
+#endif // _BPMDetect_H_
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/cpu_detect/cpu_detect.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/cpu_detect/cpu_detect.h
new file mode 100644
index 0000000..7859ffb
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/cpu_detect/cpu_detect.h
@@ -0,0 +1,62 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// A header file for detecting the Intel MMX instructions set extension.
+///
+/// Please see 'mmx_win.cpp', 'mmx_cpp.cpp' and 'mmx_non_x86.cpp' for the 
+/// routine implementations for x86 Windows, x86 gnu version and non-x86 
+/// platforms, respectively.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2008-02-10 18:26:55 +0200 (Sun, 10 Feb 2008) $
+// File revision : $Revision: 4 $
+//
+// $Id: cpu_detect.h 11 2008-02-10 16:26:55Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef _CPU_DETECT_H_
+#define _CPU_DETECT_H_
+
+#include "STTypes.h"
+
+#define SUPPORT_MMX         0x0001
+#define SUPPORT_3DNOW       0x0002
+#define SUPPORT_ALTIVEC     0x0004
+#define SUPPORT_SSE         0x0008
+#define SUPPORT_SSE2        0x0010
+
+/// Checks which instruction set extensions are supported by the CPU.
+///
+/// \return A bitmask of supported extensions, see SUPPORT_... defines.
+uint detectCPUextensions(void);
+
+/// Disables given set of instruction extensions. See SUPPORT_... defines.
+void disableExtensions(uint wDisableMask);
+
+#endif  // _CPU_DETECT_H_
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/cpu_detect/cpu_detect_x86.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/cpu_detect/cpu_detect_x86.cpp
new file mode 100644
index 0000000..fff3240
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/cpu_detect/cpu_detect_x86.cpp
@@ -0,0 +1,137 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// Generic version of the x86 CPU extension detection routine.
+///
+/// This file is for GNU & other non-Windows compilers, see 'cpu_detect_x86_win.cpp' 
+/// for the Microsoft compiler version.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-11-08 20:44:37 +0200 (Thu, 08 Nov 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: cpu_detect_x86.cpp 159 2012-11-08 18:44:37Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include "cpu_detect.h"
+#include "STTypes.h"
+
+#if defined(SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS)
+
+    #if defined(__GNUC__) && defined(__i386__)
+        // gcc
+        #include "cpuid.h"
+    #elif defined(_M_IX86)
+        // windows non-gcc
+        #include <intrin.h>
+        #define bit_MMX     (1 << 23)
+        #define bit_SSE     (1 << 25)
+        #define bit_SSE2    (1 << 26)
+    #endif
+
+#endif
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// processor instructions extension detection routines
+//
+//////////////////////////////////////////////////////////////////////////////
+
+// Flag variable indicating whick ISA extensions are disabled (for debugging)
+static uint _dwDisabledISA = 0x00;      // 0xffffffff; //<- use this to disable all extensions
+
+// Disables given set of instruction extensions. See SUPPORT_... defines.
+void disableExtensions(uint dwDisableMask)
+{
+    _dwDisabledISA = dwDisableMask;
+}
+
+
+
+/// Checks which instruction set extensions are supported by the CPU.
+uint detectCPUextensions(void)
+{
+/// If building for a 64bit system (no Itanium) and the user wants optimizations.
+/// Return the OR of SUPPORT_{MMX,SSE,SSE2}. 11001 or 0x19.
+/// Keep the _dwDisabledISA test (2 more operations, could be eliminated).
+#if ((defined(__GNUC__) && defined(__x86_64__)) \
+    || defined(_M_X64))  \
+    && defined(SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS)
+    return 0x19 & ~_dwDisabledISA;
+
+/// If building for a 32bit system and the user wants optimizations.
+/// Keep the _dwDisabledISA test (2 more operations, could be eliminated).
+#elif ((defined(__GNUC__) && defined(__i386__)) \
+    || defined(_M_IX86))  \
+    && defined(SOUNDTOUCH_ALLOW_X86_OPTIMIZATIONS)
+
+    if (_dwDisabledISA == 0xffffffff) return 0;
+ 
+    uint res = 0;
+ 
+#if defined(__GNUC__)
+    // GCC version of cpuid. Requires GCC 4.3.0 or later for __cpuid intrinsic support.
+    uint eax, ebx, ecx, edx;  // unsigned int is the standard type. uint is defined by the compiler and not guaranteed to be portable.
+
+    // Check if no cpuid support.
+    if (!__get_cpuid (1, &eax, &ebx, &ecx, &edx)) return 0; // always disable extensions.
+
+    if (edx & bit_MMX)  res = res | SUPPORT_MMX;
+    if (edx & bit_SSE)  res = res | SUPPORT_SSE;
+    if (edx & bit_SSE2) res = res | SUPPORT_SSE2;
+
+#else
+    // Window / VS version of cpuid. Notice that Visual Studio 2005 or later required 
+    // for __cpuid intrinsic support.
+    int reg[4] = {-1};
+
+    // Check if no cpuid support.
+    __cpuid(reg,0);
+    if ((unsigned int)reg[0] == 0) return 0; // always disable extensions.
+
+    __cpuid(reg,1);
+    if ((unsigned int)reg[3] & bit_MMX)  res = res | SUPPORT_MMX;
+    if ((unsigned int)reg[3] & bit_SSE)  res = res | SUPPORT_SSE;
+    if ((unsigned int)reg[3] & bit_SSE2) res = res | SUPPORT_SSE2;
+
+#endif
+
+    return res & ~_dwDisabledISA;
+
+#else
+
+/// One of these is true:
+/// 1) We don't want optimizations.
+/// 2) Using an unsupported compiler.
+/// 3) Running on a non-x86 platform.
+    return 0;
+
+#endif
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer/FIFOSampleBuffer.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer/FIFOSampleBuffer.cpp
new file mode 100644
index 0000000..4d9740a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer/FIFOSampleBuffer.cpp
@@ -0,0 +1,274 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// A buffer class for temporarily storaging sound samples, operates as a 
+/// first-in-first-out pipe.
+///
+/// Samples are added to the end of the sample buffer with the 'putSamples' 
+/// function, and are received from the beginning of the buffer by calling
+/// the 'receiveSamples' function. The class automatically removes the 
+/// outputted samples from the buffer, as well as grows the buffer size 
+/// whenever necessary.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-11-08 20:53:01 +0200 (Thu, 08 Nov 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: FIFOSampleBuffer.cpp 160 2012-11-08 18:53:01Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <stdlib.h>
+#include <memory.h>
+#include <string.h>
+#include <assert.h>
+
+#include "FIFOSampleBuffer.h"
+
+using namespace soundtouch;
+
+// Constructor
+FIFOSampleBuffer::FIFOSampleBuffer(int numChannels)
+{
+    assert(numChannels > 0);
+    sizeInBytes = 0; // reasonable initial value
+    buffer = NULL;
+    bufferUnaligned = NULL;
+    samplesInBuffer = 0;
+    bufferPos = 0;
+    channels = (uint)numChannels;
+    ensureCapacity(32);     // allocate initial capacity 
+}
+
+
+// destructor
+FIFOSampleBuffer::~FIFOSampleBuffer()
+{
+    delete[] bufferUnaligned;
+    bufferUnaligned = NULL;
+    buffer = NULL;
+}
+
+
+// Sets number of channels, 1 = mono, 2 = stereo
+void FIFOSampleBuffer::setChannels(int numChannels)
+{
+    uint usedBytes;
+
+    assert(numChannels > 0);
+    usedBytes = channels * samplesInBuffer;
+    channels = (uint)numChannels;
+    samplesInBuffer = usedBytes / channels;
+}
+
+
+// if output location pointer 'bufferPos' isn't zero, 'rewinds' the buffer and
+// zeroes this pointer by copying samples from the 'bufferPos' pointer 
+// location on to the beginning of the buffer.
+void FIFOSampleBuffer::rewind()
+{
+    if (buffer && bufferPos) 
+    {
+        memmove(buffer, ptrBegin(), sizeof(SAMPLETYPE) * channels * samplesInBuffer);
+        bufferPos = 0;
+    }
+}
+
+
+// Adds 'numSamples' pcs of samples from the 'samples' memory position to 
+// the sample buffer.
+void FIFOSampleBuffer::putSamples(const SAMPLETYPE *samples, uint nSamples)
+{
+    memcpy(ptrEnd(nSamples), samples, sizeof(SAMPLETYPE) * nSamples * channels);
+    samplesInBuffer += nSamples;
+}
+
+
+// Increases the number of samples in the buffer without copying any actual
+// samples.
+//
+// This function is used to update the number of samples in the sample buffer
+// when accessing the buffer directly with 'ptrEnd' function. Please be 
+// careful though!
+void FIFOSampleBuffer::putSamples(uint nSamples)
+{
+    uint req;
+
+    req = samplesInBuffer + nSamples;
+    ensureCapacity(req);
+    samplesInBuffer += nSamples;
+}
+
+
+// Returns a pointer to the end of the used part of the sample buffer (i.e. 
+// where the new samples are to be inserted). This function may be used for 
+// inserting new samples into the sample buffer directly. Please be careful! 
+//
+// Parameter 'slackCapacity' tells the function how much free capacity (in
+// terms of samples) there _at least_ should be, in order to the caller to
+// succesfully insert all the required samples to the buffer. When necessary, 
+// the function grows the buffer size to comply with this requirement.
+//
+// When using this function as means for inserting new samples, also remember 
+// to increase the sample count afterwards, by calling  the 
+// 'putSamples(numSamples)' function.
+SAMPLETYPE *FIFOSampleBuffer::ptrEnd(uint slackCapacity) 
+{
+    ensureCapacity(samplesInBuffer + slackCapacity);
+    return buffer + samplesInBuffer * channels;
+}
+
+
+// Returns a pointer to the beginning of the currently non-outputted samples. 
+// This function is provided for accessing the output samples directly. 
+// Please be careful!
+//
+// When using this function to output samples, also remember to 'remove' the
+// outputted samples from the buffer by calling the 
+// 'receiveSamples(numSamples)' function
+SAMPLETYPE *FIFOSampleBuffer::ptrBegin()
+{
+    assert(buffer);
+    return buffer + bufferPos * channels;
+}
+
+
+// Ensures that the buffer has enought capacity, i.e. space for _at least_
+// 'capacityRequirement' number of samples. The buffer is grown in steps of
+// 4 kilobytes to eliminate the need for frequently growing up the buffer,
+// as well as to round the buffer size up to the virtual memory page size.
+void FIFOSampleBuffer::ensureCapacity(uint capacityRequirement)
+{
+    SAMPLETYPE *tempUnaligned, *temp;
+
+    if (capacityRequirement > getCapacity()) 
+    {
+        // enlarge the buffer in 4kbyte steps (round up to next 4k boundary)
+        sizeInBytes = (capacityRequirement * channels * sizeof(SAMPLETYPE) + 4095) & (uint)-4096;
+        assert(sizeInBytes % 2 == 0);
+        tempUnaligned = new SAMPLETYPE[sizeInBytes / sizeof(SAMPLETYPE) + 16 / sizeof(SAMPLETYPE)];
+        if (tempUnaligned == NULL)
+        {
+            ST_THROW_RT_ERROR("Couldn't allocate memory!\n");
+        }
+        // Align the buffer to begin at 16byte cache line boundary for optimal performance
+        temp = (SAMPLETYPE *)SOUNDTOUCH_ALIGN_POINTER_16(tempUnaligned);
+        if (samplesInBuffer)
+        {
+            memcpy(temp, ptrBegin(), samplesInBuffer * channels * sizeof(SAMPLETYPE));
+        }
+        delete[] bufferUnaligned;
+        buffer = temp;
+        bufferUnaligned = tempUnaligned;
+        bufferPos = 0;
+    } 
+    else 
+    {
+        // simply rewind the buffer (if necessary)
+        rewind();
+    }
+}
+
+
+// Returns the current buffer capacity in terms of samples
+uint FIFOSampleBuffer::getCapacity() const
+{
+    return sizeInBytes / (channels * sizeof(SAMPLETYPE));
+}
+
+
+// Returns the number of samples currently in the buffer
+uint FIFOSampleBuffer::numSamples() const
+{
+    return samplesInBuffer;
+}
+
+
+// Output samples from beginning of the sample buffer. Copies demanded number
+// of samples to output and removes them from the sample buffer. If there
+// are less than 'numsample' samples in the buffer, returns all available.
+//
+// Returns number of samples copied.
+uint FIFOSampleBuffer::receiveSamples(SAMPLETYPE *output, uint maxSamples)
+{
+    uint num;
+
+    num = (maxSamples > samplesInBuffer) ? samplesInBuffer : maxSamples;
+
+    memcpy(output, ptrBegin(), channels * sizeof(SAMPLETYPE) * num);
+    return receiveSamples(num);
+}
+
+
+// Removes samples from the beginning of the sample buffer without copying them
+// anywhere. Used to reduce the number of samples in the buffer, when accessing
+// the sample buffer with the 'ptrBegin' function.
+uint FIFOSampleBuffer::receiveSamples(uint maxSamples)
+{
+    if (maxSamples >= samplesInBuffer)
+    {
+        uint temp;
+
+        temp = samplesInBuffer;
+        samplesInBuffer = 0;
+        return temp;
+    }
+
+    samplesInBuffer -= maxSamples;
+    bufferPos += maxSamples;
+
+    return maxSamples;
+}
+
+
+// Returns nonzero if the sample buffer is empty
+int FIFOSampleBuffer::isEmpty() const
+{
+    return (samplesInBuffer == 0) ? 1 : 0;
+}
+
+
+// Clears the sample buffer
+void FIFOSampleBuffer::clear()
+{
+    samplesInBuffer = 0;
+    bufferPos = 0;
+}
+
+
+/// allow trimming (downwards) amount of samples in pipeline.
+/// Returns adjusted amount of samples
+uint FIFOSampleBuffer::adjustAmountOfSamples(uint numSamples)
+{
+    if (numSamples < samplesInBuffer)
+    {
+        samplesInBuffer = numSamples;
+    }
+    return samplesInBuffer;
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer/FIFOSampleBuffer.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer/FIFOSampleBuffer.h
new file mode 100644
index 0000000..3789b4d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fifo_sample_buffer/FIFOSampleBuffer.h
@@ -0,0 +1,178 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// A buffer class for temporarily storaging sound samples, operates as a 
+/// first-in-first-out pipe.
+///
+/// Samples are added to the end of the sample buffer with the 'putSamples' 
+/// function, and are received from the beginning of the buffer by calling
+/// the 'receiveSamples' function. The class automatically removes the 
+/// output samples from the buffer as well as grows the storage size 
+/// whenever necessary.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-06-13 22:29:53 +0300 (Wed, 13 Jun 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: FIFOSampleBuffer.h 143 2012-06-13 19:29:53Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef FIFOSampleBuffer_H
+#define FIFOSampleBuffer_H
+
+#include "FIFOSamplePipe.h"
+
+namespace soundtouch
+{
+
+/// Sample buffer working in FIFO (first-in-first-out) principle. The class takes
+/// care of storage size adjustment and data moving during input/output operations.
+///
+/// Notice that in case of stereo audio, one sample is considered to consist of 
+/// both channel data.
+class FIFOSampleBuffer : public FIFOSamplePipe
+{
+private:
+    /// Sample buffer.
+    SAMPLETYPE *buffer;
+
+    // Raw unaligned buffer memory. 'buffer' is made aligned by pointing it to first
+    // 16-byte aligned location of this buffer
+    SAMPLETYPE *bufferUnaligned;
+
+    /// Sample buffer size in bytes
+    uint sizeInBytes;
+
+    /// How many samples are currently in buffer.
+    uint samplesInBuffer;
+
+    /// Channels, 1=mono, 2=stereo.
+    uint channels;
+
+    /// Current position pointer to the buffer. This pointer is increased when samples are 
+    /// removed from the pipe so that it's necessary to actually rewind buffer (move data)
+    /// only new data when is put to the pipe.
+    uint bufferPos;
+
+    /// Rewind the buffer by moving data from position pointed by 'bufferPos' to real 
+    /// beginning of the buffer.
+    void rewind();
+
+    /// Ensures that the buffer has capacity for at least this many samples.
+    void ensureCapacity(uint capacityRequirement);
+
+    /// Returns current capacity.
+    uint getCapacity() const;
+
+public:
+
+    /// Constructor
+    FIFOSampleBuffer(int numChannels = 2     ///< Number of channels, 1=mono, 2=stereo.
+                                              ///< Default is stereo.
+                     );
+
+    /// destructor
+    ~FIFOSampleBuffer();
+
+    /// Returns a pointer to the beginning of the output samples. 
+    /// This function is provided for accessing the output samples directly. 
+    /// Please be careful for not to corrupt the book-keeping!
+    ///
+    /// When using this function to output samples, also remember to 'remove' the
+    /// output samples from the buffer by calling the 
+    /// 'receiveSamples(numSamples)' function
+    virtual SAMPLETYPE *ptrBegin();
+
+    /// Returns a pointer to the end of the used part of the sample buffer (i.e. 
+    /// where the new samples are to be inserted). This function may be used for 
+    /// inserting new samples into the sample buffer directly. Please be careful
+    /// not corrupt the book-keeping!
+    ///
+    /// When using this function as means for inserting new samples, also remember 
+    /// to increase the sample count afterwards, by calling  the 
+    /// 'putSamples(numSamples)' function.
+    SAMPLETYPE *ptrEnd(
+                uint slackCapacity   ///< How much free capacity (in samples) there _at least_ 
+                                     ///< should be so that the caller can succesfully insert the 
+                                     ///< desired samples to the buffer. If necessary, the function 
+                                     ///< grows the buffer size to comply with this requirement.
+                );
+
+    /// Adds 'numSamples' pcs of samples from the 'samples' memory position to
+    /// the sample buffer.
+    virtual void putSamples(const SAMPLETYPE *samples,  ///< Pointer to samples.
+                            uint numSamples                         ///< Number of samples to insert.
+                            );
+
+    /// Adjusts the book-keeping to increase number of samples in the buffer without 
+    /// copying any actual samples.
+    ///
+    /// This function is used to update the number of samples in the sample buffer
+    /// when accessing the buffer directly with 'ptrEnd' function. Please be 
+    /// careful though!
+    virtual void putSamples(uint numSamples   ///< Number of samples been inserted.
+                            );
+
+    /// Output samples from beginning of the sample buffer. Copies requested samples to 
+    /// output buffer and removes them from the sample buffer. If there are less than 
+    /// 'numsample' samples in the buffer, returns all that available.
+    ///
+    /// \return Number of samples returned.
+    virtual uint receiveSamples(SAMPLETYPE *output, ///< Buffer where to copy output samples.
+                                uint maxSamples                 ///< How many samples to receive at max.
+                                );
+
+    /// Adjusts book-keeping so that given number of samples are removed from beginning of the 
+    /// sample buffer without copying them anywhere. 
+    ///
+    /// Used to reduce the number of samples in the buffer when accessing the sample buffer directly
+    /// with 'ptrBegin' function.
+    virtual uint receiveSamples(uint maxSamples   ///< Remove this many samples from the beginning of pipe.
+                                );
+
+    /// Returns number of samples currently available.
+    virtual uint numSamples() const;
+
+    /// Sets number of channels, 1 = mono, 2 = stereo.
+    void setChannels(int numChannels);
+
+    /// Returns nonzero if there aren't any samples available for outputting.
+    virtual int isEmpty() const;
+
+    /// Clears all the samples.
+    virtual void clear();
+
+    /// allow trimming (downwards) amount of samples in pipeline.
+    /// Returns adjusted amount of samples
+    uint adjustAmountOfSamples(uint numSamples);
+};
+
+}
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fir_filter/FIRFilter.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fir_filter/FIRFilter.cpp
new file mode 100644
index 0000000..1570516
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fir_filter/FIRFilter.cpp
@@ -0,0 +1,259 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// General FIR digital filter routines with MMX optimization. 
+///
+/// Note : MMX optimized functions reside in a separate, platform-specific file, 
+/// e.g. 'mmx_win.cpp' or 'mmx_gcc.cpp'
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2011-09-02 21:56:11 +0300 (Fri, 02 Sep 2011) $
+// File revision : $Revision: 4 $
+//
+// $Id: FIRFilter.cpp 131 2011-09-02 18:56:11Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <memory.h>
+#include <assert.h>
+#include <math.h>
+#include <stdlib.h>
+#include "FIRFilter.h"
+#include "cpu_detect.h"
+
+using namespace soundtouch;
+
+/*****************************************************************************
+ *
+ * Implementation of the class 'FIRFilter'
+ *
+ *****************************************************************************/
+
+FIRFilter::FIRFilter()
+{
+    resultDivFactor = 0;
+    resultDivider = 0;
+    length = 0;
+    lengthDiv8 = 0;
+    filterCoeffs = NULL;
+}
+
+
+FIRFilter::~FIRFilter()
+{
+    delete[] filterCoeffs;
+}
+
+// Usual C-version of the filter routine for stereo sound
+uint FIRFilter::evaluateFilterStereo(SAMPLETYPE *dest, const SAMPLETYPE *src, uint numSamples) const
+{
+    uint i, j, end;
+    LONG_SAMPLETYPE suml, sumr;
+#ifdef SOUNDTOUCH_FLOAT_SAMPLES
+    // when using floating point samples, use a scaler instead of a divider
+    // because division is much slower operation than multiplying.
+    double dScaler = 1.0 / (double)resultDivider;
+#endif
+
+    assert(length != 0);
+    assert(src != NULL);
+    assert(dest != NULL);
+    assert(filterCoeffs != NULL);
+
+    end = 2 * (numSamples - length);
+
+    for (j = 0; j < end; j += 2) 
+    {
+        const SAMPLETYPE *ptr;
+
+        suml = sumr = 0;
+        ptr = src + j;
+
+        for (i = 0; i < length; i += 4) 
+        {
+            // loop is unrolled by factor of 4 here for efficiency
+            suml += ptr[2 * i + 0] * filterCoeffs[i + 0] +
+                    ptr[2 * i + 2] * filterCoeffs[i + 1] +
+                    ptr[2 * i + 4] * filterCoeffs[i + 2] +
+                    ptr[2 * i + 6] * filterCoeffs[i + 3];
+            sumr += ptr[2 * i + 1] * filterCoeffs[i + 0] +
+                    ptr[2 * i + 3] * filterCoeffs[i + 1] +
+                    ptr[2 * i + 5] * filterCoeffs[i + 2] +
+                    ptr[2 * i + 7] * filterCoeffs[i + 3];
+        }
+
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+        suml >>= resultDivFactor;
+        sumr >>= resultDivFactor;
+        // saturate to 16 bit integer limits
+        suml = (suml < -32768) ? -32768 : (suml > 32767) ? 32767 : suml;
+        // saturate to 16 bit integer limits
+        sumr = (sumr < -32768) ? -32768 : (sumr > 32767) ? 32767 : sumr;
+#else
+        suml *= dScaler;
+        sumr *= dScaler;
+#endif // SOUNDTOUCH_INTEGER_SAMPLES
+        dest[j] = (SAMPLETYPE)suml;
+        dest[j + 1] = (SAMPLETYPE)sumr;
+    }
+    return numSamples - length;
+}
+
+
+
+
+// Usual C-version of the filter routine for mono sound
+uint FIRFilter::evaluateFilterMono(SAMPLETYPE *dest, const SAMPLETYPE *src, uint numSamples) const
+{
+    uint i, j, end;
+    LONG_SAMPLETYPE sum;
+#ifdef SOUNDTOUCH_FLOAT_SAMPLES
+    // when using floating point samples, use a scaler instead of a divider
+    // because division is much slower operation than multiplying.
+    double dScaler = 1.0 / (double)resultDivider;
+#endif
+
+
+    assert(length != 0);
+
+    end = numSamples - length;
+    for (j = 0; j < end; j ++) 
+    {
+        sum = 0;
+        for (i = 0; i < length; i += 4) 
+        {
+            // loop is unrolled by factor of 4 here for efficiency
+            sum += src[i + 0] * filterCoeffs[i + 0] + 
+                   src[i + 1] * filterCoeffs[i + 1] + 
+                   src[i + 2] * filterCoeffs[i + 2] + 
+                   src[i + 3] * filterCoeffs[i + 3];
+        }
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+        sum >>= resultDivFactor;
+        // saturate to 16 bit integer limits
+        sum = (sum < -32768) ? -32768 : (sum > 32767) ? 32767 : sum;
+#else
+        sum *= dScaler;
+#endif // SOUNDTOUCH_INTEGER_SAMPLES
+        dest[j] = (SAMPLETYPE)sum;
+        src ++;
+    }
+    return end;
+}
+
+
+// Set filter coeffiecients and length.
+//
+// Throws an exception if filter length isn't divisible by 8
+void FIRFilter::setCoefficients(const SAMPLETYPE *coeffs, uint newLength, uint uResultDivFactor)
+{
+    assert(newLength > 0);
+    if (newLength % 8) ST_THROW_RT_ERROR("FIR filter length not divisible by 8");
+
+    lengthDiv8 = newLength / 8;
+    length = lengthDiv8 * 8;
+    assert(length == newLength);
+
+    resultDivFactor = uResultDivFactor;
+    resultDivider = (SAMPLETYPE)::pow(2.0, (int)resultDivFactor);
+
+    delete[] filterCoeffs;
+    filterCoeffs = new SAMPLETYPE[length];
+    memcpy(filterCoeffs, coeffs, length * sizeof(SAMPLETYPE));
+}
+
+
+uint FIRFilter::getLength() const
+{
+    return length;
+}
+
+
+
+// Applies the filter to the given sequence of samples. 
+//
+// Note : The amount of outputted samples is by value of 'filter_length' 
+// smaller than the amount of input samples.
+uint FIRFilter::evaluate(SAMPLETYPE *dest, const SAMPLETYPE *src, uint numSamples, uint numChannels) const
+{
+    assert(numChannels == 1 || numChannels == 2);
+
+    assert(length > 0);
+    assert(lengthDiv8 * 8 == length);
+    if (numSamples < length) return 0;
+    if (numChannels == 2) 
+    {
+        return evaluateFilterStereo(dest, src, numSamples);
+    } else {
+        return evaluateFilterMono(dest, src, numSamples);
+    }
+}
+
+
+
+// Operator 'new' is overloaded so that it automatically creates a suitable instance 
+// depending on if we've a MMX-capable CPU available or not.
+void * FIRFilter::operator new(size_t s)
+{
+    // Notice! don't use "new FIRFilter" directly, use "newInstance" to create a new instance instead!
+    ST_THROW_RT_ERROR("Error in FIRFilter::new: Don't use 'new FIRFilter', use 'newInstance' member instead!");
+    return newInstance();
+}
+
+
+FIRFilter * FIRFilter::newInstance()
+{
+    uint uExtensions;
+
+    uExtensions = detectCPUextensions();
+
+    // Check if MMX/SSE instruction set extensions supported by CPU
+
+#ifdef SOUNDTOUCH_ALLOW_MMX
+    // MMX routines available only with integer sample types
+    if (uExtensions & SUPPORT_MMX)
+    {
+        return ::new FIRFilterMMX;
+    }
+    else
+#endif // SOUNDTOUCH_ALLOW_MMX
+
+#ifdef SOUNDTOUCH_ALLOW_SSE
+    if (uExtensions & SUPPORT_SSE)
+    {
+        // SSE support
+        return ::new FIRFilterSSE;
+    }
+    else
+#endif // SOUNDTOUCH_ALLOW_SSE
+
+    {
+        // ISA optimizations not supported, use plain C version
+        return ::new FIRFilter;
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fir_filter/FIRFilter.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fir_filter/FIRFilter.h
new file mode 100644
index 0000000..e156309
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/fir_filter/FIRFilter.h
@@ -0,0 +1,145 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// General FIR digital filter routines with MMX optimization. 
+///
+/// Note : MMX optimized functions reside in a separate, platform-specific file, 
+/// e.g. 'mmx_win.cpp' or 'mmx_gcc.cpp'
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2011-02-13 21:13:57 +0200 (Sun, 13 Feb 2011) $
+// File revision : $Revision: 4 $
+//
+// $Id: FIRFilter.h 104 2011-02-13 19:13:57Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef FIRFilter_H
+#define FIRFilter_H
+
+#include <stddef.h>
+#include "STTypes.h"
+
+namespace soundtouch
+{
+
+class FIRFilter 
+{
+protected:
+    // Number of FIR filter taps
+    uint length;    
+    // Number of FIR filter taps divided by 8
+    uint lengthDiv8;
+
+    // Result divider factor in 2^k format
+    uint resultDivFactor;
+
+    // Result divider value.
+    SAMPLETYPE resultDivider;
+
+    // Memory for filter coefficients
+    SAMPLETYPE *filterCoeffs;
+
+    virtual uint evaluateFilterStereo(SAMPLETYPE *dest, 
+                                      const SAMPLETYPE *src, 
+                                      uint numSamples) const;
+    virtual uint evaluateFilterMono(SAMPLETYPE *dest, 
+                                    const SAMPLETYPE *src, 
+                                    uint numSamples) const;
+
+public:
+    FIRFilter();
+    virtual ~FIRFilter();
+
+    /// Operator 'new' is overloaded so that it automatically creates a suitable instance 
+    /// depending on if we've a MMX-capable CPU available or not.
+    static void * operator new(size_t s);
+
+    static FIRFilter *newInstance();
+
+    /// Applies the filter to the given sequence of samples. 
+    /// Note : The amount of outputted samples is by value of 'filter_length' 
+    /// smaller than the amount of input samples.
+    ///
+    /// \return Number of samples copied to 'dest'.
+    uint evaluate(SAMPLETYPE *dest, 
+                  const SAMPLETYPE *src, 
+                  uint numSamples, 
+                  uint numChannels) const;
+
+    uint getLength() const;
+
+    virtual void setCoefficients(const SAMPLETYPE *coeffs, 
+                                 uint newLength, 
+                                 uint uResultDivFactor);
+};
+
+
+// Optional subclasses that implement CPU-specific optimizations:
+
+#ifdef SOUNDTOUCH_ALLOW_MMX
+
+/// Class that implements MMX optimized functions exclusive for 16bit integer samples type.
+    class FIRFilterMMX : public FIRFilter
+    {
+    protected:
+        short *filterCoeffsUnalign;
+        short *filterCoeffsAlign;
+
+        virtual uint evaluateFilterStereo(short *dest, const short *src, uint numSamples) const;
+    public:
+        FIRFilterMMX();
+        ~FIRFilterMMX();
+
+        virtual void setCoefficients(const short *coeffs, uint newLength, uint uResultDivFactor);
+    };
+
+#endif // SOUNDTOUCH_ALLOW_MMX
+
+
+#ifdef SOUNDTOUCH_ALLOW_SSE
+    /// Class that implements SSE optimized functions exclusive for floating point samples type.
+    class FIRFilterSSE : public FIRFilter
+    {
+    protected:
+        float *filterCoeffsUnalign;
+        float *filterCoeffsAlign;
+
+        virtual uint evaluateFilterStereo(float *dest, const float *src, uint numSamples) const;
+    public:
+        FIRFilterSSE();
+        ~FIRFilterSSE();
+
+        virtual void setCoefficients(const float *coeffs, uint newLength, uint uResultDivFactor);
+    };
+
+#endif // SOUNDTOUCH_ALLOW_SSE
+
+}
+
+#endif  // FIRFilter_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/mmx_optimized.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/mmx_optimized.cpp
new file mode 100644
index 0000000..c3e251a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/mmx_optimized.cpp
@@ -0,0 +1,317 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// MMX optimized routines. All MMX optimized functions have been gathered into 
+/// this single source code file, regardless to their class or original source 
+/// code file, in order to ease porting the library to other compiler and 
+/// processor platforms.
+///
+/// The MMX-optimizations are programmed using MMX compiler intrinsics that
+/// are supported both by Microsoft Visual C++ and GCC compilers, so this file
+/// should compile with both toolsets.
+///
+/// NOTICE: If using Visual Studio 6.0, you'll need to install the "Visual C++ 
+/// 6.0 processor pack" update to support compiler intrinsic syntax. The update
+/// is available for download at Microsoft Developers Network, see here:
+/// http://msdn.microsoft.com/en-us/vstudio/aa718349.aspx
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-11-08 20:53:01 +0200 (Thu, 08 Nov 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: mmx_optimized.cpp 160 2012-11-08 18:53:01Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include "STTypes.h"
+
+#ifdef SOUNDTOUCH_ALLOW_MMX
+// MMX routines available only with integer sample type
+
+using namespace soundtouch;
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// implementation of MMX optimized functions of class 'TDStretchMMX'
+//
+//////////////////////////////////////////////////////////////////////////////
+
+#include "TDStretch.h"
+#include <mmintrin.h>
+#include <limits.h>
+#include <math.h>
+
+
+// Calculates cross correlation of two buffers
+double TDStretchMMX::calcCrossCorr(const short *pV1, const short *pV2) const
+{
+    const __m64 *pVec1, *pVec2;
+    __m64 shifter;
+    __m64 accu, normaccu;
+    long corr, norm;
+    int i;
+   
+    pVec1 = (__m64*)pV1;
+    pVec2 = (__m64*)pV2;
+
+    shifter = _m_from_int(overlapDividerBits);
+    normaccu = accu = _mm_setzero_si64();
+
+    // process 4 parallel sets of 2 * stereo samples or 4 * mono samples
+    // during each round for improved CPU-level parallellization.
+    for (i = 0; i < channels * overlapLength / 16; i ++)
+    {
+        __m64 temp, temp2;
+
+        // dictionary of instructions:
+        // _m_pmaddwd   : 4*16bit multiply-add, resulting two 32bits = [a0*b0+a1*b1 ; a2*b2+a3*b3]
+        // _mm_add_pi32 : 2*32bit add
+        // _m_psrad     : 32bit right-shift
+
+        temp = _mm_add_pi32(_mm_madd_pi16(pVec1[0], pVec2[0]),
+                            _mm_madd_pi16(pVec1[1], pVec2[1]));
+        temp2 = _mm_add_pi32(_mm_madd_pi16(pVec1[0], pVec1[0]),
+                             _mm_madd_pi16(pVec1[1], pVec1[1]));
+        accu = _mm_add_pi32(accu, _mm_sra_pi32(temp, shifter));
+        normaccu = _mm_add_pi32(normaccu, _mm_sra_pi32(temp2, shifter));
+
+        temp = _mm_add_pi32(_mm_madd_pi16(pVec1[2], pVec2[2]),
+                            _mm_madd_pi16(pVec1[3], pVec2[3]));
+        temp2 = _mm_add_pi32(_mm_madd_pi16(pVec1[2], pVec1[2]),
+                             _mm_madd_pi16(pVec1[3], pVec1[3]));
+        accu = _mm_add_pi32(accu, _mm_sra_pi32(temp, shifter));
+        normaccu = _mm_add_pi32(normaccu, _mm_sra_pi32(temp2, shifter));
+
+        pVec1 += 4;
+        pVec2 += 4;
+    }
+
+    // copy hi-dword of mm0 to lo-dword of mm1, then sum mmo+mm1
+    // and finally store the result into the variable "corr"
+
+    accu = _mm_add_pi32(accu, _mm_srli_si64(accu, 32));
+    corr = _m_to_int(accu);
+
+    normaccu = _mm_add_pi32(normaccu, _mm_srli_si64(normaccu, 32));
+    norm = _m_to_int(normaccu);
+
+    // Clear MMS state
+    _m_empty();
+
+    // Normalize result by dividing by sqrt(norm) - this step is easiest 
+    // done using floating point operation
+    if (norm == 0) norm = 1;    // to avoid div by zero
+
+    return (double)corr / sqrt((double)norm);
+    // Note: Warning about the missing EMMS instruction is harmless
+    // as it'll be called elsewhere.
+}
+
+
+
+void TDStretchMMX::clearCrossCorrState()
+{
+    // Clear MMS state
+    _m_empty();
+    //_asm EMMS;
+}
+
+
+
+// MMX-optimized version of the function overlapStereo
+void TDStretchMMX::overlapStereo(short *output, const short *input) const
+{
+    const __m64 *pVinput, *pVMidBuf;
+    __m64 *pVdest;
+    __m64 mix1, mix2, adder, shifter;
+    int i;
+
+    pVinput  = (const __m64*)input;
+    pVMidBuf = (const __m64*)pMidBuffer;
+    pVdest   = (__m64*)output;
+
+    // mix1  = mixer values for 1st stereo sample
+    // mix1  = mixer values for 2nd stereo sample
+    // adder = adder for updating mixer values after each round
+    
+    mix1  = _mm_set_pi16(0, overlapLength,   0, overlapLength);
+    adder = _mm_set_pi16(1, -1, 1, -1);
+    mix2  = _mm_add_pi16(mix1, adder);
+    adder = _mm_add_pi16(adder, adder);
+
+    // Overlaplength-division by shifter. "+1" is to account for "-1" deduced in
+    // overlapDividerBits calculation earlier.
+    shifter = _m_from_int(overlapDividerBits + 1);
+
+    for (i = 0; i < overlapLength / 4; i ++)
+    {
+        __m64 temp1, temp2;
+                
+        // load & shuffle data so that input & mixbuffer data samples are paired
+        temp1 = _mm_unpacklo_pi16(pVMidBuf[0], pVinput[0]);     // = i0l m0l i0r m0r
+        temp2 = _mm_unpackhi_pi16(pVMidBuf[0], pVinput[0]);     // = i1l m1l i1r m1r
+
+        // temp = (temp .* mix) >> shifter
+        temp1 = _mm_sra_pi32(_mm_madd_pi16(temp1, mix1), shifter);
+        temp2 = _mm_sra_pi32(_mm_madd_pi16(temp2, mix2), shifter);
+        pVdest[0] = _mm_packs_pi32(temp1, temp2); // pack 2*2*32bit => 4*16bit
+
+        // update mix += adder
+        mix1 = _mm_add_pi16(mix1, adder);
+        mix2 = _mm_add_pi16(mix2, adder);
+
+        // --- second round begins here ---
+
+        // load & shuffle data so that input & mixbuffer data samples are paired
+        temp1 = _mm_unpacklo_pi16(pVMidBuf[1], pVinput[1]);       // = i2l m2l i2r m2r
+        temp2 = _mm_unpackhi_pi16(pVMidBuf[1], pVinput[1]);       // = i3l m3l i3r m3r
+
+        // temp = (temp .* mix) >> shifter
+        temp1 = _mm_sra_pi32(_mm_madd_pi16(temp1, mix1), shifter);
+        temp2 = _mm_sra_pi32(_mm_madd_pi16(temp2, mix2), shifter);
+        pVdest[1] = _mm_packs_pi32(temp1, temp2); // pack 2*2*32bit => 4*16bit
+
+        // update mix += adder
+        mix1 = _mm_add_pi16(mix1, adder);
+        mix2 = _mm_add_pi16(mix2, adder);
+
+        pVinput  += 2;
+        pVMidBuf += 2;
+        pVdest   += 2;
+    }
+
+    _m_empty(); // clear MMS state
+}
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// implementation of MMX optimized functions of class 'FIRFilter'
+//
+//////////////////////////////////////////////////////////////////////////////
+
+#include "FIRFilter.h"
+
+
+FIRFilterMMX::FIRFilterMMX() : FIRFilter()
+{
+    filterCoeffsUnalign = NULL;
+}
+
+
+FIRFilterMMX::~FIRFilterMMX()
+{
+    delete[] filterCoeffsUnalign;
+}
+
+
+// (overloaded) Calculates filter coefficients for MMX routine
+void FIRFilterMMX::setCoefficients(const short *coeffs, uint newLength, uint uResultDivFactor)
+{
+    uint i;
+    FIRFilter::setCoefficients(coeffs, newLength, uResultDivFactor);
+
+    // Ensure that filter coeffs array is aligned to 16-byte boundary
+    delete[] filterCoeffsUnalign;
+    filterCoeffsUnalign = new short[2 * newLength + 8];
+    filterCoeffsAlign = (short *)SOUNDTOUCH_ALIGN_POINTER_16(filterCoeffsUnalign);
+
+    // rearrange the filter coefficients for mmx routines 
+    for (i = 0;i < length; i += 4) 
+    {
+        filterCoeffsAlign[2 * i + 0] = coeffs[i + 0];
+        filterCoeffsAlign[2 * i + 1] = coeffs[i + 2];
+        filterCoeffsAlign[2 * i + 2] = coeffs[i + 0];
+        filterCoeffsAlign[2 * i + 3] = coeffs[i + 2];
+
+        filterCoeffsAlign[2 * i + 4] = coeffs[i + 1];
+        filterCoeffsAlign[2 * i + 5] = coeffs[i + 3];
+        filterCoeffsAlign[2 * i + 6] = coeffs[i + 1];
+        filterCoeffsAlign[2 * i + 7] = coeffs[i + 3];
+    }
+}
+
+
+
+// mmx-optimized version of the filter routine for stereo sound
+uint FIRFilterMMX::evaluateFilterStereo(short *dest, const short *src, uint numSamples) const
+{
+    // Create stack copies of the needed member variables for asm routines :
+    uint i, j;
+    __m64 *pVdest = (__m64*)dest;
+
+    if (length < 2) return 0;
+
+    for (i = 0; i < (numSamples - length) / 2; i ++)
+    {
+        __m64 accu1;
+        __m64 accu2;
+        const __m64 *pVsrc = (const __m64*)src;
+        const __m64 *pVfilter = (const __m64*)filterCoeffsAlign;
+
+        accu1 = accu2 = _mm_setzero_si64();
+        for (j = 0; j < lengthDiv8 * 2; j ++)
+        {
+            __m64 temp1, temp2;
+
+            temp1 = _mm_unpacklo_pi16(pVsrc[0], pVsrc[1]);  // = l2 l0 r2 r0
+            temp2 = _mm_unpackhi_pi16(pVsrc[0], pVsrc[1]);  // = l3 l1 r3 r1
+
+            accu1 = _mm_add_pi32(accu1, _mm_madd_pi16(temp1, pVfilter[0]));  // += l2*f2+l0*f0 r2*f2+r0*f0
+            accu1 = _mm_add_pi32(accu1, _mm_madd_pi16(temp2, pVfilter[1]));  // += l3*f3+l1*f1 r3*f3+r1*f1
+
+            temp1 = _mm_unpacklo_pi16(pVsrc[1], pVsrc[2]);  // = l4 l2 r4 r2
+
+            accu2 = _mm_add_pi32(accu2, _mm_madd_pi16(temp2, pVfilter[0]));  // += l3*f2+l1*f0 r3*f2+r1*f0
+            accu2 = _mm_add_pi32(accu2, _mm_madd_pi16(temp1, pVfilter[1]));  // += l4*f3+l2*f1 r4*f3+r2*f1
+
+            // accu1 += l2*f2+l0*f0 r2*f2+r0*f0
+            //       += l3*f3+l1*f1 r3*f3+r1*f1
+
+            // accu2 += l3*f2+l1*f0 r3*f2+r1*f0
+            //          l4*f3+l2*f1 r4*f3+r2*f1
+
+            pVfilter += 2;
+            pVsrc += 2;
+        }
+        // accu >>= resultDivFactor
+        accu1 = _mm_srai_pi32(accu1, resultDivFactor);
+        accu2 = _mm_srai_pi32(accu2, resultDivFactor);
+
+        // pack 2*2*32bits => 4*16 bits
+        pVdest[0] = _mm_packs_pi32(accu1, accu2);
+        src += 4;
+        pVdest ++;
+    }
+
+   _m_empty();  // clear emms state
+
+    return (numSamples & 0xfffffffe) - length;
+}
+
+#endif  // SOUNDTOUCH_ALLOW_MMX
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/peak_finder/PeakFinder.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/peak_finder/PeakFinder.cpp
new file mode 100644
index 0000000..6dbf1d8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/peak_finder/PeakFinder.cpp
@@ -0,0 +1,276 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// Peak detection routine. 
+///
+/// The routine detects highest value on an array of values and calculates the 
+/// precise peak location as a mass-center of the 'hump' around the peak value.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-12-28 21:52:47 +0200 (Fri, 28 Dec 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: PeakFinder.cpp 164 2012-12-28 19:52:47Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <math.h>
+#include <assert.h>
+
+#include "PeakFinder.h"
+
+using namespace soundtouch;
+
+#define max(x, y) (((x) > (y)) ? (x) : (y))
+
+
+PeakFinder::PeakFinder()
+{
+    minPos = maxPos = 0;
+}
+
+
+// Finds real 'top' of a peak hump from neighnourhood of the given 'peakpos'.
+int PeakFinder::findTop(const float *data, int peakpos) const
+{
+    int i;
+    int start, end;
+    float refvalue;
+
+    refvalue = data[peakpos];
+
+    // seek within ?0 points
+    start = peakpos - 10;
+    if (start < minPos) start = minPos;
+    end = peakpos + 10;
+    if (end > maxPos) end = maxPos;
+
+    for (i = start; i <= end; i ++)
+    {
+        if (data[i] > refvalue)
+        {
+            peakpos = i;
+            refvalue = data[i];
+        }
+    }
+
+    // failure if max value is at edges of seek range => it's not peak, it's at slope.
+    if ((peakpos == start) || (peakpos == end)) return 0;
+
+    return peakpos;
+}
+
+
+// Finds 'ground level' of a peak hump by starting from 'peakpos' and proceeding
+// to direction defined by 'direction' until next 'hump' after minimum value will 
+// begin
+int PeakFinder::findGround(const float *data, int peakpos, int direction) const
+{
+    int lowpos;
+    int pos;
+    int climb_count;
+    float refvalue;
+    float delta;
+
+    climb_count = 0;
+    refvalue = data[peakpos];
+    lowpos = peakpos;
+
+    pos = peakpos;
+
+    while ((pos > minPos+1) && (pos < maxPos-1))
+    {
+        int prevpos;
+
+        prevpos = pos;
+        pos += direction;
+
+        // calculate derivate
+        delta = data[pos] - data[prevpos];
+        if (delta <= 0)
+        {
+            // going downhill, ok
+            if (climb_count)
+            {
+                climb_count --;  // decrease climb count
+            }
+
+            // check if new minimum found
+            if (data[pos] < refvalue)
+            {
+                // new minimum found
+                lowpos = pos;
+                refvalue = data[pos];
+            }
+        }
+        else
+        {
+            // going uphill, increase climbing counter
+            climb_count ++;
+            if (climb_count > 5) break;    // we've been climbing too long => it's next uphill => quit
+        }
+    }
+    return lowpos;
+}
+
+
+// Find offset where the value crosses the given level, when starting from 'peakpos' and
+// proceeds to direction defined in 'direction'
+int PeakFinder::findCrossingLevel(const float *data, float level, int peakpos, int direction) const
+{
+    float peaklevel;
+    int pos;
+
+    peaklevel = data[peakpos];
+    assert(peaklevel >= level);
+    pos = peakpos;
+    while ((pos >= minPos) && (pos < maxPos))
+    {
+        if (data[pos + direction] < level) return pos;   // crossing found
+        pos += direction;
+    }
+    return -1;  // not found
+}
+
+
+// Calculates the center of mass location of 'data' array items between 'firstPos' and 'lastPos'
+double PeakFinder::calcMassCenter(const float *data, int firstPos, int lastPos) const
+{
+    int i;
+    float sum;
+    float wsum;
+
+    sum = 0;
+    wsum = 0;
+    for (i = firstPos; i <= lastPos; i ++)
+    {
+        sum += (float)i * data[i];
+        wsum += data[i];
+    }
+
+    if (wsum < 1e-6) return 0;
+    return sum / wsum;
+}
+
+
+
+/// get exact center of peak near given position by calculating local mass of center
+double PeakFinder::getPeakCenter(const float *data, int peakpos) const
+{
+    float peakLevel;            // peak level
+    int crosspos1, crosspos2;   // position where the peak 'hump' crosses cutting level
+    float cutLevel;             // cutting value
+    float groundLevel;          // ground level of the peak
+    int gp1, gp2;               // bottom positions of the peak 'hump'
+
+    // find ground positions.
+    gp1 = findGround(data, peakpos, -1);
+    gp2 = findGround(data, peakpos, 1);
+
+    groundLevel = 0.5f * (data[gp1] + data[gp2]);
+    peakLevel = data[peakpos];
+
+    // calculate 70%-level of the peak
+    cutLevel = 0.70f * peakLevel + 0.30f * groundLevel;
+    // find mid-level crossings
+    crosspos1 = findCrossingLevel(data, cutLevel, peakpos, -1);
+    crosspos2 = findCrossingLevel(data, cutLevel, peakpos, 1);
+
+    if ((crosspos1 < 0) || (crosspos2 < 0)) return 0;   // no crossing, no peak..
+
+    // calculate mass center of the peak surroundings
+    return calcMassCenter(data, crosspos1, crosspos2);
+}
+
+
+
+double PeakFinder::detectPeak(const float *data, int aminPos, int amaxPos) 
+{
+
+    int i;
+    int peakpos;                // position of peak level
+    double highPeak, peak;
+
+    this->minPos = aminPos;
+    this->maxPos = amaxPos;
+
+    // find absolute peak
+    peakpos = minPos;
+    peak = data[minPos];
+    for (i = minPos + 1; i < maxPos; i ++)
+    {
+        if (data[i] > peak) 
+        {
+            peak = data[i];
+            peakpos = i;
+        }
+    }
+    
+    // Calculate exact location of the highest peak mass center
+    highPeak = getPeakCenter(data, peakpos);
+    peak = highPeak;
+
+    // Now check if the highest peak were in fact harmonic of the true base beat peak 
+    // - sometimes the highest peak can be Nth harmonic of the true base peak yet 
+    // just a slightly higher than the true base
+
+    for (i = 3; i < 10; i ++)
+    {
+        double peaktmp, harmonic;
+        int i1,i2;
+
+        harmonic = (double)i * 0.5;
+        peakpos = (int)(highPeak / harmonic + 0.5f);
+        if (peakpos < minPos) break;
+        peakpos = findTop(data, peakpos);   // seek true local maximum index
+        if (peakpos == 0) continue;         // no local max here
+
+        // calculate mass-center of possible harmonic peak
+        peaktmp = getPeakCenter(data, peakpos);
+
+        // accept harmonic peak if 
+        // (a) it is found
+        // (b) is within ?% of the expected harmonic interval
+        // (c) has at least half x-corr value of the max. peak
+
+        double diff = harmonic * peaktmp / highPeak;
+        if ((diff < 0.96) || (diff > 1.04)) continue;   // peak too afar from expected
+
+        // now compare to highest detected peak
+        i1 = (int)(highPeak + 0.5);
+        i2 = (int)(peaktmp + 0.5);
+        if (data[i2] >= 0.4*data[i1])
+        {
+            // The harmonic is at least half as high primary peak,
+            // thus use the harmonic peak instead
+            peak = peaktmp;
+        }
+    }
+
+    return peak;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/peak_finder/PeakFinder.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/peak_finder/PeakFinder.h
new file mode 100644
index 0000000..d170b1c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/peak_finder/PeakFinder.h
@@ -0,0 +1,97 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// The routine detects highest value on an array of values and calculates the 
+/// precise peak location as a mass-center of the 'hump' around the peak value.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2011-12-30 22:33:46 +0200 (Fri, 30 Dec 2011) $
+// File revision : $Revision: 4 $
+//
+// $Id: PeakFinder.h 132 2011-12-30 20:33:46Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef _PeakFinder_H_
+#define _PeakFinder_H_
+
+namespace soundtouch
+{
+
+class PeakFinder
+{
+protected:
+    /// Min, max allowed peak positions within the data vector
+    int minPos, maxPos;
+
+    /// Calculates the mass center between given vector items.
+    double calcMassCenter(const float *data, ///< Data vector.
+                         int firstPos,      ///< Index of first vector item beloging to the peak.
+                         int lastPos        ///< Index of last vector item beloging to the peak.
+                         ) const;
+
+    /// Finds the data vector index where the monotoniously decreasing signal crosses the
+    /// given level.
+    int   findCrossingLevel(const float *data,  ///< Data vector.
+                            float level,        ///< Goal crossing level.
+                            int peakpos,        ///< Peak position index within the data vector.
+                            int direction       /// Direction where to proceed from the peak: 1 = right, -1 = left.
+                            ) const;
+
+    // Finds real 'top' of a peak hump from neighnourhood of the given 'peakpos'.
+    int findTop(const float *data, int peakpos) const;
+
+
+    /// Finds the 'ground' level, i.e. smallest level between two neighbouring peaks, to right- 
+    /// or left-hand side of the given peak position.
+    int   findGround(const float *data,     /// Data vector.
+                     int peakpos,           /// Peak position index within the data vector.
+                     int direction          /// Direction where to proceed from the peak: 1 = right, -1 = left.
+                     ) const;
+
+    /// get exact center of peak near given position by calculating local mass of center
+    double getPeakCenter(const float *data, int peakpos) const;
+
+public:
+    /// Constructor. 
+    PeakFinder();
+
+    /// Detect exact peak position of the data vector by finding the largest peak 'hump'
+    /// and calculating the mass-center location of the peak hump.
+    ///
+    /// \return The location of the largest base harmonic peak hump.
+    double detectPeak(const float *data, /// Data vector to be analyzed. The data vector has
+                                        /// to be at least 'maxPos' items long.
+                     int minPos,        ///< Min allowed peak location within the vector data.
+                     int maxPos         ///< Max allowed peak location within the vector data.
+                     );
+};
+
+}
+
+#endif // _PeakFinder_H_
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/rate_transposer/RateTransposer.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/rate_transposer/RateTransposer.cpp
new file mode 100644
index 0000000..0ccb1cc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/rate_transposer/RateTransposer.cpp
@@ -0,0 +1,626 @@
+////////////////////////////////////////////////////////////////////////////////
+/// 
+/// Sample rate transposer. Changes sample rate by using linear interpolation 
+/// together with anti-alias filtering (first order interpolation with anti-
+/// alias filtering should be quite adequate for this application)
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2011-09-02 21:56:11 +0300 (Fri, 02 Sep 2011) $
+// File revision : $Revision: 4 $
+//
+// $Id: RateTransposer.cpp 131 2011-09-02 18:56:11Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <memory.h>
+#include <assert.h>
+#include <stdlib.h>
+#include <stdio.h>
+#include "RateTransposer.h"
+#include "AAFilter.h"
+
+using namespace soundtouch;
+
+
+/// A linear samplerate transposer class that uses integer arithmetics.
+/// for the transposing.
+class RateTransposerInteger : public RateTransposer
+{
+protected:
+    int iSlopeCount;
+    int iRate;
+    SAMPLETYPE sPrevSampleL, sPrevSampleR;
+
+    virtual void resetRegisters();
+
+    virtual uint transposeStereo(SAMPLETYPE *dest, 
+                         const SAMPLETYPE *src, 
+                         uint numSamples);
+    virtual uint transposeMono(SAMPLETYPE *dest, 
+                       const SAMPLETYPE *src, 
+                       uint numSamples);
+
+public:
+    RateTransposerInteger();
+    virtual ~RateTransposerInteger();
+
+    /// Sets new target rate. Normal rate = 1.0, smaller values represent slower 
+    /// rate, larger faster rates.
+    virtual void setRate(float newRate);
+
+};
+
+
+/// A linear samplerate transposer class that uses floating point arithmetics
+/// for the transposing.
+class RateTransposerFloat : public RateTransposer
+{
+protected:
+    float fSlopeCount;
+    SAMPLETYPE sPrevSampleL, sPrevSampleR;
+
+    virtual void resetRegisters();
+
+    virtual uint transposeStereo(SAMPLETYPE *dest, 
+                         const SAMPLETYPE *src, 
+                         uint numSamples);
+    virtual uint transposeMono(SAMPLETYPE *dest, 
+                       const SAMPLETYPE *src, 
+                       uint numSamples);
+
+public:
+    RateTransposerFloat();
+    virtual ~RateTransposerFloat();
+};
+
+
+
+
+// Operator 'new' is overloaded so that it automatically creates a suitable instance 
+// depending on if we've a MMX/SSE/etc-capable CPU available or not.
+void * RateTransposer::operator new(size_t s)
+{
+    ST_THROW_RT_ERROR("Error in RateTransoser::new: don't use \"new TDStretch\" directly, use \"newInstance\" to create a new instance instead!");
+    return newInstance();
+}
+
+
+RateTransposer *RateTransposer::newInstance()
+{
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+    return ::new RateTransposerInteger;
+#else
+    return ::new RateTransposerFloat;
+#endif
+}
+
+
+// Constructor
+RateTransposer::RateTransposer() : FIFOProcessor(&outputBuffer)
+{
+    numChannels = 2;
+    bUseAAFilter = TRUE;
+    fRate = 0;
+
+    // Instantiates the anti-alias filter with default tap length
+    // of 32
+    pAAFilter = new AAFilter(32);
+}
+
+
+
+RateTransposer::~RateTransposer()
+{
+    delete pAAFilter;
+}
+
+
+
+/// Enables/disables the anti-alias filter. Zero to disable, nonzero to enable
+void RateTransposer::enableAAFilter(BOOL newMode)
+{
+    bUseAAFilter = newMode;
+}
+
+
+/// Returns nonzero if anti-alias filter is enabled.
+BOOL RateTransposer::isAAFilterEnabled() const
+{
+    return bUseAAFilter;
+}
+
+
+AAFilter *RateTransposer::getAAFilter()
+{
+    return pAAFilter;
+}
+
+
+
+// Sets new target iRate. Normal iRate = 1.0, smaller values represent slower 
+// iRate, larger faster iRates.
+void RateTransposer::setRate(float newRate)
+{
+    double fCutoff;
+
+    fRate = newRate;
+
+    // design a new anti-alias filter
+    if (newRate > 1.0f) 
+    {
+        fCutoff = 0.5f / newRate;
+    } 
+    else 
+    {
+        fCutoff = 0.5f * newRate;
+    }
+    pAAFilter->setCutoffFreq(fCutoff);
+}
+
+
+// Outputs as many samples of the 'outputBuffer' as possible, and if there's
+// any room left, outputs also as many of the incoming samples as possible.
+// The goal is to drive the outputBuffer empty.
+//
+// It's allowed for 'output' and 'input' parameters to point to the same
+// memory position.
+/*
+void RateTransposer::flushStoreBuffer()
+{
+    if (storeBuffer.isEmpty()) return;
+
+    outputBuffer.moveSamples(storeBuffer);
+}
+*/
+
+
+// Adds 'nSamples' pcs of samples from the 'samples' memory position into
+// the input of the object.
+void RateTransposer::putSamples(const SAMPLETYPE *samples, uint nSamples)
+{
+    processSamples(samples, nSamples);
+}
+
+
+
+// Transposes up the sample rate, causing the observed playback 'rate' of the
+// sound to decrease
+void RateTransposer::upsample(const SAMPLETYPE *src, uint nSamples)
+{
+    uint count, sizeTemp, num;
+
+    // If the parameter 'uRate' value is smaller than 'SCALE', first transpose
+    // the samples and then apply the anti-alias filter to remove aliasing.
+
+    // First check that there's enough room in 'storeBuffer' 
+    // (+16 is to reserve some slack in the destination buffer)
+    sizeTemp = (uint)((float)nSamples / fRate + 16.0f);
+
+    // Transpose the samples, store the result into the end of "storeBuffer"
+    count = transpose(storeBuffer.ptrEnd(sizeTemp), src, nSamples);
+    storeBuffer.putSamples(count);
+
+    // Apply the anti-alias filter to samples in "store output", output the
+    // result to "dest"
+    num = storeBuffer.numSamples();
+    count = pAAFilter->evaluate(outputBuffer.ptrEnd(num), 
+        storeBuffer.ptrBegin(), num, (uint)numChannels);
+    outputBuffer.putSamples(count);
+
+    // Remove the processed samples from "storeBuffer"
+    storeBuffer.receiveSamples(count);
+}
+
+
+// Transposes down the sample rate, causing the observed playback 'rate' of the
+// sound to increase
+void RateTransposer::downsample(const SAMPLETYPE *src, uint nSamples)
+{
+    uint count, sizeTemp;
+
+    // If the parameter 'uRate' value is larger than 'SCALE', first apply the
+    // anti-alias filter to remove high frequencies (prevent them from folding
+    // over the lover frequencies), then transpose.
+
+    // Add the new samples to the end of the storeBuffer
+    storeBuffer.putSamples(src, nSamples);
+
+    // Anti-alias filter the samples to prevent folding and output the filtered 
+    // data to tempBuffer. Note : because of the FIR filter length, the
+    // filtering routine takes in 'filter_length' more samples than it outputs.
+    assert(tempBuffer.isEmpty());
+    sizeTemp = storeBuffer.numSamples();
+
+    count = pAAFilter->evaluate(tempBuffer.ptrEnd(sizeTemp), 
+        storeBuffer.ptrBegin(), sizeTemp, (uint)numChannels);
+
+	if (count == 0) return;
+
+    // Remove the filtered samples from 'storeBuffer'
+    storeBuffer.receiveSamples(count);
+
+    // Transpose the samples (+16 is to reserve some slack in the destination buffer)
+    sizeTemp = (uint)((float)nSamples / fRate + 16.0f);
+    count = transpose(outputBuffer.ptrEnd(sizeTemp), tempBuffer.ptrBegin(), count);
+    outputBuffer.putSamples(count);
+}
+
+
+// Transposes sample rate by applying anti-alias filter to prevent folding. 
+// Returns amount of samples returned in the "dest" buffer.
+// The maximum amount of samples that can be returned at a time is set by
+// the 'set_returnBuffer_size' function.
+void RateTransposer::processSamples(const SAMPLETYPE *src, uint nSamples)
+{
+    uint count;
+    uint sizeReq;
+
+    if (nSamples == 0) return;
+    assert(pAAFilter);
+
+    // If anti-alias filter is turned off, simply transpose without applying
+    // the filter
+    if (bUseAAFilter == FALSE) 
+    {
+        sizeReq = (uint)((float)nSamples / fRate + 1.0f);
+        count = transpose(outputBuffer.ptrEnd(sizeReq), src, nSamples);
+        outputBuffer.putSamples(count);
+        return;
+    }
+
+    // Transpose with anti-alias filter
+    if (fRate < 1.0f) 
+    {
+        upsample(src, nSamples);
+    } 
+    else  
+    {
+        downsample(src, nSamples);
+    }
+}
+
+
+// Transposes the sample rate of the given samples using linear interpolation. 
+// Returns the number of samples returned in the "dest" buffer
+inline uint RateTransposer::transpose(SAMPLETYPE *dest, const SAMPLETYPE *src, uint nSamples)
+{
+    if (numChannels == 2) 
+    {
+        return transposeStereo(dest, src, nSamples);
+    } 
+    else 
+    {
+        return transposeMono(dest, src, nSamples);
+    }
+}
+
+
+// Sets the number of channels, 1 = mono, 2 = stereo
+void RateTransposer::setChannels(int nChannels)
+{
+    assert(nChannels > 0);
+    if (numChannels == nChannels) return;
+
+    assert(nChannels == 1 || nChannels == 2);
+    numChannels = nChannels;
+
+    storeBuffer.setChannels(numChannels);
+    tempBuffer.setChannels(numChannels);
+    outputBuffer.setChannels(numChannels);
+
+    // Inits the linear interpolation registers
+    resetRegisters();
+}
+
+
+// Clears all the samples in the object
+void RateTransposer::clear()
+{
+    outputBuffer.clear();
+    storeBuffer.clear();
+}
+
+
+// Returns nonzero if there aren't any samples available for outputting.
+int RateTransposer::isEmpty() const
+{
+    int res;
+
+    res = FIFOProcessor::isEmpty();
+    if (res == 0) return 0;
+    return storeBuffer.isEmpty();
+}
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// RateTransposerInteger - integer arithmetic implementation
+// 
+
+/// fixed-point interpolation routine precision
+#define SCALE    65536
+
+// Constructor
+RateTransposerInteger::RateTransposerInteger() : RateTransposer()
+{
+    // Notice: use local function calling syntax for sake of clarity, 
+    // to indicate the fact that C++ constructor can't call virtual functions.
+    RateTransposerInteger::resetRegisters();
+    RateTransposerInteger::setRate(1.0f);
+}
+
+
+RateTransposerInteger::~RateTransposerInteger()
+{
+}
+
+
+void RateTransposerInteger::resetRegisters()
+{
+    iSlopeCount = 0;
+    sPrevSampleL = 
+    sPrevSampleR = 0;
+}
+
+
+
+// Transposes the sample rate of the given samples using linear interpolation. 
+// 'Mono' version of the routine. Returns the number of samples returned in 
+// the "dest" buffer
+uint RateTransposerInteger::transposeMono(SAMPLETYPE *dest, const SAMPLETYPE *src, uint nSamples)
+{
+    unsigned int i, used;
+    LONG_SAMPLETYPE temp, vol1;
+
+    if (nSamples == 0) return 0;  // no samples, no work
+
+	used = 0;    
+    i = 0;
+
+    // process the last sample saved from the previous call first...
+    while (iSlopeCount <= SCALE) 
+    {
+        vol1 = (LONG_SAMPLETYPE)(SCALE - iSlopeCount);
+        temp = vol1 * sPrevSampleL + iSlopeCount * src[0];
+        dest[i] = (SAMPLETYPE)(temp / SCALE);
+        i++;
+        iSlopeCount += iRate;
+    }
+    // now always (iSlopeCount > SCALE)
+    iSlopeCount -= SCALE;
+
+    while (1)
+    {
+        while (iSlopeCount > SCALE) 
+        {
+            iSlopeCount -= SCALE;
+            used ++;
+            if (used >= nSamples - 1) goto end;
+        }
+        vol1 = (LONG_SAMPLETYPE)(SCALE - iSlopeCount);
+        temp = src[used] * vol1 + iSlopeCount * src[used + 1];
+        dest[i] = (SAMPLETYPE)(temp / SCALE);
+
+        i++;
+        iSlopeCount += iRate;
+    }
+end:
+    // Store the last sample for the next round
+    sPrevSampleL = src[nSamples - 1];
+
+    return i;
+}
+
+
+// Transposes the sample rate of the given samples using linear interpolation. 
+// 'Stereo' version of the routine. Returns the number of samples returned in 
+// the "dest" buffer
+uint RateTransposerInteger::transposeStereo(SAMPLETYPE *dest, const SAMPLETYPE *src, uint nSamples)
+{
+    unsigned int srcPos, i, used;
+    LONG_SAMPLETYPE temp, vol1;
+
+    if (nSamples == 0) return 0;  // no samples, no work
+
+    used = 0;    
+    i = 0;
+
+    // process the last sample saved from the sPrevSampleLious call first...
+    while (iSlopeCount <= SCALE) 
+    {
+        vol1 = (LONG_SAMPLETYPE)(SCALE - iSlopeCount);
+        temp = vol1 * sPrevSampleL + iSlopeCount * src[0];
+        dest[2 * i] = (SAMPLETYPE)(temp / SCALE);
+        temp = vol1 * sPrevSampleR + iSlopeCount * src[1];
+        dest[2 * i + 1] = (SAMPLETYPE)(temp / SCALE);
+        i++;
+        iSlopeCount += iRate;
+    }
+    // now always (iSlopeCount > SCALE)
+    iSlopeCount -= SCALE;
+
+    while (1)
+    {
+        while (iSlopeCount > SCALE) 
+        {
+            iSlopeCount -= SCALE;
+            used ++;
+            if (used >= nSamples - 1) goto end;
+        }
+        srcPos = 2 * used;
+        vol1 = (LONG_SAMPLETYPE)(SCALE - iSlopeCount);
+        temp = src[srcPos] * vol1 + iSlopeCount * src[srcPos + 2];
+        dest[2 * i] = (SAMPLETYPE)(temp / SCALE);
+        temp = src[srcPos + 1] * vol1 + iSlopeCount * src[srcPos + 3];
+        dest[2 * i + 1] = (SAMPLETYPE)(temp / SCALE);
+
+        i++;
+        iSlopeCount += iRate;
+    }
+end:
+    // Store the last sample for the next round
+    sPrevSampleL = src[2 * nSamples - 2];
+    sPrevSampleR = src[2 * nSamples - 1];
+
+    return i;
+}
+
+
+// Sets new target iRate. Normal iRate = 1.0, smaller values represent slower 
+// iRate, larger faster iRates.
+void RateTransposerInteger::setRate(float newRate)
+{
+    iRate = (int)(newRate * SCALE + 0.5f);
+    RateTransposer::setRate(newRate);
+}
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// RateTransposerFloat - floating point arithmetic implementation
+// 
+//////////////////////////////////////////////////////////////////////////////
+
+// Constructor
+RateTransposerFloat::RateTransposerFloat() : RateTransposer()
+{
+    // Notice: use local function calling syntax for sake of clarity, 
+    // to indicate the fact that C++ constructor can't call virtual functions.
+    RateTransposerFloat::resetRegisters();
+    RateTransposerFloat::setRate(1.0f);
+}
+
+
+RateTransposerFloat::~RateTransposerFloat()
+{
+}
+
+
+void RateTransposerFloat::resetRegisters()
+{
+    fSlopeCount = 0;
+    sPrevSampleL = 
+    sPrevSampleR = 0;
+}
+
+
+
+// Transposes the sample rate of the given samples using linear interpolation. 
+// 'Mono' version of the routine. Returns the number of samples returned in 
+// the "dest" buffer
+uint RateTransposerFloat::transposeMono(SAMPLETYPE *dest, const SAMPLETYPE *src, uint nSamples)
+{
+    unsigned int i, used;
+
+    used = 0;    
+    i = 0;
+
+    // process the last sample saved from the previous call first...
+    while (fSlopeCount <= 1.0f) 
+    {
+        dest[i] = (SAMPLETYPE)((1.0f - fSlopeCount) * sPrevSampleL + fSlopeCount * src[0]);
+        i++;
+        fSlopeCount += fRate;
+    }
+    fSlopeCount -= 1.0f;
+
+    if (nSamples > 1)
+    {
+        while (1)
+        {
+            while (fSlopeCount > 1.0f) 
+            {
+                fSlopeCount -= 1.0f;
+                used ++;
+                if (used >= nSamples - 1) goto end;
+            }
+            dest[i] = (SAMPLETYPE)((1.0f - fSlopeCount) * src[used] + fSlopeCount * src[used + 1]);
+            i++;
+            fSlopeCount += fRate;
+        }
+    }
+end:
+    // Store the last sample for the next round
+    sPrevSampleL = src[nSamples - 1];
+
+    return i;
+}
+
+
+// Transposes the sample rate of the given samples using linear interpolation. 
+// 'Mono' version of the routine. Returns the number of samples returned in 
+// the "dest" buffer
+uint RateTransposerFloat::transposeStereo(SAMPLETYPE *dest, const SAMPLETYPE *src, uint nSamples)
+{
+    unsigned int srcPos, i, used;
+
+    if (nSamples == 0) return 0;  // no samples, no work
+
+    used = 0;    
+    i = 0;
+
+    // process the last sample saved from the sPrevSampleLious call first...
+    while (fSlopeCount <= 1.0f) 
+    {
+        dest[2 * i] = (SAMPLETYPE)((1.0f - fSlopeCount) * sPrevSampleL + fSlopeCount * src[0]);
+        dest[2 * i + 1] = (SAMPLETYPE)((1.0f - fSlopeCount) * sPrevSampleR + fSlopeCount * src[1]);
+        i++;
+        fSlopeCount += fRate;
+    }
+    // now always (iSlopeCount > 1.0f)
+    fSlopeCount -= 1.0f;
+
+    if (nSamples > 1)
+    {
+        while (1)
+        {
+            while (fSlopeCount > 1.0f) 
+            {
+                fSlopeCount -= 1.0f;
+                used ++;
+                if (used >= nSamples - 1) goto end;
+            }
+            srcPos = 2 * used;
+
+            dest[2 * i] = (SAMPLETYPE)((1.0f - fSlopeCount) * src[srcPos] 
+                + fSlopeCount * src[srcPos + 2]);
+            dest[2 * i + 1] = (SAMPLETYPE)((1.0f - fSlopeCount) * src[srcPos + 1] 
+                + fSlopeCount * src[srcPos + 3]);
+
+            i++;
+            fSlopeCount += fRate;
+        }
+    }
+end:
+    // Store the last sample for the next round
+    sPrevSampleL = src[2 * nSamples - 2];
+    sPrevSampleR = src[2 * nSamples - 1];
+
+    return i;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/rate_transposer/RateTransposer.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/rate_transposer/RateTransposer.h
new file mode 100644
index 0000000..48f7bed
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/rate_transposer/RateTransposer.h
@@ -0,0 +1,159 @@
+////////////////////////////////////////////////////////////////////////////////
+/// 
+/// Sample rate transposer. Changes sample rate by using linear interpolation 
+/// together with anti-alias filtering (first order interpolation with anti-
+/// alias filtering should be quite adequate for this application).
+///
+/// Use either of the derived classes of 'RateTransposerInteger' or 
+/// 'RateTransposerFloat' for corresponding integer/floating point tranposing
+/// algorithm implementation.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2009-02-21 18:00:14 +0200 (Sat, 21 Feb 2009) $
+// File revision : $Revision: 4 $
+//
+// $Id: RateTransposer.h 63 2009-02-21 16:00:14Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef RateTransposer_H
+#define RateTransposer_H
+
+#include <stddef.h>
+#include "AAFilter.h"
+#include "FIFOSamplePipe.h"
+#include "FIFOSampleBuffer.h"
+
+#include "STTypes.h"
+
+namespace soundtouch
+{
+
+/// A common linear samplerate transposer class.
+///
+/// Note: Use function "RateTransposer::newInstance()" to create a new class 
+/// instance instead of the "new" operator; that function automatically 
+/// chooses a correct implementation depending on if integer or floating 
+/// arithmetics are to be used.
+class RateTransposer : public FIFOProcessor
+{
+protected:
+    /// Anti-alias filter object
+    AAFilter *pAAFilter;
+
+    float fRate;
+
+    int numChannels;
+
+    /// Buffer for collecting samples to feed the anti-alias filter between
+    /// two batches
+    FIFOSampleBuffer storeBuffer;
+
+    /// Buffer for keeping samples between transposing & anti-alias filter
+    FIFOSampleBuffer tempBuffer;
+
+    /// Output sample buffer
+    FIFOSampleBuffer outputBuffer;
+
+    BOOL bUseAAFilter;
+
+    virtual void resetRegisters() = 0;
+
+    virtual uint transposeStereo(SAMPLETYPE *dest, 
+                         const SAMPLETYPE *src, 
+                         uint numSamples) = 0;
+    virtual uint transposeMono(SAMPLETYPE *dest, 
+                       const SAMPLETYPE *src, 
+                       uint numSamples) = 0;
+    inline uint transpose(SAMPLETYPE *dest, 
+                   const SAMPLETYPE *src, 
+                   uint numSamples);
+
+    void downsample(const SAMPLETYPE *src, 
+                    uint numSamples);
+    void upsample(const SAMPLETYPE *src, 
+                 uint numSamples);
+
+    /// Transposes sample rate by applying anti-alias filter to prevent folding. 
+    /// Returns amount of samples returned in the "dest" buffer.
+    /// The maximum amount of samples that can be returned at a time is set by
+    /// the 'set_returnBuffer_size' function.
+    void processSamples(const SAMPLETYPE *src, 
+                        uint numSamples);
+
+
+public:
+    RateTransposer();
+    virtual ~RateTransposer();
+
+    /// Operator 'new' is overloaded so that it automatically creates a suitable instance 
+    /// depending on if we're to use integer or floating point arithmetics.
+    static void *operator new(size_t s);
+
+    /// Use this function instead of "new" operator to create a new instance of this class. 
+    /// This function automatically chooses a correct implementation, depending on if 
+    /// integer ot floating point arithmetics are to be used.
+    static RateTransposer *newInstance();
+
+    /// Returns the output buffer object
+    FIFOSamplePipe *getOutput() { return &outputBuffer; };
+
+    /// Returns the store buffer object
+    FIFOSamplePipe *getStore() { return &storeBuffer; };
+
+    /// Return anti-alias filter object
+    AAFilter *getAAFilter();
+
+    /// Enables/disables the anti-alias filter. Zero to disable, nonzero to enable
+    void enableAAFilter(BOOL newMode);
+
+    /// Returns nonzero if anti-alias filter is enabled.
+    BOOL isAAFilterEnabled() const;
+
+    /// Sets new target rate. Normal rate = 1.0, smaller values represent slower 
+    /// rate, larger faster rates.
+    virtual void setRate(float newRate);
+
+    /// Sets the number of channels, 1 = mono, 2 = stereo
+    void setChannels(int channels);
+
+    /// Adds 'numSamples' pcs of samples from the 'samples' memory position into
+    /// the input of the object.
+    void putSamples(const SAMPLETYPE *samples, uint numSamples);
+
+    /// Clears all the samples in the object
+    void clear();
+
+    /// Returns nonzero if there aren't any samples available for outputting.
+    int isEmpty() const;
+};
+
+}
+
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sound_touch/SoundTouch.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sound_touch/SoundTouch.cpp
new file mode 100644
index 0000000..f9160ed
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sound_touch/SoundTouch.cpp
@@ -0,0 +1,501 @@
+//////////////////////////////////////////////////////////////////////////////
+///
+/// SoundTouch - main class for tempo/pitch/rate adjusting routines. 
+///
+/// Notes:
+/// - Initialize the SoundTouch object instance by setting up the sound stream 
+///   parameters with functions 'setSampleRate' and 'setChannels', then set 
+///   desired tempo/pitch/rate settings with the corresponding functions.
+///
+/// - The SoundTouch class behaves like a first-in-first-out pipeline: The 
+///   samples that are to be processed are fed into one of the pipe by calling
+///   function 'putSamples', while the ready processed samples can be read 
+///   from the other end of the pipeline with function 'receiveSamples'.
+/// 
+/// - The SoundTouch processing classes require certain sized 'batches' of 
+///   samples in order to process the sound. For this reason the classes buffer 
+///   incoming samples until there are enough of samples available for 
+///   processing, then they carry out the processing step and consequently
+///   make the processed samples available for outputting.
+/// 
+/// - For the above reason, the processing routines introduce a certain 
+///   'latency' between the input and output, so that the samples input to
+///   SoundTouch may not be immediately available in the output, and neither 
+///   the amount of outputtable samples may not immediately be in direct 
+///   relationship with the amount of previously input samples.
+///
+/// - The tempo/pitch/rate control parameters can be altered during processing.
+///   Please notice though that they aren't currently protected by semaphores,
+///   so in multi-thread application external semaphore protection may be
+///   required.
+///
+/// - This class utilizes classes 'TDStretch' for tempo change (without modifying
+///   pitch) and 'RateTransposer' for changing the playback rate (that is, both 
+///   tempo and pitch in the same ratio) of the sound. The third available control 
+///   'pitch' (change pitch but maintain tempo) is produced by a combination of
+///   combining the two other controls.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-06-13 22:29:53 +0300 (Wed, 13 Jun 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: SoundTouch.cpp 143 2012-06-13 19:29:53Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <assert.h>
+#include <stdlib.h>
+#include <memory.h>
+#include <math.h>
+#include <stdio.h>
+
+#include "SoundTouch.h"
+#include "TDStretch.h"
+#include "RateTransposer.h"
+#include "cpu_detect.h"
+
+using namespace soundtouch;
+    
+/// test if two floating point numbers are equal
+#define TEST_FLOAT_EQUAL(a, b)  (fabs(a - b) < 1e-10)
+
+
+/// Print library version string for autoconf
+extern "C" void soundtouch_ac_test()
+{
+    printf("SoundTouch Version: %s\n",SOUNDTOUCH_VERSION);
+} 
+
+
+SoundTouch::SoundTouch()
+{
+    // Initialize rate transposer and tempo changer instances
+
+    pRateTransposer = RateTransposer::newInstance();
+    pTDStretch = TDStretch::newInstance();
+
+    setOutPipe(pTDStretch);
+
+    rate = tempo = 0;
+
+    virtualPitch = 
+    virtualRate = 
+    virtualTempo = 1.0;
+
+    calcEffectiveRateAndTempo();
+
+    channels = 0;
+    bSrateSet = FALSE;
+}
+
+
+
+SoundTouch::~SoundTouch()
+{
+    delete pRateTransposer;
+    delete pTDStretch;
+}
+
+
+
+/// Get SoundTouch library version string
+const char *SoundTouch::getVersionString()
+{
+    static const char *_version = SOUNDTOUCH_VERSION;
+
+    return _version;
+}
+
+
+/// Get SoundTouch library version Id
+uint SoundTouch::getVersionId()
+{
+    return SOUNDTOUCH_VERSION_ID;
+}
+
+
+// Sets the number of channels, 1 = mono, 2 = stereo
+void SoundTouch::setChannels(uint numChannels)
+{
+    if (numChannels != 1 && numChannels != 2) 
+    {
+        ST_THROW_RT_ERROR("Illegal number of channels");
+    }
+    channels = numChannels;
+    pRateTransposer->setChannels((int)numChannels);
+    pTDStretch->setChannels((int)numChannels);
+}
+
+
+
+// Sets new rate control value. Normal rate = 1.0, smaller values
+// represent slower rate, larger faster rates.
+void SoundTouch::setRate(float newRate)
+{
+    virtualRate = newRate;
+    calcEffectiveRateAndTempo();
+}
+
+
+
+// Sets new rate control value as a difference in percents compared
+// to the original rate (-50 .. +100 %)
+void SoundTouch::setRateChange(float newRate)
+{
+    virtualRate = 1.0f + 0.01f * newRate;
+    calcEffectiveRateAndTempo();
+}
+
+
+
+// Sets new tempo control value. Normal tempo = 1.0, smaller values
+// represent slower tempo, larger faster tempo.
+void SoundTouch::setTempo(float newTempo)
+{
+    virtualTempo = newTempo;
+    calcEffectiveRateAndTempo();
+}
+
+
+
+// Sets new tempo control value as a difference in percents compared
+// to the original tempo (-50 .. +100 %)
+void SoundTouch::setTempoChange(float newTempo)
+{
+    virtualTempo = 1.0f + 0.01f * newTempo;
+    calcEffectiveRateAndTempo();
+}
+
+
+
+// Sets new pitch control value. Original pitch = 1.0, smaller values
+// represent lower pitches, larger values higher pitch.
+void SoundTouch::setPitch(float newPitch)
+{
+    virtualPitch = newPitch;
+    calcEffectiveRateAndTempo();
+}
+
+
+
+// Sets pitch change in octaves compared to the original pitch
+// (-1.00 .. +1.00)
+void SoundTouch::setPitchOctaves(float newPitch)
+{
+    virtualPitch = (float)exp(0.69314718056f * newPitch);
+    calcEffectiveRateAndTempo();
+}
+
+
+
+// Sets pitch change in semi-tones compared to the original pitch
+// (-12 .. +12)
+void SoundTouch::setPitchSemiTones(int newPitch)
+{
+    setPitchOctaves((float)newPitch / 12.0f);
+}
+
+
+
+void SoundTouch::setPitchSemiTones(float newPitch)
+{
+    setPitchOctaves(newPitch / 12.0f);
+}
+
+
+// Calculates 'effective' rate and tempo values from the
+// nominal control values.
+void SoundTouch::calcEffectiveRateAndTempo()
+{
+    float oldTempo = tempo;
+    float oldRate = rate;
+
+    tempo = virtualTempo / virtualPitch;
+    rate = virtualPitch * virtualRate;
+
+    if (!TEST_FLOAT_EQUAL(rate,oldRate)) pRateTransposer->setRate(rate);
+    if (!TEST_FLOAT_EQUAL(tempo, oldTempo)) pTDStretch->setTempo(tempo);
+
+#ifndef SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER
+    if (rate <= 1.0f) 
+    {
+        if (output != pTDStretch) 
+        {
+            FIFOSamplePipe *tempoOut;
+
+            assert(output == pRateTransposer);
+            // move samples in the current output buffer to the output of pTDStretch
+            tempoOut = pTDStretch->getOutput();
+            tempoOut->moveSamples(*output);
+            // move samples in pitch transposer's store buffer to tempo changer's input
+            pTDStretch->moveSamples(*pRateTransposer->getStore());
+
+            output = pTDStretch;
+        }
+    }
+    else
+#endif
+    {
+        if (output != pRateTransposer) 
+        {
+            FIFOSamplePipe *transOut;
+
+            assert(output == pTDStretch);
+            // move samples in the current output buffer to the output of pRateTransposer
+            transOut = pRateTransposer->getOutput();
+            transOut->moveSamples(*output);
+            // move samples in tempo changer's input to pitch transposer's input
+            pRateTransposer->moveSamples(*pTDStretch->getInput());
+
+            output = pRateTransposer;
+        }
+    } 
+}
+
+
+// Sets sample rate.
+void SoundTouch::setSampleRate(uint srate)
+{
+    bSrateSet = TRUE;
+    // set sample rate, leave other tempo changer parameters as they are.
+    pTDStretch->setParameters((int)srate);
+}
+
+
+// Adds 'numSamples' pcs of samples from the 'samples' memory position into
+// the input of the object.
+void SoundTouch::putSamples(const SAMPLETYPE *samples, uint nSamples)
+{
+    if (bSrateSet == FALSE) 
+    {
+        ST_THROW_RT_ERROR("SoundTouch : Sample rate not defined");
+    } 
+    else if (channels == 0) 
+    {
+        ST_THROW_RT_ERROR("SoundTouch : Number of channels not defined");
+    }
+
+    // Transpose the rate of the new samples if necessary
+    /* Bypass the nominal setting - can introduce a click in sound when tempo/pitch control crosses the nominal value...
+    if (rate == 1.0f) 
+    {
+        // The rate value is same as the original, simply evaluate the tempo changer. 
+        assert(output == pTDStretch);
+        if (pRateTransposer->isEmpty() == 0) 
+        {
+            // yet flush the last samples in the pitch transposer buffer
+            // (may happen if 'rate' changes from a non-zero value to zero)
+            pTDStretch->moveSamples(*pRateTransposer);
+        }
+        pTDStretch->putSamples(samples, nSamples);
+    } 
+    */
+#ifndef SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER
+    else if (rate <= 1.0f) 
+    {
+        // transpose the rate down, output the transposed sound to tempo changer buffer
+        assert(output == pTDStretch);
+        pRateTransposer->putSamples(samples, nSamples);
+        pTDStretch->moveSamples(*pRateTransposer);
+    } 
+    else 
+#endif
+    {
+        // evaluate the tempo changer, then transpose the rate up, 
+        assert(output == pRateTransposer);
+        pTDStretch->putSamples(samples, nSamples);
+        pRateTransposer->moveSamples(*pTDStretch);
+    }
+}
+
+
+// Flushes the last samples from the processing pipeline to the output.
+// Clears also the internal processing buffers.
+//
+// Note: This function is meant for extracting the last samples of a sound
+// stream. This function may introduce additional blank samples in the end
+// of the sound stream, and thus it's not recommended to call this function
+// in the middle of a sound stream.
+void SoundTouch::flush()
+{
+    int i;
+    int nUnprocessed;
+    int nOut;
+    SAMPLETYPE buff[64*2];   // note: allocate 2*64 to cater 64 sample frames of stereo sound
+
+    // check how many samples still await processing, and scale
+    // that by tempo & rate to get expected output sample count
+    nUnprocessed = numUnprocessedSamples();
+    nUnprocessed = (int)((double)nUnprocessed / (tempo * rate) + 0.5);
+
+    nOut = numSamples();        // ready samples currently in buffer ...
+    nOut += nUnprocessed;       // ... and how many we expect there to be in the end
+    
+    memset(buff, 0, 64 * channels * sizeof(SAMPLETYPE));
+    // "Push" the last active samples out from the processing pipeline by
+    // feeding blank samples into the processing pipeline until new, 
+    // processed samples appear in the output (not however, more than 
+    // 8ksamples in any case)
+    for (i = 0; i < 128; i ++) 
+    {
+        putSamples(buff, 64);
+        if ((int)numSamples() >= nOut) 
+        {
+            // Enough new samples have appeared into the output!
+            // As samples come from processing with bigger chunks, now truncate it
+            // back to maximum "nOut" samples to improve duration accuracy 
+            adjustAmountOfSamples(nOut);
+
+            // finish
+            break;  
+        }
+    }
+
+    // Clear working buffers
+    pRateTransposer->clear();
+    pTDStretch->clearInput();
+    // yet leave the 'tempoChanger' output intouched as that's where the
+    // flushed samples are!
+}
+
+
+// Changes a setting controlling the processing system behaviour. See the
+// 'SETTING_...' defines for available setting ID's.
+BOOL SoundTouch::setSetting(int settingId, int value)
+{
+    int sampleRate, sequenceMs, seekWindowMs, overlapMs;
+
+    // read current tdstretch routine parameters
+    pTDStretch->getParameters(&sampleRate, &sequenceMs, &seekWindowMs, &overlapMs);
+
+    switch (settingId) 
+    {
+        case SETTING_USE_AA_FILTER :
+            // enables / disabless anti-alias filter
+            pRateTransposer->enableAAFilter((value != 0) ? TRUE : FALSE);
+            return TRUE;
+
+        case SETTING_AA_FILTER_LENGTH :
+            // sets anti-alias filter length
+            pRateTransposer->getAAFilter()->setLength(value);
+            return TRUE;
+
+        case SETTING_USE_QUICKSEEK :
+            // enables / disables tempo routine quick seeking algorithm
+            pTDStretch->enableQuickSeek((value != 0) ? TRUE : FALSE);
+            return TRUE;
+
+        case SETTING_SEQUENCE_MS:
+            // change time-stretch sequence duration parameter
+            pTDStretch->setParameters(sampleRate, value, seekWindowMs, overlapMs);
+            return TRUE;
+
+        case SETTING_SEEKWINDOW_MS:
+            // change time-stretch seek window length parameter
+            pTDStretch->setParameters(sampleRate, sequenceMs, value, overlapMs);
+            return TRUE;
+
+        case SETTING_OVERLAP_MS:
+            // change time-stretch overlap length parameter
+            pTDStretch->setParameters(sampleRate, sequenceMs, seekWindowMs, value);
+            return TRUE;
+
+        default :
+            return FALSE;
+    }
+}
+
+
+// Reads a setting controlling the processing system behaviour. See the
+// 'SETTING_...' defines for available setting ID's.
+//
+// Returns the setting value.
+int SoundTouch::getSetting(int settingId) const
+{
+    int temp;
+
+    switch (settingId) 
+    {
+        case SETTING_USE_AA_FILTER :
+            return (uint)pRateTransposer->isAAFilterEnabled();
+
+        case SETTING_AA_FILTER_LENGTH :
+            return pRateTransposer->getAAFilter()->getLength();
+
+        case SETTING_USE_QUICKSEEK :
+            return (uint)   pTDStretch->isQuickSeekEnabled();
+
+        case SETTING_SEQUENCE_MS:
+            pTDStretch->getParameters(NULL, &temp, NULL, NULL);
+            return temp;
+
+        case SETTING_SEEKWINDOW_MS:
+            pTDStretch->getParameters(NULL, NULL, &temp, NULL);
+            return temp;
+
+        case SETTING_OVERLAP_MS:
+            pTDStretch->getParameters(NULL, NULL, NULL, &temp);
+            return temp;
+
+		case SETTING_NOMINAL_INPUT_SEQUENCE :
+			return pTDStretch->getInputSampleReq();
+
+		case SETTING_NOMINAL_OUTPUT_SEQUENCE :
+			return pTDStretch->getOutputBatchSize();
+
+		default :
+            return 0;
+    }
+}
+
+
+// Clears all the samples in the object's output and internal processing
+// buffers.
+void SoundTouch::clear()
+{
+    pRateTransposer->clear();
+    pTDStretch->clear();
+}
+
+
+
+/// Returns number of samples currently unprocessed.
+uint SoundTouch::numUnprocessedSamples() const
+{
+    FIFOSamplePipe * psp;
+    if (pTDStretch)
+    {
+        psp = pTDStretch->getInput();
+        if (psp)
+        {
+            return psp->numSamples();
+        }
+    }
+    return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sound_touch/SoundTouch.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sound_touch/SoundTouch.h
new file mode 100644
index 0000000..c6af895
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sound_touch/SoundTouch.h
@@ -0,0 +1,277 @@
+//////////////////////////////////////////////////////////////////////////////
+///
+/// SoundTouch - main class for tempo/pitch/rate adjusting routines. 
+///
+/// Notes:
+/// - Initialize the SoundTouch object instance by setting up the sound stream 
+///   parameters with functions 'setSampleRate' and 'setChannels', then set 
+///   desired tempo/pitch/rate settings with the corresponding functions.
+///
+/// - The SoundTouch class behaves like a first-in-first-out pipeline: The 
+///   samples that are to be processed are fed into one of the pipe by calling
+///   function 'putSamples', while the ready processed samples can be read 
+///   from the other end of the pipeline with function 'receiveSamples'.
+/// 
+/// - The SoundTouch processing classes require certain sized 'batches' of 
+///   samples in order to process the sound. For this reason the classes buffer 
+///   incoming samples until there are enough of samples available for 
+///   processing, then they carry out the processing step and consequently
+///   make the processed samples available for outputting.
+/// 
+/// - For the above reason, the processing routines introduce a certain 
+///   'latency' between the input and output, so that the samples input to
+///   SoundTouch may not be immediately available in the output, and neither 
+///   the amount of outputtable samples may not immediately be in direct 
+///   relationship with the amount of previously input samples.
+///
+/// - The tempo/pitch/rate control parameters can be altered during processing.
+///   Please notice though that they aren't currently protected by semaphores,
+///   so in multi-thread application external semaphore protection may be
+///   required.
+///
+/// - This class utilizes classes 'TDStretch' for tempo change (without modifying
+///   pitch) and 'RateTransposer' for changing the playback rate (that is, both 
+///   tempo and pitch in the same ratio) of the sound. The third available control 
+///   'pitch' (change pitch but maintain tempo) is produced by a combination of
+///   combining the two other controls.
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-12-28 21:32:59 +0200 (Fri, 28 Dec 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: SoundTouch.h 163 2012-12-28 19:32:59Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef SoundTouch_H
+#define SoundTouch_H
+
+#include "FIFOSamplePipe.h"
+#include "STTypes.h"
+
+namespace soundtouch
+{
+
+/// Soundtouch library version string
+#define SOUNDTOUCH_VERSION          "1.7.1"
+
+/// SoundTouch library version id
+#define SOUNDTOUCH_VERSION_ID       (10701)
+
+//
+// Available setting IDs for the 'setSetting' & 'get_setting' functions:
+
+/// Enable/disable anti-alias filter in pitch transposer (0 = disable)
+#define SETTING_USE_AA_FILTER       0
+
+/// Pitch transposer anti-alias filter length (8 .. 128 taps, default = 32)
+#define SETTING_AA_FILTER_LENGTH    1
+
+/// Enable/disable quick seeking algorithm in tempo changer routine
+/// (enabling quick seeking lowers CPU utilization but causes a minor sound
+///  quality compromising)
+#define SETTING_USE_QUICKSEEK       2
+
+/// Time-stretch algorithm single processing sequence length in milliseconds. This determines 
+/// to how long sequences the original sound is chopped in the time-stretch algorithm. 
+/// See "STTypes.h" or README for more information.
+#define SETTING_SEQUENCE_MS         3
+
+/// Time-stretch algorithm seeking window length in milliseconds for algorithm that finds the 
+/// best possible overlapping location. This determines from how wide window the algorithm 
+/// may look for an optimal joining location when mixing the sound sequences back together. 
+/// See "STTypes.h" or README for more information.
+#define SETTING_SEEKWINDOW_MS       4
+
+/// Time-stretch algorithm overlap length in milliseconds. When the chopped sound sequences 
+/// are mixed back together, to form a continuous sound stream, this parameter defines over 
+/// how long period the two consecutive sequences are let to overlap each other. 
+/// See "STTypes.h" or README for more information.
+#define SETTING_OVERLAP_MS          5
+
+
+/// Call "getSetting" with this ID to query nominal average processing sequence
+/// size in samples. This value tells approcimate value how many input samples 
+/// SoundTouch needs to gather before it does DSP processing run for the sample batch.
+///
+/// Notices: 
+/// - This is read-only parameter, i.e. setSetting ignores this parameter
+/// - Returned value is approximate average value, exact processing batch
+///   size may wary from time to time
+/// - This parameter value is not constant but may change depending on 
+///   tempo/pitch/rate/samplerate settings.
+#define SETTING_NOMINAL_INPUT_SEQUENCE		6
+
+
+/// Call "getSetting" with this ID to query nominal average processing output 
+/// size in samples. This value tells approcimate value how many output samples 
+/// SoundTouch outputs once it does DSP processing run for a batch of input samples.
+///	
+/// Notices: 
+/// - This is read-only parameter, i.e. setSetting ignores this parameter
+/// - Returned value is approximate average value, exact processing batch
+///   size may wary from time to time
+/// - This parameter value is not constant but may change depending on 
+///   tempo/pitch/rate/samplerate settings.
+#define SETTING_NOMINAL_OUTPUT_SEQUENCE		7
+
+class SoundTouch : public FIFOProcessor
+{
+private:
+    /// Rate transposer class instance
+    class RateTransposer *pRateTransposer;
+
+    /// Time-stretch class instance
+    class TDStretch *pTDStretch;
+
+    /// Virtual pitch parameter. Effective rate & tempo are calculated from these parameters.
+    float virtualRate;
+
+    /// Virtual pitch parameter. Effective rate & tempo are calculated from these parameters.
+    float virtualTempo;
+
+    /// Virtual pitch parameter. Effective rate & tempo are calculated from these parameters.
+    float virtualPitch;
+
+    /// Flag: Has sample rate been set?
+    BOOL  bSrateSet;
+
+    /// Calculates effective rate & tempo valuescfrom 'virtualRate', 'virtualTempo' and 
+    /// 'virtualPitch' parameters.
+    void calcEffectiveRateAndTempo();
+
+protected :
+    /// Number of channels
+    uint  channels;
+
+    /// Effective 'rate' value calculated from 'virtualRate', 'virtualTempo' and 'virtualPitch'
+    float rate;
+
+    /// Effective 'tempo' value calculated from 'virtualRate', 'virtualTempo' and 'virtualPitch'
+    float tempo;
+
+public:
+    SoundTouch();
+    virtual ~SoundTouch();
+
+    /// Get SoundTouch library version string
+    static const char *getVersionString();
+
+    /// Get SoundTouch library version Id
+    static uint getVersionId();
+
+    /// Sets new rate control value. Normal rate = 1.0, smaller values
+    /// represent slower rate, larger faster rates.
+    void setRate(float newRate);
+
+    /// Sets new tempo control value. Normal tempo = 1.0, smaller values
+    /// represent slower tempo, larger faster tempo.
+    void setTempo(float newTempo);
+
+    /// Sets new rate control value as a difference in percents compared
+    /// to the original rate (-50 .. +100 %)
+    void setRateChange(float newRate);
+
+    /// Sets new tempo control value as a difference in percents compared
+    /// to the original tempo (-50 .. +100 %)
+    void setTempoChange(float newTempo);
+
+    /// Sets new pitch control value. Original pitch = 1.0, smaller values
+    /// represent lower pitches, larger values higher pitch.
+    void setPitch(float newPitch);
+
+    /// Sets pitch change in octaves compared to the original pitch  
+    /// (-1.00 .. +1.00)
+    void setPitchOctaves(float newPitch);
+
+    /// Sets pitch change in semi-tones compared to the original pitch
+    /// (-12 .. +12)
+    void setPitchSemiTones(int newPitch);
+    void setPitchSemiTones(float newPitch);
+
+    /// Sets the number of channels, 1 = mono, 2 = stereo
+    void setChannels(uint numChannels);
+
+    /// Sets sample rate.
+    void setSampleRate(uint srate);
+
+    /// Flushes the last samples from the processing pipeline to the output.
+    /// Clears also the internal processing buffers.
+    //
+    /// Note: This function is meant for extracting the last samples of a sound
+    /// stream. This function may introduce additional blank samples in the end
+    /// of the sound stream, and thus it's not recommended to call this function
+    /// in the middle of a sound stream.
+    void flush();
+
+    /// Adds 'numSamples' pcs of samples from the 'samples' memory position into
+    /// the input of the object. Notice that sample rate _has_to_ be set before
+    /// calling this function, otherwise throws a runtime_error exception.
+    virtual void putSamples(
+            const SAMPLETYPE *samples,  ///< Pointer to sample buffer.
+            uint numSamples                         ///< Number of samples in buffer. Notice
+                                                    ///< that in case of stereo-sound a single sample
+                                                    ///< contains data for both channels.
+            );
+
+    /// Clears all the samples in the object's output and internal processing
+    /// buffers.
+    virtual void clear();
+
+    /// Changes a setting controlling the processing system behaviour. See the
+    /// 'SETTING_...' defines for available setting ID's.
+    /// 
+    /// \return 'TRUE' if the setting was succesfully changed
+    BOOL setSetting(int settingId,   ///< Setting ID number. see SETTING_... defines.
+                    int value        ///< New setting value.
+                    );
+
+    /// Reads a setting controlling the processing system behaviour. See the
+    /// 'SETTING_...' defines for available setting ID's.
+    ///
+    /// \return the setting value.
+    int getSetting(int settingId    ///< Setting ID number, see SETTING_... defines.
+                   ) const;
+
+    /// Returns number of samples currently unprocessed.
+    virtual uint numUnprocessedSamples() const;
+
+
+    /// Other handy functions that are implemented in the ancestor classes (see
+    /// classes 'FIFOProcessor' and 'FIFOSamplePipe')
+    ///
+    /// - receiveSamples() : Use this function to receive 'ready' processed samples from SoundTouch.
+    /// - numSamples()     : Get number of 'ready' samples that can be received with 
+    ///                      function 'receiveSamples()'
+    /// - isEmpty()        : Returns nonzero if there aren't any 'ready' samples.
+    /// - clear()          : Clears all samples from ready/processing buffers.
+};
+
+}
+#endif
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sse_optimized.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sse_optimized.cpp
new file mode 100644
index 0000000..ffb6706
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/sse_optimized.cpp
@@ -0,0 +1,361 @@
+////////////////////////////////////////////////////////////////////////////////
+///
+/// SSE optimized routines for Pentium-III, Athlon-XP and later CPUs. All SSE 
+/// optimized functions have been gathered into this single source 
+/// code file, regardless to their class or original source code file, in order 
+/// to ease porting the library to other compiler and processor platforms.
+///
+/// The SSE-optimizations are programmed using SSE compiler intrinsics that
+/// are supported both by Microsoft Visual C++ and GCC compilers, so this file
+/// should compile with both toolsets.
+///
+/// NOTICE: If using Visual Studio 6.0, you'll need to install the "Visual C++ 
+/// 6.0 processor pack" update to support SSE instruction set. The update is 
+/// available for download at Microsoft Developers Network, see here:
+/// http://msdn.microsoft.com/en-us/vstudio/aa718349.aspx
+///
+/// If the above URL is expired or removed, go to "http://msdn.microsoft.com" and 
+/// perform a search with keywords "processor pack".
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-11-08 20:53:01 +0200 (Thu, 08 Nov 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: sse_optimized.cpp 160 2012-11-08 18:53:01Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include "cpu_detect.h"
+#include "STTypes.h"
+
+using namespace soundtouch;
+
+#ifdef SOUNDTOUCH_ALLOW_SSE
+
+// SSE routines available only with float sample type    
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// implementation of SSE optimized functions of class 'TDStretchSSE'
+//
+//////////////////////////////////////////////////////////////////////////////
+
+#include "TDStretch.h"
+#include <xmmintrin.h>
+#include <math.h>
+
+// Calculates cross correlation of two buffers
+double TDStretchSSE::calcCrossCorr(const float *pV1, const float *pV2) const
+{
+    int i;
+    const float *pVec1;
+    const __m128 *pVec2;
+    __m128 vSum, vNorm;
+
+    // Note. It means a major slow-down if the routine needs to tolerate 
+    // unaligned __m128 memory accesses. It's way faster if we can skip 
+    // unaligned slots and use _mm_load_ps instruction instead of _mm_loadu_ps.
+    // This can mean up to ~ 10-fold difference (incl. part of which is
+    // due to skipping every second round for stereo sound though).
+    //
+    // Compile-time define SOUNDTOUCH_ALLOW_NONEXACT_SIMD_OPTIMIZATION is provided
+    // for choosing if this little cheating is allowed.
+
+#ifdef SOUNDTOUCH_ALLOW_NONEXACT_SIMD_OPTIMIZATION
+    // Little cheating allowed, return valid correlation only for 
+    // aligned locations, meaning every second round for stereo sound.
+
+    #define _MM_LOAD    _mm_load_ps
+
+    if (((ulongptr)pV1) & 15) return -1e50;    // skip unaligned locations
+
+#else
+    // No cheating allowed, use unaligned load & take the resulting
+    // performance hit.
+    #define _MM_LOAD    _mm_loadu_ps
+#endif 
+
+    // ensure overlapLength is divisible by 8
+    assert((overlapLength % 8) == 0);
+
+    // Calculates the cross-correlation value between 'pV1' and 'pV2' vectors
+    // Note: pV2 _must_ be aligned to 16-bit boundary, pV1 need not.
+    pVec1 = (const float*)pV1;
+    pVec2 = (const __m128*)pV2;
+    vSum = vNorm = _mm_setzero_ps();
+
+    // Unroll the loop by factor of 4 * 4 operations. Use same routine for
+    // stereo & mono, for mono it just means twice the amount of unrolling.
+    for (i = 0; i < channels * overlapLength / 16; i ++) 
+    {
+        __m128 vTemp;
+        // vSum += pV1[0..3] * pV2[0..3]
+        vTemp = _MM_LOAD(pVec1);
+        vSum  = _mm_add_ps(vSum,  _mm_mul_ps(vTemp ,pVec2[0]));
+        vNorm = _mm_add_ps(vNorm, _mm_mul_ps(vTemp ,vTemp));
+
+        // vSum += pV1[4..7] * pV2[4..7]
+        vTemp = _MM_LOAD(pVec1 + 4);
+        vSum  = _mm_add_ps(vSum, _mm_mul_ps(vTemp, pVec2[1]));
+        vNorm = _mm_add_ps(vNorm, _mm_mul_ps(vTemp ,vTemp));
+
+        // vSum += pV1[8..11] * pV2[8..11]
+        vTemp = _MM_LOAD(pVec1 + 8);
+        vSum  = _mm_add_ps(vSum, _mm_mul_ps(vTemp, pVec2[2]));
+        vNorm = _mm_add_ps(vNorm, _mm_mul_ps(vTemp ,vTemp));
+
+        // vSum += pV1[12..15] * pV2[12..15]
+        vTemp = _MM_LOAD(pVec1 + 12);
+        vSum  = _mm_add_ps(vSum, _mm_mul_ps(vTemp, pVec2[3]));
+        vNorm = _mm_add_ps(vNorm, _mm_mul_ps(vTemp ,vTemp));
+
+        pVec1 += 16;
+        pVec2 += 4;
+    }
+
+    // return value = vSum[0] + vSum[1] + vSum[2] + vSum[3]
+    float *pvNorm = (float*)&vNorm;
+    double norm = sqrt(pvNorm[0] + pvNorm[1] + pvNorm[2] + pvNorm[3]);
+    if (norm < 1e-9) norm = 1.0;    // to avoid div by zero
+
+    float *pvSum = (float*)&vSum;
+    return (double)(pvSum[0] + pvSum[1] + pvSum[2] + pvSum[3]) / norm;
+
+    /* This is approximately corresponding routine in C-language yet without normalization:
+    double corr, norm;
+    uint i;
+
+    // Calculates the cross-correlation value between 'pV1' and 'pV2' vectors
+    corr = norm = 0.0;
+    for (i = 0; i < channels * overlapLength / 16; i ++) 
+    {
+        corr += pV1[0] * pV2[0] +
+                pV1[1] * pV2[1] +
+                pV1[2] * pV2[2] +
+                pV1[3] * pV2[3] +
+                pV1[4] * pV2[4] +
+                pV1[5] * pV2[5] +
+                pV1[6] * pV2[6] +
+                pV1[7] * pV2[7] +
+                pV1[8] * pV2[8] +
+                pV1[9] * pV2[9] +
+                pV1[10] * pV2[10] +
+                pV1[11] * pV2[11] +
+                pV1[12] * pV2[12] +
+                pV1[13] * pV2[13] +
+                pV1[14] * pV2[14] +
+                pV1[15] * pV2[15];
+
+    for (j = 0; j < 15; j ++) norm += pV1[j] * pV1[j];
+
+        pV1 += 16;
+        pV2 += 16;
+    }
+    return corr / sqrt(norm);
+    */
+}
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// implementation of SSE optimized functions of class 'FIRFilter'
+//
+//////////////////////////////////////////////////////////////////////////////
+
+#include "FIRFilter.h"
+
+FIRFilterSSE::FIRFilterSSE() : FIRFilter()
+{
+    filterCoeffsAlign = NULL;
+    filterCoeffsUnalign = NULL;
+}
+
+
+FIRFilterSSE::~FIRFilterSSE()
+{
+    delete[] filterCoeffsUnalign;
+    filterCoeffsAlign = NULL;
+    filterCoeffsUnalign = NULL;
+}
+
+
+// (overloaded) Calculates filter coefficients for SSE routine
+void FIRFilterSSE::setCoefficients(const float *coeffs, uint newLength, uint uResultDivFactor)
+{
+    uint i;
+    float fDivider;
+
+    FIRFilter::setCoefficients(coeffs, newLength, uResultDivFactor);
+
+    // Scale the filter coefficients so that it won't be necessary to scale the filtering result
+    // also rearrange coefficients suitably for SSE
+    // Ensure that filter coeffs array is aligned to 16-byte boundary
+    delete[] filterCoeffsUnalign;
+    filterCoeffsUnalign = new float[2 * newLength + 4];
+    filterCoeffsAlign = (float *)SOUNDTOUCH_ALIGN_POINTER_16(filterCoeffsUnalign);
+
+    fDivider = (float)resultDivider;
+
+    // rearrange the filter coefficients for mmx routines 
+    for (i = 0; i < newLength; i ++)
+    {
+        filterCoeffsAlign[2 * i + 0] =
+        filterCoeffsAlign[2 * i + 1] = coeffs[i + 0] / fDivider;
+    }
+}
+
+
+
+// SSE-optimized version of the filter routine for stereo sound
+uint FIRFilterSSE::evaluateFilterStereo(float *dest, const float *source, uint numSamples) const
+{
+    int count = (int)((numSamples - length) & (uint)-2);
+    int j;
+
+    assert(count % 2 == 0);
+
+    if (count < 2) return 0;
+
+    assert(source != NULL);
+    assert(dest != NULL);
+    assert((length % 8) == 0);
+    assert(filterCoeffsAlign != NULL);
+    assert(((ulongptr)filterCoeffsAlign) % 16 == 0);
+
+    // filter is evaluated for two stereo samples with each iteration, thus use of 'j += 2'
+    for (j = 0; j < count; j += 2)
+    {
+        const float *pSrc;
+        const __m128 *pFil;
+        __m128 sum1, sum2;
+        uint i;
+
+        pSrc = (const float*)source;              // source audio data
+        pFil = (const __m128*)filterCoeffsAlign;  // filter coefficients. NOTE: Assumes coefficients 
+                                                  // are aligned to 16-byte boundary
+        sum1 = sum2 = _mm_setzero_ps();
+
+        for (i = 0; i < length / 8; i ++) 
+        {
+            // Unroll loop for efficiency & calculate filter for 2*2 stereo samples 
+            // at each pass
+
+            // sum1 is accu for 2*2 filtered stereo sound data at the primary sound data offset
+            // sum2 is accu for 2*2 filtered stereo sound data for the next sound sample offset.
+
+            sum1 = _mm_add_ps(sum1, _mm_mul_ps(_mm_loadu_ps(pSrc)    , pFil[0]));
+            sum2 = _mm_add_ps(sum2, _mm_mul_ps(_mm_loadu_ps(pSrc + 2), pFil[0]));
+
+            sum1 = _mm_add_ps(sum1, _mm_mul_ps(_mm_loadu_ps(pSrc + 4), pFil[1]));
+            sum2 = _mm_add_ps(sum2, _mm_mul_ps(_mm_loadu_ps(pSrc + 6), pFil[1]));
+
+            sum1 = _mm_add_ps(sum1, _mm_mul_ps(_mm_loadu_ps(pSrc + 8) ,  pFil[2]));
+            sum2 = _mm_add_ps(sum2, _mm_mul_ps(_mm_loadu_ps(pSrc + 10), pFil[2]));
+
+            sum1 = _mm_add_ps(sum1, _mm_mul_ps(_mm_loadu_ps(pSrc + 12), pFil[3]));
+            sum2 = _mm_add_ps(sum2, _mm_mul_ps(_mm_loadu_ps(pSrc + 14), pFil[3]));
+
+            pSrc += 16;
+            pFil += 4;
+        }
+
+        // Now sum1 and sum2 both have a filtered 2-channel sample each, but we still need
+        // to sum the two hi- and lo-floats of these registers together.
+
+        // post-shuffle & add the filtered values and store to dest.
+        _mm_storeu_ps(dest, _mm_add_ps(
+                    _mm_shuffle_ps(sum1, sum2, _MM_SHUFFLE(1,0,3,2)),   // s2_1 s2_0 s1_3 s1_2
+                    _mm_shuffle_ps(sum1, sum2, _MM_SHUFFLE(3,2,1,0))    // s2_3 s2_2 s1_1 s1_0
+                    ));
+        source += 4;
+        dest += 4;
+    }
+
+    // Ideas for further improvement:
+    // 1. If it could be guaranteed that 'source' were always aligned to 16-byte 
+    //    boundary, a faster aligned '_mm_load_ps' instruction could be used.
+    // 2. If it could be guaranteed that 'dest' were always aligned to 16-byte 
+    //    boundary, a faster '_mm_store_ps' instruction could be used.
+
+    return (uint)count;
+
+    /* original routine in C-language. please notice the C-version has differently 
+       organized coefficients though.
+    double suml1, suml2;
+    double sumr1, sumr2;
+    uint i, j;
+
+    for (j = 0; j < count; j += 2)
+    {
+        const float *ptr;
+        const float *pFil;
+
+        suml1 = sumr1 = 0.0;
+        suml2 = sumr2 = 0.0;
+        ptr = src;
+        pFil = filterCoeffs;
+        for (i = 0; i < lengthLocal; i ++) 
+        {
+            // unroll loop for efficiency.
+
+            suml1 += ptr[0] * pFil[0] + 
+                     ptr[2] * pFil[2] +
+                     ptr[4] * pFil[4] +
+                     ptr[6] * pFil[6];
+
+            sumr1 += ptr[1] * pFil[1] + 
+                     ptr[3] * pFil[3] +
+                     ptr[5] * pFil[5] +
+                     ptr[7] * pFil[7];
+
+            suml2 += ptr[8] * pFil[0] + 
+                     ptr[10] * pFil[2] +
+                     ptr[12] * pFil[4] +
+                     ptr[14] * pFil[6];
+
+            sumr2 += ptr[9] * pFil[1] + 
+                     ptr[11] * pFil[3] +
+                     ptr[13] * pFil[5] +
+                     ptr[15] * pFil[7];
+
+            ptr += 16;
+            pFil += 8;
+        }
+        dest[0] = (float)suml1;
+        dest[1] = (float)sumr1;
+        dest[2] = (float)suml2;
+        dest[3] = (float)sumr2;
+
+        src += 4;
+        dest += 4;
+    }
+    */
+}
+
+#endif  // SOUNDTOUCH_ALLOW_SSE
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/td_stretch/TDStretch.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/td_stretch/TDStretch.cpp
new file mode 100644
index 0000000..fd55e70
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/td_stretch/TDStretch.cpp
@@ -0,0 +1,808 @@
+////////////////////////////////////////////////////////////////////////////////
+/// 
+/// Sampled sound tempo changer/time stretch algorithm. Changes the sound tempo 
+/// while maintaining the original pitch by using a time domain WSOLA-like 
+/// method with several performance-increasing tweaks.
+///
+/// Note : MMX optimized functions reside in a separate, platform-specific 
+/// file, e.g. 'mmx_win.cpp' or 'mmx_gcc.cpp'
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-11-08 20:53:01 +0200 (Thu, 08 Nov 2012) $
+// File revision : $Revision: 1.12 $
+//
+// $Id: TDStretch.cpp 160 2012-11-08 18:53:01Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#include <string.h>
+#include <limits.h>
+#include <assert.h>
+#include <math.h>
+#include <float.h>
+
+#include "STTypes.h"
+#include "cpu_detect.h"
+#include "TDStretch.h"
+
+#include <stdio.h>
+
+using namespace soundtouch;
+
+#define max(x, y) (((x) > (y)) ? (x) : (y))
+
+
+/*****************************************************************************
+ *
+ * Constant definitions
+ *
+ *****************************************************************************/
+
+// Table for the hierarchical mixing position seeking algorithm
+static const short _scanOffsets[5][24]={
+    { 124,  186,  248,  310,  372,  434,  496,  558,  620,  682,  744, 806,
+      868,  930,  992, 1054, 1116, 1178, 1240, 1302, 1364, 1426, 1488,   0},
+    {-100,  -75,  -50,  -25,   25,   50,   75,  100,    0,    0,    0,   0,
+        0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,   0},
+    { -20,  -15,  -10,   -5,    5,   10,   15,   20,    0,    0,    0,   0,
+        0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,   0},
+    {  -4,   -3,   -2,   -1,    1,    2,    3,    4,    0,    0,    0,   0,
+        0,    0,    0,    0,    0,    0,    0,    0,    0,    0,    0,   0},
+    { 121,  114,   97,  114,   98,  105,  108,   32,  104,   99,  117,  111,
+      116,  100,  110,  117,  111,  115,    0,    0,    0,    0,    0,   0}};
+
+/*****************************************************************************
+ *
+ * Implementation of the class 'TDStretch'
+ *
+ *****************************************************************************/
+
+
+TDStretch::TDStretch() : FIFOProcessor(&outputBuffer)
+{
+    bQuickSeek = FALSE;
+    channels = 2;
+
+    pMidBuffer = NULL;
+    pMidBufferUnaligned = NULL;
+    overlapLength = 0;
+
+    bAutoSeqSetting = TRUE;
+    bAutoSeekSetting = TRUE;
+
+//    outDebt = 0;
+    skipFract = 0;
+
+    tempo = 1.0f;
+    setParameters(44100, DEFAULT_SEQUENCE_MS, DEFAULT_SEEKWINDOW_MS, DEFAULT_OVERLAP_MS);
+    setTempo(1.0f);
+
+    clear();
+}
+
+
+
+TDStretch::~TDStretch()
+{
+    delete[] pMidBufferUnaligned;
+}
+
+
+
+// Sets routine control parameters. These control are certain time constants
+// defining how the sound is stretched to the desired duration.
+//
+// 'sampleRate' = sample rate of the sound
+// 'sequenceMS' = one processing sequence length in milliseconds (default = 82 ms)
+// 'seekwindowMS' = seeking window length for scanning the best overlapping 
+//      position (default = 28 ms)
+// 'overlapMS' = overlapping length (default = 12 ms)
+
+void TDStretch::setParameters(int aSampleRate, int aSequenceMS, 
+                              int aSeekWindowMS, int aOverlapMS)
+{
+    // accept only positive parameter values - if zero or negative, use old values instead
+    if (aSampleRate > 0)   this->sampleRate = aSampleRate;
+    if (aOverlapMS > 0)    this->overlapMs = aOverlapMS;
+
+    if (aSequenceMS > 0)
+    {
+        this->sequenceMs = aSequenceMS;
+        bAutoSeqSetting = FALSE;
+    } 
+    else if (aSequenceMS == 0)
+    {
+        // if zero, use automatic setting
+        bAutoSeqSetting = TRUE;
+    }
+
+    if (aSeekWindowMS > 0) 
+    {
+        this->seekWindowMs = aSeekWindowMS;
+        bAutoSeekSetting = FALSE;
+    } 
+    else if (aSeekWindowMS == 0) 
+    {
+        // if zero, use automatic setting
+        bAutoSeekSetting = TRUE;
+    }
+
+    calcSeqParameters();
+
+    calculateOverlapLength(overlapMs);
+
+    // set tempo to recalculate 'sampleReq'
+    setTempo(tempo);
+
+}
+
+
+
+/// Get routine control parameters, see setParameters() function.
+/// Any of the parameters to this function can be NULL, in such case corresponding parameter
+/// value isn't returned.
+void TDStretch::getParameters(int *pSampleRate, int *pSequenceMs, int *pSeekWindowMs, int *pOverlapMs) const
+{
+    if (pSampleRate)
+    {
+        *pSampleRate = sampleRate;
+    }
+
+    if (pSequenceMs)
+    {
+        *pSequenceMs = (bAutoSeqSetting) ? (USE_AUTO_SEQUENCE_LEN) : sequenceMs;
+    }
+
+    if (pSeekWindowMs)
+    {
+        *pSeekWindowMs = (bAutoSeekSetting) ? (USE_AUTO_SEEKWINDOW_LEN) : seekWindowMs;
+    }
+
+    if (pOverlapMs)
+    {
+        *pOverlapMs = overlapMs;
+    }
+}
+
+
+// Overlaps samples in 'midBuffer' with the samples in 'pInput'
+void TDStretch::overlapMono(SAMPLETYPE *pOutput, const SAMPLETYPE *pInput) const
+{
+    int i;
+    SAMPLETYPE m1, m2;
+
+    m1 = (SAMPLETYPE)0;
+    m2 = (SAMPLETYPE)overlapLength;
+
+    for (i = 0; i < overlapLength ; i ++) 
+    {
+        pOutput[i] = (SAMPLETYPE)((pInput[i] * m1 + pMidBuffer[i] * m2 ) / overlapLength);
+        m1 += 1;
+        m2 -= 1;
+    }
+}
+
+
+
+void TDStretch::clearMidBuffer()
+{
+    memset(pMidBuffer, 0, 2 * sizeof(SAMPLETYPE) * overlapLength);
+}
+
+
+void TDStretch::clearInput()
+{
+    inputBuffer.clear();
+    clearMidBuffer();
+}
+
+
+// Clears the sample buffers
+void TDStretch::clear()
+{
+    outputBuffer.clear();
+    clearInput();
+}
+
+
+
+// Enables/disables the quick position seeking algorithm. Zero to disable, nonzero
+// to enable
+void TDStretch::enableQuickSeek(BOOL enable)
+{
+    bQuickSeek = enable;
+}
+
+
+// Returns nonzero if the quick seeking algorithm is enabled.
+BOOL TDStretch::isQuickSeekEnabled() const
+{
+    return bQuickSeek;
+}
+
+
+// Seeks for the optimal overlap-mixing position.
+int TDStretch::seekBestOverlapPosition(const SAMPLETYPE *refPos)
+{
+    if (bQuickSeek) 
+    {
+        return seekBestOverlapPositionQuick(refPos);
+    } 
+    else 
+    {
+        return seekBestOverlapPositionFull(refPos);
+    }
+}
+
+
+// Overlaps samples in 'midBuffer' with the samples in 'pInputBuffer' at position
+// of 'ovlPos'.
+inline void TDStretch::overlap(SAMPLETYPE *pOutput, const SAMPLETYPE *pInput, uint ovlPos) const
+{
+    if (channels == 2) 
+    {
+        // stereo sound
+        overlapStereo(pOutput, pInput + 2 * ovlPos);
+    } else {
+        // mono sound.
+        overlapMono(pOutput, pInput + ovlPos);
+    }
+}
+
+
+
+// Seeks for the optimal overlap-mixing position. The 'stereo' version of the
+// routine
+//
+// The best position is determined as the position where the two overlapped
+// sample sequences are 'most alike', in terms of the highest cross-correlation
+// value over the overlapping period
+int TDStretch::seekBestOverlapPositionFull(const SAMPLETYPE *refPos) 
+{
+    int bestOffs;
+    double bestCorr, corr;
+    int i;
+
+    bestCorr = FLT_MIN;
+    bestOffs = 0;
+
+    // Scans for the best correlation value by testing each possible position
+    // over the permitted range.
+    for (i = 0; i < seekLength; i ++) 
+    {
+        // Calculates correlation value for the mixing position corresponding
+        // to 'i'
+        corr = calcCrossCorr(refPos + channels * i, pMidBuffer);
+        // heuristic rule to slightly favour values close to mid of the range
+        double tmp = (double)(2 * i - seekLength) / (double)seekLength;
+        corr = ((corr + 0.1) * (1.0 - 0.25 * tmp * tmp));
+
+        // Checks for the highest correlation value
+        if (corr > bestCorr) 
+        {
+            bestCorr = corr;
+            bestOffs = i;
+        }
+    }
+    // clear cross correlation routine state if necessary (is so e.g. in MMX routines).
+    clearCrossCorrState();
+
+    return bestOffs;
+}
+
+
+// Seeks for the optimal overlap-mixing position. The 'stereo' version of the
+// routine
+//
+// The best position is determined as the position where the two overlapped
+// sample sequences are 'most alike', in terms of the highest cross-correlation
+// value over the overlapping period
+int TDStretch::seekBestOverlapPositionQuick(const SAMPLETYPE *refPos) 
+{
+    int j;
+    int bestOffs;
+    double bestCorr, corr;
+    int scanCount, corrOffset, tempOffset;
+
+    bestCorr = FLT_MIN;
+    bestOffs = _scanOffsets[0][0];
+    corrOffset = 0;
+    tempOffset = 0;
+
+    // Scans for the best correlation value using four-pass hierarchical search.
+    //
+    // The look-up table 'scans' has hierarchical position adjusting steps.
+    // In first pass the routine searhes for the highest correlation with 
+    // relatively coarse steps, then rescans the neighbourhood of the highest
+    // correlation with better resolution and so on.
+    for (scanCount = 0;scanCount < 4; scanCount ++) 
+    {
+        j = 0;
+        while (_scanOffsets[scanCount][j]) 
+        {
+            tempOffset = corrOffset + _scanOffsets[scanCount][j];
+            if (tempOffset >= seekLength) break;
+
+            // Calculates correlation value for the mixing position corresponding
+            // to 'tempOffset'
+            corr = (double)calcCrossCorr(refPos + channels * tempOffset, pMidBuffer);
+            // heuristic rule to slightly favour values close to mid of the range
+            double tmp = (double)(2 * tempOffset - seekLength) / seekLength;
+            corr = ((corr + 0.1) * (1.0 - 0.25 * tmp * tmp));
+
+            // Checks for the highest correlation value
+            if (corr > bestCorr) 
+            {
+                bestCorr = corr;
+                bestOffs = tempOffset;
+            }
+            j ++;
+        }
+        corrOffset = bestOffs;
+    }
+    // clear cross correlation routine state if necessary (is so e.g. in MMX routines).
+    clearCrossCorrState();
+
+    return bestOffs;
+}
+
+
+
+/// clear cross correlation routine state if necessary 
+void TDStretch::clearCrossCorrState()
+{
+    // default implementation is empty.
+}
+
+
+/// Calculates processing sequence length according to tempo setting
+void TDStretch::calcSeqParameters()
+{
+    // Adjust tempo param according to tempo, so that variating processing sequence length is used
+    // at varius tempo settings, between the given low...top limits
+    #define AUTOSEQ_TEMPO_LOW   0.5     // auto setting low tempo range (-50%)
+    #define AUTOSEQ_TEMPO_TOP   2.0     // auto setting top tempo range (+100%)
+
+    // sequence-ms setting values at above low & top tempo
+    #define AUTOSEQ_AT_MIN      125.0
+    #define AUTOSEQ_AT_MAX      50.0
+    #define AUTOSEQ_K           ((AUTOSEQ_AT_MAX - AUTOSEQ_AT_MIN) / (AUTOSEQ_TEMPO_TOP - AUTOSEQ_TEMPO_LOW))
+    #define AUTOSEQ_C           (AUTOSEQ_AT_MIN - (AUTOSEQ_K) * (AUTOSEQ_TEMPO_LOW))
+
+    // seek-window-ms setting values at above low & top tempo
+    #define AUTOSEEK_AT_MIN     25.0
+    #define AUTOSEEK_AT_MAX     15.0
+    #define AUTOSEEK_K          ((AUTOSEEK_AT_MAX - AUTOSEEK_AT_MIN) / (AUTOSEQ_TEMPO_TOP - AUTOSEQ_TEMPO_LOW))
+    #define AUTOSEEK_C          (AUTOSEEK_AT_MIN - (AUTOSEEK_K) * (AUTOSEQ_TEMPO_LOW))
+
+    #define CHECK_LIMITS(x, mi, ma) (((x) < (mi)) ? (mi) : (((x) > (ma)) ? (ma) : (x)))
+
+    double seq, seek;
+    
+    if (bAutoSeqSetting)
+    {
+        seq = AUTOSEQ_C + AUTOSEQ_K * tempo;
+        seq = CHECK_LIMITS(seq, AUTOSEQ_AT_MAX, AUTOSEQ_AT_MIN);
+        sequenceMs = (int)(seq + 0.5);
+    }
+
+    if (bAutoSeekSetting)
+    {
+        seek = AUTOSEEK_C + AUTOSEEK_K * tempo;
+        seek = CHECK_LIMITS(seek, AUTOSEEK_AT_MAX, AUTOSEEK_AT_MIN);
+        seekWindowMs = (int)(seek + 0.5);
+    }
+
+    // Update seek window lengths
+    seekWindowLength = (sampleRate * sequenceMs) / 1000;
+    if (seekWindowLength < 2 * overlapLength) 
+    {
+        seekWindowLength = 2 * overlapLength;
+    }
+    seekLength = (sampleRate * seekWindowMs) / 1000;
+}
+
+
+
+// Sets new target tempo. Normal tempo = 'SCALE', smaller values represent slower 
+// tempo, larger faster tempo.
+void TDStretch::setTempo(float newTempo)
+{
+    int intskip;
+
+    tempo = newTempo;
+
+    // Calculate new sequence duration
+    calcSeqParameters();
+
+    // Calculate ideal skip length (according to tempo value) 
+    nominalSkip = tempo * (seekWindowLength - overlapLength);
+    intskip = (int)(nominalSkip + 0.5f);
+
+    // Calculate how many samples are needed in the 'inputBuffer' to 
+    // process another batch of samples
+    //sampleReq = max(intskip + overlapLength, seekWindowLength) + seekLength / 2;
+    sampleReq = max(intskip + overlapLength, seekWindowLength) + seekLength;
+}
+
+
+
+// Sets the number of channels, 1 = mono, 2 = stereo
+void TDStretch::setChannels(int numChannels)
+{
+    assert(numChannels > 0);
+    if (channels == numChannels) return;
+    assert(numChannels == 1 || numChannels == 2);
+
+    channels = numChannels;
+    inputBuffer.setChannels(channels);
+    outputBuffer.setChannels(channels);
+}
+
+
+// nominal tempo, no need for processing, just pass the samples through
+// to outputBuffer
+/*
+void TDStretch::processNominalTempo()
+{
+    assert(tempo == 1.0f);
+
+    if (bMidBufferDirty) 
+    {
+        // If there are samples in pMidBuffer waiting for overlapping,
+        // do a single sliding overlapping with them in order to prevent a 
+        // clicking distortion in the output sound
+        if (inputBuffer.numSamples() < overlapLength) 
+        {
+            // wait until we've got overlapLength input samples
+            return;
+        }
+        // Mix the samples in the beginning of 'inputBuffer' with the 
+        // samples in 'midBuffer' using sliding overlapping 
+        overlap(outputBuffer.ptrEnd(overlapLength), inputBuffer.ptrBegin(), 0);
+        outputBuffer.putSamples(overlapLength);
+        inputBuffer.receiveSamples(overlapLength);
+        clearMidBuffer();
+        // now we've caught the nominal sample flow and may switch to
+        // bypass mode
+    }
+
+    // Simply bypass samples from input to output
+    outputBuffer.moveSamples(inputBuffer);
+}
+*/
+
+#include <stdio.h>
+
+// Processes as many processing frames of the samples 'inputBuffer', store
+// the result into 'outputBuffer'
+void TDStretch::processSamples()
+{
+    int ovlSkip, offset;
+    int temp;
+
+    /* Removed this small optimization - can introduce a click to sound when tempo setting
+       crosses the nominal value
+    if (tempo == 1.0f) 
+    {
+        // tempo not changed from the original, so bypass the processing
+        processNominalTempo();
+        return;
+    }
+    */
+
+    // process samples as long as there are enough samples in 'inputBuffer'
+    // to form a processing frame.
+    while ((int)inputBuffer.numSamples() >= sampleReq) 
+    {
+        // If tempo differs from the normal ('SCALE'), scan for the best overlapping
+        // position
+        offset = seekBestOverlapPosition(inputBuffer.ptrBegin());
+
+        // Mix the samples in the 'inputBuffer' at position of 'offset' with the 
+        // samples in 'midBuffer' using sliding overlapping
+        // ... first partially overlap with the end of the previous sequence
+        // (that's in 'midBuffer')
+        overlap(outputBuffer.ptrEnd((uint)overlapLength), inputBuffer.ptrBegin(), (uint)offset);
+        outputBuffer.putSamples((uint)overlapLength);
+
+        // ... then copy sequence samples from 'inputBuffer' to output:
+
+        // length of sequence
+        temp = (seekWindowLength - 2 * overlapLength);
+
+        // crosscheck that we don't have buffer overflow...
+        if ((int)inputBuffer.numSamples() < (offset + temp + overlapLength * 2))
+        {
+            continue;    // just in case, shouldn't really happen
+        }
+
+        outputBuffer.putSamples(inputBuffer.ptrBegin() + channels * (offset + overlapLength), (uint)temp);
+
+        // Copies the end of the current sequence from 'inputBuffer' to 
+        // 'midBuffer' for being mixed with the beginning of the next 
+        // processing sequence and so on
+        assert((offset + temp + overlapLength * 2) <= (int)inputBuffer.numSamples());
+        memcpy(pMidBuffer, inputBuffer.ptrBegin() + channels * (offset + temp + overlapLength), 
+            channels * sizeof(SAMPLETYPE) * overlapLength);
+
+        // Remove the processed samples from the input buffer. Update
+        // the difference between integer & nominal skip step to 'skipFract'
+        // in order to prevent the error from accumulating over time.
+        skipFract += nominalSkip;   // real skip size
+        ovlSkip = (int)skipFract;   // rounded to integer skip
+        skipFract -= ovlSkip;       // maintain the fraction part, i.e. real vs. integer skip
+        inputBuffer.receiveSamples((uint)ovlSkip);
+    }
+}
+
+
+// Adds 'numsamples' pcs of samples from the 'samples' memory position into
+// the input of the object.
+void TDStretch::putSamples(const SAMPLETYPE *samples, uint nSamples)
+{
+    // Add the samples into the input buffer
+    inputBuffer.putSamples(samples, nSamples);
+    // process the samples in input buffer
+    processSamples();
+}
+
+
+
+/// Set new overlap length parameter & reallocate RefMidBuffer if necessary.
+void TDStretch::acceptNewOverlapLength(int newOverlapLength)
+{
+    int prevOvl;
+
+    assert(newOverlapLength >= 0);
+    prevOvl = overlapLength;
+    overlapLength = newOverlapLength;
+
+    if (overlapLength > prevOvl)
+    {
+        delete[] pMidBufferUnaligned;
+
+        pMidBufferUnaligned = new SAMPLETYPE[overlapLength * 2 + 16 / sizeof(SAMPLETYPE)];
+        // ensure that 'pMidBuffer' is aligned to 16 byte boundary for efficiency
+        pMidBuffer = (SAMPLETYPE *)SOUNDTOUCH_ALIGN_POINTER_16(pMidBufferUnaligned);
+
+        clearMidBuffer();
+    }
+}
+
+
+// Operator 'new' is overloaded so that it automatically creates a suitable instance 
+// depending on if we've a MMX/SSE/etc-capable CPU available or not.
+void * TDStretch::operator new(size_t s)
+{
+    // Notice! don't use "new TDStretch" directly, use "newInstance" to create a new instance instead!
+    ST_THROW_RT_ERROR("Error in TDStretch::new: Don't use 'new TDStretch' directly, use 'newInstance' member instead!");
+    return newInstance();
+}
+
+
+TDStretch * TDStretch::newInstance()
+{
+    uint uExtensions;
+
+    uExtensions = detectCPUextensions();
+
+    // Check if MMX/SSE instruction set extensions supported by CPU
+
+#ifdef SOUNDTOUCH_ALLOW_MMX
+    // MMX routines available only with integer sample types
+    if (uExtensions & SUPPORT_MMX)
+    {
+        return ::new TDStretchMMX;
+    }
+    else
+#endif // SOUNDTOUCH_ALLOW_MMX
+
+
+#ifdef SOUNDTOUCH_ALLOW_SSE
+    if (uExtensions & SUPPORT_SSE)
+    {
+        // SSE support
+        return ::new TDStretchSSE;
+    }
+    else
+#endif // SOUNDTOUCH_ALLOW_SSE
+
+    {
+        // ISA optimizations not supported, use plain C version
+        return ::new TDStretch;
+    }
+}
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// Integer arithmetics specific algorithm implementations.
+//
+//////////////////////////////////////////////////////////////////////////////
+
+#ifdef SOUNDTOUCH_INTEGER_SAMPLES
+
+// Overlaps samples in 'midBuffer' with the samples in 'input'. The 'Stereo' 
+// version of the routine.
+void TDStretch::overlapStereo(short *poutput, const short *input) const
+{
+    int i;
+    short temp;
+    int cnt2;
+
+    for (i = 0; i < overlapLength ; i ++) 
+    {
+        temp = (short)(overlapLength - i);
+        cnt2 = 2 * i;
+        poutput[cnt2] = (short)((input[cnt2] * i + pMidBuffer[cnt2] * temp )  / overlapLength);
+        poutput[cnt2 + 1] = (short)((input[cnt2 + 1] * i + pMidBuffer[cnt2 + 1] * temp ) / overlapLength);
+    }
+}
+
+// Calculates the x having the closest 2^x value for the given value
+static int _getClosest2Power(double value)
+{
+    return (int)(log(value) / log(2.0) + 0.5);
+}
+
+
+/// Calculates overlap period length in samples.
+/// Integer version rounds overlap length to closest power of 2
+/// for a divide scaling operation.
+void TDStretch::calculateOverlapLength(int aoverlapMs)
+{
+    int newOvl;
+
+    assert(aoverlapMs >= 0);
+
+    // calculate overlap length so that it's power of 2 - thus it's easy to do
+    // integer division by right-shifting. Term "-1" at end is to account for 
+    // the extra most significatnt bit left unused in result by signed multiplication 
+    overlapDividerBits = _getClosest2Power((sampleRate * aoverlapMs) / 1000.0) - 1;
+    if (overlapDividerBits > 9) overlapDividerBits = 9;
+    if (overlapDividerBits < 3) overlapDividerBits = 3;
+    newOvl = (int)pow(2.0, (int)overlapDividerBits + 1);    // +1 => account for -1 above
+
+    acceptNewOverlapLength(newOvl);
+
+    // calculate sloping divider so that crosscorrelation operation won't 
+    // overflow 32-bit register. Max. sum of the crosscorrelation sum without 
+    // divider would be 2^30*(N^3-N)/3, where N = overlap length
+    slopingDivider = (newOvl * newOvl - 1) / 3;
+}
+
+
+double TDStretch::calcCrossCorr(const short *mixingPos, const short *compare) const
+{
+    long corr;
+    long norm;
+    int i;
+
+    corr = norm = 0;
+    // Same routine for stereo and mono. For stereo, unroll loop for better
+    // efficiency and gives slightly better resolution against rounding. 
+    // For mono it same routine, just  unrolls loop by factor of 4
+    for (i = 0; i < channels * overlapLength; i += 4) 
+    {
+        corr += (mixingPos[i] * compare[i] + 
+                 mixingPos[i + 1] * compare[i + 1] +
+                 mixingPos[i + 2] * compare[i + 2] + 
+                 mixingPos[i + 3] * compare[i + 3]) >> overlapDividerBits;
+        norm += (mixingPos[i] * mixingPos[i] + 
+                 mixingPos[i + 1] * mixingPos[i + 1] +
+                 mixingPos[i + 2] * mixingPos[i + 2] + 
+                 mixingPos[i + 3] * mixingPos[i + 3]) >> overlapDividerBits;
+    }
+
+    // Normalize result by dividing by sqrt(norm) - this step is easiest 
+    // done using floating point operation
+    if (norm == 0) norm = 1;    // to avoid div by zero
+    return (double)corr / sqrt((double)norm);
+}
+
+#endif // SOUNDTOUCH_INTEGER_SAMPLES
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// Floating point arithmetics specific algorithm implementations.
+//
+
+#ifdef SOUNDTOUCH_FLOAT_SAMPLES
+
+// Overlaps samples in 'midBuffer' with the samples in 'pInput'
+void TDStretch::overlapStereo(float *pOutput, const float *pInput) const
+{
+    int i;
+    float fScale;
+    float f1;
+    float f2;
+
+    fScale = 1.0f / (float)overlapLength;
+
+    f1 = 0;
+    f2 = 1.0f;
+
+    for (i = 0; i < 2 * (int)overlapLength ; i += 2) 
+    {
+        pOutput[i + 0] = pInput[i + 0] * f1 + pMidBuffer[i + 0] * f2;
+        pOutput[i + 1] = pInput[i + 1] * f1 + pMidBuffer[i + 1] * f2;
+
+        f1 += fScale;
+        f2 -= fScale;
+    }
+}
+
+
+/// Calculates overlapInMsec period length in samples.
+void TDStretch::calculateOverlapLength(int overlapInMsec)
+{
+    int newOvl;
+
+    assert(overlapInMsec >= 0);
+    newOvl = (sampleRate * overlapInMsec) / 1000;
+    if (newOvl < 16) newOvl = 16;
+
+    // must be divisible by 8
+    newOvl -= newOvl % 8;
+
+    acceptNewOverlapLength(newOvl);
+}
+
+
+double TDStretch::calcCrossCorr(const float *mixingPos, const float *compare) const
+{
+    double corr;
+    double norm;
+    int i;
+
+    corr = norm = 0;
+    // Same routine for stereo and mono. For Stereo, unroll by factor of 2.
+    // For mono it's same routine yet unrollsd by factor of 4.
+    for (i = 0; i < channels * overlapLength; i += 4) 
+    {
+        corr += mixingPos[i] * compare[i] +
+                mixingPos[i + 1] * compare[i + 1];
+
+        norm += mixingPos[i] * mixingPos[i] + 
+                mixingPos[i + 1] * mixingPos[i + 1];
+
+        // unroll the loop for better CPU efficiency:
+        corr += mixingPos[i + 2] * compare[i + 2] +
+                mixingPos[i + 3] * compare[i + 3];
+
+        norm += mixingPos[i + 2] * mixingPos[i + 2] +
+                mixingPos[i + 3] * mixingPos[i + 3];
+    }
+
+    if (norm < 1e-9) norm = 1.0;    // to avoid div by zero
+    return corr / sqrt(norm);
+}
+
+#endif // SOUNDTOUCH_FLOAT_SAMPLES
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/td_stretch/TDStretch.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/td_stretch/TDStretch.h
new file mode 100644
index 0000000..6d6e735
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/tone_shift/src/td_stretch/TDStretch.h
@@ -0,0 +1,268 @@
+////////////////////////////////////////////////////////////////////////////////
+/// 
+/// Sampled sound tempo changer/time stretch algorithm. Changes the sound tempo 
+/// while maintaining the original pitch by using a time domain WSOLA-like method 
+/// with several performance-increasing tweaks.
+///
+/// Note : MMX/SSE optimized functions reside in separate, platform-specific files 
+/// 'mmx_optimized.cpp' and 'sse_optimized.cpp'
+///
+/// Author        : Copyright (c) Olli Parviainen
+/// Author e-mail : oparviai 'at' iki.fi
+/// SoundTouch WWW: http://www.surina.net/soundtouch
+///
+////////////////////////////////////////////////////////////////////////////////
+//
+// Last changed  : $Date: 2012-04-01 22:49:30 +0300 (Sun, 01 Apr 2012) $
+// File revision : $Revision: 4 $
+//
+// $Id: TDStretch.h 137 2012-04-01 19:49:30Z oparviai $
+//
+////////////////////////////////////////////////////////////////////////////////
+//
+// License :
+//
+//  SoundTouch audio processing library
+//  Copyright (c) Olli Parviainen
+//
+//  This library is free software; you can redistribute it and/or
+//  modify it under the terms of the GNU Lesser General Public
+//  License as published by the Free Software Foundation; either
+//  version 2.1 of the License, or (at your option) any later version.
+//
+//  This library is distributed in the hope that it will be useful,
+//  but WITHOUT ANY WARRANTY; without even the implied warranty of
+//  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+//  Lesser General Public License for more details.
+//
+//  You should have received a copy of the GNU Lesser General Public
+//  License along with this library; if not, write to the Free Software
+//  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+//
+////////////////////////////////////////////////////////////////////////////////
+
+#ifndef TDStretch_H
+#define TDStretch_H
+
+#include <stddef.h>
+#include "STTypes.h"
+#include "RateTransposer.h"
+#include "FIFOSamplePipe.h"
+
+namespace soundtouch
+{
+
+/// Default values for sound processing parameters:
+/// Notice that the default parameters are tuned for contemporary popular music 
+/// processing. For speech processing applications these parameters suit better:
+///     #define DEFAULT_SEQUENCE_MS     40
+///     #define DEFAULT_SEEKWINDOW_MS   15
+///     #define DEFAULT_OVERLAP_MS      8
+///
+
+/// Default length of a single processing sequence, in milliseconds. This determines to how 
+/// long sequences the original sound is chopped in the time-stretch algorithm.
+///
+/// The larger this value is, the lesser sequences are used in processing. In principle
+/// a bigger value sounds better when slowing down tempo, but worse when increasing tempo
+/// and vice versa.
+///
+/// Increasing this value reduces computational burden & vice versa.
+//#define DEFAULT_SEQUENCE_MS         40
+#define DEFAULT_SEQUENCE_MS         USE_AUTO_SEQUENCE_LEN
+
+/// Giving this value for the sequence length sets automatic parameter value
+/// according to tempo setting (recommended)
+#define USE_AUTO_SEQUENCE_LEN       0
+
+/// Seeking window default length in milliseconds for algorithm that finds the best possible 
+/// overlapping location. This determines from how wide window the algorithm may look for an 
+/// optimal joining location when mixing the sound sequences back together. 
+///
+/// The bigger this window setting is, the higher the possibility to find a better mixing
+/// position will become, but at the same time large values may cause a "drifting" artifact
+/// because consequent sequences will be taken at more uneven intervals.
+///
+/// If there's a disturbing artifact that sounds as if a constant frequency was drifting 
+/// around, try reducing this setting.
+///
+/// Increasing this value increases computational burden & vice versa.
+//#define DEFAULT_SEEKWINDOW_MS       15
+#define DEFAULT_SEEKWINDOW_MS       USE_AUTO_SEEKWINDOW_LEN
+
+/// Giving this value for the seek window length sets automatic parameter value
+/// according to tempo setting (recommended)
+#define USE_AUTO_SEEKWINDOW_LEN     0
+
+/// Overlap length in milliseconds. When the chopped sound sequences are mixed back together, 
+/// to form a continuous sound stream, this parameter defines over how long period the two 
+/// consecutive sequences are let to overlap each other. 
+///
+/// This shouldn't be that critical parameter. If you reduce the DEFAULT_SEQUENCE_MS setting 
+/// by a large amount, you might wish to try a smaller value on this.
+///
+/// Increasing this value increases computational burden & vice versa.
+#define DEFAULT_OVERLAP_MS      8
+
+
+/// Class that does the time-stretch (tempo change) effect for the processed
+/// sound.
+class TDStretch : public FIFOProcessor
+{
+protected:
+    int channels;
+    int sampleReq;
+    float tempo;
+
+    SAMPLETYPE *pMidBuffer;
+    SAMPLETYPE *pMidBufferUnaligned;
+    int overlapLength;
+    int seekLength;
+    int seekWindowLength;
+    int overlapDividerBits;
+    int slopingDivider;
+    float nominalSkip;
+    float skipFract;
+    FIFOSampleBuffer outputBuffer;
+    FIFOSampleBuffer inputBuffer;
+    BOOL bQuickSeek;
+
+    int sampleRate;
+    int sequenceMs;
+    int seekWindowMs;
+    int overlapMs;
+    BOOL bAutoSeqSetting;
+    BOOL bAutoSeekSetting;
+
+    void acceptNewOverlapLength(int newOverlapLength);
+
+    virtual void clearCrossCorrState();
+    void calculateOverlapLength(int overlapMs);
+
+    virtual double calcCrossCorr(const SAMPLETYPE *mixingPos, const SAMPLETYPE *compare) const;
+
+    virtual int seekBestOverlapPositionFull(const SAMPLETYPE *refPos);
+    virtual int seekBestOverlapPositionQuick(const SAMPLETYPE *refPos);
+    int seekBestOverlapPosition(const SAMPLETYPE *refPos);
+
+    virtual void overlapStereo(SAMPLETYPE *output, const SAMPLETYPE *input) const;
+    virtual void overlapMono(SAMPLETYPE *output, const SAMPLETYPE *input) const;
+
+    void clearMidBuffer();
+    void overlap(SAMPLETYPE *output, const SAMPLETYPE *input, uint ovlPos) const;
+
+    void calcSeqParameters();
+
+    /// Changes the tempo of the given sound samples.
+    /// Returns amount of samples returned in the "output" buffer.
+    /// The maximum amount of samples that can be returned at a time is set by
+    /// the 'set_returnBuffer_size' function.
+    void processSamples();
+    
+public:
+    TDStretch();
+    virtual ~TDStretch();
+
+    /// Operator 'new' is overloaded so that it automatically creates a suitable instance 
+    /// depending on if we've a MMX/SSE/etc-capable CPU available or not.
+    static void *operator new(size_t s);
+
+    /// Use this function instead of "new" operator to create a new instance of this class. 
+    /// This function automatically chooses a correct feature set depending on if the CPU
+    /// supports MMX/SSE/etc extensions.
+    static TDStretch *newInstance();
+    
+    /// Returns the output buffer object
+    FIFOSamplePipe *getOutput() { return &outputBuffer; };
+
+    /// Returns the input buffer object
+    FIFOSamplePipe *getInput() { return &inputBuffer; };
+
+    /// Sets new target tempo. Normal tempo = 'SCALE', smaller values represent slower 
+    /// tempo, larger faster tempo.
+    void setTempo(float newTempo);
+
+    /// Returns nonzero if there aren't any samples available for outputting.
+    virtual void clear();
+
+    /// Clears the input buffer
+    void clearInput();
+
+    /// Sets the number of channels, 1 = mono, 2 = stereo
+    void setChannels(int numChannels);
+
+    /// Enables/disables the quick position seeking algorithm. Zero to disable, 
+    /// nonzero to enable
+    void enableQuickSeek(BOOL enable);
+
+    /// Returns nonzero if the quick seeking algorithm is enabled.
+    BOOL isQuickSeekEnabled() const;
+
+    /// Sets routine control parameters. These control are certain time constants
+    /// defining how the sound is stretched to the desired duration.
+    //
+    /// 'sampleRate' = sample rate of the sound
+    /// 'sequenceMS' = one processing sequence length in milliseconds
+    /// 'seekwindowMS' = seeking window length for scanning the best overlapping 
+    ///      position
+    /// 'overlapMS' = overlapping length
+    void setParameters(int sampleRate,          ///< Samplerate of sound being processed (Hz)
+                       int sequenceMS = -1,     ///< Single processing sequence length (ms)
+                       int seekwindowMS = -1,   ///< Offset seeking window length (ms)
+                       int overlapMS = -1       ///< Sequence overlapping length (ms)
+                       );
+
+    /// Get routine control parameters, see setParameters() function.
+    /// Any of the parameters to this function can be NULL, in such case corresponding parameter
+    /// value isn't returned.
+    void getParameters(int *pSampleRate, int *pSequenceMs, int *pSeekWindowMs, int *pOverlapMs) const;
+
+    /// Adds 'numsamples' pcs of samples from the 'samples' memory position into
+    /// the input of the object.
+    virtual void putSamples(
+            const SAMPLETYPE *samples,  ///< Input sample data
+            uint numSamples                         ///< Number of samples in 'samples' so that one sample
+                                                    ///< contains both channels if stereo
+            );
+
+    /// return nominal input sample requirement for triggering a processing batch
+    int getInputSampleReq() const
+    {
+        return (int)(nominalSkip + 0.5);
+    }
+
+    /// return nominal output sample amount when running a processing batch
+    int getOutputBatchSize() const
+    {
+        return seekWindowLength - overlapLength;
+    }
+};
+
+
+
+// Implementation-specific class declarations:
+
+#ifdef SOUNDTOUCH_ALLOW_MMX
+    /// Class that implements MMX optimized routines for 16bit integer samples type.
+    class TDStretchMMX : public TDStretch
+    {
+    protected:
+        double calcCrossCorr(const short *mixingPos, const short *compare) const;
+        virtual void overlapStereo(short *output, const short *input) const;
+        virtual void clearCrossCorrState();
+    };
+#endif /// SOUNDTOUCH_ALLOW_MMX
+
+
+#ifdef SOUNDTOUCH_ALLOW_SSE
+    /// Class that implements SSE optimized routines for floating point samples type.
+    class TDStretchSSE : public TDStretch
+    {
+    protected:
+        double calcCrossCorr(const float *mixingPos, const float *compare) const;
+    };
+
+#endif /// SOUNDTOUCH_ALLOW_SSE
+
+}
+#endif  /// TDStretch_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/CMakeLists.txt
new file mode 100644
index 0000000..fc1cfe0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/CMakeLists.txt
@@ -0,0 +1,4 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_WAVES_SRCS)
+add_library(waves ${DIR_WAVES_SRCS})
+#set_target_properties(waves PROPERTIES CXX_VISIBILITY_PRESET hidden)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/inc/ExtraMono.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/inc/ExtraMono.h
new file mode 100755
index 0000000..280fab0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/inc/ExtraMono.h
@@ -0,0 +1,230 @@
+
+#include <string>
+#include <string.h>
+
+#define SIZE_LONG 4
+#define SIZE_SHORT 2
+
+#define SIZE_FLAG 4
+#define FMT_TAG 0x0001
+
+#define BITS_PER_BYTE 8
+
+#ifndef AFS_CMPL_MAX_WAV	
+#define AFS_CMPL_MAX_WAV 15360000	// 时长16分（960*16000）
+#endif
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个32位数据
+//+---------------------------------------------------------------------------+
+unsigned long fa_read_u32(FILE* fp)
+{
+	unsigned long cx;
+	unsigned char temp[SIZE_LONG];
+
+	fread(temp, sizeof(unsigned char), SIZE_LONG, fp);
+	cx =  (unsigned long)temp[0];
+	cx |= (unsigned long)temp[1] << 8;
+	cx |= (unsigned long)temp[2] << 16;
+	cx |= (unsigned long)temp[3] << 24;
+	return cx;
+}
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个16位数据
+//+---------------------------------------------------------------------------+
+unsigned short fa_read_u16(FILE *fp)
+{
+	unsigned short cx;
+	unsigned char  temp[SIZE_SHORT];
+
+	fread(temp, sizeof(unsigned char), SIZE_SHORT, fp);
+	cx = temp[0] | (temp[1] * 256);
+	return cx;
+}
+
+int GetWaveHeadLen(const char* pszFile,unsigned short &channels, int &nPos, int& nLength)
+{
+	//+---------------------------------------------------------------------------+
+	//+ 读取WAVE的头信息
+	//+---------------------------------------------------------------------------+
+	unsigned char  temp[SIZE_FLAG];
+	unsigned short bits_per_sample;
+	unsigned long  x_size;
+	unsigned long  n_skip;
+
+	unsigned short format;
+	//unsigned short channels;
+	unsigned long  sample_rate;
+	unsigned short block_align;
+	unsigned long  data_size;
+	int nCnt = 0;
+
+	/* 读取通用信息 */
+	FILE* pWavFile = fopen(pszFile, "rb");
+	if ( pWavFile == NULL )
+	{
+		printf("Input file can not be opened!\n");
+		return -1;
+	}
+
+	fseek(pWavFile, 0, SEEK_END );
+	nLength = ftell(pWavFile);
+	fseek(pWavFile, 0, SEEK_SET );
+
+	// 判断资源标识为"RIFF"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "RIFF", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Resource flag is not RIFF!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+	nCnt += SIZE_LONG;
+
+	// 判断文件标识为"WAVE"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "WAVE", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "File flag is not WAVE\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	// 判断格式标识为"fmt "
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "fmt ", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Format flag is not FMT!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	x_size = fa_read_u32(pWavFile);
+	nCnt += SIZE_LONG;
+
+	// 判断编码格式为0x0001
+	format = fa_read_u16(pWavFile);
+	nCnt += SIZE_SHORT;
+	if ( format != FMT_TAG )
+	{
+		fprintf(stderr, "Encoding format is not 0x0001!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+
+	// 读取声道数目和采样频率
+	channels = fa_read_u16(pWavFile);
+	sample_rate = fa_read_u32(pWavFile);
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+
+	// 读取对齐单位和样本位数
+	block_align = fa_read_u16(pWavFile);
+	bits_per_sample = fa_read_u16(pWavFile);
+
+	/* 读取特殊信息 */
+	x_size -= (4*SIZE_SHORT + 2*SIZE_LONG);
+	if ( x_size != 0 )
+	{
+		fseek(pWavFile, x_size, SEEK_CUR);
+	}
+
+	// 读取数据大小
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	while ( memcmp(temp, "data", SIZE_FLAG) != 0 )
+	{
+		n_skip = fa_read_u32(pWavFile);
+		fseek(pWavFile, n_skip, SEEK_CUR);
+
+		fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	}
+
+	data_size = fa_read_u32(pWavFile);
+	fclose(pWavFile);
+
+	//+---------------------------------------------------------------------------+
+	//+ 返回WAVE的头长度
+	//+---------------------------------------------------------------------------+
+	nPos = nCnt;
+	int nHeadLength = nLength - data_size;
+	return nHeadLength;
+}
+
+bool ExtraMono(const std::string &sInput, const std::string &sOutput)
+{
+	FILE *pFile = fopen(sInput.c_str(), "rb");
+	if ( NULL == pFile )
+	{
+		printf("Fopen Error %s", sInput.c_str());
+		return false;
+	}
+
+	FILE *pFile2 = fopen(sOutput.c_str(), "wb");
+	if ( NULL == pFile2 )
+	{
+		printf("Fopen2 Error %s", sOutput.c_str());
+		return false;
+	}
+
+	short *pBuf = new short[AFS_CMPL_MAX_WAV];
+	int nLen = 0;
+
+	nLen = fread(pBuf, sizeof(short), AFS_CMPL_MAX_WAV, pFile);
+	if ( nLen <= 0 )
+	{
+		perror("Fread Error!");
+		return false;
+	}
+
+	unsigned short channels=0;
+	int nPos;
+	int nLength;
+	int nHeadByte = GetWaveHeadLen(sInput.c_str(),channels, nPos, nLength);
+	int nHeadShort = nHeadByte/2;
+	
+	if (channels==1)
+	{
+		fwrite(pBuf + nHeadShort, sizeof(short), nLen - nHeadShort, pFile2);
+	}
+	else
+	{
+		short *pBuf2 = new short[AFS_CMPL_MAX_WAV];
+		memcpy( pBuf2, pBuf, nHeadShort*sizeof(short));
+		pBuf2[nPos] = 1;
+
+		unsigned char tmp[2];
+		memcpy(tmp, &pBuf2[nPos], 2);
+
+		pBuf2[nPos] = static_cast<short>(tmp[0] | tmp[1]*256);
+
+		short *pWav = pBuf + nHeadShort;
+		nLen -= nHeadShort;
+
+		int halfnlen=nLen/2;
+		for (int i=0;i<=halfnlen;i++ )
+		{
+			pBuf2[nHeadShort+i] = *(pWav+i*2);
+		}
+		fwrite(pBuf2, sizeof(short), nLen+nHeadShort, pFile2);
+
+		delete []pBuf;
+		delete []pBuf2;
+		pBuf = NULL;
+		pBuf2 = NULL;
+	}
+
+
+	fclose(pFile);
+	fclose(pFile2);
+	return true;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/inc/STWaveFile.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/inc/STWaveFile.h
new file mode 100755
index 0000000..0593058
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/inc/STWaveFile.h
@@ -0,0 +1,74 @@
+#ifndef WAVE_FILE_H
+#define WAVE_FILE_H
+
+#include <stdio.h>
+#include <stdint.h>
+
+
+typedef enum SAMPLE_FORMAT
+{
+    SF_U8 = 8,
+    SF_S16 = 16,
+    SF_S24 = 24,
+    SF_S32 = 32,
+    SF_IEEE_FLOAT = 0x100 + 32,
+    SF_IEEE_DOUBLE = 0x100 + 64,
+    SF_MAX,
+} SAMPLE_FORMAT;
+
+/* 主处理对象 **/
+class STCWaveFile
+{
+public:
+	/* 构造传入文件及 是读还是写 **/
+    STCWaveFile(const char* Filename, bool Write);
+    virtual ~STCWaveFile();
+
+public:
+    int GetChannels();
+    int GetSampleRate();
+    double GetDuration();  // in second
+    uint32_t GetChannelMask();
+    void SetChannels(int Channels);
+    void SetSampleRate(int SampleRate);
+    void SetSampleFormat(SAMPLE_FORMAT Format);
+    void SetChannelMask(uint32_t Mask);
+    void Stat();
+    void SetupDone();
+    bool ReadFrameAsS16(short* FrameSamples, int Frames = 1);
+    bool ReadFrameAsDouble(double* FrameSamples, int Frames = 1);
+	bool ReadFrameAsfloat(float* FrameSamples, int Frames = 1);
+	void WriteRaw(void* Raw, int Size);
+    void WriteFrame(uint8_t* FrameSamples, int Frames = 1);
+    void WriteFrame(short* FrameSamples, int Frames = 1);
+    void WriteFrame(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrameS24(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrame(double* FrameSamples, int Frames = 1);
+    void WriteFrame(float* FrameSamples, int Frames=1);
+    void Seek(int FramePos, int Where = SEEK_SET);
+	bool GetStatus();
+	SAMPLE_FORMAT GetFormat();
+	int GetTotalFrames();
+	int GetFramesRead();
+
+
+protected:
+    FILE* File;
+    int Channels;					/* 通道数 **/
+    int SampleRate;					/* 采样率 **/
+    SAMPLE_FORMAT Format;			/* 采样精度 **/
+    int SampleSize; // Measured in Bits
+    unsigned int FrameStartPos;		/* 音频数据的起始位置 **/
+    unsigned long TotalFrames;		/* 总帧数，如果16bit，则一个short为一帧 **/
+    unsigned long FramesRead;
+    double Duration;				/* 时长 **/
+
+    bool ReadOnly;					/* 是度还是写 **/
+
+    uint32_t ChannelMask;
+
+	bool m_bOK;		/* 文件是否已经被打开 **/
+};
+
+
+#endif
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/src/STWaveFile.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/src/STWaveFile.cpp
new file mode 100755
index 0000000..29d5b32
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/ref/waves/src/STWaveFile.cpp
@@ -0,0 +1,822 @@
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <memory.h>
+#include <errno.h>
+
+#if WIN32
+#else
+#include <inttypes.h>
+#endif
+
+#include "STWaveFile.h"
+#define SPEAKER_FRONT_LEFT             0x1
+#define SPEAKER_FRONT_RIGHT            0x2
+#define SPEAKER_FRONT_CENTER           0x4
+#define SPEAKER_LOW_FREQUENCY          0x8
+#define SPEAKER_BACK_LEFT              0x10
+#define SPEAKER_BACK_RIGHT             0x20
+#define SPEAKER_FRONT_LEFT_OF_CENTER   0x40
+#define SPEAKER_FRONT_RIGHT_OF_CENTER  0x80
+#define SPEAKER_BACK_CENTER            0x100
+#define SPEAKER_SIDE_LEFT              0x200
+#define SPEAKER_SIDE_RIGHT             0x400
+#define SPEAKER_TOP_CENTER             0x800
+#define SPEAKER_TOP_FRONT_LEFT         0x1000
+#define SPEAKER_TOP_FRONT_CENTER       0x2000
+#define SPEAKER_TOP_FRONT_RIGHT        0x4000
+#define SPEAKER_TOP_BACK_LEFT          0x8000
+#define SPEAKER_TOP_BACK_CENTER        0x10000
+#define SPEAKER_TOP_BACK_RIGHT         0x20000
+#define SPEAKER_RESERVED               0x80000000
+
+
+#define SPEAKER_REAR_CENTER_SURROUND   SPEAKER_BACK_CENTER 
+
+#define DCA_MONO 0
+#define DCA_CHANNEL 1
+#define DCA_STEREO 2
+#define DCA_STEREO_SUMDIFF 3
+#define DCA_STEREO_TOTAL 4
+#define DCA_3F 5
+#define DCA_2F1R 6
+#define DCA_3F1R 7
+#define DCA_2F2R 8
+#define DCA_3F2R 9
+#define DCA_4F2R 10
+
+#define DCA_DOLBY 101 /* FIXME */
+
+#define DCA_CHANNEL_MAX  DCA_3F2R /* We don't handle anything above that */
+#define DCA_CHANNEL_BITS 6
+#define DCA_CHANNEL_MASK 0x3F
+
+#define DCA_LFE 0x80
+#define DCA_ADJUST_LEVEL 0x100
+
+#define WAVE_FORMAT_PCM        0x0001
+#define WAVE_FORMAT_IEEE_FLOAT 0x0003
+#define WAVE_FORMAT_EXTENSIBLE 0xFFFE
+
+static uint8_t wav_header[] = {
+    'R', 'I', 'F', 'F', 0xfc, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 16, 0, 0, 0,
+    WAVE_FORMAT_PCM, WAVE_FORMAT_PCM >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0,
+    'd', 'a', 't', 'a', 0xd8, 0xff, 0xff, 0xff
+};
+
+static uint8_t wavmulti_header[] = {
+    'R', 'I', 'F', 'F', 0xf0, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 40, 0, 0, 0,
+    (uint8_t)(WAVE_FORMAT_EXTENSIBLE & 0xFF), WAVE_FORMAT_EXTENSIBLE >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 22, 0,
+    0, 0, 0, 0, 0, 0,
+    WAVE_FORMAT_IEEE_FLOAT, WAVE_FORMAT_IEEE_FLOAT >> 8,
+    0, 0, 0, 0, 0x10, 0x00, 0x80, 0, 0, 0xaa, 0, 0x38, 0x9b, 0x71,
+    'd', 'a', 't', 'a', 0xb4, 0xff, 0xff, 0xff
+};
+
+static void store4 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+    buf[2] = value >> 16;
+    buf[3] = value >> 24;
+}
+
+static void store2 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+}
+
+
+static uint32_t find_chunk(FILE * file, const uint8_t chunk_id[4])
+{
+    uint8_t buffer[8];
+    while (1) {
+        size_t chunksize;
+        size_t s = fread(buffer, 1, 8, file);
+        if (s < 8)
+            return 0;
+        chunksize = (uint32_t)buffer[4] | ((uint32_t)buffer[5] << 8) |
+            ((uint32_t)buffer[6] << 16) | ((uint32_t)buffer[7] << 24);
+        if (!memcmp(buffer, chunk_id, 4))
+            return chunksize;
+        fseek(file, chunksize, SEEK_CUR);
+    }
+}
+
+
+STCWaveFile::STCWaveFile(const char* Filename, bool Write)
+    : Duration(0), ReadOnly(false), m_bOK(false)
+{
+    Channels = 0;
+
+	/* 打开文件 **/
+    File = fopen(Filename, Write ? "wb":"rb");
+    if ( !File )
+        return;
+    
+	/* 设置写文件初始参数 **/
+    if ( Write )
+    {
+        SampleRate = 44100;
+        Channels = 2;
+        Format = SF_S16;
+        SampleSize = 16;
+		ChannelMask = 0;
+		m_bOK = true;
+        return;
+    }
+
+    ReadOnly = true;
+
+    size_t s;
+    uint8_t buffer[8];
+    uint8_t *fmt = NULL;
+    uint32_t v;
+    uint32_t avg_bps;
+    uint32_t block_align;
+    unsigned short FormatType;
+    unsigned short SampleType;
+
+    static const uint8_t riff[4] = { 'R', 'I', 'F', 'F' };
+    static const uint8_t wave[4] = { 'W', 'A', 'V', 'E' };
+    static const uint8_t fmt_[4] = { 'f', 'm', 't', ' ' };
+    static const uint8_t data[4] = { 'd', 'a', 't', 'a' };
+
+	/* 前四个字节为 riff **/
+    s = fread(buffer, 1, 8, File);
+    if (s < 8)
+        goto err2;
+
+    if (memcmp(buffer, riff, 4))
+        goto err2;
+
+	/* 8~12为wave **/
+    /* TODO: check size (in buffer[4..8]) */
+    s = fread(buffer, 1, 4, File);
+    if (s < 4)
+        goto err2;
+
+    if (memcmp(buffer, wave, 4))
+        goto err2;
+
+    s = find_chunk(File, fmt_);
+    if ( s != 16 && s != 18 && s != 40 )
+        goto err2;
+
+    fmt = (uint8_t*)malloc(s);
+    if (!fmt)
+        goto err2;
+
+    if (fread(fmt, 1, s, File) != s)
+        goto err3;
+
+    /* wFormatTag */
+    v = (uint32_t)fmt[0] | ((uint32_t)fmt[1] << 8);
+    if (v != WAVE_FORMAT_PCM && v != WAVE_FORMAT_IEEE_FLOAT && v != WAVE_FORMAT_EXTENSIBLE)
+        goto err3;
+
+    FormatType = v;
+
+    if (s == 40 && 0xfffe == v)
+    {
+        // fmt begins at 0x14 of the wave file
+        v = *(unsigned short*)&fmt[0x2C - 0x14];
+    }
+
+    SampleType = v;
+
+    /* wChannels */
+    v = (uint32_t)fmt[2] | ((uint32_t)fmt[3] << 8);
+
+    Channels = v;
+
+    if (v < 1 || v > 32)
+        goto err3;
+
+    /* dwSamplesPerSec */
+    SampleRate = (uint32_t)fmt[4] | ((uint32_t)fmt[5] << 8) |
+        ((uint32_t)fmt[6] << 16) | ((uint32_t)fmt[7] << 24);
+
+    /* dwAvgBytesPerSec */
+    avg_bps = (uint32_t)fmt[8] | ((uint32_t)fmt[9] << 8) |
+        ((uint32_t)fmt[10] << 16) | ((uint32_t)fmt[11] << 24);
+
+    /* wBlockAlign */
+    block_align = (uint32_t)fmt[12] | ((uint32_t)fmt[13] << 8);
+
+    /* wBitsPerSample */
+    SampleSize = (uint32_t)fmt[14] | ((uint32_t)fmt[15] << 8);
+    if (SampleSize != 8 && SampleSize != 16 && SampleSize != 32 && SampleSize != 24 && SampleSize != 64)
+        goto err3;
+
+    switch (SampleSize)
+    {
+    case 8:
+        Format = SF_U8;
+        break;
+    case 16:
+        Format = SF_S16;
+        break;
+    case 24:
+        Format = SF_S24;
+        break;
+    case 32:
+    {
+        if (SampleType == WAVE_FORMAT_IEEE_FLOAT)
+            Format = SF_IEEE_FLOAT;
+        else
+            Format = SF_S32;
+
+    }
+    break;
+    case 64:
+        if (SampleType != WAVE_FORMAT_IEEE_FLOAT)
+            goto err3;
+        Format = SF_IEEE_DOUBLE;
+        break;
+    }
+
+
+    // Handle 24-bit samples individually
+#if 0
+    if (SampleSize == 24 && Channels <= 2)
+    {
+        int ba24 = Channels * (SampleSize / 8); // Align to 4x
+
+        ba24 = (ba24 + 3) / 4 * 4;
+
+        if (block_align != ba24)
+            goto err3;
+    }
+    else
+#endif
+    {
+        if (block_align != Channels * (SampleSize / 8))
+            goto err3;
+    }
+
+    if (avg_bps != block_align * SampleRate)
+        goto err3;
+
+    v = find_chunk(File, data);
+
+    if (v == 0 || v % block_align != 0)
+        goto err3;
+
+    TotalFrames = v / block_align;
+
+    FramesRead = 0;
+
+    if (FormatType == WAVE_FORMAT_EXTENSIBLE)
+    {
+        ChannelMask = *(unsigned int*)(&fmt[0x14]);
+    }
+    else
+    {
+        ChannelMask = 0;
+    }
+    
+    FrameStartPos = ftell(File);
+
+    free(fmt);
+	m_bOK = true;
+    return;
+
+err3:
+    free(fmt);
+err2:
+    fclose(File);
+
+    File = NULL;
+}
+
+bool STCWaveFile::GetStatus()
+{
+	return m_bOK;
+}
+
+SAMPLE_FORMAT STCWaveFile::GetFormat()
+{
+	return Format;
+}
+
+int STCWaveFile::GetTotalFrames()
+{
+	return TotalFrames;
+}
+
+int STCWaveFile::GetFramesRead()
+{
+	return FramesRead;
+}
+
+STCWaveFile::~STCWaveFile()
+{
+    if (File != NULL)
+    {
+        if (!ReadOnly)
+        {
+            unsigned int Size = ftell(File) - FrameStartPos;// 44;
+
+            fseek(File, FrameStartPos - 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+
+            Size += FrameStartPos - 8;
+
+            fseek(File, 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+        }
+
+        fclose(File);
+    }
+}
+
+int STCWaveFile::GetSampleRate()
+{
+    return SampleRate;
+}
+
+void STCWaveFile::SetSampleRate(int SampleRate)
+{
+    this->SampleRate = SampleRate;
+}
+
+void STCWaveFile::SetupDone()
+{
+    unsigned char Header[68];
+
+    fseek(File, 0, SEEK_SET);
+
+    SampleSize = Format & 0xFF;
+
+    if (ChannelMask)
+    {
+        memcpy(Header, wavmulti_header, sizeof(wavmulti_header));
+
+        if (Format < SF_IEEE_FLOAT)
+        {
+         //   store2(Header + 20, WAVE_FORMAT_PCM);
+            store2(Header + 44, WAVE_FORMAT_PCM);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        store2(Header + 38, SampleSize / 8 * 8);
+        store4(Header + 40, ChannelMask);
+
+        fwrite(Header, sizeof(wavmulti_header), 1, File);
+    }
+    else
+    {
+        memcpy(Header, wav_header, sizeof(wav_header));
+
+        if (Format >= SF_IEEE_FLOAT)
+        {
+            store2(Header + 20, WAVE_FORMAT_IEEE_FLOAT);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        fwrite(Header, sizeof(wav_header), 1, File);
+    }
+
+
+    FrameStartPos = ftell(File);
+}
+
+
+void STCWaveFile::Seek(int FramePos, int Where)
+{
+    // Ignoring Where
+
+    fseek(File, FrameStartPos + FramePos * Channels* (SampleSize / 8), Where);
+
+    FramesRead = FramePos;
+
+}
+
+int STCWaveFile::GetChannels()
+{
+    return Channels;
+}
+
+void STCWaveFile::SetChannels(int Channels)
+{
+    this->Channels = Channels;
+}
+
+void STCWaveFile::SetSampleFormat(SAMPLE_FORMAT Format)
+{
+    this->Format = Format;
+}
+
+uint32_t STCWaveFile::GetChannelMask()
+{
+    return ChannelMask;
+}
+
+void STCWaveFile::SetChannelMask(uint32_t Mask)
+{
+    ChannelMask = Mask;
+}
+
+bool STCWaveFile::ReadFrameAsS16(short* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) << 8;
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+        return Frames == fread(FrameSamples, sizeof(FrameSamples[0])*Channels, Frames, File);
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 8);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 16);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[Frames * Channels];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        double DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+bool STCWaveFile::ReadFrameAsfloat(float* FrameSamples, int Frames)
+{
+	if (FramesRead >= TotalFrames)
+		return false;
+
+	FramesRead += Frames;
+
+	switch (Format)
+	{
+	case SF_U8:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 1, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S16:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 2, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S24:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 3, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S32:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 4, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_IEEE_FLOAT:
+	{
+	    if(fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+	        return true;
+        }
+	    return false;
+//		float DirectSamples[32];
+//
+//		if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+//		{
+//			for (int frame = 0; frame < Frames; frame++)
+//			{
+//				for (int ch = 0; ch < Channels; ch++)
+//				{
+//					FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+//				}
+//			}
+//			return true;
+//		}
+//		return false;
+	}
+	case SF_IEEE_DOUBLE:
+	{
+		if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+		{
+			return true;
+		}
+		return false;
+	}
+	}
+	return false;
+}
+
+bool STCWaveFile::ReadFrameAsDouble(double* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File)) 
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 2, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample ))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+void STCWaveFile::WriteRaw(void* Raw, int Size)
+{
+	fwrite(Raw, Size, 1, File);
+}
+
+
+void STCWaveFile::WriteFrame(uint8_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void STCWaveFile::WriteFrame(short* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void STCWaveFile::WriteFrame(int32_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void STCWaveFile::WriteFrameS24(int32_t* FrameSamples, int Frames)
+{
+    for (int c = 0; c < Channels; c++)
+    {
+        fwrite(&FrameSamples[c], 3, 1, File);
+    }
+}
+
+void STCWaveFile::WriteFrame(double* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void STCWaveFile::WriteFrame(float* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+
+double STCWaveFile::GetDuration()
+{
+    return Duration;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/CAudioEffectsChainApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/CAudioEffectsChainApi.cpp
new file mode 100644
index 0000000..29805ae
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/CAudioEffectsChainApi.cpp
@@ -0,0 +1,74 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#include "CAudioEffectsChainApi.h"
+#include "audio_chain/CAudioEffectsChain.h"
+
+void* ae_create_object()
+{
+    return new CAudioEffectsChain(); // 构造
+}
+
+void ae_destory_object(void *p)
+{
+    ae_uninit(p);
+    delete static_cast<CAudioEffectsChain *>(p); // 释放
+}
+
+AE_ERR ae_init(void *p, int sample_rate, int channel)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    return audio_effect_chain->init(sample_rate, channel);
+}
+
+AE_ERR ae_uninit(void *p)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    return audio_effect_chain->uninit();
+}
+
+AE_ERR ae_reset(void *p)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    return audio_effect_chain->reset();
+}
+
+int ae_get_latency_ms(void *p)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    return audio_effect_chain->get_latency_ms();
+}
+
+AE_ERR ae_set_params(void *p, void *casw, AE_PARAMS *params)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    CAudioSmoothWrapper* audio_smooth_wrapper = static_cast<CAudioSmoothWrapper*>(casw);
+    return audio_effect_chain->set_params(audio_smooth_wrapper, params);
+}
+
+AE_ERR ae_get_params(void *p, void *casw, AE_PARAMS *params)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    CAudioSmoothWrapper* audio_smooth_wrapper = static_cast<CAudioSmoothWrapper*>(casw);
+    return audio_effect_chain->get_params(audio_smooth_wrapper, params);
+}
+
+AE_ERR ae_process(void *p, float *in_buf, float *out_buf, int length)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    return audio_effect_chain->process(in_buf, out_buf, length);
+}
+
+void* ae_add_effect(void *p, AE_EFFECT_TYPE effects_number)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    return audio_effect_chain->add_effect(effects_number);
+}
+
+AE_ERR ae_delete_effect(void *p, void *casw)
+{
+    CAudioEffectsChain* audio_effect_chain = static_cast<CAudioEffectsChain*>(p);
+    CAudioSmoothWrapper* audio_smooth_wrapper = static_cast<CAudioSmoothWrapper*>(casw);
+    return audio_effect_chain->delete_effect(audio_smooth_wrapper);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/IAudioEffects.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/IAudioEffects.h
new file mode 100644
index 0000000..575178a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/IAudioEffects.h
@@ -0,0 +1,45 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_IAUDIOEFFECTS_H
+#define AUDIO_EFFECTS_LIB_IAUDIOEFFECTS_H
+
+/**
+ * 效果器的接口
+ */
+#include "manager/Manager.h"
+#include "AudioEffectsDef.h"
+
+class IAudioEffects
+{
+public:
+    IAudioEffects() {};
+    virtual ~IAudioEffects() {}; // 增加虚类的析构函数，防止内存泄漏
+public:
+    virtual int init(int sample_rate, int channel) = 0;
+    virtual int reset() = 0;
+    virtual int uninit() = 0;
+    virtual int process(float* in_buf, float* out_buf, int length) = 0;
+    virtual int get_latency_ms() = 0;
+    virtual int set_params(AE_PARAMS* param) = 0;
+    virtual int get_params(AE_PARAMS* param) = 0; // 在外部将空间开辟好
+    virtual int get_effectId() = 0; // 获取唯一ID
+};
+
+
+class ICreator
+{
+
+public:
+    ICreator() = delete;
+    explicit ICreator(int type)
+    {
+        registered(type, this);
+    };
+
+public:
+    virtual IAudioEffects* get_inst() = 0;
+};
+
+#endif //AUDIO_EFFECTS_LIB_IAUDIOEFFECTS_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_al_reverb/CAudioAlReverb.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_al_reverb/CAudioAlReverb.cpp
new file mode 100644
index 0000000..cbcc936
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_al_reverb/CAudioAlReverb.cpp
@@ -0,0 +1,93 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#include "CAudioAlReverb.h"
+#include "al_reverb/inc/AlReverbApi.h"
+
+static CAudioAlReverbCreator gs_al_reverb_api = CAudioAlReverbCreator(AE_EFFECT_TYPE_AL_REVERB);
+
+CAudioAlReverb::CAudioAlReverb()
+{
+    m_al_reverb_api = nullptr;
+    m_ae_params_al_reverb = nullptr;
+}
+
+CAudioAlReverb::~CAudioAlReverb()
+{
+    uninit();
+}
+
+int CAudioAlReverb::init(int sample_rate, int channel)
+{
+    m_al_reverb_api = new SUPERSOUND::ALREVERB::AlReverbApi();
+    m_al_reverb_api->init(sample_rate, channel, 0);
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAlReverb::uninit()
+{
+    if(nullptr != m_al_reverb_api)
+    {
+        m_al_reverb_api->uninit();
+        delete m_al_reverb_api;
+        m_al_reverb_api = nullptr;
+    }
+
+    if(nullptr != m_ae_params_al_reverb)
+    {
+        delete m_ae_params_al_reverb;
+        m_ae_params_al_reverb = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAlReverb::reset()
+{
+    m_al_reverb_api->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAlReverb::get_effectId()
+{
+    return AE_EFFECT_TYPE_AL_REVERB;
+}
+
+int CAudioAlReverb::get_latency_ms()
+{
+    return m_al_reverb_api->get_latency();
+}
+
+int CAudioAlReverb::set_params(AE_PARAMS *param)
+{
+    if(nullptr != param)
+    {
+        AE_PARAMS_AL_REVERB* tp = (AE_PARAMS_AL_REVERB*) param;
+
+        // 第一次设置时开辟空间
+        if(nullptr == m_ae_params_al_reverb)
+        {
+            m_ae_params_al_reverb = new AE_PARAMS_AL_REVERB();
+        }
+        memcpy(m_ae_params_al_reverb, tp, sizeof(AE_PARAMS_AL_REVERB));
+    }
+    return m_al_reverb_api->set_param((AE_PARAMS_AL_REVERB*) param);
+}
+
+int CAudioAlReverb::get_params(AE_PARAMS *param)
+{
+    if(nullptr != param && nullptr != m_ae_params_al_reverb)
+    {
+        memcpy(param, m_ae_params_al_reverb, sizeof(AE_PARAMS_AL_REVERB));
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAlReverb::process(float *in_buf, float *out_buf, int length)
+{
+    if(in_buf != out_buf)
+    {
+        memcpy(out_buf, in_buf, sizeof(float) * length);
+    }
+    return m_al_reverb_api->process(out_buf, length);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_al_reverb/CAudioAlReverb.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_al_reverb/CAudioAlReverb.h
new file mode 100644
index 0000000..cd85bf0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_al_reverb/CAudioAlReverb.h
@@ -0,0 +1,48 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOALREVERB_H
+#define AUDIO_EFFECTS_LIB_CAUDIOALREVERB_H
+
+#include "IAudioEffects.h"
+namespace SUPERSOUND {
+    namespace ALREVERB {
+        class AlReverbApi;
+    }
+}
+
+class CAudioAlReverb : public IAudioEffects
+{
+public:
+    CAudioAlReverb();
+    ~CAudioAlReverb();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+
+private:
+    SUPERSOUND::ALREVERB::AlReverbApi* m_al_reverb_api;
+    AE_PARAMS_AL_REVERB* m_ae_params_al_reverb;
+};
+
+
+class CAudioAlReverbCreator : public ICreator
+{
+public:
+    CAudioAlReverbCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioAlReverb();
+    };
+};
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOALREVERB_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_autotune/CAudioAutoTune.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_autotune/CAudioAutoTune.cpp
new file mode 100644
index 0000000..5db5271
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_autotune/CAudioAutoTune.cpp
@@ -0,0 +1,73 @@
+//
+// Created by yangjianli on 2020-01-13.
+//
+
+#include <ref/autotune/inc/AutoTuneDef.h>
+#include "CAudioAutoTune.h"
+#include "autotune/inc/ATndkWrapper.h"
+
+static CAudioAutoTuneCreator gs_autotune_creator = CAudioAutoTuneCreator(AE_EFFECT_TYPE_AUTOTUNE);
+CAudioAutoTune::CAudioAutoTune()
+{
+    m_atndk_api = nullptr;
+}
+
+CAudioAutoTune::~CAudioAutoTune()
+{
+    uninit();
+}
+int CAudioAutoTune::init(int sample_rate, int channel)
+{
+    m_atndk_api =  new CATndkWrapper();
+    int ret = m_atndk_api->init(sample_rate, channel);
+    if(AT_ERR_SUCCESS != ret)
+    {
+        uninit();
+        return ret;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAutoTune::uninit()
+{
+    if(nullptr != m_atndk_api)
+    {
+        m_atndk_api->uninit();
+        delete m_atndk_api;
+        m_atndk_api = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAutoTune::reset()
+{
+    m_atndk_api->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAutoTune::get_effectId()
+{
+    return AE_EFFECT_TYPE_AUTOTUNE;
+}
+
+int CAudioAutoTune::get_latency_ms()
+{
+    return m_atndk_api->get_latency_time_ms();
+}
+
+int CAudioAutoTune::set_params(AE_PARAMS *param)
+{
+    // 不需要设置参数
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAutoTune::get_params(AE_PARAMS *param)
+{
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioAutoTune::process(float *in_buf, float *out_buf, int length)
+{
+    // 这里的ms在内部没有被调用，故此，设置成0
+    return m_atndk_api->process(in_buf, out_buf, length, 0);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_autotune/CAudioAutoTune.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_autotune/CAudioAutoTune.h
new file mode 100644
index 0000000..03b9a05
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_autotune/CAudioAutoTune.h
@@ -0,0 +1,42 @@
+//
+// Created by yangjianli on 2020-01-13.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOAUTOTUNE_H
+#define AUDIO_EFFECTS_LIB_CAUDIOAUTOTUNE_H
+
+#include "IAudioEffects.h"
+
+class CATndkWrapper;
+class CAudioAutoTune : public IAudioEffects
+{
+public:
+    CAudioAutoTune();
+    ~CAudioAutoTune();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+
+private:
+    CATndkWrapper* m_atndk_api;
+};
+
+class CAudioAutoTuneCreator : public ICreator
+{
+public:
+    CAudioAutoTuneCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioAutoTune();
+    };
+
+};
+#endif //AUDIO_EFFECTS_LIB_CAUDIOAUTOTUNE_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_chain/CAudioEffectsChain.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_chain/CAudioEffectsChain.cpp
new file mode 100644
index 0000000..20efbc8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_chain/CAudioEffectsChain.cpp
@@ -0,0 +1,201 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#include "CAudioEffectsChain.h"
+
+CAudioEffectsChain::CAudioEffectsChain()
+{
+    m_list.clear();
+    m_list_tmp.clear();
+    m_process_list.clear();
+    m_sample_rate = 0;
+    m_channel = 0;
+    m_list_update = false;
+}
+
+CAudioEffectsChain::~CAudioEffectsChain()
+{
+    uninit();
+}
+
+CAudioSmoothWrapper* CAudioEffectsChain::add_effect(AE_EFFECT_TYPE effects_number)
+{
+    if(0 == m_sample_rate || 0 == m_channel)
+    {
+        return nullptr;
+    }
+
+    // 自定义删除函数，保证在析构的时候自动uninit释放空间
+    std::shared_ptr<CAudioSmoothWrapper> sw = std::shared_ptr<CAudioSmoothWrapper>(new CAudioSmoothWrapper(),
+            [](CAudioSmoothWrapper *inst){
+                inst->uninit();
+                delete inst;
+                inst = nullptr;
+            }
+    );
+
+    int ret = sw->init(effects_number, m_sample_rate, m_channel);
+    if(AE_ERR_SUCCESS != ret)
+    {
+        return nullptr;
+    }
+    // 塞入时加锁
+    {
+        std::lock_guard<std::mutex> lock(m_mutex);
+        m_list.push_back(sw);
+        m_list_update = true;
+    }
+    return sw.get();
+}
+
+AE_ERR CAudioEffectsChain::init(int sample_rate, int channel)
+{
+    m_sample_rate = sample_rate;
+    m_channel = channel;
+    return AE_ERR_SUCCESS;
+}
+
+AE_ERR CAudioEffectsChain::uninit()
+{
+    // 删除时加锁
+    std::lock_guard<std::mutex> lock(m_mutex);
+    m_list.clear();
+    m_list_tmp.clear();
+    m_process_list.clear();
+
+    m_sample_rate = 0;
+    m_channel = 0;
+    m_list_update = false;
+    return AE_ERR_SUCCESS;
+}
+
+AE_ERR CAudioEffectsChain::reset()
+{
+    // 拷贝一份做reset,防止reset时在process中被释放
+    copylist2tmp();
+    for(auto & sw : m_list_tmp)
+    {
+        sw->reset();
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioEffectsChain::get_latency_ms()
+{
+    // 拷贝一份做get_latency_ms,防止get_latency_ms时在process中被释放
+    copylist2tmp();
+    int latency = 0;
+    for(auto & sw : m_list_tmp)
+    {
+        latency += sw->get_latency_ms();
+    }
+    return latency;
+}
+
+AE_ERR CAudioEffectsChain::set_params(CAudioSmoothWrapper* casw, AE_PARAMS *params)
+{
+    copylist2tmp();
+    AE_ERR ret = AE_ERR_EFFECT_NOT_IN_CHAIN;
+    for(auto & sw : m_list_tmp)
+    {
+        if(casw == sw.get())
+        {
+            ret = AE_ERR_SUCCESS;
+            sw->set_param(params);
+            break;
+        }
+    }
+    return ret;
+}
+
+AE_ERR CAudioEffectsChain::get_params(CAudioSmoothWrapper *casw, AE_PARAMS *params)
+{
+    copylist2tmp();
+    AE_ERR ret = AE_ERR_EFFECT_NOT_IN_CHAIN;
+    for(auto & sw : m_list_tmp)
+    {
+        if(casw == sw.get())
+        {
+            ret = AE_ERR_SUCCESS;
+            sw->get_param(params);
+            break;
+        }
+    }
+    return ret;
+}
+
+AE_ERR CAudioEffectsChain::process(float *in_buf, float *out_buf, int length)
+{
+    if(m_list_update){
+        std::lock_guard<std::mutex> lock(m_mutex);
+        m_list_update = false;
+        m_process_list.clear();
+        m_process_list.insert(m_process_list.end(), m_list.begin(), m_list.end());
+    }
+
+    // 防止list为空时，没有任何输出
+    if(in_buf != out_buf)
+    {
+        memcpy(out_buf, in_buf, sizeof(float) * length);
+    }
+
+    bool update = false;
+    std::vector<std::shared_ptr<CAudioSmoothWrapper> >::iterator it;
+    for(it=m_process_list.begin(); it != m_process_list.end();)
+    {
+        (*it)->process(in_buf, out_buf, length);
+        if(!(*it)->get_switch_status() && (*it)->get_change_status())
+        {
+            // 此处不需要手动做uninit,内部是智能指针
+            // 当没有任何vector引用时，析构函数自动调用uninit函数
+            // 本次直接从vector中删除，其他临时的vector取用数据时仍旧可用
+            // erase(it),返回值是下一个元素的地址
+//            (*it)->uninit();
+            it=m_process_list.erase(it);
+            update = true;
+        }
+        else
+        {
+            ++it;
+        }
+
+        if(in_buf != out_buf)
+        {
+            memcpy(in_buf, out_buf, sizeof(float) * length);
+        }
+    }
+
+    // 更新数据
+    if(update)
+    {
+        std::lock_guard<std::mutex> lock(m_mutex);
+        m_list.clear();
+        m_list.insert(m_list.end(), m_process_list.begin(), m_process_list.end());
+    }
+    return AE_ERR_SUCCESS;
+}
+
+AE_ERR CAudioEffectsChain::delete_effect(CAudioSmoothWrapper* casw)
+{
+    copylist2tmp();
+    AE_ERR ret = AE_ERR_EFFECT_NOT_IN_CHAIN;
+    for(auto &ae : m_list_tmp)
+    {
+        if (casw == ae.get())
+        {
+            ret = AE_ERR_SUCCESS;
+            ae->close_effect();
+            break;
+        }
+    }
+    return ret;
+}
+
+// 拷贝列表,防止在添加或者删除时,遍历列表出现异常
+void CAudioEffectsChain::copylist2tmp()
+{
+    std::lock_guard<std::mutex> lock(m_mutex);
+    m_list_tmp.clear();
+    m_list_tmp.insert(m_list_tmp.end(), m_list.begin(), m_list.end());
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_chain/CAudioEffectsChain.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_chain/CAudioEffectsChain.h
new file mode 100644
index 0000000..9760c4c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_chain/CAudioEffectsChain.h
@@ -0,0 +1,61 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOEFFECTSCHAIN_H
+#define AUDIO_EFFECTS_LIB_CAUDIOEFFECTSCHAIN_H
+
+#include "audio_smooth_wrapper/CAudioSmoothWrapper.h"
+#include "AudioEffectsDef.h"
+#include "vector"
+#include "map"
+#include "mutex"
+#include <memory>
+/**
+ * 注意:
+ * 1 init之后做其他操作
+ * 2 process是一个单独的线程,reset需要和process在同一个线程 & 其他操作在同一个线程
+ * 3 必须process之后才能uninit
+ * 效果链
+ * 承担功能:
+ * 1 添加效果
+ * 2 剔除效果
+ * 3 保证处理顺序
+ * 4 修改效果参数
+ */
+
+class CAudioEffectsChain
+{
+public:
+    CAudioEffectsChain();
+    ~CAudioEffectsChain();
+
+public:
+    AE_ERR init(int sample_rate, int channel);
+    AE_ERR uninit();
+    AE_ERR reset();
+    int get_latency_ms();
+    AE_ERR set_params(CAudioSmoothWrapper* casw, AE_PARAMS* params);
+    AE_ERR get_params(CAudioSmoothWrapper* casw, AE_PARAMS* params);
+    AE_ERR process(float* in_buf, float* out_buf, int length);
+
+    // 返回效果的地址,作为外部指定内部操作的唯一标示
+    // 尽量不要在外部直接使用
+    CAudioSmoothWrapper* add_effect(AE_EFFECT_TYPE effects_number);
+    AE_ERR delete_effect(CAudioSmoothWrapper* casw);
+
+private:
+    void copylist2tmp();
+private:
+    std::vector<std::shared_ptr<CAudioSmoothWrapper> > m_list; // 多个效果的叠加顺序
+    std::vector<std::shared_ptr<CAudioSmoothWrapper> > m_list_tmp; // 多个效果使用时拷贝出来
+    std::vector<std::shared_ptr<CAudioSmoothWrapper> > m_process_list; // 处理时拷贝出来
+    std::mutex m_mutex; // 保证m_list多进程处理问题
+    int m_sample_rate;
+    int m_channel;
+    // 当非process线程修改list时更新
+    bool m_list_update;
+};
+
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOEFFECTSCHAIN_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_eq/CAudioEqApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_eq/CAudioEqApi.cpp
new file mode 100644
index 0000000..dc16372
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_eq/CAudioEqApi.cpp
@@ -0,0 +1,105 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#include "CAudioEqApi.h"
+#include "stdio.h"
+#include "iir_eq/inc/CAudaciousEqApi.h"
+
+static CEqApiCreator gs_eq_creator = CEqApiCreator(AE_EFFECT_TYPE_EQ);
+
+CAudioEqApi::CAudioEqApi()
+{
+    m_eq_api = nullptr;
+    m_eq_param = nullptr;
+}
+
+CAudioEqApi::~CAudioEqApi()
+{
+    uninit();
+}
+
+int CAudioEqApi::init(int sample_rate, int channel)
+{
+    m_eq_api = new CAudaciousEqApi();
+    int ret = m_eq_api->init(sample_rate, channel);
+    if(AUDACIOUS_EQ_ERROR_CODE_SUCCESS != ret)
+    {
+        uninit();
+        return ret;
+    }
+    m_kvs.init(channel);
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioEqApi::uninit()
+{
+    if(nullptr != m_eq_api)
+    {
+        m_eq_api->uninit();
+        delete m_eq_api;
+        m_eq_api = NULL;
+    }
+
+    if(nullptr != m_eq_param)
+    {
+        delete m_eq_param;
+        m_eq_param = nullptr;
+    }
+
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioEqApi::reset()
+{
+    m_kvs.reset();
+    return m_eq_api->reset();
+}
+
+int CAudioEqApi::get_effectId()
+{
+    return AE_EFFECT_TYPE_EQ;
+}
+
+int CAudioEqApi::get_latency_ms()
+{
+    return m_eq_api->get_latency_ms();
+}
+
+int CAudioEqApi::set_params(AE_PARAMS* param)
+{
+    // 不论如何将数据传下去，下面会做处理。
+    AE_PARAMS_EQ* audio_effects_eq_params = (AE_PARAMS_EQ*) param;
+    if(NULL != audio_effects_eq_params)
+    {
+        m_eq_api->set_param(audio_effects_eq_params->params);
+        if(nullptr == m_eq_param)
+        {
+            m_eq_param = new AE_PARAMS_EQ();
+        }
+        memcpy(m_eq_param, audio_effects_eq_params, sizeof(AE_PARAMS_EQ));
+    }else
+    {
+        const float* tmp = NULL;
+        m_eq_api->set_param(tmp);
+    }
+
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioEqApi::get_params(AE_PARAMS *param)
+{
+    if(nullptr != m_eq_param && nullptr != param)
+    {
+        memcpy(param, m_eq_param, sizeof(AE_PARAMS_EQ));
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioEqApi::process(float *in_buf, float *out_buf, int length)
+{
+    m_kvs.pre_process(in_buf, length);
+    int ret = m_eq_api->process(in_buf, out_buf, length);
+    m_kvs.after_process(out_buf, length);
+    return ret;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_eq/CAudioEqApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_eq/CAudioEqApi.h
new file mode 100644
index 0000000..8e5a5f5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_eq/CAudioEqApi.h
@@ -0,0 +1,46 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_AUDIOEQAPI_H
+#define AUDIO_EFFECTS_LIB_AUDIOEQAPI_H
+
+#include "IAudioEffects.h"
+#include "common/keep_volume_steady/CKeepVolumeSteady.h"
+class CAudaciousEqApi;
+class CAudioEqApi : public IAudioEffects
+{
+public:
+    CAudioEqApi();
+    ~CAudioEqApi();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+
+private:
+    CAudaciousEqApi* m_eq_api;
+    AE_PARAMS_EQ* m_eq_param;
+    CKeepVolumeSteady m_kvs;
+};
+
+
+class CEqApiCreator : public ICreator
+{
+
+public:
+    CEqApiCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioEqApi();
+    };
+};
+
+#endif //AUDIO_EFFECTS_LIB_AUDIOEQAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_im_effect/CImEffectApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_im_effect/CImEffectApi.cpp
new file mode 100644
index 0000000..6772fde
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_im_effect/CImEffectApi.cpp
@@ -0,0 +1,167 @@
+//
+// Created by yangjianli on 2022/9/7.
+//
+
+// 要求: 外部输入的每个单声道的帧长小于等于 (1 << (bits - 1))
+
+#include "CImEffectApi.h"
+#include "supersound/inc/supersound_err.h"
+#include "impulse_effect.h"
+#include <cmath>
+static CImEffectApiCreator gs_im_effect_creator = CImEffectApiCreator(AE_EFFECT_TYPE_IM_EFFECT);
+
+CImEffectApi::CImEffectApi()
+{
+    m_impluse_effect = nullptr;
+    m_sample_rate = 0;
+    m_channel = 0;
+    m_latency_ms = 0;
+    m_empty_buf = nullptr;
+    m_empty_buf_len = 0;
+    m_need_push_data = false;
+}
+
+CImEffectApi::~CImEffectApi()
+{
+    uninit();
+}
+
+int CImEffectApi::init(int sample_rate, int channel)
+{
+    m_impluse_effect = new SUPERSOUND::IMPULSE::ImpulseEffect();
+    m_sample_rate = sample_rate;
+    m_channel = channel;
+    m_params = new Impulse_Param();
+    m_latency_ms = 0;
+    return AE_ERR_SUCCESS;
+}
+
+int CImEffectApi::uninit()
+{
+    if (nullptr != m_impluse_effect)
+    {
+        // delete的时候内部自主释放空间
+        delete m_impluse_effect;
+        m_impluse_effect = nullptr;
+    }
+
+    if (nullptr != m_params)
+    {
+        // 内部的音频空间由外部统一管理
+        delete m_params;
+        m_params = nullptr;
+    }
+
+    if (nullptr != m_empty_buf)
+    {
+        delete[] m_empty_buf;
+        m_empty_buf = nullptr;
+        m_empty_buf_len = 0;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CImEffectApi::get_effectId()
+{
+    return AE_EFFECT_TYPE_IM_EFFECT;
+}
+
+int CImEffectApi::get_latency_ms()
+{
+    return m_latency_ms;
+}
+
+int CImEffectApi::reset()
+{
+    m_impluse_effect->FlushOut();
+    if (m_need_push_data)
+    {
+        pre_push_data();
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CImEffectApi::set_params(AE_PARAMS *param)
+{
+    int err = 0;
+    if (param != NULL)
+    {
+        Impulse_Param *new_param = (Impulse_Param *) param;
+        copy_impluse_params(m_params, new_param);
+        // 要求当前帧长比内部帧长小
+        int cur_frame_len = (1 << (new_param->window_bits - 1));
+        while (cur_frame_len < new_param->process_buffer_len)
+        {
+            new_param->window_bits += 1;
+            cur_frame_len = (1 << (new_param->window_bits - 1));
+        }
+
+        // 高性能意味着使用内部的帧长,此时有可能存在延迟
+        int process_buffer_len = new_param->process_buffer_len;
+        if (new_param->high_performance)
+        {
+            // 卡一下最小的fft计算时间
+            if (new_param->window_bits <= 10)
+            {
+                new_param->window_bits = 10;
+                cur_frame_len = (1 << (new_param->window_bits - 1));
+            }
+            new_param->process_buffer_len = cur_frame_len;
+        }
+
+        new_param->fs = m_sample_rate;
+        new_param->in_channels = m_channel;
+        new_param->out_channels = m_channel;
+        err = m_impluse_effect->SetParam(param);
+        if (err != 0)
+        {
+            return err;
+        }
+
+        // 当两者相等时,可以直接做处理，延迟为0
+        // 当process_buffer_len 小于 内部帧长时，由于需要凑帧长，所以提前塞满一帧0，这样可以保证之后可以入多少出多少
+        m_latency_ms = 0;
+        m_need_push_data = process_buffer_len != m_impluse_effect->GetFrameLen();
+    }
+    return err;
+}
+
+int CImEffectApi::get_params(AE_PARAMS *param)
+{
+    copy_impluse_params((Impulse_Param*)param, m_params);
+    return 0;
+}
+
+int CImEffectApi::process(float *in_buf, float *out_buf, int length)
+{
+    int out_length = 0;
+    m_impluse_effect->ProcessfInput(in_buf, length, out_length);
+    if (out_length < length)
+    {
+        // 这种情况理论上不会出现
+        memset(out_buf, 0, sizeof(float) * length);
+        return 0;
+    }
+    m_impluse_effect->ProcessfOutput(out_buf, length, out_length);
+    return 0;
+}
+
+// 为了保证之后的输出一直是稳定的，保证只有最前面的一部分是0
+// 所以在设置参数过后或者reset之后都需要做该操作
+// 但是两者不能同时操作 | 目前外部做了包装，只要在reset做即可,set_params之后外部会自动做reset
+void CImEffectApi::pre_push_data()
+{
+    if (m_empty_buf == nullptr || m_empty_buf_len < m_impluse_effect->GetFrameLen() * m_channel)
+    {
+        if (m_empty_buf != nullptr)
+        {
+            delete [] m_empty_buf;
+        }
+        m_empty_buf_len = m_impluse_effect->GetFrameLen() * m_channel;
+        m_empty_buf = new float[m_empty_buf_len];
+        memset(m_empty_buf, 0, sizeof(float) * m_empty_buf_len);
+    }
+    int out_length = 0;
+    m_impluse_effect->ProcessfInput(m_empty_buf, m_impluse_effect->GetFrameLen() * m_channel, out_length);
+    m_latency_ms = round(m_impluse_effect->GetFrameLen() * 1.0 / m_sample_rate * 1000);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_im_effect/CImEffectApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_im_effect/CImEffectApi.h
new file mode 100644
index 0000000..43b1dca
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_im_effect/CImEffectApi.h
@@ -0,0 +1,60 @@
+//
+// Created by yangjianli on 2022/9/7.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CIMEFFECTAPI_H
+#define AUDIO_EFFECTS_LIB_CIMEFFECTAPI_H
+#include "IAudioEffects.h"
+namespace SUPERSOUND
+{
+    namespace IMPULSE
+    {
+        class ImpulseEffect;
+    }
+}
+
+class CImEffectApi : public IAudioEffects
+{
+public:
+    CImEffectApi();
+    ~CImEffectApi();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+
+private:
+    void pre_push_data();
+private:
+    SUPERSOUND::IMPULSE::ImpulseEffect* m_impluse_effect;
+    Impulse_Param * m_params;
+    int32_t m_sample_rate;
+    int32_t m_channel;
+    int32_t m_latency_ms;
+    float* m_empty_buf;
+    int32_t m_empty_buf_len;
+    bool m_need_push_data;
+};
+
+
+class CImEffectApiCreator : public ICreator
+{
+
+public:
+    CImEffectApiCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        printf("IM Create !\n");
+        return new CImEffectApi();
+    };
+};
+
+
+#endif //AUDIO_EFFECTS_LIB_CIMEFFECTAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_phonograph/CAudioPhonograph.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_phonograph/CAudioPhonograph.cpp
new file mode 100644
index 0000000..7822cc7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_phonograph/CAudioPhonograph.cpp
@@ -0,0 +1,81 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#include "CAudioPhonograph.h"
+#include "phonograph/inc/CPhonograph.h"
+
+#define APG_VOLUME_RATE 1.68 //保持音量响度不变需要的倍数
+
+static CAudioPhonographCreator gs_audio_phonograph_creator = CAudioPhonographCreator(AE_EFFECT_TYPE_PHONOGRAPH);
+
+CAudioPhonograph::CAudioPhonograph()
+{
+    m_phonogh_api = nullptr;
+}
+
+CAudioPhonograph::~CAudioPhonograph()
+{
+    uninit();
+}
+
+int CAudioPhonograph::init(int sample_rate, int channel)
+{
+    m_phonogh_api = new CPhonograph();
+    int ret = m_phonogh_api->init(sample_rate, channel);
+    if(0 != ret)
+    {
+        uninit();
+        return ret;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioPhonograph::uninit()
+{
+    if(nullptr != m_phonogh_api)
+    {
+        m_phonogh_api->uninit();
+        delete m_phonogh_api;
+        m_phonogh_api = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioPhonograph::get_effectId()
+{
+    return AE_EFFECT_TYPE_PHONOGRAPH;
+}
+
+int CAudioPhonograph::get_latency_ms()
+{
+    return 0;
+}
+
+int CAudioPhonograph::reset()
+{
+    m_phonogh_api->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioPhonograph::set_params(AE_PARAMS *param)
+{
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioPhonograph::get_params(AE_PARAMS *param)
+{
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioPhonograph::process(float *in_buf, float *out_buf, int length) {
+    if (in_buf != out_buf) {
+        memcpy(out_buf, in_buf, sizeof(float) * length);
+    }
+    int ret = m_phonogh_api->process(out_buf, length);
+    for (int i = 0; i < length; i++)
+    {
+        out_buf[i] *= APG_VOLUME_RATE;
+    }
+    return ret;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_phonograph/CAudioPhonograph.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_phonograph/CAudioPhonograph.h
new file mode 100644
index 0000000..bca5b04
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_phonograph/CAudioPhonograph.h
@@ -0,0 +1,46 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOPHONOGRAPH_H
+#define AUDIO_EFFECTS_LIB_CAUDIOPHONOGRAPH_H
+
+
+#include "IAudioEffects.h"
+#include "common/keep_volume_steady/CKeepVolumeSteady.h"
+class CPhonograph;
+class CAudioPhonograph : public IAudioEffects
+{
+public:
+    CAudioPhonograph();
+    ~CAudioPhonograph();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+
+private:
+    CPhonograph* m_phonogh_api;
+};
+
+
+class CAudioPhonographCreator : public ICreator
+{
+
+public:
+    CAudioPhonographCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioPhonograph();
+    };
+};
+
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOPHONOGRAPH_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_reverb/CAudioReverbApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_reverb/CAudioReverbApi.cpp
new file mode 100644
index 0000000..0a35fa2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_reverb/CAudioReverbApi.cpp
@@ -0,0 +1,115 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#include "CAudioReverbApi.h"
+#include "reverb/inc/CReverb.h"
+
+#define RB_VOLUME_RATE 1.68 // 对于DISTINCT需要保持不变
+
+static CAudioReverbApiCreator gs_reverb_api = CAudioReverbApiCreator(AE_EFFECT_TYPE_REVERB);
+CAudioReverbApi::CAudioReverbApi()
+{
+    m_reverb_api = nullptr;
+    m_reverb_param = nullptr;
+
+    m_rate = 1.0;
+}
+
+CAudioReverbApi::~CAudioReverbApi()
+{
+    uninit();
+}
+
+int CAudioReverbApi::init(int sample_rate, int channel)
+{
+    m_reverb_api = new CReverb();
+    int ret = m_reverb_api->init(sample_rate, channel);
+    if(ret != RB_ERR_SUCCESS)
+    {
+        uninit();
+        return ret;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioReverbApi::uninit()
+{
+    if(nullptr != m_reverb_api)
+    {
+        m_reverb_api->uninit();
+        delete m_reverb_api;
+        m_reverb_api = nullptr;
+    }
+
+    if(nullptr != m_reverb_param)
+    {
+        delete m_reverb_param;
+        m_reverb_param = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioReverbApi::reset()
+{
+    m_reverb_api->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioReverbApi::get_effectId()
+{
+    return AE_EFFECT_TYPE_REVERB;
+}
+
+int CAudioReverbApi::get_latency_ms()
+{
+    return m_reverb_api->get_latency();
+}
+
+int CAudioReverbApi::set_params(AE_PARAMS *param)
+{
+    AE_PARAMS_REVERB* tp = (AE_PARAMS_REVERB*) param;
+    if(tp != nullptr)
+    {
+        if(nullptr == m_reverb_param)
+        {
+            m_reverb_param = new AE_PARAMS_REVERB();
+        }
+        memcpy(m_reverb_param, tp, sizeof(AE_PARAMS_REVERB));
+
+        // 判断新输入的值是否与DISTINCT相等
+        m_rate = params_cmp(tp,
+             (AE_PARAMS_REVERB*)&(gs_ae_params_reverb_params[AE_PARAMS_TYPE_REVERB_ID_15 - AE_PARAMS_TYPE_RERVERB]))
+              ? RB_VOLUME_RATE : 1.0;
+
+    }
+    return m_reverb_api->set_params(tp);
+}
+
+int CAudioReverbApi::get_params(AE_PARAMS *param)
+{
+    if(nullptr != param && nullptr != m_reverb_param)
+    {
+        memcpy(param, m_reverb_param, sizeof(AE_PARAMS_REVERB));
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioReverbApi::process(float *in_buf, float *out_buf, int length)
+{
+    m_reverb_api->process(in_buf, length, out_buf, length);
+    if(m_rate != 1.0)
+    {
+        for(int i=0;i<length;i++)
+        {
+            out_buf[i] *= m_rate;
+        }
+    }
+    return AE_ERR_SUCCESS;
+}
+
+bool CAudioReverbApi::params_cmp(AE_PARAMS_REVERB* a, AE_PARAMS_REVERB* b)
+{
+    return (a->room_size == b->room_size && a->wet == b->wet && a->width == b->width
+    && a->dry == b->dry && a->damp == b->damp && a->mode == b->mode);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_reverb/CAudioReverbApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_reverb/CAudioReverbApi.h
new file mode 100644
index 0000000..bf531a5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_reverb/CAudioReverbApi.h
@@ -0,0 +1,44 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOREVERBAPI_H
+#define AUDIO_EFFECTS_LIB_CAUDIOREVERBAPI_H
+
+#include "IAudioEffects.h"
+class CReverb;
+class CAudioReverbApi : public IAudioEffects
+{
+public:
+    CAudioReverbApi();
+    ~CAudioReverbApi();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+private:
+    bool params_cmp(AE_PARAMS_REVERB* a, AE_PARAMS_REVERB* b);
+private:
+    CReverb* m_reverb_api;
+    AE_PARAMS_REVERB* m_reverb_param;
+    float m_rate;
+};
+
+class CAudioReverbApiCreator : public ICreator
+{
+public:
+    CAudioReverbApiCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioReverbApi();
+    };
+};
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOREVERBAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_saudio_effects/CAudioSAudioEffectsApi.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_saudio_effects/CAudioSAudioEffectsApi.cpp
new file mode 100644
index 0000000..54b8a20
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_saudio_effects/CAudioSAudioEffectsApi.cpp
@@ -0,0 +1,99 @@
+//
+// Created by yangjianli on 2020-01-10.
+//
+
+#include "CAudioSAudioEffectsApi.h"
+#include "saudio_effects/inc/SAudioEffectsApi.h"
+
+static CAudioSAudioEffectsCreator gs_eq_creator = CAudioSAudioEffectsCreator(AE_EFFECT_TYPE_SAE);
+
+CAudioSAudioEffectsApi::CAudioSAudioEffectsApi()
+{
+    m_sae_api = nullptr;
+    m_ae_params_sae = nullptr;
+}
+
+CAudioSAudioEffectsApi::~CAudioSAudioEffectsApi()
+{
+    uninit();
+}
+
+int CAudioSAudioEffectsApi::init(int sample_rate, int channel)
+{
+    m_sae_api = new SAudioEffectsApi();
+    int ret = m_sae_api->init(sample_rate, channel);
+    if(ERROR_CODE_SUCCESS != ret)
+    {
+        uninit();
+        return ret;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSAudioEffectsApi::uninit()
+{
+    if(nullptr != m_sae_api)
+    {
+        m_sae_api->uninit();
+        delete m_sae_api;
+        m_sae_api = nullptr;
+    }
+
+    if(nullptr != m_ae_params_sae)
+    {
+        delete m_ae_params_sae;
+        m_ae_params_sae = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSAudioEffectsApi::reset()
+{
+    m_sae_api->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSAudioEffectsApi::get_effectId()
+{
+    return AE_EFFECT_TYPE_SAE;
+}
+
+int CAudioSAudioEffectsApi::get_latency_ms()
+{
+    return m_sae_api->get_latency();
+}
+
+int CAudioSAudioEffectsApi::set_params(AE_PARAMS *param)
+{
+    if(nullptr != param)
+    {
+        if(nullptr == m_ae_params_sae)
+        {
+            m_ae_params_sae = new AE_PARAMS_SAE();
+        }
+
+        AE_PARAMS_SAE* tp = (AE_PARAMS_SAE*) param;
+        m_ae_params_sae->params_list.assign(
+                    tp->params_list.begin(),tp->params_list.end()
+                );
+    }
+    return m_sae_api->set_audio_effect(param);
+}
+
+int CAudioSAudioEffectsApi::get_params(AE_PARAMS *param)
+{
+    if(nullptr != param && nullptr != m_ae_params_sae)
+    {
+        AE_PARAMS_SAE* tp = (AE_PARAMS_SAE*) param;
+        tp->params_list.assign(
+                m_ae_params_sae->params_list.begin(),
+                m_ae_params_sae->params_list.end()
+                );
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSAudioEffectsApi::process(float *in_buf, float *out_buf, int length)
+{
+    return m_sae_api->process(in_buf, out_buf, length);
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_saudio_effects/CAudioSAudioEffectsApi.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_saudio_effects/CAudioSAudioEffectsApi.h
new file mode 100644
index 0000000..33348b1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_saudio_effects/CAudioSAudioEffectsApi.h
@@ -0,0 +1,40 @@
+//
+// Created by yangjianli on 2020-01-10.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOSAUDIOEFFECTSAPI_H
+#define AUDIO_EFFECTS_LIB_CAUDIOSAUDIOEFFECTSAPI_H
+
+#include "IAudioEffects.h"
+
+class SAudioEffectsApi;
+class CAudioSAudioEffectsApi : public IAudioEffects
+{
+public:
+    CAudioSAudioEffectsApi();
+    ~CAudioSAudioEffectsApi();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+private:
+    SAudioEffectsApi* m_sae_api;
+    AE_PARAMS_SAE* m_ae_params_sae;
+};
+
+class CAudioSAudioEffectsCreator : ICreator {
+public:
+    CAudioSAudioEffectsCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioSAudioEffectsApi();
+    };
+};
+#endif //AUDIO_EFFECTS_LIB_CAUDIOSAUDIOEFFECTSAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_slow_flanging/CAudioSlowFlanging.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_slow_flanging/CAudioSlowFlanging.cpp
new file mode 100644
index 0000000..c972bf6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_slow_flanging/CAudioSlowFlanging.cpp
@@ -0,0 +1,71 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#include "CAudioSlowFlanging.h"
+#include "slow_flanging/inc/CSlowFlanging.h"
+
+static CAudioSlowFlangingCreator gs_audio_slow_flaging_creator = CAudioSlowFlangingCreator(AE_EFFECT_TYPE_SLOWFLANGING);
+CAudioSlowFlanging::CAudioSlowFlanging()
+{
+    m_slow_flanging_api = nullptr;
+}
+
+CAudioSlowFlanging::~CAudioSlowFlanging()
+{
+    uninit();
+}
+
+int CAudioSlowFlanging::init(int sample_rate, int channel)
+{
+    m_slow_flanging_api = new CSlowFlanging();
+    int ret = m_slow_flanging_api->init(channel, sample_rate);
+    if(0 != ret)
+    {
+        uninit();
+        return ret;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSlowFlanging::uninit()
+{
+    if(nullptr != m_slow_flanging_api)
+    {
+        m_slow_flanging_api->uninit();
+        delete m_slow_flanging_api;
+        m_slow_flanging_api = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSlowFlanging::get_effectId()
+{
+    return AE_EFFECT_TYPE_SLOWFLANGING;
+}
+
+int CAudioSlowFlanging::get_latency_ms()
+{
+    return 0;
+}
+
+int CAudioSlowFlanging::reset()
+{
+    m_slow_flanging_api->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSlowFlanging::set_params(AE_PARAMS *param)
+{
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSlowFlanging::get_params(AE_PARAMS *param)
+{
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSlowFlanging::process(float *in_buf, float *out_buf, int length)
+{
+    return m_slow_flanging_api->process(in_buf, out_buf, length);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_slow_flanging/CAudioSlowFlanging.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_slow_flanging/CAudioSlowFlanging.h
new file mode 100644
index 0000000..001b4bb
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_slow_flanging/CAudioSlowFlanging.h
@@ -0,0 +1,42 @@
+//
+// Created by yangjianli on 2020-01-14.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOSLOWFLANGING_H
+#define AUDIO_EFFECTS_LIB_CAUDIOSLOWFLANGING_H
+
+
+#include "IAudioEffects.h"
+
+class CSlowFlanging;
+class CAudioSlowFlanging : public IAudioEffects
+{
+public:
+    CAudioSlowFlanging();
+    ~CAudioSlowFlanging();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+private:
+    CSlowFlanging* m_slow_flanging_api;
+};
+
+class CAudioSlowFlangingCreator : ICreator {
+public:
+    CAudioSlowFlangingCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioSlowFlanging();
+    };
+};
+
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOSLOWFLANGING_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_smooth_wrapper/CAudioSmoothWrapper.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_smooth_wrapper/CAudioSmoothWrapper.cpp
new file mode 100644
index 0000000..29344ec
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_smooth_wrapper/CAudioSmoothWrapper.cpp
@@ -0,0 +1,219 @@
+//
+// Created by yangjianli on 2020-01-02.
+//
+
+#include "CAudioSmoothWrapper.h"
+#include "common/utils.h"
+
+CAudioSmoothWrapper::CAudioSmoothWrapper()
+{
+    m_update = false;
+    m_last_ms = 0;
+    m_tmp_in_buf = nullptr;
+    m_tmp_out_buf = nullptr;
+    m_current_iaudio = nullptr;
+    m_new_iaudio = nullptr;
+}
+
+CAudioSmoothWrapper::~CAudioSmoothWrapper()
+{
+    uninit();
+}
+
+int CAudioSmoothWrapper::init(int type, int sample_rate, int channel)
+{
+    m_sample_rate = sample_rate;
+    m_channel = channel;
+    m_current_iaudio = get_inst(type);
+    m_new_iaudio = get_inst(type);
+    if(!m_current_iaudio || !m_new_iaudio)
+    {
+        return AE_ERR_NO_EFFECTS;
+    }
+
+    m_new_iaudio->init(m_sample_rate, m_channel);
+    m_current_iaudio->init(m_sample_rate, m_channel);
+
+    m_update = false;
+    m_last_ms = 0;
+    m_change_status = false;
+
+    m_current_switch = false;
+    m_new_switch = false;
+    m_fade_in = false; // 初始化，当前是空的，但是一开始是关闭状态，数据直接拷贝
+
+    m_tmp_in_buf = nullptr;
+    m_tmp_out_buf = nullptr;
+    m_tmp_buf_len = 0;
+
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSmoothWrapper::uninit()
+{
+    if(nullptr != m_tmp_in_buf)
+    {
+        delete [] m_tmp_in_buf;
+        m_tmp_in_buf = nullptr;
+    }
+
+    if(nullptr != m_tmp_out_buf)
+    {
+        delete [] m_tmp_out_buf;
+        m_tmp_out_buf = nullptr;
+    }
+
+    if(nullptr != m_current_iaudio)
+    {
+        m_current_iaudio->uninit();
+        delete m_current_iaudio;
+        m_current_iaudio = nullptr;
+    }
+    if(nullptr != m_new_iaudio)
+    {
+        m_new_iaudio->uninit();
+        delete m_new_iaudio;
+        m_new_iaudio = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+
+int CAudioSmoothWrapper::set_param(AE_PARAMS *param)
+{
+    std::lock_guard<std::mutex> lock(m_mutex);
+
+    m_new_iaudio->set_params(param);
+    m_new_iaudio->reset();
+
+    // 操作之后再进行标志更新，减少耗时
+    m_update = true;
+    m_last_ms = 0;
+    m_change_status = false;
+    m_new_switch = true;
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSmoothWrapper::get_param(AE_PARAMS *param)
+{
+    m_current_iaudio->get_params(param);
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSmoothWrapper::reset()
+{
+    m_new_iaudio->reset();
+    m_current_iaudio->reset();
+    m_last_ms = 0;
+    m_fade_in = true;
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSmoothWrapper::get_latency_ms()
+{
+    return m_current_switch ? m_current_iaudio->get_latency_ms() : 0;
+}
+
+// 将本音效关闭
+int CAudioSmoothWrapper::close_effect()
+{
+    std::lock_guard<std::mutex> lock(m_mutex);
+    m_new_switch = false;
+    m_update = true;
+    m_last_ms = 0;
+    m_change_status = false;
+    return AE_ERR_SUCCESS;
+}
+
+// mLength 对应的是总长度 Sample * channel
+int CAudioSmoothWrapper::process(float *in_buf, float *out_buf, int length)
+{
+    // 复用缓存
+    if (length != m_tmp_buf_len) {
+        if (nullptr != m_tmp_in_buf) {
+            delete[] m_tmp_in_buf;
+        }
+        if(nullptr != m_tmp_out_buf)
+        {
+            delete [] m_tmp_out_buf;
+        }
+        m_tmp_buf_len = length;
+        m_tmp_in_buf = new float[m_tmp_buf_len];
+        m_tmp_out_buf = new float[m_tmp_buf_len];
+    }
+
+    // init和reset之后，防止阶跃噪声
+    if(m_fade_in)
+    {
+        m_fade_in = false;
+        au_float_fade_in(in_buf, length, m_channel);
+    }
+
+    // 拷贝一份原来的数据
+    memcpy(m_tmp_in_buf, in_buf, sizeof(float) * length); // 为新数据做准备
+    if(m_current_switch)
+    {
+        m_current_iaudio->process(in_buf, out_buf, length);
+    }else if(in_buf != out_buf)
+    {
+        // 没有打开音效开关，直接拷贝数据
+        memcpy(out_buf, in_buf, sizeof(float) * length);
+    }
+
+    if(m_update)
+    {
+        std::lock_guard<std::mutex> lock(m_mutex);
+        if(0 == m_last_ms)
+        {
+            au_float_fade_in(m_tmp_in_buf, length, m_channel);
+        }
+        if(m_new_switch)
+        {
+            m_new_iaudio->process(m_tmp_in_buf, m_tmp_out_buf, length);
+        }else
+        {
+            memcpy(m_tmp_out_buf, m_tmp_in_buf, sizeof(float) * length);
+        }
+
+        // 平稳后交换
+        int nLatency = m_new_switch ? m_new_iaudio->get_latency_ms() : 0;
+        if(m_last_ms >= nLatency)
+        {
+            au_float_fade_in(m_tmp_out_buf, length, m_channel);
+            au_float_cross_fade(m_tmp_out_buf, out_buf,out_buf,
+                           length, m_channel);
+
+            // 交换效果器
+            IAudioEffects* tmp;
+            tmp = m_new_iaudio;
+            m_new_iaudio = m_current_iaudio;
+            m_current_iaudio = tmp;
+
+            // 交换开关状态
+            m_current_switch = m_new_switch;
+
+            // 状态重置
+            m_last_ms = 0;
+            m_update = false;
+            m_change_status = true;
+        } else {
+            m_last_ms += float(length * 1.0 / m_channel / m_sample_rate * 1000);
+        }
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioSmoothWrapper::get_change_status()
+{
+    return m_change_status;
+}
+
+int CAudioSmoothWrapper::get_effect_id()
+{
+    return m_current_iaudio->get_effectId();
+}
+
+int CAudioSmoothWrapper::get_switch_status()
+{
+    return m_current_switch;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_smooth_wrapper/CAudioSmoothWrapper.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_smooth_wrapper/CAudioSmoothWrapper.h
new file mode 100644
index 0000000..92abb40
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_smooth_wrapper/CAudioSmoothWrapper.h
@@ -0,0 +1,57 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOSMOOTHWRAPPER_H
+#define AUDIO_EFFECTS_LIB_CAUDIOSMOOTHWRAPPER_H
+
+#include <mutex>
+#include "IAudioEffects.h"
+
+/**
+ * 对IAudioEffects进行一层包装,使得其满足
+ * 音效更改参数的时候，平滑切换，没有杂音
+ */
+
+class CAudioSmoothWrapper
+{
+public:
+    CAudioSmoothWrapper();
+    ~CAudioSmoothWrapper();
+
+public:
+    // type 是需要的效果器的Type
+    int init(int type,int sample_rate, int channel);
+    int uninit();
+    int set_param(AE_PARAMS* param);
+    int get_param(AE_PARAMS* param);
+    int reset();
+    int get_latency_ms();
+    int process(float* in_buf, float* out_buf, int length);
+
+    // 切换到新的效果器完成，用来给外部做延迟时间调整,只有切换完成才可以重新调整延迟时间，否则会有杂音问题
+    int get_change_status();
+    int close_effect(); // 关闭该音效
+    int get_switch_status();// 获取音效开关状态
+    int get_effect_id(); // 获取唯一标示ID
+
+private:
+    IAudioEffects* m_current_iaudio;
+    IAudioEffects* m_new_iaudio;
+
+    int m_sample_rate;
+    int m_channel;
+
+    float m_last_ms; // 当前切换参数过程中已经持续的时间
+    std::mutex m_mutex; // 加锁
+    bool m_update; // 需要切换到新的效果器
+    bool m_change_status;
+    bool m_current_switch; // 是否处于音效开启状态
+    bool m_new_switch;
+    bool m_fade_in; // 是否reset
+
+    float* m_tmp_in_buf;
+    float* m_tmp_out_buf;
+    int m_tmp_buf_len;
+};
+#endif //AUDIO_EFFECTS_LIB_CAUDIOSMOOTHWRAPPER_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_tone_shift/CAudioToneShift.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_tone_shift/CAudioToneShift.cpp
new file mode 100644
index 0000000..e3dfcd0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_tone_shift/CAudioToneShift.cpp
@@ -0,0 +1,123 @@
+//
+// Created by yangjianli on 2020-01-15.
+//
+
+#include "CAudioToneShift.h"
+#include "tone_shift/inc/CToneShift.h"
+#include "common/simple_delay/CSimpleDelayWrapper.h"
+static CAudioToneShiftCreator gs_audio_tone_shift_creator = CAudioToneShiftCreator(AE_EFFECT_TYPE_TONE_SHIFT);
+
+CAudioToneShift::CAudioToneShift()
+{
+    m_tone_shift_api = nullptr;
+    m_need_process = false;
+    m_ae_params_tone_shift = nullptr;
+    m_simple_delay = nullptr;
+}
+
+CAudioToneShift::~CAudioToneShift()
+{
+    uninit();
+}
+
+int CAudioToneShift::init(int sample_rate, int channel)
+{
+    m_tone_shift_api = new CToneShift();
+    m_tone_shift_api->init(sample_rate, channel);
+    int samples = int(sample_rate * 1.0 / 1000 * m_tone_shift_api->get_latence());
+    m_simple_delay = new CSimpleDelayWrapper();
+    m_simple_delay->init(samples, channel);
+    m_need_process = false;
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioToneShift::uninit() {
+    if (nullptr != m_tone_shift_api)
+    {
+        m_tone_shift_api->uninit();
+        delete m_tone_shift_api;
+        m_tone_shift_api = nullptr;
+    }
+
+    if(nullptr != m_ae_params_tone_shift)
+    {
+        delete m_ae_params_tone_shift;
+        m_ae_params_tone_shift = nullptr;
+    }
+
+    if (nullptr != m_simple_delay)
+    {
+        delete m_simple_delay;
+        m_simple_delay = nullptr;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioToneShift::get_effectId()
+{
+    return AE_EFFECT_TYPE_TONE_SHIFT;
+}
+
+int CAudioToneShift::get_latency_ms()
+{
+    return m_tone_shift_api->get_latence();
+}
+
+int CAudioToneShift::reset()
+{
+    m_tone_shift_api->reset();
+    m_simple_delay->reset();
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioToneShift::set_params(AE_PARAMS *param)
+{
+    if(param != nullptr)
+    {
+        AE_PARAMS_TONE_SHIFT* tp = (AE_PARAMS_TONE_SHIFT*) param;
+        if(tp->shift_value != 0)
+        {
+            m_need_process = true;
+            m_tone_shift_api->set_shift_value(tp->shift_value);
+            if(nullptr == m_ae_params_tone_shift)
+            {
+                m_ae_params_tone_shift = new AE_PARAMS_TONE_SHIFT();
+                m_ae_params_tone_shift->max_value = MAX_TONE_SHIFT_VALUE;
+                m_ae_params_tone_shift->min_value = MIN_TONE_SHIFT_VALUE;
+            }
+            memcpy(m_ae_params_tone_shift, tp, sizeof(AE_PARAMS_TONE_SHIFT));
+        }
+        else
+        {
+            m_need_process = false;
+        }
+    }else
+    {
+        m_need_process = false;
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioToneShift::get_params(AE_PARAMS *param)
+{
+    if(nullptr != param && nullptr != m_ae_params_tone_shift)
+    {
+        memcpy(param, m_ae_params_tone_shift, sizeof(AE_PARAMS_TONE_SHIFT));
+    }
+    return AE_ERR_SUCCESS;
+}
+
+int CAudioToneShift::process(float *in_buf, float *out_buf, int length)
+{
+    if(in_buf != out_buf)
+    {
+        memcpy(out_buf, in_buf, sizeof(float) * length);
+    }
+
+    if(m_need_process)
+    {
+        return m_tone_shift_api->process(in_buf, length, out_buf, length);
+    }
+    m_simple_delay->process(in_buf, out_buf, length);
+    return AE_ERR_SUCCESS;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_tone_shift/CAudioToneShift.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_tone_shift/CAudioToneShift.h
new file mode 100644
index 0000000..51d9229
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/audio_tone_shift/CAudioToneShift.h
@@ -0,0 +1,48 @@
+//
+// Created by yangjianli on 2020-01-15.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CAUDIOTONESHIFT_H
+#define AUDIO_EFFECTS_LIB_CAUDIOTONESHIFT_H
+
+#include "IAudioEffects.h"
+
+class CToneShift;
+class CSimpleDelayWrapper;
+class CAudioToneShift : public IAudioEffects
+{
+public:
+    CAudioToneShift();
+    ~CAudioToneShift();
+public:
+    int init(int sample_rate, int channel) override;
+    int reset() override;
+    int uninit() override;
+    int process(float* in_buf, float* out_buf, int length) override;
+    int get_latency_ms() override;
+    int set_params(AE_PARAMS* param) override;
+    int get_params(AE_PARAMS* param) override;
+    int get_effectId() override; // 获取唯一ID
+
+private:
+    CToneShift* m_tone_shift_api;
+    AE_PARAMS_TONE_SHIFT* m_ae_params_tone_shift;
+    CSimpleDelayWrapper* m_simple_delay;
+    bool m_need_process;
+};
+
+
+class CAudioToneShiftCreator : public ICreator
+{
+
+public:
+    CAudioToneShiftCreator(int type):ICreator(type){};
+
+public:
+    IAudioEffects* get_inst() override
+    {
+        return new CAudioToneShift();
+    };
+};
+
+#endif //AUDIO_EFFECTS_LIB_CAUDIOTONESHIFT_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/keep_volume_steady/CKeepVolumeSteady.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/keep_volume_steady/CKeepVolumeSteady.cpp
new file mode 100644
index 0000000..9c4f058
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/keep_volume_steady/CKeepVolumeSteady.cpp
@@ -0,0 +1,40 @@
+//
+// Created by yangjianli on 2020-02-05.
+//
+
+#include "CKeepVolumeSteady.h"
+#include "common/utils.h"
+#include "stdio.h"
+CKeepVolumeSteady::CKeepVolumeSteady()
+{
+    m_channel = 1; // 默认给个1,防止未给参数导致bug出现
+}
+
+CKeepVolumeSteady::~CKeepVolumeSteady()
+{
+
+}
+
+void CKeepVolumeSteady::init(int channel)
+{
+    m_channel = channel;
+    reset();
+}
+
+void CKeepVolumeSteady::reset()
+{
+    m_current_gain = 1.0;
+}
+
+void CKeepVolumeSteady::pre_process(float *buf, int len)
+{
+    m_before_rms = au_calc_rms(buf, len, m_channel);
+}
+
+void CKeepVolumeSteady::after_process(float *buf, int len)
+{
+    float after_rms = au_calc_rms(buf, len, m_channel);
+    float new_gain = after_rms > 0 ? m_before_rms / after_rms : 1.0;
+    au_float_gain_crossfade(m_current_gain, new_gain, buf, len, m_channel);
+    m_current_gain = new_gain;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/keep_volume_steady/CKeepVolumeSteady.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/keep_volume_steady/CKeepVolumeSteady.h
new file mode 100644
index 0000000..fc8f72c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/keep_volume_steady/CKeepVolumeSteady.h
@@ -0,0 +1,32 @@
+//
+// Created by yangjianli on 2020-02-05.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CKEEPVOLUMESTEADY_H
+#define AUDIO_EFFECTS_LIB_CKEEPVOLUMESTEADY_H
+
+/**
+ * 保证音频的RMS值不变来保持整体的音量平稳
+ * 该算法对于使用带有回声的音效的效果不好
+ */
+#include "AudioEffectsConf.h"
+class CKeepVolumeSteady {
+public:
+    CKeepVolumeSteady();
+    ~CKeepVolumeSteady();
+
+public:
+    void init(int channel);
+    void reset();
+
+    void pre_process(float* buf, int len);
+    void after_process(float* buf, int len);
+
+private:
+    int m_channel;
+    float m_current_gain;
+    float m_before_rms;
+};
+
+
+#endif //AUDIO_EFFECTS_LIB_CKEEPVOLUMESTEADY_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelay.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelay.cpp
new file mode 100644
index 0000000..536c5de
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelay.cpp
@@ -0,0 +1,96 @@
+//
+// Created by yangjianli on 2020/12/11.
+//
+
+#include "CSimpleDelay.h"
+#include <memory>
+int32_t simple_delay_next_power_2(int32_t x)
+{
+    if(x > 0)
+    {
+        x--;
+        x |= x >> 1;
+        x |= x >> 2;
+        x |= x >> 4;
+        x |= x >> 8;
+        x |= x >> 16;
+    }
+    return x + 1;
+}
+
+CSimpleDelay::CSimpleDelay()
+{
+    m_idx = 0;
+    m_mask = 0;
+    m_buffer_len = 0;
+    m_delay_len = 0;
+    m_cache = new float[1];
+    m_cache[0] = 0;
+}
+
+CSimpleDelay::~CSimpleDelay()
+{
+    m_idx = 0;
+    m_mask = 0;
+    m_buffer_len = 0;
+    m_delay_len = 0;
+
+    if(m_cache)
+    {
+        delete [] m_cache;
+        m_cache = NULL;
+    }
+}
+
+void CSimpleDelay::reset()
+{
+    if(m_cache)
+    {
+        memset(m_cache, 0, m_buffer_len * sizeof(float));
+    }
+}
+
+bool CSimpleDelay::set_delay(int delay_len)
+{
+    //如果完全一致的话
+    if(m_delay_len == delay_len)
+    {
+        return true;
+    }
+
+    if(m_buffer_len > delay_len)
+    {
+        reset();
+        m_delay_len = delay_len;
+        return true;
+    }
+
+    int len = simple_delay_next_power_2(delay_len);
+    float * buffer = new float[len];
+    memset(buffer, 0, len * sizeof(len));
+
+    if(m_cache)
+    {
+        delete [] m_cache;
+        m_cache = NULL;
+    }
+
+    m_idx = 0;
+    m_mask = len - 1;
+    m_buffer_len = len;
+    m_delay_len = delay_len;
+    m_cache = buffer;
+
+    return true;
+}
+
+void CSimpleDelay::process(float * buffer, int len)
+{
+    if(m_delay_len > 0)
+    {
+        for(int i = 0; i < len; i++)
+        {
+            buffer[i] = process(buffer[i]);
+        }
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelay.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelay.h
new file mode 100644
index 0000000..5a4d627
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelay.h
@@ -0,0 +1,43 @@
+//
+// Created by yangjianli on 2020/12/11.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CSIMPLEDELAY_H
+#define AUDIO_EFFECTS_LIB_CSIMPLEDELAY_H
+
+#include "stdint.h"
+#include <cstring>
+class CSimpleDelay
+{
+public:
+    CSimpleDelay();
+    ~CSimpleDelay();
+
+public:
+    bool set_delay(int delay_len);
+    void reset();
+    void process(float * buffer, int len);
+    inline float process(float in)
+    {
+        int idx = (m_idx + m_delay_len) & m_mask;
+
+        float out = m_cache[m_idx];
+
+        m_cache[idx] = in;
+
+        m_idx = (m_idx + 1) & m_mask;
+
+        return out;
+    }
+
+private:
+    int m_idx;
+    int m_mask;
+    int m_buffer_len;
+    int m_delay_len;
+    float * m_cache;
+};
+
+
+
+#endif //AUDIO_EFFECTS_LIB_CSIMPLEDELAY_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelayWrapper.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelayWrapper.cpp
new file mode 100644
index 0000000..4891c7f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelayWrapper.cpp
@@ -0,0 +1,49 @@
+//
+// Created by yangjianli on 2020/12/11.
+//
+
+#include "CSimpleDelayWrapper.h"
+#include "CSimpleDelay.h"
+CSimpleDelayWrapper::CSimpleDelayWrapper()
+{
+    m_delay_list.clear();
+    m_channel = 0;
+}
+
+CSimpleDelayWrapper::~CSimpleDelayWrapper()
+{
+    // clear时,智能指针销毁,各个实例调用自己的析构函数，释放空间
+    m_delay_list.clear();
+    m_channel = 0;
+}
+
+int CSimpleDelayWrapper::init(int samples, int channel)
+{
+    m_delay_list.clear();
+    for(int i = 0; i < channel; i++)
+    {
+        m_delay_list.emplace_back(std::make_shared<CSimpleDelay>());
+        m_delay_list[i]->set_delay(samples);
+    }
+    m_channel = channel;
+    return 0;
+}
+
+void CSimpleDelayWrapper::process(float *in_buf, float* out_buf, int len)
+{
+    for(int i = 0; i < len; i+= m_channel)
+    {
+        for (int j =0 ; j < m_channel; j++)
+        {
+            out_buf[i+j] = m_delay_list[j]->process(in_buf[i+j]);
+        }
+    }
+}
+
+void CSimpleDelayWrapper::reset()
+{
+    for(int i = 0; i < m_channel; i++)
+    {
+        m_delay_list[i]->reset();
+    }
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelayWrapper.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelayWrapper.h
new file mode 100644
index 0000000..a804933
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/simple_delay/CSimpleDelayWrapper.h
@@ -0,0 +1,47 @@
+//
+// Created by yangjianli on 2020/12/11.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_CSIMPLEDELAYWRAPPER_H
+#define AUDIO_EFFECTS_LIB_CSIMPLEDELAYWRAPPER_H
+
+
+// 封装延迟器
+#include "common/simple_delay/CSimpleDelay.h"
+#include <vector>
+#include <memory>
+class CSimpleDelayWrapper
+{
+public:
+    CSimpleDelayWrapper();
+    ~CSimpleDelayWrapper();
+
+public:
+    /**
+     * 初始化延迟器
+     * @param samples 每个通道的采样点的数量
+     * @param channel 通道数
+     * @return
+     */
+    int init(int samples, int channel);
+
+    /**
+     * 处理过程，入多少出多少
+     * 立体声使用交错方式存储
+     * @param buf 数据地址
+     * @param len 数据长度
+     */
+    void process(float* in_buf, float* out_buf, int len);
+
+    /**
+     * 清空内部数据，重新开始
+     * @return
+     */
+    void reset();
+
+public:
+    std::vector<std::shared_ptr<CSimpleDelay>> m_delay_list;
+    int m_channel;
+};
+
+#endif //AUDIO_EFFECTS_LIB_CSIMPLEDELAYWRAPPER_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/utils.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/utils.cpp
new file mode 100644
index 0000000..21db75c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/utils.cpp
@@ -0,0 +1,138 @@
+//
+// Created by yangjianli on 2020-01-03.
+//
+
+#include "utils.h"
+#include "math.h"
+
+void au_short_fade_in(short *buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = (short)(buffer[i] * i / size);
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = (short)(buffer[i] * i / size);
+            buffer[i + 1] = (short)(buffer[i + 1] * i / size);
+        }
+    }
+}
+
+void au_float_fade_in(float *buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = buffer[i] * i / size;
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = buffer[i] * i / size;
+            buffer[i + 1] = buffer[i + 1] * i / size;
+        }
+    }
+}
+
+void au_short_fade_out(short *buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = (short)(buffer[i] * (size - i) / size);
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = (short)(buffer[i] * (size - i) / size);
+            buffer[i + 1] = (short)(buffer[i + 1] * (size - i) / size);
+        }
+    }
+}
+
+void au_float_fade_out(float *buffer, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            buffer[i] = buffer[i] * (size - i) / size;
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            buffer[i] = buffer[i] * (size - i) / size;
+            buffer[i + 1] = buffer[i + 1] * (size - i) / size;
+        }
+    }
+}
+
+
+
+void ShortToFloat(short * in, float * out, int num)
+{
+    for(int i = 0; i < num; i++)
+    {
+        out[i] = in[i] / 32768.0f;
+    }
+}
+
+void au_float_cross_fade(float *fadein_buf, float *fadeout_buf, float *out, int size, int channel)
+{
+    if(1 == channel)
+    {
+        for(int i = 0; i < size; i++)
+        {
+            out[i] = fadein_buf[i] + fadeout_buf[i] * (size - i) / size;
+        }
+    }
+    else
+    {
+        for(int i = 0; i < size; i += 2)
+        {
+            out[i] = fadein_buf[i] + fadeout_buf[i] * (size - i) / size;
+            out[i + 1] = fadein_buf[i + 1] + fadeout_buf[i + 1] * (size - i) / size;
+        }
+    }
+}
+
+float au_calc_rms(float *in, int len, int channel)
+{
+    float rms = 0;
+    // 只取用第一个声道数据
+    for(int i=0;i<len;i+=channel)
+    {
+        rms += in[i] * in[i];
+    }
+    rms /= int(len / channel);
+    rms = sqrt(rms);
+    return rms;
+}
+
+void au_float_gain_crossfade(float src_gain, float dst_gain, float *in, int size, int channel)
+{
+    float gain = 0.0;
+    for(int k=0;k<size;k+=channel)
+    {
+        gain = src_gain * (size - k) / size +
+               dst_gain * k / size;
+        for(int kk=0;kk<channel;kk++)
+        {
+            in[k+kk] *= gain;
+        }
+    }
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/utils.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/utils.h
new file mode 100644
index 0000000..78bb202
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/common/utils.h
@@ -0,0 +1,31 @@
+//
+// Created by yangjianli on 2020-01-03.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_UTILS_H
+#define AUDIO_EFFECTS_LIB_UTILS_H
+
+//进行一段数据的fadein
+void au_short_fade_in(short *buffer, int size, int channel);
+void au_float_fade_in(float *buffer, int size, int channel);
+
+//进行一段数据的fadeout
+void au_short_fade_out(short *buffer, int size, int channel);
+void au_float_fade_out(float *buffer, int size, int channel);
+
+//浮点转定点数据
+void au_float2short(float *in, short *out, int num);
+
+//定点转浮点数据
+void au_short2float(short *in, float *out, int num);
+
+//浮点的crossfade代码
+void au_float_cross_fade(float *fadein_buf, float *fadeout_buf, float *out, int size, int channel);
+
+// 计算rms
+float au_calc_rms(float *in, int len, int channel);
+
+// 从src_gain->dst_gain增益平滑增长
+void au_float_gain_crossfade(float src_gain, float dst_gain, float *in, int size, int channel);
+
+#endif //AUDIO_EFFECTS_LIB_UTILS_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/manager/Manager.cpp b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/manager/Manager.cpp
new file mode 100644
index 0000000..7f09124
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/manager/Manager.cpp
@@ -0,0 +1,33 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#include "Manager.h"
+#include "IAudioEffects.h"
+#include "map"
+
+// 通过这个方式保证静态变量的顺序
+// 因为不同的类属于不同的编译单元，不同的编译单元之间，其全局变量的初始化顺序不一致
+// 通过这个方式保证该变量被调用的时候，一定进行过初始化
+static std::map<int, ICreator*>* get_map()
+{
+    static std::map<int, ICreator*> ae_creator_map;
+    return &ae_creator_map;
+}
+
+void registered(int type, ICreator* creator)
+{
+    std::map<int, ICreator*>* ae_map = get_map();
+    ae_map->insert(std::make_pair(type, creator));
+}
+
+IAudioEffects* get_inst(int type)
+{
+    std::map<int, ICreator*>* ae_map = get_map();
+    std::map<int, ICreator*>::iterator it = ae_map->find(type);
+    if(it != ae_map->end())
+    {
+        return it->second->get_inst();
+    }
+    return nullptr;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/manager/Manager.h b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/manager/Manager.h
new file mode 100644
index 0000000..5c40f36
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/src/manager/Manager.h
@@ -0,0 +1,16 @@
+//
+// Created by yangjianli on 2020-01-09.
+//
+
+#ifndef AUDIO_EFFECTS_LIB_MANAGER_H
+#define AUDIO_EFFECTS_LIB_MANAGER_H
+#include "AudioEffectsConf.h"
+class IAudioEffects;
+class ICreator;
+
+
+void registered(int type, ICreator* creator);
+
+IAudioEffects* get_inst(int type);
+
+#endif //AUDIO_EFFECTS_LIB_MANAGER_H
diff --git a/AutoCoverTool/ref/tools/mixer/audio_effects_lib/toolchain/ios.toolchain.cmake b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/toolchain/ios.toolchain.cmake
new file mode 100644
index 0000000..a56ea82
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_effects_lib/toolchain/ios.toolchain.cmake
@@ -0,0 +1,429 @@
+# This file is part of the ios-cmake project. It was retrieved from
+# https://github.com/cristeab/ios-cmake.git, which is a fork of
+# https://code.google.com/p/ios-cmake/. Which in turn is based off of
+# the Platform/Darwin.cmake and Platform/UnixPaths.cmake files which
+# are included with CMake 2.8.4
+#
+# The ios-cmake project is licensed under the new BSD license.
+#
+# Copyright (c) 2014, Bogdan Cristea and LTE Engineering Software,
+# Kitware, Inc., Insight Software Consortium.  All rights reserved.
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+# 1. Redistributions of source code must retain the above copyright
+# notice, this list of conditions and the following disclaimer.
+#
+# 2. Redistributions in binary form must reproduce the above copyright
+# notice, this list of conditions and the following disclaimer in the
+# documentation and/or other materials provided with the distribution.
+#
+# 3. Neither the name of the copyright holder nor the names of its
+# contributors may be used to endorse or promote products derived from
+# this software without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+# COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+# BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
+# ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+# POSSIBILITY OF SUCH DAMAGE.
+#
+# This file is based off of the Platform/Darwin.cmake and
+# Platform/UnixPaths.cmake files which are included with CMake 2.8.4
+# It has been altered for iOS development.
+#
+# Updated by Alex Stewart (alexs.mac@gmail.com)
+#
+# *****************************************************************************
+#      Now maintained by Alexander Widerberg (widerbergaren [at] gmail.com)
+#                      under the BSD-3-Clause license
+# *****************************************************************************
+#
+#                           INFORMATION / HELP
+#
+# The following variables control the behaviour of this toolchain:
+#
+# IOS_PLATFORM: OS (default) or SIMULATOR or SIMULATOR64 or TVOS or SIMULATOR_TVOS
+#    OS = Build for iPhoneOS.
+#    SIMULATOR = Build for x86 i386 iPhone Simulator.
+#    SIMULATOR64 = Build for x86_64 iPhone Simulator.
+#    TVOS = Build for AppleTVOS.
+#    SIMULATOR_TVOS = Build for x86_64 AppleTV Simulator.
+# CMAKE_OSX_SYSROOT: Path to the iOS SDK to use.  By default this is
+#    automatically determined from IOS_PLATFORM and xcodebuild, but
+#    can also be manually specified (although this should not be required).
+# CMAKE_IOS_DEVELOPER_ROOT: Path to the Developer directory for the iOS platform
+#    being compiled for.  By default this is automatically determined from
+#    CMAKE_OSX_SYSROOT, but can also be manually specified (although this should
+#    not be required).
+# ENABLE_BITCODE: (1|0) Enables or disables bitcode support. Default 1 (true)
+# ENABLE_ARC: (1|0) Enables or disables ARC support. Default 1 (true, ARC enabled by default)
+# ENABLE_VISIBILITY: (1|0) Enables or disables symbol visibility support. Default 0 (false, visibility hidden by default)
+# IOS_ARCH: (armv7 armv7s arm64 i386 x86_64) If specified, will override the default architectures for the given IOS_PLATFORM
+#    OS = armv7 armv7s arm64
+#    SIMULATOR = i386
+#    SIMULATOR64 = x86_64
+#    TVOS = arm64
+#    SIMULATOR_TVOS = x86_64
+#
+# This toolchain defines the following variables for use externally:
+#
+# XCODE_VERSION: Version number (not including Build version) of Xcode detected.
+# IOS_SDK_VERSION: Version of iOS SDK being used.
+# CMAKE_OSX_ARCHITECTURES: Architectures being compiled for (generated from
+#    IOS_PLATFORM).
+#
+# This toolchain defines the following macros for use externally:
+#
+# set_xcode_property (TARGET XCODE_PROPERTY XCODE_VALUE XCODE_VARIANT)
+#   A convenience macro for setting xcode specific properties on targets.
+#   Available variants are: All, Release, RelWithDebInfo, Debug, MinSizeRel
+#   example: set_xcode_property (myioslib IPHONEOS_DEPLOYMENT_TARGET "3.1" "all").
+#
+# find_host_package (PROGRAM ARGS)
+#   A macro used to find executable programs on the host system, not within the
+#   iOS environment.  Thanks to the android-cmake project for providing the
+#   command.
+
+# Fix for PThread library not in path
+set(CMAKE_THREAD_LIBS_INIT "-lpthread")
+set(CMAKE_HAVE_THREADS_LIBRARY 1)
+set(CMAKE_USE_WIN32_THREADS_INIT 0)
+set(CMAKE_USE_PTHREADS_INIT 1)
+
+# Get the Xcode version being used.
+execute_process(COMMAND xcodebuild -version
+  OUTPUT_VARIABLE XCODE_VERSION
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+string(REGEX MATCH "Xcode [0-9\\.]+" XCODE_VERSION "${XCODE_VERSION}")
+string(REGEX REPLACE "Xcode ([0-9\\.]+)" "\\1" XCODE_VERSION "${XCODE_VERSION}")
+message(STATUS "Building with Xcode version: ${XCODE_VERSION}")
+# Default to building for iPhoneOS if not specified otherwise, and we cannot
+# determine the platform from the CMAKE_OSX_ARCHITECTURES variable. The use
+# of CMAKE_OSX_ARCHITECTURES is such that try_compile() projects can correctly
+# determine the value of IOS_PLATFORM from the root project, as
+# CMAKE_OSX_ARCHITECTURES is propagated to them by CMake.
+if (NOT DEFINED IOS_PLATFORM)
+  if (CMAKE_OSX_ARCHITECTURES)
+    if (CMAKE_OSX_ARCHITECTURES MATCHES ".*arm.*")
+      set(IOS_PLATFORM "OS")
+    elseif (CMAKE_OSX_ARCHITECTURES MATCHES "i386")
+      set(IOS_PLATFORM "SIMULATOR")
+    elseif (CMAKE_OSX_ARCHITECTURES MATCHES "x86_64")
+      set(IOS_PLATFORM "SIMULATOR64")
+    endif()
+  endif()
+  if (NOT IOS_PLATFORM)
+    set(IOS_PLATFORM "OS")
+  endif()
+endif()
+set(IOS_PLATFORM ${IOS_PLATFORM} CACHE STRING
+  "Type of iOS platform for which to build.")
+# Determine the platform name and architectures for use in xcodebuild commands
+# from the specified IOS_PLATFORM name.
+if (IOS_PLATFORM STREQUAL "OS")
+  set(XCODE_IOS_PLATFORM iphoneos)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH armv7 armv7s arm64)
+  endif()
+elseif (IOS_PLATFORM STREQUAL "SIMULATOR")
+  set(XCODE_IOS_PLATFORM iphonesimulator)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH i386)
+  endif()
+elseif(IOS_PLATFORM STREQUAL "SIMULATOR64")
+  set(XCODE_IOS_PLATFORM iphonesimulator)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH x86_64)
+  endif()
+elseif (IOS_PLATFORM STREQUAL "TVOS")
+  set(XCODE_IOS_PLATFORM appletvos)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH arm64)
+  endif()
+elseif (IOS_PLATFORM STREQUAL "SIMULATOR_TVOS")
+  set(XCODE_IOS_PLATFORM appletvsimulator)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH x86_64)
+  endif()
+else()
+  message(FATAL_ERROR "Invalid IOS_PLATFORM: ${IOS_PLATFORM}")
+endif()
+message(STATUS "Configuring iOS build for platform: ${IOS_PLATFORM}, "
+  "architecture(s): ${IOS_ARCH}")
+# If user did not specify the SDK root to use, then query xcodebuild for it.
+if (NOT CMAKE_OSX_SYSROOT)
+  execute_process(COMMAND xcodebuild -version -sdk ${XCODE_IOS_PLATFORM} Path
+    OUTPUT_VARIABLE CMAKE_OSX_SYSROOT
+    ERROR_QUIET
+    OUTPUT_STRIP_TRAILING_WHITESPACE)
+  message(STATUS "Using SDK: ${CMAKE_OSX_SYSROOT} for platform: ${IOS_PLATFORM}")
+endif()
+if (NOT EXISTS ${CMAKE_OSX_SYSROOT})
+  message(FATAL_ERROR "Invalid CMAKE_OSX_SYSROOT: ${CMAKE_OSX_SYSROOT} "
+    "does not exist.")
+endif()
+# Specify minimum version of deployment target.
+if (NOT DEFINED IOS_DEPLOYMENT_TARGET)
+  # Unless specified, SDK version 8.0 is used by default as minimum target version.
+  set(IOS_DEPLOYMENT_TARGET "8.0"
+      CACHE STRING "Minimum iOS version to build for." )
+  message(STATUS "Using the default min-version since IOS_DEPLOYMENT_TARGET not provided!")
+endif()
+# Use bitcode or not
+if (NOT DEFINED ENABLE_BITCODE AND NOT IOS_ARCH MATCHES "((^|, )(i386|x86_64))+")
+  # Unless specified, enable bitcode support by default
+  set(ENABLE_BITCODE TRUE CACHE BOOL "Whether or not to enable bitcode")
+  message(STATUS "Enabling bitcode support by default. ENABLE_BITCODE not provided!")
+endif()
+if (NOT DEFINED ENABLE_BITCODE)
+  message(STATUS "Disabling bitcode support by default on simulators. ENABLE_BITCODE not provided for override!")
+endif()
+# Use ARC or not
+if (NOT DEFINED ENABLE_ARC)
+  # Unless specified, enable ARC support by default
+  set(ENABLE_ARC TRUE CACHE BOOL "Whether or not to enable ARC")
+  message(STATUS "Enabling ARC support by default. ENABLE_ARC not provided!")
+endif()
+# Use hidden visibility or not
+if (NOT DEFINED ENABLE_VISIBILITY)
+  # Unless specified, disable symbols visibility by default
+  set(ENABLE_VISIBILITY FALSE CACHE BOOL "Whether or not to hide symbols (-fvisibility=hidden)")
+  message(STATUS "Hiding symbols visibility by default. ENABLE_VISIBILITY not provided!")
+endif()
+# Get the SDK version information.
+execute_process(COMMAND xcodebuild -sdk ${CMAKE_OSX_SYSROOT} -version SDKVersion
+  OUTPUT_VARIABLE IOS_SDK_VERSION
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+# Find the Developer root for the specific iOS platform being compiled for
+# from CMAKE_OSX_SYSROOT.  Should be ../../ from SDK specified in
+# CMAKE_OSX_SYSROOT.  There does not appear to be a direct way to obtain
+# this information from xcrun or xcodebuild.
+if (NOT CMAKE_IOS_DEVELOPER_ROOT)
+  get_filename_component(IOS_PLATFORM_SDK_DIR ${CMAKE_OSX_SYSROOT} PATH)
+  get_filename_component(CMAKE_IOS_DEVELOPER_ROOT ${IOS_PLATFORM_SDK_DIR} PATH)
+endif()
+if (NOT EXISTS ${CMAKE_IOS_DEVELOPER_ROOT})
+  message(FATAL_ERROR "Invalid CMAKE_IOS_DEVELOPER_ROOT: "
+    "${CMAKE_IOS_DEVELOPER_ROOT} does not exist.")
+endif()
+# Find the C & C++ compilers for the specified SDK.
+if (NOT CMAKE_C_COMPILER)
+  execute_process(COMMAND xcrun -sdk ${CMAKE_OSX_SYSROOT} -find clang
+    OUTPUT_VARIABLE CMAKE_C_COMPILER
+    ERROR_QUIET
+    OUTPUT_STRIP_TRAILING_WHITESPACE)
+  message(STATUS "Using C compiler: ${CMAKE_C_COMPILER}")
+endif()
+if (NOT CMAKE_CXX_COMPILER)
+  execute_process(COMMAND xcrun -sdk ${CMAKE_OSX_SYSROOT} -find clang++
+    OUTPUT_VARIABLE CMAKE_CXX_COMPILER
+    ERROR_QUIET
+    OUTPUT_STRIP_TRAILING_WHITESPACE)
+  message(STATUS "Using CXX compiler: ${CMAKE_CXX_COMPILER}")
+endif()
+# Find (Apple's) libtool.
+execute_process(COMMAND xcrun -sdk ${CMAKE_OSX_SYSROOT} -find libtool
+  OUTPUT_VARIABLE IOS_LIBTOOL
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+message(STATUS "Using libtool: ${IOS_LIBTOOL}")
+# Configure libtool to be used instead of ar + ranlib to build static libraries.
+# This is required on Xcode 7+, but should also work on previous versions of
+# Xcode.
+set(CMAKE_C_CREATE_STATIC_LIBRARY
+  "${IOS_LIBTOOL} -static -o <TARGET> <LINK_FLAGS> <OBJECTS> ")
+set(CMAKE_CXX_CREATE_STATIC_LIBRARY
+  "${IOS_LIBTOOL} -static -o <TARGET> <LINK_FLAGS> <OBJECTS> ")
+# Get the version of Darwin (OS X) of the host.
+execute_process(COMMAND uname -r
+  OUTPUT_VARIABLE CMAKE_HOST_SYSTEM_VERSION
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+# Standard settings.
+set(CMAKE_SYSTEM_NAME Darwin CACHE INTERNAL "")
+set(CMAKE_SYSTEM_VERSION ${IOS_SDK_VERSION} CACHE INTERNAL "")
+set(UNIX TRUE CACHE BOOL "")
+set(APPLE TRUE CACHE BOOL "")
+set(IOS TRUE CACHE BOOL "")
+set(CMAKE_AR ar CACHE FILEPATH "" FORCE)
+set(CMAKE_RANLIB ranlib CACHE FILEPATH "" FORCE)
+# Force unset of OS X-specific deployment target (otherwise autopopulated),
+# required as of cmake 2.8.10.
+set(CMAKE_OSX_DEPLOYMENT_TARGET "" CACHE STRING
+  "Must be empty for iOS builds." FORCE)
+# Set the architectures for which to build.
+set(CMAKE_OSX_ARCHITECTURES ${IOS_ARCH} CACHE STRING "Build architecture for iOS")
+# Skip the platform compiler checks for cross compiling.
+set(CMAKE_CXX_COMPILER_FORCED TRUE)
+set(CMAKE_CXX_COMPILER_WORKS TRUE)
+set(CMAKE_C_COMPILER_FORCED TRUE)
+set(CMAKE_C_COMPILER_WORKS TRUE)
+# All iOS/Darwin specific settings - some may be redundant.
+set(CMAKE_SHARED_LIBRARY_PREFIX "lib")
+set(CMAKE_SHARED_LIBRARY_SUFFIX ".dylib")
+set(CMAKE_SHARED_MODULE_PREFIX "lib")
+set(CMAKE_SHARED_MODULE_SUFFIX ".so")
+set(CMAKE_C_COMPILER_ABI ELF)
+set(CMAKE_CXX_COMPILER_ABI ELF)
+set(CMAKE_C_HAS_ISYSROOT 1)
+set(CMAKE_CXX_HAS_ISYSROOT 1)
+set(CMAKE_MODULE_EXISTS 1)
+set(CMAKE_DL_LIBS "")
+set(CMAKE_C_OSX_COMPATIBILITY_VERSION_FLAG "-compatibility_version ")
+set(CMAKE_C_OSX_CURRENT_VERSION_FLAG "-current_version ")
+set(CMAKE_CXX_OSX_COMPATIBILITY_VERSION_FLAG "${CMAKE_C_OSX_COMPATIBILITY_VERSION_FLAG}")
+set(CMAKE_CXX_OSX_CURRENT_VERSION_FLAG "${CMAKE_C_OSX_CURRENT_VERSION_FLAG}")
+
+if(IOS_ARCH MATCHES "((^|, )(arm64|x86_64))+")
+  set(CMAKE_C_SIZEOF_DATA_PTR 8)
+  set(CMAKE_CXX_SIZEOF_DATA_PTR 8)
+  message(STATUS "Using a data_ptr size of 8")
+else()
+  set(CMAKE_C_SIZEOF_DATA_PTR 4)
+  set(CMAKE_CXX_SIZEOF_DATA_PTR 4)
+  message(STATUS "Using a data_ptr size of 4")
+endif()
+
+message(STATUS "Building for minimum iOS version: ${IOS_DEPLOYMENT_TARGET}"
+               " (SDK version: ${IOS_SDK_VERSION})")
+# Note that only Xcode 7+ supports the newer more specific:
+# -m${XCODE_IOS_PLATFORM}-version-min flags, older versions of Xcode use:
+# -m(ios/ios-simulator)-version-min instead.
+if (IOS_PLATFORM STREQUAL "OS")
+  if (XCODE_VERSION VERSION_LESS 7.0)
+    set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+      "-mios-version-min=${IOS_DEPLOYMENT_TARGET}")
+  else()
+    # Xcode 7.0+ uses flags we can build directly from XCODE_IOS_PLATFORM.
+    set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+      "-m${XCODE_IOS_PLATFORM}-version-min=${IOS_DEPLOYMENT_TARGET}")
+  endif()
+elseif (IOS_PLATFORM STREQUAL "TVOS")
+  set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+    "-mtvos-version-min=${IOS_DEPLOYMENT_TARGET}")
+elseif (IOS_PLATFORM STREQUAL "SIMULATOR_TVOS")
+  set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+    "-mtvos-simulator-version-min=${IOS_DEPLOYMENT_TARGET}")
+else()
+  # SIMULATOR or SIMULATOR64 both use -mios-simulator-version-min.
+  set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+    "-mios-simulator-version-min=${IOS_DEPLOYMENT_TARGET}")
+endif()
+message(STATUS "Version flags set to: ${XCODE_IOS_PLATFORM_VERSION_FLAGS}")
+
+if (ENABLE_BITCODE)
+  set(BITCODE "-fembed-bitcode")
+  set(HEADER_PAD "")
+  message(STATUS "Enabling bitcode support.")
+else()
+  set(BITCODE "")
+  set(HEADER_PAD "-headerpad_max_install_names")
+  message(STATUS "Disabling bitcode support.")
+endif()
+
+if (ENABLE_ARC)
+  set(FOBJC_ARC "-fobjc-arc")
+  message(STATUS "Enabling ARC support.")
+else()
+  set(FOBJC_ARC "-fno-objc-arc")
+  message(STATUS "Disabling ARC support.")
+endif()
+
+if (NOT ENABLE_VISIBILITY)
+  set(VISIBILITY "-fvisibility=hidden")
+  message(STATUS "Hiding symbols (-fvisibility=hidden).")
+else()
+  set(VISIBILITY "")
+endif()
+
+set(CMAKE_C_FLAGS
+"${XCODE_IOS_PLATFORM_VERSION_FLAGS} ${BITCODE} -fobjc-abi-version=2 ${FOBJC_ARC} ${C_FLAGS}")
+# Hidden visibilty is required for C++ on iOS.
+set(CMAKE_CXX_FLAGS
+"${XCODE_IOS_PLATFORM_VERSION_FLAGS} ${BITCODE} ${VISIBILITY} -fvisibility-inlines-hidden -fobjc-abi-version=2 ${FOBJC_ARC} ${CXX_FLAGS}")
+set(CMAKE_CXX_FLAGS_MINSIZEREL "${CMAKE_CXX_FLAGS} -DNDEBUG -Os -fomit-frame-pointer -ffast-math ${BITCODE} ${CXX_FLAGS_MINSIZEREL}")
+set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS} -DNDEBUG -O2 -g -fomit-frame-pointer -ffast-math ${BITCODE} ${CXX_FLAGS_RELWITHDEBINFO}")
+set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS} -DNDEBUG -O3 -fomit-frame-pointer -ffast-math ${BITCODE} ${CXX_FLAGS_RELEASE}")
+set(CMAKE_C_LINK_FLAGS "${XCODE_IOS_PLATFORM_VERSION_FLAGS} -Wl,-search_paths_first ${C_LINK_FLAGS}")
+set(CMAKE_CXX_LINK_FLAGS "${XCODE_IOS_PLATFORM_VERSION_FLAGS}  -Wl,-search_paths_first ${CXX_LINK_FLAGS}")
+
+# In order to ensure that the updated compiler flags are used in try_compile()
+# tests, we have to forcibly set them in the CMake cache, not merely set them
+# in the local scope.
+list(APPEND VARS_TO_FORCE_IN_CACHE
+  CMAKE_C_FLAGS
+  CMAKE_CXX_FLAGS
+  CMAKE_CXX_FLAGS_RELWITHDEBINFO
+  CMAKE_CXX_FLAGS_MINSIZEREL
+  CMAKE_CXX_FLAGS_RELEASE
+  CMAKE_C_LINK_FLAGS
+  CMAKE_CXX_LINK_FLAGS)
+foreach(VAR_TO_FORCE ${VARS_TO_FORCE_IN_CACHE})
+  set(${VAR_TO_FORCE} "${${VAR_TO_FORCE}}" CACHE STRING "" FORCE)
+endforeach()
+
+set(CMAKE_PLATFORM_HAS_INSTALLNAME 1)
+set (CMAKE_SHARED_LINKER_FLAGS "-rpath @executable_path/Frameworks -rpath @loader_path/Frameworks")
+set(CMAKE_SHARED_LIBRARY_CREATE_C_FLAGS "-dynamiclib ${HEADER_PAD}")
+set(CMAKE_SHARED_MODULE_CREATE_C_FLAGS "-bundle ${HEADER_PAD}")
+set(CMAKE_SHARED_MODULE_LOADER_C_FLAG "-Wl,-bundle_loader,")
+set(CMAKE_SHARED_MODULE_LOADER_CXX_FLAG "-Wl,-bundle_loader,")
+set(CMAKE_FIND_LIBRARY_SUFFIXES ".dylib" ".so" ".a")
+
+# Hack: if a new cmake (which uses CMAKE_INSTALL_NAME_TOOL) runs on an old
+# build tree (where install_name_tool was hardcoded) and where
+# CMAKE_INSTALL_NAME_TOOL isn't in the cache and still cmake didn't fail in
+# CMakeFindBinUtils.cmake (because it isn't rerun) hardcode
+# CMAKE_INSTALL_NAME_TOOL here to install_name_tool, so it behaves as it did
+# before, Alex.
+if (NOT DEFINED CMAKE_INSTALL_NAME_TOOL)
+  find_program(CMAKE_INSTALL_NAME_TOOL install_name_tool)
+endif (NOT DEFINED CMAKE_INSTALL_NAME_TOOL)
+
+# Set the find root to the iOS developer roots and to user defined paths.
+set(CMAKE_FIND_ROOT_PATH ${CMAKE_IOS_DEVELOPER_ROOT} ${CMAKE_OSX_SYSROOT}
+  ${CMAKE_PREFIX_PATH} CACHE string  "iOS find search path root" FORCE)
+# Default to searching for frameworks first.
+set(CMAKE_FIND_FRAMEWORK FIRST)
+# Set up the default search directories for frameworks.
+set(CMAKE_SYSTEM_FRAMEWORK_PATH
+  ${CMAKE_OSX_SYSROOT}/System/Library/Frameworks
+  ${CMAKE_OSX_SYSROOT}/System/Library/PrivateFrameworks
+  ${CMAKE_OSX_SYSROOT}/Developer/Library/Frameworks)
+# Only search the specified iOS SDK, not the remainder of the host filesystem.
+set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM ONLY)
+set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY ONLY)
+set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE ONLY)
+# This little macro lets you set any XCode specific property.
+macro(set_xcode_property TARGET XCODE_PROPERTY XCODE_VALUE XCODE_RELVERSION)
+  set(XCODE_RELVERSION_I "${XCODE_RELVERSION}")
+  if (XCODE_RELVERSION_I STREQUAL "All")
+    set_property(TARGET ${TARGET} PROPERTY
+    XCODE_ATTRIBUTE_${XCODE_PROPERTY} "${XCODE_VALUE}")
+  else()
+    set_property(TARGET ${TARGET} PROPERTY
+    XCODE_ATTRIBUTE_${XCODE_PROPERTY}[variant=${XCODE_RELVERSION_I}] "${XCODE_VALUE}")
+  endif()
+endmacro(set_xcode_property)
+# This macro lets you find executable programs on the host system.
+macro(find_host_package)
+  set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM NEVER)
+  set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY NEVER)
+  set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE NEVER)
+  set(IOS FALSE)
+  find_package(${ARGN})
+  set(IOS TRUE)
+  set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM ONLY)
+  set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY ONLY)
+  set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE ONLY)
+endmacro(find_host_package)
diff --git a/AutoCoverTool/ref/tools/mixer/audio_mixer/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/audio_mixer/CMakeLists.txt
new file mode 100644
index 0000000..22884c4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_mixer/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_AUDIO_MIXER_SRCS)
+add_library(audio_mixer ${DIR_AUDIO_MIXER_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/audio_mixer/inc/AudioMixer.h b/AutoCoverTool/ref/tools/mixer/audio_mixer/inc/AudioMixer.h
new file mode 100644
index 0000000..57d24fc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_mixer/inc/AudioMixer.h
@@ -0,0 +1,78 @@
+
+#ifndef __CAUDIO_MIXER_H__
+#define __CAUDIO_MIXER_H__
+
+#define AUMIX_VOLUME_MAX					(DEFAULT_VOLUME * 2 * 10)
+#define AUMIX_VOLUME_MIN					0
+#define AUMIX_VOLUME_NO_CHANGE				DEFAULT_VOLUME
+
+#define AUMIX_FLT_MIN		-1
+#define AUMIX_FLT_MAX		0.99996f
+#define AUMIX_LIMIT_HIGH	0.91556f
+#define AUMIX_LIMIT_LOW		-0.91556f
+
+#include "alimiter.h"
+
+class CFastDelay
+{
+public:
+	CFastDelay();
+	~CFastDelay();
+
+public:
+	bool set_delay(int delay_len);
+	void reset();
+	void process(float * buffer, int len);
+	inline float process(float in)
+	{
+		int idx = (m_idx + m_delay_len) & m_mask;
+
+		m_cache[idx] = in;
+
+		float out = m_cache[m_idx];
+
+		m_idx = (m_idx + 1) & m_mask;
+
+		return out;
+	}
+
+private:
+	int m_idx;
+	int m_mask;
+	int m_buffer_len;
+	int m_delay_len;
+	float * m_cache;
+};
+
+class CAudioMixer
+{
+public:
+	CAudioMixer();
+	~CAudioMixer();
+
+public:
+	bool init(int fs, int nChannels);
+	int get_latency();
+	void process(float * vocal, float * acc, float * out, int len);
+	int set_acc_delay(int delay_len);
+	void set_vocal_volume(int volume);
+	void set_acc_volume(int volume);
+	void reset();
+	void uninit();
+
+private:
+	void quick_agc(float * buffer, int len, float * max);
+
+private:
+	int m_nChannels;
+	int m_vocal_volume;
+	int m_acc_volume;
+	float m_factor_last[2];
+	int m_current_acc_delay_len;
+	int m_new_acc_delay_len;
+	CFastDelay * m_acc_delay;
+    SUPERSOUND::Alimiter* m_alimiter;
+
+};
+
+#endif // !__CAUDIO_MIXER_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_mixer/inc/common.h b/AutoCoverTool/ref/tools/mixer/audio_mixer/inc/common.h
new file mode 100644
index 0000000..2a16ec3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_mixer/inc/common.h
@@ -0,0 +1,149 @@
+//
+// Created by 杨将 on 2017/6/27.
+//
+
+#ifndef __COMMON_H__
+#define __COMMON_H__
+
+//#include <sys/malloc.h>
+#include <new>
+#include <math.h>
+//#include <include/types.h>
+
+#ifdef ST_DEBUG
+#include <assert.h>
+#define ASSERT(e) assert(e)
+#else
+#define ASSERT(e)
+#endif
+
+
+//定义一些常用的宏或者常量等
+
+//录制、播放、解码的缓存buffer的时间长度，单位ms
+#define RECORDER_CIRCLE_BUFFER_TIME     ((int)200)
+
+//默认写入文件的人声采样率
+#define FILE_VOCAL_SAMPLERATE           ((int)44100)
+
+//跳转在多少ms以内不需要进行跳转
+#define SEEK_NO_OPRATE                  (1.01)
+
+//文件读取的基本长度
+#define FILE_OPERATE_LEN                ((int)2048)
+//人声文件中进行fade的最大长度
+#define FILE_FADE_LEN                   ((int)240)
+//最大声道数，这个值不能改动，可以改成1
+#define MAX_CHANNEL                     ((int)2)
+
+//底层音量的中值
+#define DEFAULT_VOLUME                  ((int)50)
+
+//伴奏音量的基准值（分贝）
+#define DEFAULT_BASELINE_DB                  ((float)-14.57f)
+
+//安全关闭文件
+#ifndef SAFE_CLOSE_FILE
+#define SAFE_CLOSE_FILE(file)       \
+{                                   \
+    if(file)                        \
+    {                               \
+        fclose(file);               \
+        file = NULL;                \
+    }                               \
+}
+#endif //SAFE_CLOSE_FILE
+
+//安全释放内存
+#ifndef SAFE_FREE
+#define SAFE_FREE(ptr)              \
+{                                   \
+    if(ptr)                         \
+    {                               \
+        free(ptr);                  \
+        ptr = NULL;                 \
+    }                               \
+}
+#endif //SAFE_FREE
+
+//安全删除对象
+#ifndef SAFE_DELETE_OBJ
+#define SAFE_DELETE_OBJ(obj)        \
+{                                   \
+    if(obj)                         \
+    {                               \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_DELETE_OBJ
+
+//安全逆初始化并删除对象
+#ifndef SAFE_UNINIT_DELETE_OBJ
+#define SAFE_UNINIT_DELETE_OBJ(obj) \
+{                                   \
+    if(obj)                         \
+    {                               \
+        obj->uninit();              \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_UNINIT_DELETE_OBJ
+
+#ifndef SAFE_CLOSE_DELETE_OBJ
+#define SAFE_CLOSE_DELETE_OBJ(obj)  \
+{                                   \
+    if(obj)                         \
+    {                               \
+        obj->close();               \
+        delete obj;                 \
+        obj = NULL;                 \
+    }                               \
+}
+#endif //SAFE_CLOSE_DELETE_OBJ
+
+//安全删除数组
+#ifndef SAFE_DELETE_ARRAY
+#define SAFE_DELETE_ARRAY(array)    \
+{                                   \
+    if(array)                       \
+    {                               \
+        delete [] array;            \
+        array = NULL;               \
+    }                               \
+}
+#endif //SAFE_DELETE_ARRAY
+
+//取大值
+#ifndef GLOBAL_MAX
+#define GLOBAL_MAX(a, b)	(((a) > (b)) ? (a) : (b))
+#endif
+
+//取小值
+#ifndef GLOBAL_MIN
+#define GLOBAL_MIN(a,b)		(((a) < (b)) ? (a) : (b))
+#endif
+
+//取中间
+#ifndef GLOBAL_MID
+#define GLOBAL_MID(a, b, c)	(GLOBAL_MAX(a, GLOBAL_MIN(b, c)))
+#endif
+
+//取绝对值
+#ifndef GLOBAL_ABS
+#define GLOBAL_ABS(a)       ((a) < 0 ? (-(a)) : (a))
+#endif
+
+
+#ifndef CHECK_FLOAT_EQUAL
+#define CHECK_FLOAT_EQUAL(a, b)  (fabs(a - b) < 0.001f)
+#endif
+
+
+//extern GlobParam gGlobparm;
+
+#define TYPE_PLAY_ORIGIN 1
+#define TYPE_PLAY_CORRECTION 2
+
+#endif //__COMMON_H__
diff --git a/AutoCoverTool/ref/tools/mixer/audio_mixer/src/AudioMixer.cpp b/AutoCoverTool/ref/tools/mixer/audio_mixer/src/AudioMixer.cpp
new file mode 100644
index 0000000..808f0fa
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/audio_mixer/src/AudioMixer.cpp
@@ -0,0 +1,318 @@
+
+#include <math.h>
+#include <string.h>
+#include <stdio.h>
+#include <new>
+#include "AudioMixer.h"
+#include "common.h"
+#include "alimiter.h"
+
+int32_t supersound_next_power_2(int32_t x)
+{
+	if(x > 0)
+	{
+		x--;
+		x |= x >> 1;
+		x |= x >> 2;
+		x |= x >> 4;
+		x |= x >> 8;
+		x |= x >> 16;
+	}
+	return x + 1;
+}
+
+CFastDelay::CFastDelay()
+{
+	m_idx = 0;
+	m_mask = 0;
+	m_buffer_len = 0;
+	m_delay_len = 0;
+	m_cache = new float[1];
+	m_cache[0] = 0;
+}
+
+CFastDelay::~CFastDelay()
+{
+	m_idx = 0;
+	m_mask = 0;
+	m_buffer_len = 0;
+	m_delay_len = 0;
+
+	if(m_cache)
+	{
+		delete [] m_cache;
+		m_cache = NULL;
+	}
+}
+
+void CFastDelay::reset()
+{
+	if(m_cache)
+	{
+		memset(m_cache, 0, m_buffer_len * sizeof(float));
+	}
+}
+
+bool CFastDelay::set_delay(int delay_len)
+{
+	//如果完全一致的话
+	if(m_delay_len == delay_len)
+	{
+		return true;
+	}
+
+	if(m_buffer_len > delay_len)
+	{
+		reset();
+		m_delay_len = delay_len;
+		return true;
+	}
+
+	int len = supersound_next_power_2(delay_len);
+	float * buffer = new float[len];
+	memset(buffer, 0, len * sizeof(len));
+
+	if(m_cache)
+	{
+		delete [] m_cache;
+		m_cache = NULL;
+	}
+
+	m_idx = 0;
+	m_mask = len - 1;
+	m_buffer_len = len;
+	m_delay_len = delay_len;
+	m_cache = buffer;
+
+	return true;
+}
+
+void CFastDelay::process(float * buffer, int len)
+{
+	if(m_delay_len > 0)
+	{
+		for(int i = 0; i < len; i++)
+		{
+			buffer[i] = process(buffer[i]);
+		}
+	}
+}
+
+CAudioMixer::CAudioMixer()
+{
+	m_vocal_volume = AUMIX_VOLUME_NO_CHANGE;
+	m_acc_volume = AUMIX_VOLUME_NO_CHANGE;
+	m_factor_last[0] = 1;
+	m_factor_last[1] = 1;
+
+	m_current_acc_delay_len = 0;
+	m_new_acc_delay_len = 0;
+	m_acc_delay = NULL;
+}
+
+CAudioMixer::~CAudioMixer()
+{
+	uninit();
+}
+
+bool CAudioMixer::init(int fs, int nChannels)
+{
+	if ((nChannels != 2) && (nChannels != 1))
+	{
+		return false;
+	}
+
+	m_nChannels = nChannels;
+
+	m_acc_delay = new(std::nothrow) CFastDelay();
+	if(NULL == m_acc_delay)
+	{
+		return false;
+	}
+    m_alimiter = new(std::nothrow) SUPERSOUND::Alimiter();
+	if(NULL == m_alimiter)
+    {
+        return false;
+    }
+	m_alimiter->SetParam(fs, nChannels);
+	return true;
+}
+
+int CAudioMixer::get_latency()
+{
+	return 0;
+}
+
+void CAudioMixer::reset()
+{
+    m_factor_last[0] = 1;
+    m_factor_last[1] = 1;
+
+	if(m_acc_delay)
+	{
+		m_acc_delay->reset();
+	}
+
+//	if(m_alimiter)
+//    {
+//	    m_alimiter->Flush();
+//    }
+}
+
+int CAudioMixer::set_acc_delay(int delay_len)
+{
+	if(m_new_acc_delay_len != delay_len)
+	{
+		m_new_acc_delay_len = delay_len;
+	}
+
+	return false;
+}
+
+void CAudioMixer::process(float * vocal, float * acc, float * out, int len)
+{
+	float vocal_gain = m_vocal_volume / (float)AUMIX_VOLUME_NO_CHANGE;
+	float acc_gain = m_acc_volume / (float)AUMIX_VOLUME_NO_CHANGE;
+
+	float value = 0;
+	float max[2];
+	max[0] = max[1] = 0;
+
+	if(m_new_acc_delay_len != m_current_acc_delay_len)
+	{
+		m_current_acc_delay_len = m_new_acc_delay_len;
+		m_acc_delay->set_delay(m_current_acc_delay_len * m_nChannels);
+	}
+
+	m_acc_delay->process(acc, len);
+
+	for (int i = 0; i < len; i += m_nChannels)
+	{
+		for (int j = 0; j < m_nChannels; j++)
+		{
+			out[i + j] = vocal[i + j] * vocal_gain + acc[i + j] * acc_gain;
+			value = (float)fabs(out[i + j]);
+			if (max[j] < value)
+			{
+				max[j] = value;
+			}
+		}
+	}
+
+	quick_agc(out, len, max);
+    for (int i = 0; i < len; i++)
+    {
+        out[i] = out[i] > AUMIX_FLT_MAX ? AUMIX_FLT_MAX : (out[i] < AUMIX_FLT_MIN ? AUMIX_FLT_MIN : out[i]);
+    }
+//	float* tp = new float[len];
+//	memset(tp, 0, sizeof(float)*len);
+//    m_alimiter->Filter(out, tp, len);
+//    for(int i=0;i<len;i++)
+//    {
+////        if(tp[i] == 0 && (out[i] - tp[i]) > 0.5)
+////        {
+////            continue;
+////        }
+//        out[i] = tp[i];
+//    }
+//    delete [] tp;
+
+
+}
+
+void CAudioMixer::set_vocal_volume(int volume)
+{
+	if (volume == m_vocal_volume)
+		return ;
+
+	if (volume > AUMIX_VOLUME_MAX)
+		volume = AUMIX_VOLUME_MAX;
+	else if (volume < AUMIX_VOLUME_MIN)
+		volume = AUMIX_VOLUME_MIN;
+
+    m_vocal_volume = volume;
+}
+
+void CAudioMixer::set_acc_volume(int volume)
+{
+	if (volume == m_acc_volume)
+		return;
+
+	if (volume > AUMIX_VOLUME_MAX)
+		volume = AUMIX_VOLUME_MAX;
+	else if (volume < AUMIX_VOLUME_MIN)
+		volume = AUMIX_VOLUME_MIN;
+
+	m_acc_volume = volume;
+}
+
+void CAudioMixer::quick_agc(float * buffer, int len, float * max)
+{
+	float fdeta[2];
+	float fts[2];
+	int idx = len / m_nChannels / 8;
+
+	for (int i = 0; i < m_nChannels; i++)
+	{
+		if (max[i] <= AUMIX_LIMIT_HIGH)
+		{
+			fts[i] = m_factor_last[i] + 0.1f;
+			if (fts[i] > 1)
+				fts[i] = 1;
+		}
+		else
+		{
+			fts[i] = AUMIX_LIMIT_HIGH / max[i];
+			if (fts[i] < 0.34f)
+				fts[i] = 0.34f;
+		}
+
+		fdeta[i] = (fts[i] - m_factor_last[i]) / idx;
+	}
+
+	idx *= m_nChannels;
+	for (int i = 0; i < idx; i += m_nChannels)
+	{
+		for (int j = 0; j < m_nChannels; j++)
+		{
+			buffer[i + j] *= m_factor_last[j];
+			m_factor_last[j] += fdeta[j];
+		}
+	}
+	for (int i = idx; i < len; i += m_nChannels)
+	{
+		for (int j = 0; j < m_nChannels; j++)
+		{
+			buffer[i + j] *= m_factor_last[j];
+		}
+	}
+
+	for (int i = 0; i < m_nChannels; i++)
+	{
+		m_factor_last[i] = fts[i];
+	}
+}
+
+void CAudioMixer::uninit()
+{
+	m_vocal_volume = AUMIX_VOLUME_NO_CHANGE;
+	m_acc_volume = AUMIX_VOLUME_NO_CHANGE;
+	m_factor_last[0] = 1;
+	m_factor_last[1] = 1;
+
+	m_current_acc_delay_len = 0;
+	m_new_acc_delay_len = 0;
+
+	if(m_acc_delay)
+	{
+		delete m_acc_delay;
+		m_acc_delay = NULL;
+	}
+
+	if(m_alimiter)
+    {
+	    delete m_alimiter;
+	    m_alimiter = NULL;
+    }
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/denoise.cpp b/AutoCoverTool/ref/tools/mixer/denoise.cpp
new file mode 100644
index 0000000..bd49530
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise.cpp
@@ -0,0 +1,225 @@
+//
+// Created by yangjianli on 2019-09-09.
+//
+/**
+ * 输入一个音频和伴奏自动进行混合
+ * gated_loudness 当前音量
+ * gain 预期增益
+ */
+#include "iostream"
+#include "WaveFile.h"
+#include "math.h"
+#include "ebur128.h"
+#include "AudioMixer.h"
+#include "alimiter.h"
+#include "waves/inc/WaveFile.h"
+#include "CAudioEffectsChainApi.h"
+#include "string"
+#include "ae_server/CAeServer.h"
+#include <cstdio>
+#include <chrono>
+#include <iostream>
+#include <cstdlib>
+#include <sys/time.h>
+#include "denoise/webrtc/include/WebrtcDenoise.h"
+
+#define PROC_LEN 1024
+#define DEFAULT_BASELINE_DB (float)-14.57f
+
+int short2float(short *pInBuf, int nLen, float *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    return 0;
+}
+
+int float2short(float *pInBuf, int nLen, short *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = int(pInBuf[i] * 32768);
+    }
+    return 0;
+}
+
+/**
+ * 获取增益
+ * @param nChannel
+ * @param nSampleRate
+ * @param pData
+ * @param nLength
+ * @param gain
+ * @return
+ */
+int ebur128_whole(int nChannel, int nSampleRate, short *pData, const int nLength, double &gated_loudness, double &gain)
+{
+    printf("ebur128_init start .. %d\n", nLength);
+    ebur128_state *st = NULL;
+    st = ebur128_init(nChannel, nSampleRate, EBUR128_MODE_I);
+    if (NULL == st)
+    {
+        return -1;
+    }
+    int nPos = 0;
+    int nTmpLength = 0;
+    int nRet;
+    printf("process start ..\n");
+    while (nPos < nLength)
+    {
+        nTmpLength = PROC_LEN;
+        if (nLength - nPos < PROC_LEN)
+        {
+            nTmpLength = nLength - nPos;
+        }
+        nRet = ebur128_add_frames_short(st, pData + nPos, nTmpLength / nChannel);
+        if (nRet != 0)
+        {
+            return -2;
+        }
+        nPos += nTmpLength;
+    }
+    printf("process ok..\n");
+    gated_loudness = -1;
+    ebur128_loudness_global(st, &gated_loudness);
+    float db = (DEFAULT_BASELINE_DB - gated_loudness) / 20.f;
+    gain = pow(10, db);
+    printf("gated_loudness = %f db = %f  gain = %f\n", gated_loudness, db, gain);
+    ebur128_destroy(&st);
+    return 0;
+}
+
+
+/**
+ * 混合音频和伴奏
+ * @param pVocalIn
+ * @param pAccIn
+ * @param nLength
+ * @param gainVocal
+ * @param gainAcc
+ * @param pOutBuf
+ * @return
+ */
+int mix(float *pVocalIn, float *pAccIn, int nLength, double gainVocal, double gainAcc, float *pOutBuf,
+        int nSampleRate, int nChannel, int nDelay, std::string effect_file)
+{
+
+    CAudioMixer *cAudioMixer = new CAudioMixer();
+    cAudioMixer->init(nSampleRate, nChannel);
+    cAudioMixer->set_acc_delay(nDelay);
+    cAudioMixer->set_vocal_volume(int(gainVocal * 50));
+    cAudioMixer->set_acc_volume(int(gainAcc * 50));
+
+    int nPos = 0;
+    int nStep = 1024;
+    float *fTmp = new float[nStep];
+    cAudioMixer->reset();
+    nPos = 0;
+    nStep = 1024;
+    int cnt = 0;
+
+    CAeServer cAeServer;
+    cAeServer.init(nSampleRate, nChannel, nStep / nChannel);
+    AE_PARAMS_IM_EFFECT im_params = {
+            .effect_path = effect_file,
+    };
+    cAeServer.set_params(AE_TYPE_IM_EFFECT, (void *) &im_params);
+
+
+    while (nPos < nLength)
+    {
+        if (nLength - nPos < nStep)
+        {
+            nStep = nLength - nPos;
+        }
+        cnt++;
+        cAeServer.process(pVocalIn + nPos, pVocalIn + nPos, nStep);
+        cAudioMixer->process(pVocalIn + nPos, pAccIn + nPos, pOutBuf + nPos, nStep);
+        nPos += nStep;
+    }
+    cAeServer.uninit();
+    delete cAudioMixer;
+    delete[] fTmp;
+    return 0;
+}
+
+int denoise_webrtc(short *pInBuf, int nLength, int nChannel, int nSampleRate)
+{
+    CWebrtcDenoise cWebrtcDenoise;
+    cWebrtcDenoise.init(nSampleRate, nChannel);
+    float *pTmp = new float[nLength];
+    for (int i = 0; i < nLength; i++)
+    {
+        pTmp[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    cWebrtcDenoise.set_level(kHigh);
+    int nStep = 512 * nChannel;
+
+    for (int i = 0; i < nStep; i++)
+    {
+        pTmp[i] = pTmp[i] * i * 1.0 / nStep;
+    }
+
+    for (int i = 0, cnt = 0; i < nLength; i += nStep, cnt++)
+    {
+        if (nLength - i < nStep) continue;
+        cWebrtcDenoise.process(pTmp + i, nStep);
+    }
+
+    for (int i = 0; i < nLength; i++)
+    {
+        pInBuf[i] = short(pTmp[i] * 32768);
+    }
+    delete[] pTmp;
+    return 0;
+}
+
+double calc_power_rate(float *in_data, int32_t in_len, float *ref_data, int32_t ref_len)
+{
+    double in_power = 0;
+    double ref_power = 0;
+    int32_t min_len = in_len > ref_len ? ref_len : in_len;
+    for (int i = 0; i < min_len; i++)
+    {
+        in_power += (in_data[i]) * (in_data[i]);
+        ref_power += (ref_data[i]) * (ref_data[i]);
+    }
+    return ref_power / in_power;
+}
+
+
+int main(int argc, char *argv[])
+{
+    if (argc != 3)
+    {
+        printf("input error! example: ./main vocal_path dst_vocal_path\n");
+        return -1;
+    }
+    std::string sVocal = argv[1];
+    std::string sDstVocal = argv[2];
+
+    // 读取人声
+    CWaveFile *oWaveFile = new CWaveFile(sVocal.c_str(), false);
+    short *pVocalBuf = new short[oWaveFile->GetTotalFrames() * oWaveFile->GetChannels()];
+    oWaveFile->ReadFrameAsS16(pVocalBuf, oWaveFile->GetTotalFrames());
+
+    // 对人声做降噪
+    denoise_webrtc(pVocalBuf, oWaveFile->GetTotalFrames() * oWaveFile->GetChannels(),
+                   oWaveFile->GetChannels(), oWaveFile->GetSampleRate());
+
+    //写入文件
+    printf("write2file nLength:%d path:%s!\n", oWaveFile->GetTotalFrames(), sDstVocal.c_str());
+    CWaveFile *oWaveFile2 = new CWaveFile(sDstVocal.c_str(), true);
+    oWaveFile2->SetSampleFormat(SF_S16);
+    oWaveFile2->SetSampleRate(oWaveFile->GetSampleRate());
+    oWaveFile2->SetChannels(oWaveFile->GetChannels());
+    oWaveFile2->SetupDone();
+    oWaveFile2->WriteFrame(pVocalBuf, oWaveFile->GetTotalFrames());
+
+    delete oWaveFile;
+    delete oWaveFile2;
+
+    delete[] pVocalBuf;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/denoise/CMakeLists.txt
new file mode 100644
index 0000000..a5b6167
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/CMakeLists.txt
@@ -0,0 +1,14 @@
+cmake_minimum_required(VERSION 2.8)
+project(denoise)
+#set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++11")
+set(NOT_CROSSCOMPIRE 0)
+
+include_directories(./)
+add_subdirectory(webrtc)
+if(NOT_CROSSCOMPIRE)
+    add_subdirectory(waves)
+    add_executable(test test.cpp)
+    target_link_libraries(test ${LIBRARY_OUTPUT_PATH}/libwebrtc.a
+            ${LIBRARY_OUTPUT_PATH}/libwaves.a)
+endif()
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/build_android.sh b/AutoCoverTool/ref/tools/mixer/denoise/build_android.sh
new file mode 100755
index 0000000..d24b9a8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/build_android.sh
@@ -0,0 +1,64 @@
+#!/bin/sh
+
+# @Time    : 2019-06-18 17:50
+# @Author  : AlanWang
+# @FileName: build_android.sh
+
+# MY_NDK 和 MY_CMAKE 需要改成自己对应的 ndk 中的目录
+MY_NDK="/Users/yangjianli/Library/Android/sdk/ndk-bundle"
+MY_CMAKE="/Users/yangjianli/Library/Android/sdk/cmake/3.6.4111459/bin/cmake"
+
+if [ -z "$MY_NDK" ]; then
+  echo "Please set MY_NDK to the Android NDK folder"
+  exit 1
+fi
+
+if [ -z "$MY_CMAKE" ]; then
+  echo "Please set MY_CMAKE to the Android CMake folder"
+  exit 1
+fi
+
+OUTPUT_LIBS="./build/libs/android"
+ANDROID_NATIVE_API_LEVEL="android-16"
+
+# arme_abis=(armeabi armeabi-v7a arm64-v8a x86 x86_64 mips mips64)
+arme_abis=(armeabi-v7a arm64-v8a x86 x86_64)
+
+function build_with_armeabi() {
+	ARME_ABI=$1
+	echo ${ARME_ABI}
+
+	BUILD_DIR="./build/android/${ARME_ABI}"
+	BUILD_REF_DIR="./build/android/${ARME_ABI}/ref"
+	OUTPUT_SO_DIR="${BUILD_DIR}/build/android/libs/${ARME_ABI}"
+
+	PRE_EXE_DIR=$(pwd)
+	echo ${PRE_EXE_DIR}
+
+	${MY_CMAKE} \
+	-H"./" \
+	-B"${BUILD_DIR}" \
+	-DANDROID_ABI="${ARME_ABI}" \
+	-DANDROID_NDK="${MY_NDK}" \
+	-DCMAKE_LIBRARY_OUTPUT_DIRECTORY="./build/android/libs/${ARME_ABI}" \
+	-DCMAKE_BUILD_TYPE="Release" \
+	-DCMAKE_TOOLCHAIN_FILE="${MY_NDK}/build/cmake/android.toolchain.cmake" \
+	-DANDROID_NATIVE_API_LEVEL=${ANDROID_NATIVE_API_LEVEL} \
+	-DANDROID_TOOLCHAIN="clang" \
+	-DCMAKE_C_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DCMAKE_CXX_FLAGS="-fpic -fexceptions -frtti -Wno-narrowing" \
+	-DANDROID_STL="c++_static" \
+
+
+	cd ${BUILD_DIR}
+	make
+
+	cd ${PRE_EXE_DIR}
+	mkdir -p ${OUTPUT_LIBS}/${ARME_ABI}/
+	mv ${PRE_EXE_DIR}/lib/* ${OUTPUT_LIBS}/${ARME_ABI}/
+	rm -r ./build/android
+}
+
+for i in ${arme_abis[@]}; do
+	build_with_armeabi $i
+done
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/build_ios.sh b/AutoCoverTool/ref/tools/mixer/denoise/build_ios.sh
new file mode 100755
index 0000000..689d274
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/build_ios.sh
@@ -0,0 +1,39 @@
+#!/bin/sh
+
+OUTPUT_LIBS="./build/libs/ios"
+
+function build_with_platform_and_armeabi() {
+	PLATFORM=$1
+	ARME_ABI=$2
+	echo ${PLATFORM}
+	echo ${ARME_ABI}
+
+	BUILD_DIR="./build/ios/${ARME_ABI}"
+	PRE_EXE_DIR=$(pwd)
+	echo ${PRE_EXE_DIR}
+
+	cmake \
+	-H"./" \
+	-B"${BUILD_DIR}" \
+	-DCMAKE_BUILD_TYPE="Release" \
+	-DCMAKE_TOOLCHAIN_FILE="./toolchain/ios.toolchain.cmake" \
+	-DIOS_PLATFORM=${PLATFORM} \
+	-DIOS_ARCH=${ARME_ABI}
+
+	# 生成目标文件
+	cd ${BUILD_DIR}
+	make
+
+	# 将目标文件移至指定目录
+	cd ${PRE_EXE_DIR}
+	mkdir -p ${OUTPUT_LIBS}/${ARME_ABI}/
+	mv ${PRE_EXE_DIR}/lib/* ${OUTPUT_LIBS}/${ARME_ABI}/
+	rm -r ./build/ios
+}
+
+build_with_platform_and_armeabi "OS" "armv7"
+build_with_platform_and_armeabi "OS" "armv7s"
+build_with_platform_and_armeabi "OS" "arm64"
+
+build_with_platform_and_armeabi "SIMULATOR64" "x86_64"
+build_with_platform_and_armeabi "SIMULATOR" "i386"
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/test.cpp b/AutoCoverTool/ref/tools/mixer/denoise/test.cpp
new file mode 100644
index 0000000..d3b2e3b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/test.cpp
@@ -0,0 +1,96 @@
+//
+// Created by yangjianli on 2020-02-13.
+//
+#include "cstdio"
+#include "iostream"
+#include "webrtc/include/WebrtcDenoise.h"
+#include "string"
+#include "waves/inc/WaveFile.h"
+/**
+ * 切分为4个阶段测试4个等级
+ * https://people.xiph.org/~jm/demo/rnnoise/
+ * 使用该网址的杂音数据
+ * @param pInBuf
+ * @param nLength
+ * @param nChannel
+ * @param nSampleRate
+ * @return
+ */
+int denoise_webrtc(short* pInBuf, int nLength, int nChannel, int nSampleRate)
+{
+    CWebrtcDenoise cWebrtcDenoise;
+    cWebrtcDenoise.init(nSampleRate, nChannel);
+    float* pTmp = new float[nLength];
+    for(int i=0;i<nLength;i++)
+    {
+        pTmp[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    cWebrtcDenoise.set_level(kLow);
+    int nStep = 512 * nChannel;
+
+    for(int i=0;i<nStep;i++)
+    {
+        pTmp[i] = pTmp[i] * i * 1.0 / nStep;
+    }
+
+    for(int i=0,cnt=0;i<nLength;i+=nStep,cnt++)
+    {
+        if(nLength - i < nStep) continue;
+
+        if(cnt == 307 * 1)
+        {
+//            cWebrtcDenoise.reset();
+//            cWebrtcDenoise.set_level(kModerate);
+            cWebrtcDenoise.set_level(kNone);
+        } else if(cnt == 363 * 2)
+        {
+//            cWebrtcDenoise.reset();
+//            cWebrtcDenoise.set_level(kHigh);
+            cWebrtcDenoise.set_level(kVeryHigh);
+        }else if(cnt == 363 * 3)
+        {
+//            cWebrtcDenoise.reset();
+//            cWebrtcDenoise.set_level(kVeryHigh);
+            cWebrtcDenoise.set_level(kNone);
+        }else if(cnt == 363 * 4)
+        {
+//            cWebrtcDenoise.reset();
+            cWebrtcDenoise.set_level(kVeryHigh);
+        }
+        cWebrtcDenoise.process(pTmp+i, nStep);
+    }
+
+    for(int i=0;i<nLength;i++)
+    {
+        pInBuf[i] = short(pTmp[i] * 32768);
+    }
+    return 0;
+}
+
+int main(int argc, char* argv[])
+{
+    if(argc < 2)
+    {
+        printf("params err!\n");
+        return -1;
+    }
+
+    std::string sAudio = argv[1];
+    CWaveFile oWaveFile = CWaveFile(sAudio.c_str(), false);
+    int nLength = oWaveFile.GetTotalFrames() * oWaveFile.GetChannels();
+    short* pInBuf = new short[nLength];
+    oWaveFile.ReadFrameAsS16(pInBuf, oWaveFile.GetTotalFrames());
+    denoise_webrtc(pInBuf, nLength, oWaveFile.GetChannels(), oWaveFile.GetSampleRate());
+
+    std::string sAudioDe = sAudio+".webrtc_ds_3.wav";
+    printf("write2file %s\n", sAudioDe.c_str());
+    CWaveFile oWaveFile1 = CWaveFile(sAudioDe.c_str(), true);
+    oWaveFile1.SetChannels(oWaveFile.GetChannels());
+    oWaveFile1.SetSampleRate(oWaveFile.GetSampleRate());
+    oWaveFile1.SetSampleFormat(SF_S16);
+    oWaveFile1.SetupDone();
+    oWaveFile1.WriteFrame(pInBuf, oWaveFile.GetTotalFrames());
+
+    delete [] pInBuf;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/toolchain/ios.toolchain.cmake b/AutoCoverTool/ref/tools/mixer/denoise/toolchain/ios.toolchain.cmake
new file mode 100644
index 0000000..a56ea82
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/toolchain/ios.toolchain.cmake
@@ -0,0 +1,429 @@
+# This file is part of the ios-cmake project. It was retrieved from
+# https://github.com/cristeab/ios-cmake.git, which is a fork of
+# https://code.google.com/p/ios-cmake/. Which in turn is based off of
+# the Platform/Darwin.cmake and Platform/UnixPaths.cmake files which
+# are included with CMake 2.8.4
+#
+# The ios-cmake project is licensed under the new BSD license.
+#
+# Copyright (c) 2014, Bogdan Cristea and LTE Engineering Software,
+# Kitware, Inc., Insight Software Consortium.  All rights reserved.
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions
+# are met:
+# 1. Redistributions of source code must retain the above copyright
+# notice, this list of conditions and the following disclaimer.
+#
+# 2. Redistributions in binary form must reproduce the above copyright
+# notice, this list of conditions and the following disclaimer in the
+# documentation and/or other materials provided with the distribution.
+#
+# 3. Neither the name of the copyright holder nor the names of its
+# contributors may be used to endorse or promote products derived from
+# this software without specific prior written permission.
+#
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+# COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+# BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
+# ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+# POSSIBILITY OF SUCH DAMAGE.
+#
+# This file is based off of the Platform/Darwin.cmake and
+# Platform/UnixPaths.cmake files which are included with CMake 2.8.4
+# It has been altered for iOS development.
+#
+# Updated by Alex Stewart (alexs.mac@gmail.com)
+#
+# *****************************************************************************
+#      Now maintained by Alexander Widerberg (widerbergaren [at] gmail.com)
+#                      under the BSD-3-Clause license
+# *****************************************************************************
+#
+#                           INFORMATION / HELP
+#
+# The following variables control the behaviour of this toolchain:
+#
+# IOS_PLATFORM: OS (default) or SIMULATOR or SIMULATOR64 or TVOS or SIMULATOR_TVOS
+#    OS = Build for iPhoneOS.
+#    SIMULATOR = Build for x86 i386 iPhone Simulator.
+#    SIMULATOR64 = Build for x86_64 iPhone Simulator.
+#    TVOS = Build for AppleTVOS.
+#    SIMULATOR_TVOS = Build for x86_64 AppleTV Simulator.
+# CMAKE_OSX_SYSROOT: Path to the iOS SDK to use.  By default this is
+#    automatically determined from IOS_PLATFORM and xcodebuild, but
+#    can also be manually specified (although this should not be required).
+# CMAKE_IOS_DEVELOPER_ROOT: Path to the Developer directory for the iOS platform
+#    being compiled for.  By default this is automatically determined from
+#    CMAKE_OSX_SYSROOT, but can also be manually specified (although this should
+#    not be required).
+# ENABLE_BITCODE: (1|0) Enables or disables bitcode support. Default 1 (true)
+# ENABLE_ARC: (1|0) Enables or disables ARC support. Default 1 (true, ARC enabled by default)
+# ENABLE_VISIBILITY: (1|0) Enables or disables symbol visibility support. Default 0 (false, visibility hidden by default)
+# IOS_ARCH: (armv7 armv7s arm64 i386 x86_64) If specified, will override the default architectures for the given IOS_PLATFORM
+#    OS = armv7 armv7s arm64
+#    SIMULATOR = i386
+#    SIMULATOR64 = x86_64
+#    TVOS = arm64
+#    SIMULATOR_TVOS = x86_64
+#
+# This toolchain defines the following variables for use externally:
+#
+# XCODE_VERSION: Version number (not including Build version) of Xcode detected.
+# IOS_SDK_VERSION: Version of iOS SDK being used.
+# CMAKE_OSX_ARCHITECTURES: Architectures being compiled for (generated from
+#    IOS_PLATFORM).
+#
+# This toolchain defines the following macros for use externally:
+#
+# set_xcode_property (TARGET XCODE_PROPERTY XCODE_VALUE XCODE_VARIANT)
+#   A convenience macro for setting xcode specific properties on targets.
+#   Available variants are: All, Release, RelWithDebInfo, Debug, MinSizeRel
+#   example: set_xcode_property (myioslib IPHONEOS_DEPLOYMENT_TARGET "3.1" "all").
+#
+# find_host_package (PROGRAM ARGS)
+#   A macro used to find executable programs on the host system, not within the
+#   iOS environment.  Thanks to the android-cmake project for providing the
+#   command.
+
+# Fix for PThread library not in path
+set(CMAKE_THREAD_LIBS_INIT "-lpthread")
+set(CMAKE_HAVE_THREADS_LIBRARY 1)
+set(CMAKE_USE_WIN32_THREADS_INIT 0)
+set(CMAKE_USE_PTHREADS_INIT 1)
+
+# Get the Xcode version being used.
+execute_process(COMMAND xcodebuild -version
+  OUTPUT_VARIABLE XCODE_VERSION
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+string(REGEX MATCH "Xcode [0-9\\.]+" XCODE_VERSION "${XCODE_VERSION}")
+string(REGEX REPLACE "Xcode ([0-9\\.]+)" "\\1" XCODE_VERSION "${XCODE_VERSION}")
+message(STATUS "Building with Xcode version: ${XCODE_VERSION}")
+# Default to building for iPhoneOS if not specified otherwise, and we cannot
+# determine the platform from the CMAKE_OSX_ARCHITECTURES variable. The use
+# of CMAKE_OSX_ARCHITECTURES is such that try_compile() projects can correctly
+# determine the value of IOS_PLATFORM from the root project, as
+# CMAKE_OSX_ARCHITECTURES is propagated to them by CMake.
+if (NOT DEFINED IOS_PLATFORM)
+  if (CMAKE_OSX_ARCHITECTURES)
+    if (CMAKE_OSX_ARCHITECTURES MATCHES ".*arm.*")
+      set(IOS_PLATFORM "OS")
+    elseif (CMAKE_OSX_ARCHITECTURES MATCHES "i386")
+      set(IOS_PLATFORM "SIMULATOR")
+    elseif (CMAKE_OSX_ARCHITECTURES MATCHES "x86_64")
+      set(IOS_PLATFORM "SIMULATOR64")
+    endif()
+  endif()
+  if (NOT IOS_PLATFORM)
+    set(IOS_PLATFORM "OS")
+  endif()
+endif()
+set(IOS_PLATFORM ${IOS_PLATFORM} CACHE STRING
+  "Type of iOS platform for which to build.")
+# Determine the platform name and architectures for use in xcodebuild commands
+# from the specified IOS_PLATFORM name.
+if (IOS_PLATFORM STREQUAL "OS")
+  set(XCODE_IOS_PLATFORM iphoneos)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH armv7 armv7s arm64)
+  endif()
+elseif (IOS_PLATFORM STREQUAL "SIMULATOR")
+  set(XCODE_IOS_PLATFORM iphonesimulator)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH i386)
+  endif()
+elseif(IOS_PLATFORM STREQUAL "SIMULATOR64")
+  set(XCODE_IOS_PLATFORM iphonesimulator)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH x86_64)
+  endif()
+elseif (IOS_PLATFORM STREQUAL "TVOS")
+  set(XCODE_IOS_PLATFORM appletvos)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH arm64)
+  endif()
+elseif (IOS_PLATFORM STREQUAL "SIMULATOR_TVOS")
+  set(XCODE_IOS_PLATFORM appletvsimulator)
+  if(NOT IOS_ARCH)
+    set(IOS_ARCH x86_64)
+  endif()
+else()
+  message(FATAL_ERROR "Invalid IOS_PLATFORM: ${IOS_PLATFORM}")
+endif()
+message(STATUS "Configuring iOS build for platform: ${IOS_PLATFORM}, "
+  "architecture(s): ${IOS_ARCH}")
+# If user did not specify the SDK root to use, then query xcodebuild for it.
+if (NOT CMAKE_OSX_SYSROOT)
+  execute_process(COMMAND xcodebuild -version -sdk ${XCODE_IOS_PLATFORM} Path
+    OUTPUT_VARIABLE CMAKE_OSX_SYSROOT
+    ERROR_QUIET
+    OUTPUT_STRIP_TRAILING_WHITESPACE)
+  message(STATUS "Using SDK: ${CMAKE_OSX_SYSROOT} for platform: ${IOS_PLATFORM}")
+endif()
+if (NOT EXISTS ${CMAKE_OSX_SYSROOT})
+  message(FATAL_ERROR "Invalid CMAKE_OSX_SYSROOT: ${CMAKE_OSX_SYSROOT} "
+    "does not exist.")
+endif()
+# Specify minimum version of deployment target.
+if (NOT DEFINED IOS_DEPLOYMENT_TARGET)
+  # Unless specified, SDK version 8.0 is used by default as minimum target version.
+  set(IOS_DEPLOYMENT_TARGET "8.0"
+      CACHE STRING "Minimum iOS version to build for." )
+  message(STATUS "Using the default min-version since IOS_DEPLOYMENT_TARGET not provided!")
+endif()
+# Use bitcode or not
+if (NOT DEFINED ENABLE_BITCODE AND NOT IOS_ARCH MATCHES "((^|, )(i386|x86_64))+")
+  # Unless specified, enable bitcode support by default
+  set(ENABLE_BITCODE TRUE CACHE BOOL "Whether or not to enable bitcode")
+  message(STATUS "Enabling bitcode support by default. ENABLE_BITCODE not provided!")
+endif()
+if (NOT DEFINED ENABLE_BITCODE)
+  message(STATUS "Disabling bitcode support by default on simulators. ENABLE_BITCODE not provided for override!")
+endif()
+# Use ARC or not
+if (NOT DEFINED ENABLE_ARC)
+  # Unless specified, enable ARC support by default
+  set(ENABLE_ARC TRUE CACHE BOOL "Whether or not to enable ARC")
+  message(STATUS "Enabling ARC support by default. ENABLE_ARC not provided!")
+endif()
+# Use hidden visibility or not
+if (NOT DEFINED ENABLE_VISIBILITY)
+  # Unless specified, disable symbols visibility by default
+  set(ENABLE_VISIBILITY FALSE CACHE BOOL "Whether or not to hide symbols (-fvisibility=hidden)")
+  message(STATUS "Hiding symbols visibility by default. ENABLE_VISIBILITY not provided!")
+endif()
+# Get the SDK version information.
+execute_process(COMMAND xcodebuild -sdk ${CMAKE_OSX_SYSROOT} -version SDKVersion
+  OUTPUT_VARIABLE IOS_SDK_VERSION
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+# Find the Developer root for the specific iOS platform being compiled for
+# from CMAKE_OSX_SYSROOT.  Should be ../../ from SDK specified in
+# CMAKE_OSX_SYSROOT.  There does not appear to be a direct way to obtain
+# this information from xcrun or xcodebuild.
+if (NOT CMAKE_IOS_DEVELOPER_ROOT)
+  get_filename_component(IOS_PLATFORM_SDK_DIR ${CMAKE_OSX_SYSROOT} PATH)
+  get_filename_component(CMAKE_IOS_DEVELOPER_ROOT ${IOS_PLATFORM_SDK_DIR} PATH)
+endif()
+if (NOT EXISTS ${CMAKE_IOS_DEVELOPER_ROOT})
+  message(FATAL_ERROR "Invalid CMAKE_IOS_DEVELOPER_ROOT: "
+    "${CMAKE_IOS_DEVELOPER_ROOT} does not exist.")
+endif()
+# Find the C & C++ compilers for the specified SDK.
+if (NOT CMAKE_C_COMPILER)
+  execute_process(COMMAND xcrun -sdk ${CMAKE_OSX_SYSROOT} -find clang
+    OUTPUT_VARIABLE CMAKE_C_COMPILER
+    ERROR_QUIET
+    OUTPUT_STRIP_TRAILING_WHITESPACE)
+  message(STATUS "Using C compiler: ${CMAKE_C_COMPILER}")
+endif()
+if (NOT CMAKE_CXX_COMPILER)
+  execute_process(COMMAND xcrun -sdk ${CMAKE_OSX_SYSROOT} -find clang++
+    OUTPUT_VARIABLE CMAKE_CXX_COMPILER
+    ERROR_QUIET
+    OUTPUT_STRIP_TRAILING_WHITESPACE)
+  message(STATUS "Using CXX compiler: ${CMAKE_CXX_COMPILER}")
+endif()
+# Find (Apple's) libtool.
+execute_process(COMMAND xcrun -sdk ${CMAKE_OSX_SYSROOT} -find libtool
+  OUTPUT_VARIABLE IOS_LIBTOOL
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+message(STATUS "Using libtool: ${IOS_LIBTOOL}")
+# Configure libtool to be used instead of ar + ranlib to build static libraries.
+# This is required on Xcode 7+, but should also work on previous versions of
+# Xcode.
+set(CMAKE_C_CREATE_STATIC_LIBRARY
+  "${IOS_LIBTOOL} -static -o <TARGET> <LINK_FLAGS> <OBJECTS> ")
+set(CMAKE_CXX_CREATE_STATIC_LIBRARY
+  "${IOS_LIBTOOL} -static -o <TARGET> <LINK_FLAGS> <OBJECTS> ")
+# Get the version of Darwin (OS X) of the host.
+execute_process(COMMAND uname -r
+  OUTPUT_VARIABLE CMAKE_HOST_SYSTEM_VERSION
+  ERROR_QUIET
+  OUTPUT_STRIP_TRAILING_WHITESPACE)
+# Standard settings.
+set(CMAKE_SYSTEM_NAME Darwin CACHE INTERNAL "")
+set(CMAKE_SYSTEM_VERSION ${IOS_SDK_VERSION} CACHE INTERNAL "")
+set(UNIX TRUE CACHE BOOL "")
+set(APPLE TRUE CACHE BOOL "")
+set(IOS TRUE CACHE BOOL "")
+set(CMAKE_AR ar CACHE FILEPATH "" FORCE)
+set(CMAKE_RANLIB ranlib CACHE FILEPATH "" FORCE)
+# Force unset of OS X-specific deployment target (otherwise autopopulated),
+# required as of cmake 2.8.10.
+set(CMAKE_OSX_DEPLOYMENT_TARGET "" CACHE STRING
+  "Must be empty for iOS builds." FORCE)
+# Set the architectures for which to build.
+set(CMAKE_OSX_ARCHITECTURES ${IOS_ARCH} CACHE STRING "Build architecture for iOS")
+# Skip the platform compiler checks for cross compiling.
+set(CMAKE_CXX_COMPILER_FORCED TRUE)
+set(CMAKE_CXX_COMPILER_WORKS TRUE)
+set(CMAKE_C_COMPILER_FORCED TRUE)
+set(CMAKE_C_COMPILER_WORKS TRUE)
+# All iOS/Darwin specific settings - some may be redundant.
+set(CMAKE_SHARED_LIBRARY_PREFIX "lib")
+set(CMAKE_SHARED_LIBRARY_SUFFIX ".dylib")
+set(CMAKE_SHARED_MODULE_PREFIX "lib")
+set(CMAKE_SHARED_MODULE_SUFFIX ".so")
+set(CMAKE_C_COMPILER_ABI ELF)
+set(CMAKE_CXX_COMPILER_ABI ELF)
+set(CMAKE_C_HAS_ISYSROOT 1)
+set(CMAKE_CXX_HAS_ISYSROOT 1)
+set(CMAKE_MODULE_EXISTS 1)
+set(CMAKE_DL_LIBS "")
+set(CMAKE_C_OSX_COMPATIBILITY_VERSION_FLAG "-compatibility_version ")
+set(CMAKE_C_OSX_CURRENT_VERSION_FLAG "-current_version ")
+set(CMAKE_CXX_OSX_COMPATIBILITY_VERSION_FLAG "${CMAKE_C_OSX_COMPATIBILITY_VERSION_FLAG}")
+set(CMAKE_CXX_OSX_CURRENT_VERSION_FLAG "${CMAKE_C_OSX_CURRENT_VERSION_FLAG}")
+
+if(IOS_ARCH MATCHES "((^|, )(arm64|x86_64))+")
+  set(CMAKE_C_SIZEOF_DATA_PTR 8)
+  set(CMAKE_CXX_SIZEOF_DATA_PTR 8)
+  message(STATUS "Using a data_ptr size of 8")
+else()
+  set(CMAKE_C_SIZEOF_DATA_PTR 4)
+  set(CMAKE_CXX_SIZEOF_DATA_PTR 4)
+  message(STATUS "Using a data_ptr size of 4")
+endif()
+
+message(STATUS "Building for minimum iOS version: ${IOS_DEPLOYMENT_TARGET}"
+               " (SDK version: ${IOS_SDK_VERSION})")
+# Note that only Xcode 7+ supports the newer more specific:
+# -m${XCODE_IOS_PLATFORM}-version-min flags, older versions of Xcode use:
+# -m(ios/ios-simulator)-version-min instead.
+if (IOS_PLATFORM STREQUAL "OS")
+  if (XCODE_VERSION VERSION_LESS 7.0)
+    set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+      "-mios-version-min=${IOS_DEPLOYMENT_TARGET}")
+  else()
+    # Xcode 7.0+ uses flags we can build directly from XCODE_IOS_PLATFORM.
+    set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+      "-m${XCODE_IOS_PLATFORM}-version-min=${IOS_DEPLOYMENT_TARGET}")
+  endif()
+elseif (IOS_PLATFORM STREQUAL "TVOS")
+  set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+    "-mtvos-version-min=${IOS_DEPLOYMENT_TARGET}")
+elseif (IOS_PLATFORM STREQUAL "SIMULATOR_TVOS")
+  set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+    "-mtvos-simulator-version-min=${IOS_DEPLOYMENT_TARGET}")
+else()
+  # SIMULATOR or SIMULATOR64 both use -mios-simulator-version-min.
+  set(XCODE_IOS_PLATFORM_VERSION_FLAGS
+    "-mios-simulator-version-min=${IOS_DEPLOYMENT_TARGET}")
+endif()
+message(STATUS "Version flags set to: ${XCODE_IOS_PLATFORM_VERSION_FLAGS}")
+
+if (ENABLE_BITCODE)
+  set(BITCODE "-fembed-bitcode")
+  set(HEADER_PAD "")
+  message(STATUS "Enabling bitcode support.")
+else()
+  set(BITCODE "")
+  set(HEADER_PAD "-headerpad_max_install_names")
+  message(STATUS "Disabling bitcode support.")
+endif()
+
+if (ENABLE_ARC)
+  set(FOBJC_ARC "-fobjc-arc")
+  message(STATUS "Enabling ARC support.")
+else()
+  set(FOBJC_ARC "-fno-objc-arc")
+  message(STATUS "Disabling ARC support.")
+endif()
+
+if (NOT ENABLE_VISIBILITY)
+  set(VISIBILITY "-fvisibility=hidden")
+  message(STATUS "Hiding symbols (-fvisibility=hidden).")
+else()
+  set(VISIBILITY "")
+endif()
+
+set(CMAKE_C_FLAGS
+"${XCODE_IOS_PLATFORM_VERSION_FLAGS} ${BITCODE} -fobjc-abi-version=2 ${FOBJC_ARC} ${C_FLAGS}")
+# Hidden visibilty is required for C++ on iOS.
+set(CMAKE_CXX_FLAGS
+"${XCODE_IOS_PLATFORM_VERSION_FLAGS} ${BITCODE} ${VISIBILITY} -fvisibility-inlines-hidden -fobjc-abi-version=2 ${FOBJC_ARC} ${CXX_FLAGS}")
+set(CMAKE_CXX_FLAGS_MINSIZEREL "${CMAKE_CXX_FLAGS} -DNDEBUG -Os -fomit-frame-pointer -ffast-math ${BITCODE} ${CXX_FLAGS_MINSIZEREL}")
+set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS} -DNDEBUG -O2 -g -fomit-frame-pointer -ffast-math ${BITCODE} ${CXX_FLAGS_RELWITHDEBINFO}")
+set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS} -DNDEBUG -O3 -fomit-frame-pointer -ffast-math ${BITCODE} ${CXX_FLAGS_RELEASE}")
+set(CMAKE_C_LINK_FLAGS "${XCODE_IOS_PLATFORM_VERSION_FLAGS} -Wl,-search_paths_first ${C_LINK_FLAGS}")
+set(CMAKE_CXX_LINK_FLAGS "${XCODE_IOS_PLATFORM_VERSION_FLAGS}  -Wl,-search_paths_first ${CXX_LINK_FLAGS}")
+
+# In order to ensure that the updated compiler flags are used in try_compile()
+# tests, we have to forcibly set them in the CMake cache, not merely set them
+# in the local scope.
+list(APPEND VARS_TO_FORCE_IN_CACHE
+  CMAKE_C_FLAGS
+  CMAKE_CXX_FLAGS
+  CMAKE_CXX_FLAGS_RELWITHDEBINFO
+  CMAKE_CXX_FLAGS_MINSIZEREL
+  CMAKE_CXX_FLAGS_RELEASE
+  CMAKE_C_LINK_FLAGS
+  CMAKE_CXX_LINK_FLAGS)
+foreach(VAR_TO_FORCE ${VARS_TO_FORCE_IN_CACHE})
+  set(${VAR_TO_FORCE} "${${VAR_TO_FORCE}}" CACHE STRING "" FORCE)
+endforeach()
+
+set(CMAKE_PLATFORM_HAS_INSTALLNAME 1)
+set (CMAKE_SHARED_LINKER_FLAGS "-rpath @executable_path/Frameworks -rpath @loader_path/Frameworks")
+set(CMAKE_SHARED_LIBRARY_CREATE_C_FLAGS "-dynamiclib ${HEADER_PAD}")
+set(CMAKE_SHARED_MODULE_CREATE_C_FLAGS "-bundle ${HEADER_PAD}")
+set(CMAKE_SHARED_MODULE_LOADER_C_FLAG "-Wl,-bundle_loader,")
+set(CMAKE_SHARED_MODULE_LOADER_CXX_FLAG "-Wl,-bundle_loader,")
+set(CMAKE_FIND_LIBRARY_SUFFIXES ".dylib" ".so" ".a")
+
+# Hack: if a new cmake (which uses CMAKE_INSTALL_NAME_TOOL) runs on an old
+# build tree (where install_name_tool was hardcoded) and where
+# CMAKE_INSTALL_NAME_TOOL isn't in the cache and still cmake didn't fail in
+# CMakeFindBinUtils.cmake (because it isn't rerun) hardcode
+# CMAKE_INSTALL_NAME_TOOL here to install_name_tool, so it behaves as it did
+# before, Alex.
+if (NOT DEFINED CMAKE_INSTALL_NAME_TOOL)
+  find_program(CMAKE_INSTALL_NAME_TOOL install_name_tool)
+endif (NOT DEFINED CMAKE_INSTALL_NAME_TOOL)
+
+# Set the find root to the iOS developer roots and to user defined paths.
+set(CMAKE_FIND_ROOT_PATH ${CMAKE_IOS_DEVELOPER_ROOT} ${CMAKE_OSX_SYSROOT}
+  ${CMAKE_PREFIX_PATH} CACHE string  "iOS find search path root" FORCE)
+# Default to searching for frameworks first.
+set(CMAKE_FIND_FRAMEWORK FIRST)
+# Set up the default search directories for frameworks.
+set(CMAKE_SYSTEM_FRAMEWORK_PATH
+  ${CMAKE_OSX_SYSROOT}/System/Library/Frameworks
+  ${CMAKE_OSX_SYSROOT}/System/Library/PrivateFrameworks
+  ${CMAKE_OSX_SYSROOT}/Developer/Library/Frameworks)
+# Only search the specified iOS SDK, not the remainder of the host filesystem.
+set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM ONLY)
+set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY ONLY)
+set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE ONLY)
+# This little macro lets you set any XCode specific property.
+macro(set_xcode_property TARGET XCODE_PROPERTY XCODE_VALUE XCODE_RELVERSION)
+  set(XCODE_RELVERSION_I "${XCODE_RELVERSION}")
+  if (XCODE_RELVERSION_I STREQUAL "All")
+    set_property(TARGET ${TARGET} PROPERTY
+    XCODE_ATTRIBUTE_${XCODE_PROPERTY} "${XCODE_VALUE}")
+  else()
+    set_property(TARGET ${TARGET} PROPERTY
+    XCODE_ATTRIBUTE_${XCODE_PROPERTY}[variant=${XCODE_RELVERSION_I}] "${XCODE_VALUE}")
+  endif()
+endmacro(set_xcode_property)
+# This macro lets you find executable programs on the host system.
+macro(find_host_package)
+  set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM NEVER)
+  set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY NEVER)
+  set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE NEVER)
+  set(IOS FALSE)
+  find_package(${ARGN})
+  set(IOS TRUE)
+  set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM ONLY)
+  set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY ONLY)
+  set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE ONLY)
+endmacro(find_host_package)
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/waves/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/denoise/waves/CMakeLists.txt
new file mode 100644
index 0000000..3045b00
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/waves/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_WAVES_SRCS)
+add_library(waves ${DIR_WAVES_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/waves/inc/ExtraMono.h b/AutoCoverTool/ref/tools/mixer/denoise/waves/inc/ExtraMono.h
new file mode 100755
index 0000000..280fab0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/waves/inc/ExtraMono.h
@@ -0,0 +1,230 @@
+
+#include <string>
+#include <string.h>
+
+#define SIZE_LONG 4
+#define SIZE_SHORT 2
+
+#define SIZE_FLAG 4
+#define FMT_TAG 0x0001
+
+#define BITS_PER_BYTE 8
+
+#ifndef AFS_CMPL_MAX_WAV	
+#define AFS_CMPL_MAX_WAV 15360000	// 时长16分（960*16000）
+#endif
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个32位数据
+//+---------------------------------------------------------------------------+
+unsigned long fa_read_u32(FILE* fp)
+{
+	unsigned long cx;
+	unsigned char temp[SIZE_LONG];
+
+	fread(temp, sizeof(unsigned char), SIZE_LONG, fp);
+	cx =  (unsigned long)temp[0];
+	cx |= (unsigned long)temp[1] << 8;
+	cx |= (unsigned long)temp[2] << 16;
+	cx |= (unsigned long)temp[3] << 24;
+	return cx;
+}
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个16位数据
+//+---------------------------------------------------------------------------+
+unsigned short fa_read_u16(FILE *fp)
+{
+	unsigned short cx;
+	unsigned char  temp[SIZE_SHORT];
+
+	fread(temp, sizeof(unsigned char), SIZE_SHORT, fp);
+	cx = temp[0] | (temp[1] * 256);
+	return cx;
+}
+
+int GetWaveHeadLen(const char* pszFile,unsigned short &channels, int &nPos, int& nLength)
+{
+	//+---------------------------------------------------------------------------+
+	//+ 读取WAVE的头信息
+	//+---------------------------------------------------------------------------+
+	unsigned char  temp[SIZE_FLAG];
+	unsigned short bits_per_sample;
+	unsigned long  x_size;
+	unsigned long  n_skip;
+
+	unsigned short format;
+	//unsigned short channels;
+	unsigned long  sample_rate;
+	unsigned short block_align;
+	unsigned long  data_size;
+	int nCnt = 0;
+
+	/* 读取通用信息 */
+	FILE* pWavFile = fopen(pszFile, "rb");
+	if ( pWavFile == NULL )
+	{
+		printf("Input file can not be opened!\n");
+		return -1;
+	}
+
+	fseek(pWavFile, 0, SEEK_END );
+	nLength = ftell(pWavFile);
+	fseek(pWavFile, 0, SEEK_SET );
+
+	// 判断资源标识为"RIFF"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "RIFF", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Resource flag is not RIFF!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+	nCnt += SIZE_LONG;
+
+	// 判断文件标识为"WAVE"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "WAVE", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "File flag is not WAVE\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	// 判断格式标识为"fmt "
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "fmt ", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Format flag is not FMT!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	x_size = fa_read_u32(pWavFile);
+	nCnt += SIZE_LONG;
+
+	// 判断编码格式为0x0001
+	format = fa_read_u16(pWavFile);
+	nCnt += SIZE_SHORT;
+	if ( format != FMT_TAG )
+	{
+		fprintf(stderr, "Encoding format is not 0x0001!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+
+	// 读取声道数目和采样频率
+	channels = fa_read_u16(pWavFile);
+	sample_rate = fa_read_u32(pWavFile);
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+
+	// 读取对齐单位和样本位数
+	block_align = fa_read_u16(pWavFile);
+	bits_per_sample = fa_read_u16(pWavFile);
+
+	/* 读取特殊信息 */
+	x_size -= (4*SIZE_SHORT + 2*SIZE_LONG);
+	if ( x_size != 0 )
+	{
+		fseek(pWavFile, x_size, SEEK_CUR);
+	}
+
+	// 读取数据大小
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	while ( memcmp(temp, "data", SIZE_FLAG) != 0 )
+	{
+		n_skip = fa_read_u32(pWavFile);
+		fseek(pWavFile, n_skip, SEEK_CUR);
+
+		fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	}
+
+	data_size = fa_read_u32(pWavFile);
+	fclose(pWavFile);
+
+	//+---------------------------------------------------------------------------+
+	//+ 返回WAVE的头长度
+	//+---------------------------------------------------------------------------+
+	nPos = nCnt;
+	int nHeadLength = nLength - data_size;
+	return nHeadLength;
+}
+
+bool ExtraMono(const std::string &sInput, const std::string &sOutput)
+{
+	FILE *pFile = fopen(sInput.c_str(), "rb");
+	if ( NULL == pFile )
+	{
+		printf("Fopen Error %s", sInput.c_str());
+		return false;
+	}
+
+	FILE *pFile2 = fopen(sOutput.c_str(), "wb");
+	if ( NULL == pFile2 )
+	{
+		printf("Fopen2 Error %s", sOutput.c_str());
+		return false;
+	}
+
+	short *pBuf = new short[AFS_CMPL_MAX_WAV];
+	int nLen = 0;
+
+	nLen = fread(pBuf, sizeof(short), AFS_CMPL_MAX_WAV, pFile);
+	if ( nLen <= 0 )
+	{
+		perror("Fread Error!");
+		return false;
+	}
+
+	unsigned short channels=0;
+	int nPos;
+	int nLength;
+	int nHeadByte = GetWaveHeadLen(sInput.c_str(),channels, nPos, nLength);
+	int nHeadShort = nHeadByte/2;
+	
+	if (channels==1)
+	{
+		fwrite(pBuf + nHeadShort, sizeof(short), nLen - nHeadShort, pFile2);
+	}
+	else
+	{
+		short *pBuf2 = new short[AFS_CMPL_MAX_WAV];
+		memcpy( pBuf2, pBuf, nHeadShort*sizeof(short));
+		pBuf2[nPos] = 1;
+
+		unsigned char tmp[2];
+		memcpy(tmp, &pBuf2[nPos], 2);
+
+		pBuf2[nPos] = static_cast<short>(tmp[0] | tmp[1]*256);
+
+		short *pWav = pBuf + nHeadShort;
+		nLen -= nHeadShort;
+
+		int halfnlen=nLen/2;
+		for (int i=0;i<=halfnlen;i++ )
+		{
+			pBuf2[nHeadShort+i] = *(pWav+i*2);
+		}
+		fwrite(pBuf2, sizeof(short), nLen+nHeadShort, pFile2);
+
+		delete []pBuf;
+		delete []pBuf2;
+		pBuf = NULL;
+		pBuf2 = NULL;
+	}
+
+
+	fclose(pFile);
+	fclose(pFile2);
+	return true;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/waves/inc/WaveFile.h b/AutoCoverTool/ref/tools/mixer/denoise/waves/inc/WaveFile.h
new file mode 100755
index 0000000..8b57806
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/waves/inc/WaveFile.h
@@ -0,0 +1,74 @@
+#ifndef WAVE_FILE_H
+#define WAVE_FILE_H
+
+#include <stdio.h>
+#include <stdint.h>
+
+
+typedef enum SAMPLE_FORMAT
+{
+    SF_U8 = 8,
+    SF_S16 = 16,
+    SF_S24 = 24,
+    SF_S32 = 32,
+    SF_IEEE_FLOAT = 0x100 + 32,
+    SF_IEEE_DOUBLE = 0x100 + 64,
+    SF_MAX,
+} SAMPLE_FORMAT;
+
+/* 主处理对象 **/
+class CWaveFile
+{
+public:
+	/* 构造传入文件及 是读还是写 **/
+    CWaveFile(const char* Filename, bool Write);
+    virtual ~CWaveFile();
+
+public:
+    int GetChannels();
+    int GetSampleRate();
+    double GetDuration();  // in second
+    uint32_t GetChannelMask();
+    void SetChannels(int Channels);
+    void SetSampleRate(int SampleRate);
+    void SetSampleFormat(SAMPLE_FORMAT Format);
+    void SetChannelMask(uint32_t Mask);
+    void Stat();
+    void SetupDone();
+    bool ReadFrameAsS16(short* FrameSamples, int Frames = 1);
+    bool ReadFrameAsDouble(double* FrameSamples, int Frames = 1);
+	bool ReadFrameAsfloat(float* FrameSamples, int Frames = 1);
+	void WriteRaw(void* Raw, int Size);
+    void WriteFrame(uint8_t* FrameSamples, int Frames = 1);
+    void WriteFrame(short* FrameSamples, int Frames = 1);
+    void WriteFrame(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrameS24(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrame(double* FrameSamples, int Frames = 1);
+    void WriteFrame(float* FrameSamples, int Frames=1);
+    void Seek(int FramePos, int Where = SEEK_SET);
+	bool GetStatus();
+	SAMPLE_FORMAT GetFormat();
+	int GetTotalFrames();
+	int GetFramesRead();
+
+
+protected:
+    FILE* File;
+    int Channels;					/* 通道数 **/
+    int SampleRate;					/* 采样率 **/
+    SAMPLE_FORMAT Format;			/* 采样精度 **/
+    int SampleSize; // Measured in Bits
+    unsigned int FrameStartPos;		/* 音频数据的起始位置 **/
+    unsigned long TotalFrames;		/* 总帧数，如果16bit，则一个short为一帧 **/
+    unsigned long FramesRead;
+    double Duration;				/* 时长 **/
+
+    bool ReadOnly;					/* 是度还是写 **/
+
+    uint32_t ChannelMask;
+
+	bool m_bOK;		/* 文件是否已经被打开 **/
+};
+
+
+#endif
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/waves/src/WaveFile.cpp b/AutoCoverTool/ref/tools/mixer/denoise/waves/src/WaveFile.cpp
new file mode 100755
index 0000000..9cf66b5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/waves/src/WaveFile.cpp
@@ -0,0 +1,824 @@
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <memory.h>
+#include <errno.h>
+
+#if WIN32
+#else
+#include <inttypes.h>
+#endif
+
+#include "WaveFile.h"
+#define SPEAKER_FRONT_LEFT             0x1
+#define SPEAKER_FRONT_RIGHT            0x2
+#define SPEAKER_FRONT_CENTER           0x4
+#define SPEAKER_LOW_FREQUENCY          0x8
+#define SPEAKER_BACK_LEFT              0x10
+#define SPEAKER_BACK_RIGHT             0x20
+#define SPEAKER_FRONT_LEFT_OF_CENTER   0x40
+#define SPEAKER_FRONT_RIGHT_OF_CENTER  0x80
+#define SPEAKER_BACK_CENTER            0x100
+#define SPEAKER_SIDE_LEFT              0x200
+#define SPEAKER_SIDE_RIGHT             0x400
+#define SPEAKER_TOP_CENTER             0x800
+#define SPEAKER_TOP_FRONT_LEFT         0x1000
+#define SPEAKER_TOP_FRONT_CENTER       0x2000
+#define SPEAKER_TOP_FRONT_RIGHT        0x4000
+#define SPEAKER_TOP_BACK_LEFT          0x8000
+#define SPEAKER_TOP_BACK_CENTER        0x10000
+#define SPEAKER_TOP_BACK_RIGHT         0x20000
+#define SPEAKER_RESERVED               0x80000000
+
+
+#define SPEAKER_REAR_CENTER_SURROUND   SPEAKER_BACK_CENTER 
+
+#define DCA_MONO 0
+#define DCA_CHANNEL 1
+#define DCA_STEREO 2
+#define DCA_STEREO_SUMDIFF 3
+#define DCA_STEREO_TOTAL 4
+#define DCA_3F 5
+#define DCA_2F1R 6
+#define DCA_3F1R 7
+#define DCA_2F2R 8
+#define DCA_3F2R 9
+#define DCA_4F2R 10
+
+#define DCA_DOLBY 101 /* FIXME */
+
+#define DCA_CHANNEL_MAX  DCA_3F2R /* We don't handle anything above that */
+#define DCA_CHANNEL_BITS 6
+#define DCA_CHANNEL_MASK 0x3F
+
+#define DCA_LFE 0x80
+#define DCA_ADJUST_LEVEL 0x100
+
+#define WAVE_FORMAT_PCM        0x0001
+#define WAVE_FORMAT_IEEE_FLOAT 0x0003
+#define WAVE_FORMAT_EXTENSIBLE 0xFFFE
+
+static uint8_t wav_header[] = {
+    'R', 'I', 'F', 'F', 0xfc, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 16, 0, 0, 0,
+    WAVE_FORMAT_PCM, WAVE_FORMAT_PCM >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0,
+    'd', 'a', 't', 'a', 0xd8, 0xff, 0xff, 0xff
+};
+
+static uint8_t wavmulti_header[] = {
+    'R', 'I', 'F', 'F', 0xf0, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 40, 0, 0, 0,
+    (uint8_t)(WAVE_FORMAT_EXTENSIBLE & 0xFF), WAVE_FORMAT_EXTENSIBLE >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 22, 0,
+    0, 0, 0, 0, 0, 0,
+    WAVE_FORMAT_IEEE_FLOAT, WAVE_FORMAT_IEEE_FLOAT >> 8,
+    0, 0, 0, 0, 0x10, 0x00, 0x80, 0, 0, 0xaa, 0, 0x38, 0x9b, 0x71,
+    'd', 'a', 't', 'a', 0xb4, 0xff, 0xff, 0xff
+};
+
+static void store4 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+    buf[2] = value >> 16;
+    buf[3] = value >> 24;
+}
+
+static void store2 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+}
+
+
+static uint32_t find_chunk(FILE * file, const uint8_t chunk_id[4])
+{
+    uint8_t buffer[8];
+    while (1) {
+        size_t chunksize;
+        size_t s = fread(buffer, 1, 8, file);
+        if (s < 8)
+            return 0;
+        chunksize = (uint32_t)buffer[4] | ((uint32_t)buffer[5] << 8) |
+            ((uint32_t)buffer[6] << 16) | ((uint32_t)buffer[7] << 24);
+        if (!memcmp(buffer, chunk_id, 4))
+            return chunksize;
+        fseek(file, chunksize, SEEK_CUR);
+    }
+}
+
+
+CWaveFile::CWaveFile(const char* Filename, bool Write)
+    : Duration(0), ReadOnly(false), m_bOK(false)
+{
+    Channels = 0;
+
+	/* 打开文件 **/
+    File = fopen(Filename, Write ? "wb":"rb");
+    if ( !File )
+        return;
+    
+	/* 设置写文件初始参数 **/
+    if ( Write )
+    {
+        SampleRate = 44100;
+        Channels = 2;
+        Format = SF_S16;
+        SampleSize = 16;
+		ChannelMask = 0;
+		m_bOK = true;
+        return;
+    }
+
+    ReadOnly = true;
+
+    size_t s;
+    uint8_t buffer[8];
+    uint8_t *fmt = NULL;
+    uint32_t v;
+    uint32_t avg_bps;
+    uint32_t block_align;
+    unsigned short FormatType;
+    unsigned short SampleType;
+
+    static const uint8_t riff[4] = { 'R', 'I', 'F', 'F' };
+    static const uint8_t wave[4] = { 'W', 'A', 'V', 'E' };
+    static const uint8_t fmt_[4] = { 'f', 'm', 't', ' ' };
+    static const uint8_t data[4] = { 'd', 'a', 't', 'a' };
+
+	/* 前四个字节为 riff **/
+    s = fread(buffer, 1, 8, File);
+    if (s < 8)
+        goto err2;
+
+    if (memcmp(buffer, riff, 4))
+        goto err2;
+
+	/* 8~12为wave **/
+    /* TODO: check size (in buffer[4..8]) */
+    s = fread(buffer, 1, 4, File);
+    if (s < 4)
+        goto err2;
+
+    if (memcmp(buffer, wave, 4))
+        goto err2;
+
+    s = find_chunk(File, fmt_);
+    if ( s != 16 && s != 18 && s != 40 )
+        goto err2;
+
+    fmt = (uint8_t*)malloc(s);
+    if (!fmt)
+        goto err2;
+
+    if (fread(fmt, 1, s, File) != s)
+        goto err3;
+
+    /* wFormatTag */
+    v = (uint32_t)fmt[0] | ((uint32_t)fmt[1] << 8);
+    if (v != WAVE_FORMAT_PCM && v != WAVE_FORMAT_IEEE_FLOAT && v != WAVE_FORMAT_EXTENSIBLE)
+        goto err3;
+
+    FormatType = v;
+
+    if (s == 40 && 0xfffe == v)
+    {
+        // fmt begins at 0x14 of the wave file
+        v = *(unsigned short*)&fmt[0x2C - 0x14];
+    }
+
+    SampleType = v;
+
+    /* wChannels */
+    v = (uint32_t)fmt[2] | ((uint32_t)fmt[3] << 8);
+
+    Channels = v;
+
+    if (v < 1 || v > 32)
+        goto err3;
+
+    /* dwSamplesPerSec */
+    SampleRate = (uint32_t)fmt[4] | ((uint32_t)fmt[5] << 8) |
+        ((uint32_t)fmt[6] << 16) | ((uint32_t)fmt[7] << 24);
+
+    /* dwAvgBytesPerSec */
+    avg_bps = (uint32_t)fmt[8] | ((uint32_t)fmt[9] << 8) |
+        ((uint32_t)fmt[10] << 16) | ((uint32_t)fmt[11] << 24);
+
+    /* wBlockAlign */
+    block_align = (uint32_t)fmt[12] | ((uint32_t)fmt[13] << 8);
+
+    /* wBitsPerSample */
+    SampleSize = (uint32_t)fmt[14] | ((uint32_t)fmt[15] << 8);
+    if (SampleSize != 8 && SampleSize != 16 && SampleSize != 32 && SampleSize != 24 && SampleSize != 64)
+        goto err3;
+
+    switch (SampleSize)
+    {
+    case 8:
+        Format = SF_U8;
+        break;
+    case 16:
+        Format = SF_S16;
+        break;
+    case 24:
+        Format = SF_S24;
+        break;
+    case 32:
+    {
+        if (SampleType == WAVE_FORMAT_IEEE_FLOAT)
+            Format = SF_IEEE_FLOAT;
+        else
+            Format = SF_S32;
+
+    }
+    break;
+    case 64:
+        if (SampleType != WAVE_FORMAT_IEEE_FLOAT)
+            goto err3;
+        Format = SF_IEEE_DOUBLE;
+        break;
+    }
+
+
+    // Handle 24-bit samples individually
+#if 0
+    if (SampleSize == 24 && Channels <= 2)
+    {
+        int ba24 = Channels * (SampleSize / 8); // Align to 4x
+
+        ba24 = (ba24 + 3) / 4 * 4;
+
+        if (block_align != ba24)
+            goto err3;
+    }
+    else
+#endif
+    {
+        if (block_align != Channels * (SampleSize / 8))
+            goto err3;
+    }
+
+    if (avg_bps != block_align * SampleRate)
+        goto err3;
+
+    v = find_chunk(File, data);
+
+    if (v == 0 || v % block_align != 0)
+        goto err3;
+
+    TotalFrames = v / block_align;
+
+    FramesRead = 0;
+
+    if (FormatType == WAVE_FORMAT_EXTENSIBLE)
+    {
+        ChannelMask = *(unsigned int*)(&fmt[0x14]);
+    }
+    else
+    {
+        ChannelMask = 0;
+    }
+    
+    FrameStartPos = ftell(File);
+
+    free(fmt);
+	m_bOK = true;
+    return;
+
+err3:
+    free(fmt);
+err2:
+    fclose(File);
+
+    File = NULL;
+}
+
+bool CWaveFile::GetStatus()
+{
+	return m_bOK;
+}
+
+SAMPLE_FORMAT CWaveFile::GetFormat()
+{
+	return Format;
+}
+
+int CWaveFile::GetTotalFrames()
+{
+	return TotalFrames;
+}
+
+int CWaveFile::GetFramesRead()
+{
+	return FramesRead;
+}
+
+CWaveFile::~CWaveFile()
+{
+    if (File != NULL)
+    {
+        if (!ReadOnly)
+        {
+            unsigned int Size = ftell(File) - FrameStartPos;// 44;
+
+            fseek(File, FrameStartPos - 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+
+            Size += FrameStartPos - 8;
+
+            fseek(File, 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+        }
+
+        fclose(File);
+    }
+}
+
+int CWaveFile::GetSampleRate()
+{
+    return SampleRate;
+}
+
+void CWaveFile::SetSampleRate(int SampleRate)
+{
+    this->SampleRate = SampleRate;
+}
+
+void CWaveFile::SetupDone()
+{
+    unsigned char Header[68];
+
+    fseek(File, 0, SEEK_SET);
+
+    SampleSize = Format & 0xFF;
+
+    if (ChannelMask)
+    {
+        memcpy(Header, wavmulti_header, sizeof(wavmulti_header));
+
+        if (Format < SF_IEEE_FLOAT)
+        {
+         //   store2(Header + 20, WAVE_FORMAT_PCM);
+            store2(Header + 44, WAVE_FORMAT_PCM);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        store2(Header + 38, SampleSize / 8 * 8);
+        store4(Header + 40, ChannelMask);
+
+        fwrite(Header, sizeof(wavmulti_header), 1, File);
+    }
+    else
+    {
+        memcpy(Header, wav_header, sizeof(wav_header));
+
+        if (Format >= SF_IEEE_FLOAT)
+        {
+            store2(Header + 20, WAVE_FORMAT_IEEE_FLOAT);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        fwrite(Header, sizeof(wav_header), 1, File);
+    }
+
+
+    FrameStartPos = ftell(File);
+}
+
+
+void CWaveFile::Seek(int FramePos, int Where)
+{
+    // Ignoring Where
+
+    fseek(File, FrameStartPos + FramePos * Channels* (SampleSize / 8), Where);
+
+    FramesRead = FramePos;
+
+}
+
+int CWaveFile::GetChannels()
+{
+    return Channels;
+}
+
+void CWaveFile::SetChannels(int Channels)
+{
+    this->Channels = Channels;
+}
+
+void CWaveFile::SetSampleFormat(SAMPLE_FORMAT Format)
+{
+    this->Format = Format;
+}
+
+uint32_t CWaveFile::GetChannelMask()
+{
+    return ChannelMask;
+}
+
+void CWaveFile::SetChannelMask(uint32_t Mask)
+{
+    ChannelMask = Mask;
+}
+
+bool CWaveFile::ReadFrameAsS16(short* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) << 8;
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+        return Frames == fread(FrameSamples, sizeof(FrameSamples[0])*Channels, Frames, File);
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 8);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 16);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float* DirectSamples = new float[Frames * Channels];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            delete DirectSamples;
+            return true;
+        }
+        delete DirectSamples;
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        double DirectSamples[Frames * Channels];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+bool CWaveFile::ReadFrameAsfloat(float* FrameSamples, int Frames)
+{
+	if (FramesRead >= TotalFrames)
+		return false;
+
+	FramesRead += Frames;
+
+	switch (Format)
+	{
+	case SF_U8:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 1, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S16:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 2, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S24:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 3, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S32:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 4, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_IEEE_FLOAT:
+	{
+	    if(fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+	        return true;
+        }
+	    return false;
+//		float DirectSamples[32];
+//
+//		if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+//		{
+//			for (int frame = 0; frame < Frames; frame++)
+//			{
+//				for (int ch = 0; ch < Channels; ch++)
+//				{
+//					FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+//				}
+//			}
+//			return true;
+//		}
+//		return false;
+	}
+	case SF_IEEE_DOUBLE:
+	{
+		if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+		{
+			return true;
+		}
+		return false;
+	}
+	}
+	return false;
+}
+
+bool CWaveFile::ReadFrameAsDouble(double* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File)) 
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 2, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample ))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+void CWaveFile::WriteRaw(void* Raw, int Size)
+{
+	fwrite(Raw, Size, 1, File);
+}
+
+
+void CWaveFile::WriteFrame(uint8_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(short* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(int32_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrameS24(int32_t* FrameSamples, int Frames)
+{
+    for (int c = 0; c < Channels; c++)
+    {
+        fwrite(&FrameSamples[c], 3, 1, File);
+    }
+}
+
+void CWaveFile::WriteFrame(double* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(float* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+
+double CWaveFile::GetDuration()
+{
+    return Duration;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/CMakeLists.txt
new file mode 100644
index 0000000..382c84b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/CMakeLists.txt
@@ -0,0 +1,125 @@
+cmake_minimum_required(VERSION 3.4.1)
+
+include_directories(./)
+include_directories(./include)
+include_directories(./cpufeatures/)
+
+set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -Wall -v -Wl")
+
+add_definitions("-DWEBRTC_ANDROID -DWEBRTC_POSIX")
+set(WEBRTC_COMMON_FILE
+        base/criticalsection.cc
+        common_audio/resampler/push_sinc_resampler.cc
+        common_audio/resampler/sinc_resampler.cc
+        common_audio/signal_processing/auto_corr_to_refl_coef.c
+        common_audio/signal_processing/auto_correlation.c
+        common_audio/signal_processing/complex_fft.c
+        common_audio/signal_processing/copy_set_operations.c
+        common_audio/signal_processing/division_operations.c
+        common_audio/signal_processing/dot_product_with_scale.cc
+        common_audio/signal_processing/energy.c
+        common_audio/signal_processing/filter_ar.c
+        common_audio/signal_processing/filter_ma_fast_q12.c
+        common_audio/signal_processing/get_hanning_window.c
+        common_audio/signal_processing/get_scaling_square.c
+        common_audio/signal_processing/ilbc_specific_functions.c
+        common_audio/signal_processing/levinson_durbin.c
+        common_audio/signal_processing/lpc_to_refl_coef.c
+        common_audio/signal_processing/randomization_functions.c
+        common_audio/signal_processing/real_fft.c
+        common_audio/signal_processing/refl_coef_to_lpc.c
+        common_audio/signal_processing/resample.c
+        common_audio/signal_processing/resample_48khz.c
+        common_audio/signal_processing/resample_by_2.c
+        common_audio/signal_processing/resample_by_2_internal.c
+        common_audio/signal_processing/resample_by_2_mips.c
+        common_audio/signal_processing/resample_fractional.c
+        common_audio/signal_processing/spl_init.c
+        common_audio/signal_processing/spl_inl.c
+        common_audio/signal_processing/spl_sqrt.c
+        common_audio/signal_processing/splitting_filter.c
+        common_audio/signal_processing/sqrt_of_one_minus_x_squared.c
+        common_audio/signal_processing/vector_scaling_operations.c
+        common_audio/audio_util.cc
+        common_audio/channel_buffer.cc
+        common_audio/fft4g.c
+        common_audio/sparse_fir_filter.cc
+        modules/audio_processing/audio_buffer.cc
+        modules/audio_processing/noise_suppression_impl.cc
+        modules/audio_processing/splitting_filter.cc
+        modules/audio_processing/three_band_filter_bank.cc
+        system_wrappers/source/aligned_malloc.cc
+#        system_wrappers/source/cpu_features_android.c
+#        cpufeatures/cpu-features.c
+        )
+set(ANDROID_ABI "x86_64")
+if(${ANDROID_ABI} STREQUAL "x86" OR ${ANDROID_ABI} STREQUAL "x86_64")
+    add_definitions("-D__SSE2__")
+    set(WEBRTC_X86_FILES
+            common_audio/resampler/sinc_resampler_sse.cc
+            common_audio/signal_processing/complex_bit_reverse.c
+            common_audio/signal_processing/cross_correlation.c
+            common_audio/signal_processing/downsample_fast.c
+            common_audio/signal_processing/filter_ar_fast_q12.c
+            common_audio/signal_processing/min_max_operations.c
+            common_audio/signal_processing/spl_sqrt_floor.c
+            )
+elseif(${ANDROID_ABI} STREQUAL "armeabi-v7a")
+    enable_language(ASM)
+    add_definitions("-DWEBRTC_ARCH_ARM_V7 -DWEBRTC_HAS_NEON")
+    set(WEBRTC_ARMV7A_FILES
+            common_audio/resampler/sinc_resampler_neon.cc
+            common_audio/signal_processing/complex_bit_reverse_arm.S
+            common_audio/signal_processing/cross_correlation_neon.c
+            common_audio/signal_processing/downsample_fast_neon.c
+            common_audio/signal_processing/filter_ar_fast_q12_armv7.S
+            common_audio/signal_processing/min_max_operations_neon.c
+            common_audio/signal_processing/spl_sqrt_floor_arm.S
+            )
+    set_source_files_properties(${WEBRTC_ARMV7A_FILES} PROPERTIES COMPILE_FLAGS -mfpu=neon)
+elseif(${ANDROID_ABI} STREQUAL "arm64-v8a")
+    add_definitions("-DWEBRTC_ARCH_ARM64 -DWEBRTC_HAS_NEON")
+    set(WEBRTC_ARMV7A_FILES
+            common_audio/resampler/sinc_resampler_neon.cc
+            common_audio/signal_processing/complex_bit_reverse.c
+            common_audio/signal_processing/cross_correlation_neon.c
+            common_audio/signal_processing/downsample_fast_neon.c
+            common_audio/signal_processing/filter_ar_fast_q12.c
+            common_audio/signal_processing/min_max_operations_neon.c
+            common_audio/signal_processing/spl_sqrt_floor.c
+            )
+else(${ANDROID_ABI} STREQUAL "x86" OR ${ANDROID_ABI} STREQUAL "x86_64")
+    # do nothing
+endif(${ANDROID_ABI} STREQUAL "x86" OR ${ANDROID_ABI} STREQUAL "x86_64")
+
+if(DEFINED NS_FIXED)
+    add_definitions("-DWEBRTC_NS_FIXED")
+    set(WEBRTC_FIXED_FILES
+            modules/audio_processing/ns/noise_suppression_x.c
+            modules/audio_processing/ns/nsx_core.c
+            modules/audio_processing/ns/nsx_core_c.c
+            )
+    if(NOT (${ANDROID_ABI} STREQUAL "x86" OR ${ANDROID_ABI} STREQUAL "x86_64"))
+        set(WEBRTC_FIXED_FILES
+                ${WEBRTC_FIXED_FILES}
+                modules/audio_processing/ns/nsx_core_neon.c
+                )
+    endif(NOT (${ANDROID_ABI} STREQUAL "x86" OR ${ANDROID_ABI} STREQUAL "x86_64"))
+else(DEFINED NS_FIXED)
+    add_definitions("-DWEBRTC_NS_FLOAT")
+    set(WEBRTC_FLOAT_FILES
+            modules/audio_processing/ns/noise_suppression.c
+            modules/audio_processing/ns/ns_core.c
+            )
+endif(DEFINED NS_FIXED)
+
+add_library(
+        webrtc
+        ${WEBRTC_COMMON_FILE}
+        ${WEBRTC_X86_FILES}
+        ${WEBRTC_ARMV7A_FILES}
+        ${WEBRTC_FIXED_FILES}
+        ${WEBRTC_FLOAT_FILES}
+        WebrtcDenoise.cpp
+        WebrtcDenoiseAPI.cpp
+)
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/WebrtcDenoise.cpp b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/WebrtcDenoise.cpp
new file mode 100644
index 0000000..d364fc8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/WebrtcDenoise.cpp
@@ -0,0 +1,326 @@
+//
+// Created by 杨将 on 2017/8/1.
+//
+
+#include "string"
+#include "WebrtcDenoise.h"
+#include "webrtc/modules/audio_processing/audio_buffer.h"
+#include "webrtc/modules/audio_processing/noise_suppression_impl.h"
+
+CWebrtcDenoise::CWebrtcDenoise()
+{
+    m_sample_rate = 44100;
+    m_channel = 2;
+    m_latency = 0;
+
+    m_noise_suppression = NULL;
+
+    m_frame_size = 441;
+    m_process_buffer = NULL;
+    m_stream_config = NULL;
+
+    m_critical_section = NULL;
+
+    m_residual = 0;
+
+    m_level = kNone;
+    m_current_level = kNone;
+    m_need_smooth = false;
+    m_need_update = false;
+
+    m_tmp_buf = NULL;
+    m_tmp_buf_len = 0;
+
+    memset(m_in_buffer, 0, sizeof(m_in_buffer));
+    memset(m_out_buffer, 0, sizeof(m_out_buffer));
+}
+
+CWebrtcDenoise::~CWebrtcDenoise()
+{
+    uninit();
+}
+
+int CWebrtcDenoise::init(int samplerate, int channel)
+{
+    if((channel != 1) && (channel != 2))
+    {
+        return -1;
+    }
+
+    //帧长为10ms
+    m_frame_size = rtc::CheckedDivExact(samplerate, 100);
+    m_process_buffer = new webrtc::AudioBuffer((size_t)m_frame_size, 1,
+                                               480, 1,
+                                               (size_t)m_frame_size);
+    m_stream_config = new webrtc::StreamConfig(samplerate, 1, false);
+
+    m_critical_section = new rtc::CriticalSection();
+
+    m_noise_suppression = new webrtc::NoiseSuppressionImpl(m_critical_section);
+    m_noise_suppression->Initialize(1, 48000);
+    m_noise_suppression->Enable(true);
+    m_noise_suppression->set_level(webrtc::NoiseSuppression::Level::kHigh);
+
+    m_latency = m_frame_size;
+    m_sample_rate = samplerate;
+    m_channel = channel;
+
+    // 兼容除预览合成的其他调用
+    // 默认实例化的时候,直接process，使用的是kHigh级别
+    m_level = kHigh;
+    m_current_level = kHigh;
+    m_need_smooth = false;
+    m_need_update = false;
+    m_tmp_buf_len = 0;
+    return 0;
+}
+
+float CWebrtcDenoise::get_latency()
+{
+    return m_current_level != kNone ? m_latency / 48000.0f * 1000 + 7 : 0;
+}
+
+void CWebrtcDenoise::reset()
+{
+    m_noise_suppression->Enable(false);
+    m_noise_suppression->Enable(true);
+    m_residual = 0;
+    memset(m_in_buffer, 0, sizeof(m_in_buffer));
+    memset(m_out_buffer, 0, sizeof(m_out_buffer));
+
+    // 清空buffer,否则会有杂音
+    // TODO 有时间看下内部，然后确认下process_buffer的reset怎么做比较合理
+    if(m_process_buffer)
+    {
+        delete m_process_buffer;
+        m_process_buffer = NULL;
+    }
+    m_process_buffer = new webrtc::AudioBuffer((size_t)m_frame_size, 1,
+                                               480, 1,
+                                               (size_t)m_frame_size);
+}
+
+int CWebrtcDenoise::core_process(float * buffer, int len)
+{
+    if((2 == m_channel) && (len & 1))
+    {
+        return -1;
+    }
+
+    float * input = buffer;
+    int copy_num = len / m_channel;
+    int last_num = m_residual;
+
+    if(2 == m_channel)
+    {
+        for(int i = 0; i < copy_num; i ++)
+        {
+            input[2 * i] = (input[2 * i] + input[2 * i + 1]) / 2;
+        }
+    }
+
+    for(int i = 0; i < len; i += m_channel)
+    {
+        m_in_buffer[m_residual] = input[i];
+        m_residual++;
+        if(m_frame_size == m_residual)
+        {
+            m_residual = 0;
+            float * nimei[1];
+            nimei[0] = m_in_buffer;
+            m_process_buffer->CopyFrom((const float * const *)nimei, *m_stream_config);
+            process_one_frame();
+            if(2 == m_channel)
+            {
+                for(int j = 0; j < (m_frame_size - last_num); j++)
+                {
+                    buffer[2 * j] = m_out_buffer[j];
+                    buffer[2 * j + 1] = m_out_buffer[j];
+                }
+                buffer += 2 * (m_frame_size - last_num);
+            }
+            else
+            {
+                memcpy(buffer, m_out_buffer, (m_frame_size - last_num) * sizeof(float));
+                buffer += (m_frame_size - last_num);
+            }
+            copy_num -= (m_frame_size - last_num);
+            nimei[0] = m_out_buffer;
+            m_process_buffer->CopyTo(*m_stream_config, (float * const *)nimei);
+            last_num = 0;
+        }
+    }
+
+    if(copy_num > 0)
+    {
+        if(2 == m_channel)
+        {
+            for(int i = 0; i < copy_num; i++)
+            {
+                buffer[2 * i] = m_out_buffer[i];
+                buffer[2 * i + 1] = m_out_buffer[i];
+            }
+        }
+        else
+        {
+            memcpy(buffer, m_out_buffer, copy_num * sizeof(float));
+        }
+    }
+
+    memmove(m_out_buffer, m_out_buffer + copy_num, (m_frame_size - last_num - copy_num) * sizeof(float));
+
+    return 0;
+}
+
+int CWebrtcDenoise::process(float *buffer, int len)
+{
+    std::lock_guard<std::mutex> lock(m_mutex);
+    if((2 == m_channel) && (len & 1))
+    {
+        return -1;
+    }
+
+    // 新做法
+    // webrtc降噪一直运行，当切换到None的时候，对两者进行叠加输出
+    // 一直的None的时候，切换到webrtc，两者叠加输出
+    if(m_tmp_buf_len < len)
+    {
+        if(NULL != m_tmp_buf)
+        {
+            delete[] m_tmp_buf;
+        }
+        m_tmp_buf = NULL;
+        m_tmp_buf = new float[len];
+        m_tmp_buf_len = len;
+    }
+    memcpy(m_tmp_buf, buffer, sizeof(float) * len);
+    if(m_need_update)
+    {
+        if(kNone != m_level)
+        {
+            m_noise_suppression->set_level((webrtc::NoiseSuppression::Level)m_webrtc_level);
+        }
+        m_current_level = m_level;
+        m_need_update = false;
+    }
+    core_process(m_tmp_buf, len);
+    if(m_need_smooth)
+    {
+        if(kNone == m_current_level)
+        {
+            // 叠加处理
+            for(int i=0;i<len;i+=m_channel)
+            {
+                for(int j=0;j<m_channel;j++)
+                {
+                    buffer[i+j] = buffer[i+j] * i / len + m_tmp_buf[i+j] * (len - i) / len;
+                }
+            }
+        }else
+        {
+            for(int i=0;i<len;i+=m_channel)
+            {
+                for(int j=0;j<m_channel;j++)
+                {
+                    buffer[i+j] = buffer[i+j] * (len - i) / len + m_tmp_buf[i+j] * i / len;
+                }
+            }
+        }
+        m_need_smooth = false;
+    }else
+    {
+        if(kNone != m_current_level)
+        {
+            memcpy(buffer, m_tmp_buf, sizeof(float) * len);
+        }
+    }
+    return 0;
+}
+
+void CWebrtcDenoise::uninit()
+{
+    m_sample_rate = 44100;
+    m_channel = 2;
+    m_latency = 0;
+
+    m_frame_size = 441;
+    if(m_process_buffer)
+    {
+        delete m_process_buffer;
+        m_process_buffer = NULL;
+    }
+    if(m_stream_config)
+    {
+        delete m_stream_config;
+        m_stream_config = NULL;
+    }
+
+    if(m_critical_section)
+    {
+        delete m_critical_section;
+        m_critical_section = NULL;
+    }
+
+    if(m_noise_suppression)
+    {
+        delete m_noise_suppression;
+        m_noise_suppression = NULL;
+    }
+    if(m_tmp_buf)
+    {
+        delete[] m_tmp_buf;
+        m_tmp_buf = NULL;
+    }
+    m_tmp_buf_len = 0;
+    m_residual = 0;
+    memset(m_in_buffer, 0, sizeof(m_in_buffer));
+    memset(m_out_buffer, 0, sizeof(m_out_buffer));
+}
+
+void CWebrtcDenoise::process_one_frame()
+{
+    m_process_buffer->SplitIntoFrequencyBands();
+
+    m_noise_suppression->AnalyzeCaptureAudio(m_process_buffer);
+    m_noise_suppression->ProcessCaptureAudio(m_process_buffer);
+
+    m_process_buffer->MergeFrequencyBands();
+}
+
+void CWebrtcDenoise::set_level(Level level)
+{
+    std::lock_guard<std::mutex> lock(m_mutex);
+    // 重复输入的不处理
+    if(m_current_level == level)
+    {
+        return;
+    }
+
+    // 从无->有，从有->无做平滑
+    // 从无->有
+    if(m_current_level == kNone || level == kNone)
+    {
+        m_need_smooth = true;
+    }
+
+    m_level = level;
+    m_need_update = true;
+    if(kLow == level)
+    {
+        m_webrtc_level = webrtc::NoiseSuppression::Level::kLow;
+    }else if(kModerate == level)
+    {
+        m_webrtc_level = webrtc::NoiseSuppression::Level::kModerate;
+    }else if(kHigh == level)
+    {
+        m_webrtc_level = webrtc::NoiseSuppression::Level::kHigh;
+    }else if(kVeryHigh == level)
+    {
+        m_webrtc_level = webrtc::NoiseSuppression::Level::kVeryHigh;
+    }
+}
+
+Level CWebrtcDenoise::get_level()
+{
+    return m_current_level;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/WebrtcDenoiseAPI.cpp b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/WebrtcDenoiseAPI.cpp
new file mode 100644
index 0000000..14616e4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/WebrtcDenoiseAPI.cpp
@@ -0,0 +1,88 @@
+
+/**
+ * Author: wangjianjun.
+ * Date: 17/8/31 20:58.
+ * Mail: alanwang6584@gmail.com
+ */
+//
+
+#include <cstdlib>
+#include "WebrtcDenoiseAPI.h"
+
+
+/**
+ * 创建CWebrtcDenoise实例
+ * @return
+ */
+void * __DENOISE_API denoise_create()
+{
+    CWebrtcDenoise * webrtcDenoise = new CWebrtcDenoise();
+
+    return webrtcDenoise;
+}
+
+/**
+ * 初始化
+ * @param instance
+ * @param samplerate
+ * @param channel
+ * @return
+ */
+int __DENOISE_API denoise_init(void * instance, int samplerate, int channel)
+{
+    CWebrtcDenoise * webrtcDenoise = (CWebrtcDenoise *) instance;
+    return webrtcDenoise->init(samplerate, channel);
+}
+
+/**
+ * 获取延迟
+ * @param instance
+ */
+float __DENOISE_API denoise_get_latency(void * instance)
+{
+    CWebrtcDenoise * webrtcDenoise = (CWebrtcDenoise *) instance;
+    return webrtcDenoise->get_latency();
+}
+
+/**
+ * reset
+ * @param instance
+ */
+void __DENOISE_API denoise_reset(void * instance)
+{
+    CWebrtcDenoise * webrtcDenoise = (CWebrtcDenoise *) instance;
+    webrtcDenoise->reset();
+}
+
+/**
+ *
+ * @param instance
+ * @param buffer
+ * @param len
+ * @return
+ */
+int __DENOISE_API denoise_process(void * instance, float * buffer, int len)
+{
+    CWebrtcDenoise * webrtcDenoise = (CWebrtcDenoise *) instance;
+    return webrtcDenoise->process(buffer, len);
+}
+
+/**
+ * @param instance
+ */
+void __DENOISE_API denoise_uninit(void * instance)
+{
+    CWebrtcDenoise * webrtcDenoise = (CWebrtcDenoise *) instance;
+    webrtcDenoise->uninit();
+}
+
+/**
+ * 销毁实例
+ * @param instance
+ */
+void __DENOISE_API denoise_destory(void ** instance)
+{
+    CWebrtcDenoise * webrtcDenoise = (CWebrtcDenoise *) *instance;
+    delete (webrtcDenoise);
+    *instance = NULL;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/checks.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/checks.h
new file mode 100644
index 0000000..0ffc098
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/checks.h
@@ -0,0 +1,82 @@
+/*
+ *  Copyright 2006 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_BASE_CHECKS_H_
+#define WEBRTC_BASE_CHECKS_H_
+
+#include "webrtc/typedefs.h"
+
+#include <assert.h>
+
+#define RTC_CHECK(condition)		\
+{									\
+	assert(condition);				\
+}
+
+#define RTC_CHECK_EQ(val1, val2)	\
+{									\
+	assert((val1) == (val2));		\
+}
+
+#define RTC_CHECK_NE(val1, val2)	\
+{									\
+	assert((val1) £¡= (val2));		\
+}
+
+#define RTC_CHECK_LE(val1, val2)	\
+{									\
+	assert((val1) <= (val2));		\
+}
+
+#define RTC_CHECK_LT(val1, val2)	\
+{									\
+	assert((val1) < (val2));		\
+}
+
+#define RTC_CHECK_GE(val1, val2)	\
+{									\
+	assert((val1) >= (val2));		\
+}
+
+#define RTC_CHECK_GT(val1, val2)	\
+{									\
+	assert((val1) > (val2));		\
+}
+
+#define RTC_DCHECK(condition) RTC_CHECK(condition)
+#define RTC_DCHECK_EQ(v1, v2) RTC_CHECK_EQ(v1, v2)
+#define RTC_DCHECK_NE(v1, v2) RTC_CHECK_NE(v1, v2)
+#define RTC_DCHECK_LE(v1, v2) RTC_CHECK_LE(v1, v2)
+#define RTC_DCHECK_LT(v1, v2) RTC_CHECK_LT(v1, v2)
+#define RTC_DCHECK_GE(v1, v2) RTC_CHECK_GE(v1, v2)
+#define RTC_DCHECK_GT(v1, v2) RTC_CHECK_GT(v1, v2)
+
+#ifdef __cplusplus
+
+namespace rtc {
+
+#define FATAL()
+
+#define RTC_UNREACHABLE_CODE_HIT false
+#define RTC_NOTREACHED() RTC_DCHECK(RTC_UNREACHABLE_CODE_HIT)
+
+// Performs the integer division a/b and returns the result. CHECKs that the
+// remainder is zero.
+template <typename T>
+inline T CheckedDivExact(T a, T b) {
+	RTC_CHECK_EQ(a % b, 0);
+	return a / b;
+}
+
+}  // namespace rtc
+
+#endif  // __cplusplus
+
+#endif  // WEBRTC_BASE_CHECKS_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/constructormagic.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/constructormagic.h
new file mode 100644
index 0000000..6ef7826
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/constructormagic.h
@@ -0,0 +1,34 @@
+/*
+ *  Copyright 2004 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_BASE_CONSTRUCTORMAGIC_H_
+#define WEBRTC_BASE_CONSTRUCTORMAGIC_H_
+
+// Put this in the declarations for a class to be unassignable.
+#define RTC_DISALLOW_ASSIGN(TypeName) \
+  void operator=(const TypeName&) = delete
+
+// A macro to disallow the copy constructor and operator= functions. This should
+// be used in the declarations for a class.
+#define RTC_DISALLOW_COPY_AND_ASSIGN(TypeName) \
+  TypeName(const TypeName&) = delete;          \
+  RTC_DISALLOW_ASSIGN(TypeName)
+
+// A macro to disallow all the implicit constructors, namely the default
+// constructor, copy constructor and operator= functions.
+//
+// This should be used in the declarations for a class that wants to prevent
+// anyone from instantiating it. This is especially useful for classes
+// containing only static methods.
+#define RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(TypeName) \
+  TypeName() = delete;                               \
+  RTC_DISALLOW_COPY_AND_ASSIGN(TypeName)
+
+#endif  // WEBRTC_BASE_CONSTRUCTORMAGIC_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/criticalsection.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/criticalsection.cc
new file mode 100644
index 0000000..e8aa20d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/criticalsection.cc
@@ -0,0 +1,84 @@
+/*
+ *  Copyright 2015 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/base/criticalsection.h"
+
+#include "webrtc/base/checks.h"
+//#include "webrtc/base/platform_thread.h"
+
+// TODO(tommi): Split this file up to per-platform implementation files.
+
+namespace rtc {
+
+CriticalSection::CriticalSection() {
+#if defined(WEBRTC_WIN)
+  InitializeCriticalSection(&crit_);
+#else
+  pthread_mutexattr_t mutex_attribute;
+  pthread_mutexattr_init(&mutex_attribute);
+  pthread_mutexattr_settype(&mutex_attribute, PTHREAD_MUTEX_RECURSIVE);
+  pthread_mutex_init(&mutex_, &mutex_attribute);
+  pthread_mutexattr_destroy(&mutex_attribute);
+#endif
+}
+
+CriticalSection::~CriticalSection() {
+#if defined(WEBRTC_WIN)
+  DeleteCriticalSection(&crit_);
+#else
+  pthread_mutex_destroy(&mutex_);
+#endif
+}
+
+void CriticalSection::Enter() const EXCLUSIVE_LOCK_FUNCTION() {
+#if defined(WEBRTC_WIN)
+  EnterCriticalSection(&crit_);
+#else
+  pthread_mutex_lock(&mutex_);
+#endif
+}
+
+bool CriticalSection::TryEnter() const EXCLUSIVE_TRYLOCK_FUNCTION(true) {
+#if defined(WEBRTC_WIN)
+  return TryEnterCriticalSection(&crit_) != FALSE;
+#else
+  if (pthread_mutex_trylock(&mutex_) != 0)
+    return false;
+
+  return true;
+#endif
+}
+void CriticalSection::Leave() const UNLOCK_FUNCTION() {
+  RTC_DCHECK(CurrentThreadIsOwner());
+#if defined(WEBRTC_WIN)
+  LeaveCriticalSection(&crit_);
+#else
+  pthread_mutex_unlock(&mutex_);
+#endif
+}
+
+bool CriticalSection::CurrentThreadIsOwner() const {
+#if defined(WEBRTC_WIN)
+  // OwningThread has type HANDLE but actually contains the Thread ID:
+  // http://stackoverflow.com/questions/12675301/why-is-the-owningthread-member-of-critical-section-of-type-handle-when-it-is-de
+  // Converting through size_t avoids the VS 2015 warning C4312: conversion from
+  // 'type1' to 'type2' of greater size
+  return crit_.OwningThread ==
+         reinterpret_cast<HANDLE>(static_cast<size_t>(GetCurrentThreadId()));
+#else
+  return true;
+#endif
+}
+
+CritScope::CritScope(const CriticalSection* cs) : cs_(cs) { cs_->Enter(); }
+CritScope::~CritScope() { cs_->Leave(); }
+
+
+}  // namespace rtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/criticalsection.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/criticalsection.h
new file mode 100644
index 0000000..9611ac2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/criticalsection.h
@@ -0,0 +1,71 @@
+/*
+ *  Copyright 2004 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_BASE_CRITICALSECTION_H_
+#define WEBRTC_BASE_CRITICALSECTION_H_
+
+//#include "webrtc/base/atomicops.h"
+#include "webrtc/base/checks.h"
+#include "webrtc/base/constructormagic.h"
+#include "webrtc/base/thread_annotations.h"
+//#include "webrtc/base/platform_thread_types.h"
+
+#if defined(WEBRTC_WIN)
+// Include winsock2.h before including <windows.h> to maintain consistency with
+// win32.h.  We can't include win32.h directly here since it pulls in
+// headers such as basictypes.h which causes problems in Chromium where webrtc
+// exists as two separate projects, webrtc and libjingle.
+#include <winsock2.h>
+#include <windows.h>
+#include <sal.h>  // must come after windows headers.
+#endif  // defined(WEBRTC_WIN)
+
+#if defined(WEBRTC_POSIX)
+#include <pthread.h>
+#endif
+
+namespace rtc {
+
+// Locking methods (Enter, TryEnter, Leave)are const to permit protecting
+// members inside a const context without requiring mutable CriticalSections
+// everywhere.
+class LOCKABLE CriticalSection {
+ public:
+  CriticalSection();
+  ~CriticalSection();
+
+  void Enter() const EXCLUSIVE_LOCK_FUNCTION();
+  bool TryEnter() const EXCLUSIVE_TRYLOCK_FUNCTION(true);
+  void Leave() const UNLOCK_FUNCTION();
+
+ private:
+  // Use only for RTC_DCHECKing.
+  bool CurrentThreadIsOwner() const;
+
+#if defined(WEBRTC_WIN)
+  mutable CRITICAL_SECTION crit_;
+#elif defined(WEBRTC_POSIX)
+  mutable pthread_mutex_t mutex_;
+#endif
+};
+
+// CritScope, for serializing execution through a scope.
+class SCOPED_LOCKABLE CritScope {
+ public:
+  explicit CritScope(const CriticalSection* cs) EXCLUSIVE_LOCK_FUNCTION(cs);
+  ~CritScope() UNLOCK_FUNCTION();
+ private:
+  const CriticalSection* const cs_;
+  RTC_DISALLOW_COPY_AND_ASSIGN(CritScope);
+};
+
+} // namespace rtc
+
+#endif // WEBRTC_BASE_CRITICALSECTION_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/deprecation.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/deprecation.h
new file mode 100644
index 0000000..ce950f9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/deprecation.h
@@ -0,0 +1,45 @@
+/*
+ *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_BASE_DEPRECATION_H_
+#define WEBRTC_BASE_DEPRECATION_H_
+
+// Annotate the declarations of deprecated functions with this to cause a
+// compiler warning when they're used. Like so:
+//
+//   RTC_DEPRECATED std::pony PonyPlz(const std::pony_spec& ps);
+//
+// NOTE 1: The annotation goes on the declaration in the .h file, not the
+// definition in the .cc file!
+//
+// NOTE 2: In order to keep unit testing the deprecated function without
+// getting warnings, do something like this:
+//
+//   std::pony DEPRECATED_PonyPlz(const std::pony_spec& ps);
+//   RTC_DEPRECATED inline std::pony PonyPlz(const std::pony_spec& ps) {
+//     return DEPRECATED_PonyPlz(ps);
+//   }
+//
+// In other words, rename the existing function, and provide an inline wrapper
+// using the original name that calls it. That way, callers who are willing to
+// call it using the DEPRECATED_-prefixed name don't get the warning.
+//
+// TODO(kwiberg): Remove this when we can use [[deprecated]] from C++14.
+#if defined(_MSC_VER)
+// Note: Deprecation warnings seem to fail to trigger on Windows
+// (https://bugs.chromium.org/p/webrtc/issues/detail?id=5368).
+#define RTC_DEPRECATED __declspec(deprecated)
+#elif defined(__GNUC__)
+#define RTC_DEPRECATED __attribute__ ((__deprecated__))
+#else
+#define RTC_DEPRECATED
+#endif
+
+#endif  // WEBRTC_BASE_DEPRECATION_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/gtest_prod_util.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/gtest_prod_util.h
new file mode 100644
index 0000000..f0cb114
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/gtest_prod_util.h
@@ -0,0 +1,38 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_BASE_GTEST_PROD_UTIL_H_
+#define WEBRTC_BASE_GTEST_PROD_UTIL_H_
+
+// Define our own version of FRIEND_TEST here rather than including
+// gtest_prod.h to avoid depending on any part of GTest in production code.
+#define FRIEND_TEST_WEBRTC(test_case_name, test_name)\
+friend class test_case_name##_##test_name##_Test
+
+// This file is a plain copy of Chromium's base/gtest_prod_util.h.
+//
+// This is a wrapper for gtest's FRIEND_TEST macro that friends
+// test with all possible prefixes. This is very helpful when changing the test
+// prefix, because the friend declarations don't need to be updated.
+//
+// Example usage:
+//
+// class MyClass {
+//  private:
+//   void MyMethod();
+//   FRIEND_TEST_ALL_PREFIXES(MyClassTest, MyMethod);
+// };
+#define FRIEND_TEST_ALL_PREFIXES(test_case_name, test_name) \
+  FRIEND_TEST_WEBRTC(test_case_name, test_name); \
+  FRIEND_TEST_WEBRTC(test_case_name, DISABLED_##test_name); \
+  FRIEND_TEST_WEBRTC(test_case_name, FLAKY_##test_name); \
+  FRIEND_TEST_WEBRTC(test_case_name, FAILS_##test_name)
+
+#endif  // WEBRTC_BASE_GTEST_PROD_UTIL_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/safe_conversions.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/safe_conversions.h
new file mode 100644
index 0000000..2acce4d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/safe_conversions.h
@@ -0,0 +1,76 @@
+/*
+ *  Copyright 2014 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Borrowed from Chromium's src/base/numerics/safe_conversions.h.
+
+#ifndef WEBRTC_BASE_SAFE_CONVERSIONS_H_
+#define WEBRTC_BASE_SAFE_CONVERSIONS_H_
+
+#include <limits>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/base/safe_conversions_impl.h"
+
+namespace rtc {
+
+// Convenience function that returns true if the supplied value is in range
+// for the destination type.
+template <typename Dst, typename Src>
+inline bool IsValueInRangeForNumericType(Src value) {
+  return internal::RangeCheck<Dst>(value) == internal::TYPE_VALID;
+}
+
+// checked_cast<> and dchecked_cast<> are analogous to static_cast<> for
+// numeric types, except that they [D]CHECK that the specified numeric
+// conversion will not overflow or underflow. NaN source will always trigger
+// the [D]CHECK.
+template <typename Dst, typename Src>
+inline Dst checked_cast(Src value) {
+  RTC_CHECK(IsValueInRangeForNumericType<Dst>(value));
+  return static_cast<Dst>(value);
+}
+template <typename Dst, typename Src>
+inline Dst dchecked_cast(Src value) {
+  RTC_DCHECK(IsValueInRangeForNumericType<Dst>(value));
+  return static_cast<Dst>(value);
+}
+
+// saturated_cast<> is analogous to static_cast<> for numeric types, except
+// that the specified numeric conversion will saturate rather than overflow or
+// underflow. NaN assignment to an integral will trigger a RTC_CHECK condition.
+template <typename Dst, typename Src>
+inline Dst saturated_cast(Src value) {
+  // Optimization for floating point values, which already saturate.
+  if (std::numeric_limits<Dst>::is_iec559)
+    return static_cast<Dst>(value);
+
+  switch (internal::RangeCheck<Dst>(value)) {
+    case internal::TYPE_VALID:
+      return static_cast<Dst>(value);
+
+    case internal::TYPE_UNDERFLOW:
+      return (std::numeric_limits<Dst>::min)();
+
+    case internal::TYPE_OVERFLOW:
+      return (std::numeric_limits<Dst>::max)();
+
+    // Should fail only on attempting to assign NaN to a saturated integer.
+    case internal::TYPE_INVALID:
+      FATAL();
+      return (std::numeric_limits<Dst>::max)();
+  }
+
+  FATAL();
+  return static_cast<Dst>(value);
+}
+
+}  // namespace rtc
+
+#endif  // WEBRTC_BASE_SAFE_CONVERSIONS_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/safe_conversions_impl.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/safe_conversions_impl.h
new file mode 100644
index 0000000..7dbd6a3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/safe_conversions_impl.h
@@ -0,0 +1,188 @@
+/*
+ *  Copyright 2014 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Borrowed from Chromium's src/base/numerics/safe_conversions_impl.h.
+
+#ifndef WEBRTC_BASE_SAFE_CONVERSIONS_IMPL_H_
+#define WEBRTC_BASE_SAFE_CONVERSIONS_IMPL_H_
+
+#include <limits>
+
+namespace rtc {
+namespace internal {
+
+enum DstSign {
+  DST_UNSIGNED,
+  DST_SIGNED
+};
+
+enum SrcSign {
+  SRC_UNSIGNED,
+  SRC_SIGNED
+};
+
+enum DstRange {
+  OVERLAPS_RANGE,
+  CONTAINS_RANGE
+};
+
+// Helper templates to statically determine if our destination type can contain
+// all values represented by the source type.
+
+template <typename Dst, typename Src,
+          DstSign IsDstSigned = std::numeric_limits<Dst>::is_signed ?
+                                DST_SIGNED : DST_UNSIGNED,
+          SrcSign IsSrcSigned = std::numeric_limits<Src>::is_signed ?
+                                SRC_SIGNED : SRC_UNSIGNED>
+struct StaticRangeCheck {};
+
+template <typename Dst, typename Src>
+struct StaticRangeCheck<Dst, Src, DST_SIGNED, SRC_SIGNED> {
+  typedef std::numeric_limits<Dst> DstLimits;
+  typedef std::numeric_limits<Src> SrcLimits;
+  // Compare based on max_exponent, which we must compute for integrals.
+  static const size_t kDstMaxExponent = DstLimits::is_iec559 ?
+                                        DstLimits::max_exponent :
+                                        (sizeof(Dst) * 8 - 1);
+  static const size_t kSrcMaxExponent = SrcLimits::is_iec559 ?
+                                        SrcLimits::max_exponent :
+                                        (sizeof(Src) * 8 - 1);
+  static const DstRange value = kDstMaxExponent >= kSrcMaxExponent ?
+                                CONTAINS_RANGE : OVERLAPS_RANGE;
+};
+
+template <typename Dst, typename Src>
+struct StaticRangeCheck<Dst, Src, DST_UNSIGNED, SRC_UNSIGNED> {
+  static const DstRange value = sizeof(Dst) >= sizeof(Src) ?
+                                CONTAINS_RANGE : OVERLAPS_RANGE;
+};
+
+template <typename Dst, typename Src>
+struct StaticRangeCheck<Dst, Src, DST_SIGNED, SRC_UNSIGNED> {
+  typedef std::numeric_limits<Dst> DstLimits;
+  typedef std::numeric_limits<Src> SrcLimits;
+  // Compare based on max_exponent, which we must compute for integrals.
+  static const size_t kDstMaxExponent = DstLimits::is_iec559 ?
+                                        DstLimits::max_exponent :
+                                        (sizeof(Dst) * 8 - 1);
+  static const size_t kSrcMaxExponent = sizeof(Src) * 8;
+  static const DstRange value = kDstMaxExponent >= kSrcMaxExponent ?
+                                CONTAINS_RANGE : OVERLAPS_RANGE;
+};
+
+template <typename Dst, typename Src>
+struct StaticRangeCheck<Dst, Src, DST_UNSIGNED, SRC_SIGNED> {
+  static const DstRange value = OVERLAPS_RANGE;
+};
+
+
+enum RangeCheckResult {
+  TYPE_VALID = 0,      // Value can be represented by the destination type.
+  TYPE_UNDERFLOW = 1,  // Value would overflow.
+  TYPE_OVERFLOW = 2,   // Value would underflow.
+  TYPE_INVALID = 3     // Source value is invalid (i.e. NaN).
+};
+
+// This macro creates a RangeCheckResult from an upper and lower bound
+// check by taking advantage of the fact that only NaN can be out of range in
+// both directions at once.
+#define BASE_NUMERIC_RANGE_CHECK_RESULT(is_in_upper_bound, is_in_lower_bound) \
+    RangeCheckResult(((is_in_upper_bound) ? 0 : TYPE_OVERFLOW) | \
+                            ((is_in_lower_bound) ? 0 : TYPE_UNDERFLOW))
+
+template <typename Dst,
+          typename Src,
+          DstSign IsDstSigned = std::numeric_limits<Dst>::is_signed ?
+                                DST_SIGNED : DST_UNSIGNED,
+          SrcSign IsSrcSigned = std::numeric_limits<Src>::is_signed ?
+                                SRC_SIGNED : SRC_UNSIGNED,
+          DstRange IsSrcRangeContained = StaticRangeCheck<Dst, Src>::value>
+struct RangeCheckImpl {};
+
+// The following templates are for ranges that must be verified at runtime. We
+// split it into checks based on signedness to avoid confusing casts and
+// compiler warnings on signed an unsigned comparisons.
+
+// Dst range always contains the result: nothing to check.
+template <typename Dst, typename Src, DstSign IsDstSigned, SrcSign IsSrcSigned>
+struct RangeCheckImpl<Dst, Src, IsDstSigned, IsSrcSigned, CONTAINS_RANGE> {
+  static RangeCheckResult Check(Src value) {
+    return TYPE_VALID;
+  }
+};
+
+// Signed to signed narrowing.
+template <typename Dst, typename Src>
+struct RangeCheckImpl<Dst, Src, DST_SIGNED, SRC_SIGNED, OVERLAPS_RANGE> {
+  static RangeCheckResult Check(Src value) {
+    typedef std::numeric_limits<Dst> DstLimits;
+    return DstLimits::is_iec559 ?
+           BASE_NUMERIC_RANGE_CHECK_RESULT(
+               value <= static_cast<Src>((DstLimits::max)()),
+               value >= static_cast<Src>((DstLimits::max)() * -1)) :
+           BASE_NUMERIC_RANGE_CHECK_RESULT(
+               value <= static_cast<Src>((DstLimits::max)()),
+               value >= static_cast<Src>((DstLimits::min)()));
+  }
+};
+
+// Unsigned to unsigned narrowing.
+template <typename Dst, typename Src>
+struct RangeCheckImpl<Dst, Src, DST_UNSIGNED, SRC_UNSIGNED, OVERLAPS_RANGE> {
+  static RangeCheckResult Check(Src value) {
+    typedef std::numeric_limits<Dst> DstLimits;
+    return BASE_NUMERIC_RANGE_CHECK_RESULT(
+               value <= static_cast<Src>((DstLimits::max)()), true);
+  }
+};
+
+// Unsigned to signed.
+template <typename Dst, typename Src>
+struct RangeCheckImpl<Dst, Src, DST_SIGNED, SRC_UNSIGNED, OVERLAPS_RANGE> {
+  static RangeCheckResult Check(Src value) {
+    typedef std::numeric_limits<Dst> DstLimits;
+    return sizeof(Dst) > sizeof(Src) ? TYPE_VALID :
+           BASE_NUMERIC_RANGE_CHECK_RESULT(
+               value <= static_cast<Src>((DstLimits::max)()), true);
+  }
+};
+
+// Signed to unsigned.
+template <typename Dst, typename Src>
+struct RangeCheckImpl<Dst, Src, DST_UNSIGNED, SRC_SIGNED, OVERLAPS_RANGE> {
+  static RangeCheckResult Check(Src value) {
+    typedef std::numeric_limits<Dst> DstLimits;
+    typedef std::numeric_limits<Src> SrcLimits;
+    // Compare based on max_exponent, which we must compute for integrals.
+    static const size_t kDstMaxExponent = sizeof(Dst) * 8;
+    static const size_t kSrcMaxExponent = SrcLimits::is_iec559 ?
+                                          SrcLimits::max_exponent :
+                                          (sizeof(Src) * 8 - 1);
+    return (kDstMaxExponent >= kSrcMaxExponent) ?
+           BASE_NUMERIC_RANGE_CHECK_RESULT(true, value >= static_cast<Src>(0)) :
+           BASE_NUMERIC_RANGE_CHECK_RESULT(
+               value <= static_cast<Src>((DstLimits::max)()),
+               value >= static_cast<Src>(0));
+  }
+};
+
+template <typename Dst, typename Src>
+inline RangeCheckResult RangeCheck(Src value) {
+  static_assert(std::numeric_limits<Src>::is_specialized,
+                "argument must be numeric");
+  static_assert(std::numeric_limits<Dst>::is_specialized,
+                "result must be numeric");
+  return RangeCheckImpl<Dst, Src>::Check(value);
+}
+
+}  // namespace internal
+}  // namespace rtc
+
+#endif  // WEBRTC_BASE_SAFE_CONVERSIONS_IMPL_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/sanitizer.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/sanitizer.h
new file mode 100644
index 0000000..e27a692
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/sanitizer.h
@@ -0,0 +1,116 @@
+/*
+ *  Copyright 2016 The WebRTC Project Authors. All rights reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_BASE_SANITIZER_H_
+#define WEBRTC_BASE_SANITIZER_H_
+
+#if defined(__has_feature)
+#if __has_feature(address_sanitizer)
+#define RTC_HAS_ASAN 1
+#endif
+#if __has_feature(memory_sanitizer)
+#define RTC_HAS_MSAN 1
+#endif
+#endif
+#ifndef RTC_HAS_ASAN
+#define RTC_HAS_ASAN 0
+#endif
+#ifndef RTC_HAS_MSAN
+#define RTC_HAS_MSAN 0
+#endif
+
+#if RTC_HAS_ASAN
+#include <sanitizer/asan_interface.h>
+#endif
+#if RTC_HAS_MSAN
+#include <sanitizer/msan_interface.h>
+#endif
+
+#ifdef __has_attribute
+#if __has_attribute(no_sanitize)
+#define RTC_NO_SANITIZE(what) __attribute__((no_sanitize(what)))
+#endif
+#endif
+#ifndef RTC_NO_SANITIZE
+#define RTC_NO_SANITIZE(what)
+#endif
+
+// Ask ASan to mark the memory range [ptr, ptr + element_size * num_elements)
+// as being unaddressable, so that reads and writes are not allowed. ASan may
+// narrow the range to the nearest alignment boundaries.
+static inline void rtc_AsanPoison(const volatile void* ptr,
+                                  size_t element_size,
+                                  size_t num_elements) {
+#if RTC_HAS_ASAN
+  ASAN_POISON_MEMORY_REGION(ptr, element_size * num_elements);
+#endif
+}
+
+// Ask ASan to mark the memory range [ptr, ptr + element_size * num_elements)
+// as being addressable, so that reads and writes are allowed. ASan may widen
+// the range to the nearest alignment boundaries.
+static inline void rtc_AsanUnpoison(const volatile void* ptr,
+                                    size_t element_size,
+                                    size_t num_elements) {
+#if RTC_HAS_ASAN
+  ASAN_UNPOISON_MEMORY_REGION(ptr, element_size * num_elements);
+#endif
+}
+
+// Ask MSan to mark the memory range [ptr, ptr + element_size * num_elements)
+// as being uninitialized.
+static inline void rtc_MsanMarkUninitialized(const volatile void* ptr,
+                                             size_t element_size,
+                                             size_t num_elements) {
+#if RTC_HAS_MSAN
+  __msan_poison(ptr, element_size * num_elements);
+#endif
+}
+
+// Force an MSan check (if any bits in the memory range [ptr, ptr +
+// element_size * num_elements) are uninitialized the call will crash with an
+// MSan report).
+static inline void rtc_MsanCheckInitialized(const volatile void* ptr,
+                                            size_t element_size,
+                                            size_t num_elements) {
+#if RTC_HAS_MSAN
+  __msan_check_mem_is_initialized(ptr, element_size * num_elements);
+#endif
+}
+
+#ifdef __cplusplus
+
+namespace rtc {
+
+template <typename T>
+inline void AsanPoison(const T& mem) {
+  rtc_AsanPoison(mem.data(), sizeof(mem.data()[0]), mem.size());
+}
+
+template <typename T>
+inline void AsanUnpoison(const T& mem) {
+  rtc_AsanUnpoison(mem.data(), sizeof(mem.data()[0]), mem.size());
+}
+
+template <typename T>
+inline void MsanMarkUninitialized(const T& mem) {
+  rtc_MsanMarkUninitialized(mem.data(), sizeof(mem.data()[0]), mem.size());
+}
+
+template <typename T>
+inline void MsanCheckInitialized(const T& mem) {
+  rtc_MsanCheckInitialized(mem.data(), sizeof(mem.data()[0]), mem.size());
+}
+
+}  // namespace rtc
+
+#endif  // __cplusplus
+
+#endif  // WEBRTC_BASE_SANITIZER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/thread_annotations.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/thread_annotations.h
new file mode 100644
index 0000000..8d5abbd
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/base/thread_annotations.h
@@ -0,0 +1,100 @@
+//
+// Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+//
+// Use of this source code is governed by a BSD-style license
+// that can be found in the LICENSE file in the root of the source
+// tree. An additional intellectual property rights grant can be found
+// in the file PATENTS.  All contributing project authors may
+// be found in the AUTHORS file in the root of the source tree.
+//
+// Borrowed from
+// https://code.google.com/p/gperftools/source/browse/src/base/thread_annotations.h
+// but adapted for clang attributes instead of the gcc.
+//
+// This header file contains the macro definitions for thread safety
+// annotations that allow the developers to document the locking policies
+// of their multi-threaded code. The annotations can also help program
+// analysis tools to identify potential thread safety issues.
+
+#ifndef WEBRTC_BASE_THREAD_ANNOTATIONS_H_
+#define WEBRTC_BASE_THREAD_ANNOTATIONS_H_
+
+#if defined(__clang__) && (!defined(SWIG))
+#define THREAD_ANNOTATION_ATTRIBUTE__(x) __attribute__((x))
+#else
+#define THREAD_ANNOTATION_ATTRIBUTE__(x)  // no-op
+#endif
+
+// Document if a shared variable/field needs to be protected by a lock.
+// GUARDED_BY allows the user to specify a particular lock that should be
+// held when accessing the annotated variable, while GUARDED_VAR only
+// indicates a shared variable should be guarded (by any lock). GUARDED_VAR
+// is primarily used when the client cannot express the name of the lock.
+#define GUARDED_BY(x) THREAD_ANNOTATION_ATTRIBUTE__(guarded_by(x))
+#define GUARDED_VAR THREAD_ANNOTATION_ATTRIBUTE__(guarded_var)
+
+// Document if the memory location pointed to by a pointer should be guarded
+// by a lock when dereferencing the pointer. Similar to GUARDED_VAR,
+// PT_GUARDED_VAR is primarily used when the client cannot express the name
+// of the lock. Note that a pointer variable to a shared memory location
+// could itself be a shared variable. For example, if a shared global pointer
+// q, which is guarded by mu1, points to a shared memory location that is
+// guarded by mu2, q should be annotated as follows:
+//     int *q GUARDED_BY(mu1) PT_GUARDED_BY(mu2);
+#define PT_GUARDED_BY(x) THREAD_ANNOTATION_ATTRIBUTE__(pt_guarded_by(x))
+#define PT_GUARDED_VAR THREAD_ANNOTATION_ATTRIBUTE__(pt_guarded_var)
+
+// Document the acquisition order between locks that can be held
+// simultaneously by a thread. For any two locks that need to be annotated
+// to establish an acquisition order, only one of them needs the annotation.
+// (i.e. You don't have to annotate both locks with both ACQUIRED_AFTER
+// and ACQUIRED_BEFORE.)
+#define ACQUIRED_AFTER(x) THREAD_ANNOTATION_ATTRIBUTE__(acquired_after(x))
+#define ACQUIRED_BEFORE(x) THREAD_ANNOTATION_ATTRIBUTE__(acquired_before(x))
+
+// The following three annotations document the lock requirements for
+// functions/methods.
+
+// Document if a function expects certain locks to be held before it is called
+#define EXCLUSIVE_LOCKS_REQUIRED(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(exclusive_locks_required(__VA_ARGS__))
+
+#define SHARED_LOCKS_REQUIRED(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(shared_locks_required(__VA_ARGS__))
+
+// Document the locks acquired in the body of the function. These locks
+// cannot be held when calling this function (as google3's Mutex locks are
+// non-reentrant).
+#define LOCKS_EXCLUDED(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(locks_excluded(__VA_ARGS__))
+
+// Document the lock the annotated function returns without acquiring it.
+#define LOCK_RETURNED(x) THREAD_ANNOTATION_ATTRIBUTE__(lock_returned(x))
+
+// Document if a class/type is a lockable type (such as the Mutex class).
+#define LOCKABLE THREAD_ANNOTATION_ATTRIBUTE__(lockable)
+
+// Document if a class is a scoped lockable type (such as the MutexLock class).
+#define SCOPED_LOCKABLE THREAD_ANNOTATION_ATTRIBUTE__(scoped_lockable)
+
+// The following annotations specify lock and unlock primitives.
+#define EXCLUSIVE_LOCK_FUNCTION(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(exclusive_lock_function(__VA_ARGS__))
+
+#define SHARED_LOCK_FUNCTION(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(shared_lock_function(__VA_ARGS__))
+
+#define EXCLUSIVE_TRYLOCK_FUNCTION(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(exclusive_trylock_function(__VA_ARGS__))
+
+#define SHARED_TRYLOCK_FUNCTION(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(shared_trylock_function(__VA_ARGS__))
+
+#define UNLOCK_FUNCTION(...) \
+  THREAD_ANNOTATION_ATTRIBUTE__(unlock_function(__VA_ARGS__))
+
+// An escape hatch for thread safety analysis to ignore the annotated function.
+#define NO_THREAD_SAFETY_ANALYSIS \
+  THREAD_ANNOTATION_ATTRIBUTE__(no_thread_safety_analysis)
+
+#endif  // WEBRTC_BASE_THREAD_ANNOTATIONS_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/audio_util.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/audio_util.cc
new file mode 100644
index 0000000..2ce2eba
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/audio_util.cc
@@ -0,0 +1,51 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/include/audio_util.h"
+
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+void FloatToS16(const float* src, size_t size, int16_t* dest) {
+  for (size_t i = 0; i < size; ++i)
+    dest[i] = FloatToS16(src[i]);
+}
+
+void S16ToFloat(const int16_t* src, size_t size, float* dest) {
+  for (size_t i = 0; i < size; ++i)
+    dest[i] = S16ToFloat(src[i]);
+}
+
+void FloatS16ToS16(const float* src, size_t size, int16_t* dest) {
+  for (size_t i = 0; i < size; ++i)
+    dest[i] = FloatS16ToS16(src[i]);
+}
+
+void FloatToFloatS16(const float* src, size_t size, float* dest) {
+  for (size_t i = 0; i < size; ++i)
+    dest[i] = FloatToFloatS16(src[i]);
+}
+
+void FloatS16ToFloat(const float* src, size_t size, float* dest) {
+  for (size_t i = 0; i < size; ++i)
+    dest[i] = FloatS16ToFloat(src[i]);
+}
+
+template <>
+void DownmixInterleavedToMono<int16_t>(const int16_t* interleaved,
+                                       size_t num_frames,
+                                       int num_channels,
+                                       int16_t* deinterleaved) {
+  DownmixInterleavedToMonoImpl<int16_t, int32_t>(interleaved, num_frames,
+                                                 num_channels, deinterleaved);
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/channel_buffer.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/channel_buffer.cc
new file mode 100644
index 0000000..0f36411
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/channel_buffer.cc
@@ -0,0 +1,79 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/channel_buffer.h"
+
+#include "webrtc/base/checks.h"
+
+namespace webrtc {
+
+IFChannelBuffer::IFChannelBuffer(size_t num_frames,
+                                 size_t num_channels,
+                                 size_t num_bands)
+    : ivalid_(true),
+      ibuf_(num_frames, num_channels, num_bands),
+      fvalid_(true),
+      fbuf_(num_frames, num_channels, num_bands) {}
+
+IFChannelBuffer::~IFChannelBuffer() = default;
+
+ChannelBuffer<int16_t>* IFChannelBuffer::ibuf() {
+  RefreshI();
+  fvalid_ = false;
+  return &ibuf_;
+}
+
+ChannelBuffer<float>* IFChannelBuffer::fbuf() {
+  RefreshF();
+  ivalid_ = false;
+  return &fbuf_;
+}
+
+const ChannelBuffer<int16_t>* IFChannelBuffer::ibuf_const() const {
+  RefreshI();
+  return &ibuf_;
+}
+
+const ChannelBuffer<float>* IFChannelBuffer::fbuf_const() const {
+  RefreshF();
+  return &fbuf_;
+}
+
+void IFChannelBuffer::RefreshF() const {
+  if (!fvalid_) {
+    RTC_DCHECK(ivalid_);
+    fbuf_.set_num_channels(ibuf_.num_channels());
+    const int16_t* const* int_channels = ibuf_.channels();
+    float* const* float_channels = fbuf_.channels();
+    for (size_t i = 0; i < ibuf_.num_channels(); ++i) {
+      for (size_t j = 0; j < ibuf_.num_frames(); ++j) {
+        float_channels[i][j] = int_channels[i][j];
+      }
+    }
+    fvalid_ = true;
+  }
+}
+
+void IFChannelBuffer::RefreshI() const {
+  if (!ivalid_) {
+    RTC_DCHECK(fvalid_);
+    int16_t* const* int_channels = ibuf_.channels();
+    ibuf_.set_num_channels(fbuf_.num_channels());
+    const float* const* float_channels = fbuf_.channels();
+    for (size_t i = 0; i < fbuf_.num_channels(); ++i) {
+      FloatS16ToS16(float_channels[i],
+                    ibuf_.num_frames(),
+                    int_channels[i]);
+    }
+    ivalid_ = true;
+  }
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/channel_buffer.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/channel_buffer.h
new file mode 100644
index 0000000..930dd73
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/channel_buffer.h
@@ -0,0 +1,186 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_CHANNEL_BUFFER_H_
+#define WEBRTC_COMMON_AUDIO_CHANNEL_BUFFER_H_
+
+#include <string.h>
+
+#include <memory>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/base/gtest_prod_util.h"
+#include "webrtc/common_audio/include/audio_util.h"
+
+namespace webrtc {
+
+// Helper to encapsulate a contiguous data buffer, full or split into frequency
+// bands, with access to a pointer arrays of the deinterleaved channels and
+// bands. The buffer is zero initialized at creation.
+//
+// The buffer structure is showed below for a 2 channel and 2 bands case:
+//
+// |data_|:
+// { [ --- b1ch1 --- ] [ --- b2ch1 --- ] [ --- b1ch2 --- ] [ --- b2ch2 --- ] }
+//
+// The pointer arrays for the same example are as follows:
+//
+// |channels_|:
+// { [ b1ch1* ] [ b1ch2* ] [ b2ch1* ] [ b2ch2* ] }
+//
+// |bands_|:
+// { [ b1ch1* ] [ b2ch1* ] [ b1ch2* ] [ b2ch2* ] }
+template <typename T>
+class ChannelBuffer {
+ public:
+  ChannelBuffer(size_t num_frames,
+                size_t num_channels,
+                size_t num_bands = 1)
+      : data_(new T[num_frames * num_channels]()),
+        channels_(new T*[num_channels * num_bands]),
+        bands_(new T*[num_channels * num_bands]),
+        num_frames_(num_frames),
+        num_frames_per_band_(num_frames / num_bands),
+        num_allocated_channels_(num_channels),
+        num_channels_(num_channels),
+        num_bands_(num_bands) {
+    for (size_t i = 0; i < num_allocated_channels_; ++i) {
+      for (size_t j = 0; j < num_bands_; ++j) {
+        channels_[j * num_allocated_channels_ + i] =
+            &data_[i * num_frames_ + j * num_frames_per_band_];
+        bands_[i * num_bands_ + j] = channels_[j * num_allocated_channels_ + i];
+      }
+    }
+  }
+
+  // Returns a pointer array to the full-band channels (or lower band channels).
+  // Usage:
+  // channels()[channel][sample].
+  // Where:
+  // 0 <= channel < |num_allocated_channels_|
+  // 0 <= sample < |num_frames_|
+  T* const* channels() { return channels(0); }
+  const T* const* channels() const { return channels(0); }
+
+  // Returns a pointer array to the channels for a specific band.
+  // Usage:
+  // channels(band)[channel][sample].
+  // Where:
+  // 0 <= band < |num_bands_|
+  // 0 <= channel < |num_allocated_channels_|
+  // 0 <= sample < |num_frames_per_band_|
+  const T* const* channels(size_t band) const {
+    RTC_DCHECK_LT(band, num_bands_);
+    return &channels_[band * num_allocated_channels_];
+  }
+  T* const* channels(size_t band) {
+    const ChannelBuffer<T>* t = this;
+    return const_cast<T* const*>(t->channels(band));
+  }
+
+  // Returns a pointer array to the bands for a specific channel.
+  // Usage:
+  // bands(channel)[band][sample].
+  // Where:
+  // 0 <= channel < |num_channels_|
+  // 0 <= band < |num_bands_|
+  // 0 <= sample < |num_frames_per_band_|
+  const T* const* bands(size_t channel) const {
+    RTC_DCHECK_LT(channel, num_channels_);
+    RTC_DCHECK_GE(channel, 0);
+    return &bands_[channel * num_bands_];
+  }
+  T* const* bands(size_t channel) {
+    const ChannelBuffer<T>* t = this;
+    return const_cast<T* const*>(t->bands(channel));
+  }
+
+  // Sets the |slice| pointers to the |start_frame| position for each channel.
+  // Returns |slice| for convenience.
+  const T* const* Slice(T** slice, size_t start_frame) const {
+    RTC_DCHECK_LT(start_frame, num_frames_);
+    for (size_t i = 0; i < num_channels_; ++i)
+      slice[i] = &channels_[i][start_frame];
+    return slice;
+  }
+  T** Slice(T** slice, size_t start_frame) {
+    const ChannelBuffer<T>* t = this;
+    return const_cast<T**>(t->Slice(slice, start_frame));
+  }
+
+  size_t num_frames() const { return num_frames_; }
+  size_t num_frames_per_band() const { return num_frames_per_band_; }
+  size_t num_channels() const { return num_channels_; }
+  size_t num_bands() const { return num_bands_; }
+  size_t size() const {return num_frames_ * num_allocated_channels_; }
+
+  void set_num_channels(size_t num_channels) {
+    RTC_DCHECK_LE(num_channels, num_allocated_channels_);
+    num_channels_ = num_channels;
+  }
+
+  void SetDataForTesting(const T* data, size_t size) {
+    RTC_CHECK_EQ(size, this->size());
+    memcpy(data_.get(), data, size * sizeof(*data));
+  }
+
+ private:
+  std::unique_ptr<T[]> data_;
+  std::unique_ptr<T* []> channels_;
+  std::unique_ptr<T* []> bands_;
+  const size_t num_frames_;
+  const size_t num_frames_per_band_;
+  // Number of channels the internal buffer holds.
+  const size_t num_allocated_channels_;
+  // Number of channels the user sees.
+  size_t num_channels_;
+  const size_t num_bands_;
+};
+
+// One int16_t and one float ChannelBuffer that are kept in sync. The sync is
+// broken when someone requests write access to either ChannelBuffer, and
+// reestablished when someone requests the outdated ChannelBuffer. It is
+// therefore safe to use the return value of ibuf_const() and fbuf_const()
+// until the next call to ibuf() or fbuf(), and the return value of ibuf() and
+// fbuf() until the next call to any of the other functions.
+class IFChannelBuffer {
+ public:
+  IFChannelBuffer(size_t num_frames, size_t num_channels, size_t num_bands = 1);
+  ~IFChannelBuffer();
+
+  ChannelBuffer<int16_t>* ibuf();
+  ChannelBuffer<float>* fbuf();
+  const ChannelBuffer<int16_t>* ibuf_const() const;
+  const ChannelBuffer<float>* fbuf_const() const;
+
+  size_t num_frames() const { return ibuf_.num_frames(); }
+  size_t num_frames_per_band() const { return ibuf_.num_frames_per_band(); }
+  size_t num_channels() const {
+    return ivalid_ ? ibuf_.num_channels() : fbuf_.num_channels();
+  }
+  void set_num_channels(size_t num_channels) {
+    ibuf_.set_num_channels(num_channels);
+    fbuf_.set_num_channels(num_channels);
+  }
+  size_t num_bands() const { return ibuf_.num_bands(); }
+
+ private:
+  void RefreshF() const;
+  void RefreshI() const;
+
+  mutable bool ivalid_;
+  mutable ChannelBuffer<int16_t> ibuf_;
+  mutable bool fvalid_;
+  mutable ChannelBuffer<float> fbuf_;
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_COMMON_AUDIO_CHANNEL_BUFFER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/fft4g.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/fft4g.c
new file mode 100644
index 0000000..9cf7b9f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/fft4g.c
@@ -0,0 +1,1332 @@
+/*
+ * http://www.kurims.kyoto-u.ac.jp/~ooura/fft.html
+ * Copyright Takuya OOURA, 1996-2001
+ *
+ * You may use, copy, modify and distribute this code for any purpose (include
+ * commercial use) and without fee. Please refer to this package when you modify
+ * this code.
+ *
+ * Changes:
+ * Trivial type modifications by the WebRTC authors.
+ */
+
+/*
+Fast Fourier/Cosine/Sine Transform
+    dimension   :one
+    data length :power of 2
+    decimation  :frequency
+    radix       :4, 2
+    data        :inplace
+    table       :use
+functions
+    cdft: Complex Discrete Fourier Transform
+    rdft: Real Discrete Fourier Transform
+    ddct: Discrete Cosine Transform
+    ddst: Discrete Sine Transform
+    dfct: Cosine Transform of RDFT (Real Symmetric DFT)
+    dfst: Sine Transform of RDFT (Real Anti-symmetric DFT)
+function prototypes
+    void cdft(int, int, float *, int *, float *);
+    void rdft(size_t, int, float *, size_t *, float *);
+    void ddct(int, int, float *, int *, float *);
+    void ddst(int, int, float *, int *, float *);
+    void dfct(int, float *, float *, int *, float *);
+    void dfst(int, float *, float *, int *, float *);
+
+
+-------- Complex DFT (Discrete Fourier Transform) --------
+    [definition]
+        <case1>
+            X[k] = sum_j=0^n-1 x[j]*exp(2*pi*i*j*k/n), 0<=k<n
+        <case2>
+            X[k] = sum_j=0^n-1 x[j]*exp(-2*pi*i*j*k/n), 0<=k<n
+        (notes: sum_j=0^n-1 is a summation from j=0 to n-1)
+    [usage]
+        <case1>
+            ip[0] = 0; // first time only
+            cdft(2*n, 1, a, ip, w);
+        <case2>
+            ip[0] = 0; // first time only
+            cdft(2*n, -1, a, ip, w);
+    [parameters]
+        2*n            :data length (int)
+                        n >= 1, n = power of 2
+        a[0...2*n-1]   :input/output data (float *)
+                        input data
+                            a[2*j] = Re(x[j]),
+                            a[2*j+1] = Im(x[j]), 0<=j<n
+                        output data
+                            a[2*k] = Re(X[k]),
+                            a[2*k+1] = Im(X[k]), 0<=k<n
+        ip[0...*]      :work area for bit reversal (int *)
+                        length of ip >= 2+sqrt(n)
+                        strictly,
+                        length of ip >=
+                            2+(1<<(int)(log(n+0.5)/log(2))/2).
+                        ip[0],ip[1] are pointers of the cos/sin table.
+        w[0...n/2-1]   :cos/sin table (float *)
+                        w[],ip[] are initialized if ip[0] == 0.
+    [remark]
+        Inverse of
+            cdft(2*n, -1, a, ip, w);
+        is
+            cdft(2*n, 1, a, ip, w);
+            for (j = 0; j <= 2 * n - 1; j++) {
+                a[j] *= 1.0 / n;
+            }
+        .
+
+
+-------- Real DFT / Inverse of Real DFT --------
+    [definition]
+        <case1> RDFT
+            R[k] = sum_j=0^n-1 a[j]*cos(2*pi*j*k/n), 0<=k<=n/2
+            I[k] = sum_j=0^n-1 a[j]*sin(2*pi*j*k/n), 0<k<n/2
+        <case2> IRDFT (excluding scale)
+            a[k] = (R[0] + R[n/2]*cos(pi*k))/2 +
+                   sum_j=1^n/2-1 R[j]*cos(2*pi*j*k/n) +
+                   sum_j=1^n/2-1 I[j]*sin(2*pi*j*k/n), 0<=k<n
+    [usage]
+        <case1>
+            ip[0] = 0; // first time only
+            rdft(n, 1, a, ip, w);
+        <case2>
+            ip[0] = 0; // first time only
+            rdft(n, -1, a, ip, w);
+    [parameters]
+        n              :data length (size_t)
+                        n >= 2, n = power of 2
+        a[0...n-1]     :input/output data (float *)
+                        <case1>
+                            output data
+                                a[2*k] = R[k], 0<=k<n/2
+                                a[2*k+1] = I[k], 0<k<n/2
+                                a[1] = R[n/2]
+                        <case2>
+                            input data
+                                a[2*j] = R[j], 0<=j<n/2
+                                a[2*j+1] = I[j], 0<j<n/2
+                                a[1] = R[n/2]
+        ip[0...*]      :work area for bit reversal (size_t *)
+                        length of ip >= 2+sqrt(n/2)
+                        strictly,
+                        length of ip >=
+                            2+(1<<(int)(log(n/2+0.5)/log(2))/2).
+                        ip[0],ip[1] are pointers of the cos/sin table.
+        w[0...n/2-1]   :cos/sin table (float *)
+                        w[],ip[] are initialized if ip[0] == 0.
+    [remark]
+        Inverse of
+            rdft(n, 1, a, ip, w);
+        is
+            rdft(n, -1, a, ip, w);
+            for (j = 0; j <= n - 1; j++) {
+                a[j] *= 2.0 / n;
+            }
+        .
+
+
+-------- DCT (Discrete Cosine Transform) / Inverse of DCT --------
+    [definition]
+        <case1> IDCT (excluding scale)
+            C[k] = sum_j=0^n-1 a[j]*cos(pi*j*(k+1/2)/n), 0<=k<n
+        <case2> DCT
+            C[k] = sum_j=0^n-1 a[j]*cos(pi*(j+1/2)*k/n), 0<=k<n
+    [usage]
+        <case1>
+            ip[0] = 0; // first time only
+            ddct(n, 1, a, ip, w);
+        <case2>
+            ip[0] = 0; // first time only
+            ddct(n, -1, a, ip, w);
+    [parameters]
+        n              :data length (int)
+                        n >= 2, n = power of 2
+        a[0...n-1]     :input/output data (float *)
+                        output data
+                            a[k] = C[k], 0<=k<n
+        ip[0...*]      :work area for bit reversal (int *)
+                        length of ip >= 2+sqrt(n/2)
+                        strictly,
+                        length of ip >=
+                            2+(1<<(int)(log(n/2+0.5)/log(2))/2).
+                        ip[0],ip[1] are pointers of the cos/sin table.
+        w[0...n*5/4-1] :cos/sin table (float *)
+                        w[],ip[] are initialized if ip[0] == 0.
+    [remark]
+        Inverse of
+            ddct(n, -1, a, ip, w);
+        is
+            a[0] *= 0.5;
+            ddct(n, 1, a, ip, w);
+            for (j = 0; j <= n - 1; j++) {
+                a[j] *= 2.0 / n;
+            }
+        .
+
+
+-------- DST (Discrete Sine Transform) / Inverse of DST --------
+    [definition]
+        <case1> IDST (excluding scale)
+            S[k] = sum_j=1^n A[j]*sin(pi*j*(k+1/2)/n), 0<=k<n
+        <case2> DST
+            S[k] = sum_j=0^n-1 a[j]*sin(pi*(j+1/2)*k/n), 0<k<=n
+    [usage]
+        <case1>
+            ip[0] = 0; // first time only
+            ddst(n, 1, a, ip, w);
+        <case2>
+            ip[0] = 0; // first time only
+            ddst(n, -1, a, ip, w);
+    [parameters]
+        n              :data length (int)
+                        n >= 2, n = power of 2
+        a[0...n-1]     :input/output data (float *)
+                        <case1>
+                            input data
+                                a[j] = A[j], 0<j<n
+                                a[0] = A[n]
+                            output data
+                                a[k] = S[k], 0<=k<n
+                        <case2>
+                            output data
+                                a[k] = S[k], 0<k<n
+                                a[0] = S[n]
+        ip[0...*]      :work area for bit reversal (int *)
+                        length of ip >= 2+sqrt(n/2)
+                        strictly,
+                        length of ip >=
+                            2+(1<<(int)(log(n/2+0.5)/log(2))/2).
+                        ip[0],ip[1] are pointers of the cos/sin table.
+        w[0...n*5/4-1] :cos/sin table (float *)
+                        w[],ip[] are initialized if ip[0] == 0.
+    [remark]
+        Inverse of
+            ddst(n, -1, a, ip, w);
+        is
+            a[0] *= 0.5;
+            ddst(n, 1, a, ip, w);
+            for (j = 0; j <= n - 1; j++) {
+                a[j] *= 2.0 / n;
+            }
+        .
+
+
+-------- Cosine Transform of RDFT (Real Symmetric DFT) --------
+    [definition]
+        C[k] = sum_j=0^n a[j]*cos(pi*j*k/n), 0<=k<=n
+    [usage]
+        ip[0] = 0; // first time only
+        dfct(n, a, t, ip, w);
+    [parameters]
+        n              :data length - 1 (int)
+                        n >= 2, n = power of 2
+        a[0...n]       :input/output data (float *)
+                        output data
+                            a[k] = C[k], 0<=k<=n
+        t[0...n/2]     :work area (float *)
+        ip[0...*]      :work area for bit reversal (int *)
+                        length of ip >= 2+sqrt(n/4)
+                        strictly,
+                        length of ip >=
+                            2+(1<<(int)(log(n/4+0.5)/log(2))/2).
+                        ip[0],ip[1] are pointers of the cos/sin table.
+        w[0...n*5/8-1] :cos/sin table (float *)
+                        w[],ip[] are initialized if ip[0] == 0.
+    [remark]
+        Inverse of
+            a[0] *= 0.5;
+            a[n] *= 0.5;
+            dfct(n, a, t, ip, w);
+        is
+            a[0] *= 0.5;
+            a[n] *= 0.5;
+            dfct(n, a, t, ip, w);
+            for (j = 0; j <= n; j++) {
+                a[j] *= 2.0 / n;
+            }
+        .
+
+
+-------- Sine Transform of RDFT (Real Anti-symmetric DFT) --------
+    [definition]
+        S[k] = sum_j=1^n-1 a[j]*sin(pi*j*k/n), 0<k<n
+    [usage]
+        ip[0] = 0; // first time only
+        dfst(n, a, t, ip, w);
+    [parameters]
+        n              :data length + 1 (int)
+                        n >= 2, n = power of 2
+        a[0...n-1]     :input/output data (float *)
+                        output data
+                            a[k] = S[k], 0<k<n
+                        (a[0] is used for work area)
+        t[0...n/2-1]   :work area (float *)
+        ip[0...*]      :work area for bit reversal (int *)
+                        length of ip >= 2+sqrt(n/4)
+                        strictly,
+                        length of ip >=
+                            2+(1<<(int)(log(n/4+0.5)/log(2))/2).
+                        ip[0],ip[1] are pointers of the cos/sin table.
+        w[0...n*5/8-1] :cos/sin table (float *)
+                        w[],ip[] are initialized if ip[0] == 0.
+    [remark]
+        Inverse of
+            dfst(n, a, t, ip, w);
+        is
+            dfst(n, a, t, ip, w);
+            for (j = 1; j <= n - 1; j++) {
+                a[j] *= 2.0 / n;
+            }
+        .
+
+
+Appendix :
+    The cos/sin table is recalculated when the larger table required.
+    w[] and ip[] are compatible with all routines.
+*/
+
+#include <stddef.h>
+
+static void makewt(size_t nw, size_t *ip, float *w);
+static void makect(size_t nc, size_t *ip, float *c);
+static void bitrv2(size_t n, size_t *ip, float *a);
+#if 0  // Not used.
+static void bitrv2conj(int n, int *ip, float *a);
+#endif
+static void cftfsub(size_t n, float *a, float *w);
+static void cftbsub(size_t n, float *a, float *w);
+static void cft1st(size_t n, float *a, float *w);
+static void cftmdl(size_t n, size_t l, float *a, float *w);
+static void rftfsub(size_t n, float *a, size_t nc, float *c);
+static void rftbsub(size_t n, float *a, size_t nc, float *c);
+#if 0  // Not used.
+static void dctsub(int n, float *a, int nc, float *c)
+static void dstsub(int n, float *a, int nc, float *c)
+#endif
+
+
+#if 0  // Not used.
+void WebRtc_cdft(int n, int isgn, float *a, int *ip, float *w)
+{
+    if (n > (ip[0] << 2)) {
+        makewt(n >> 2, ip, w);
+    }
+    if (n > 4) {
+        if (isgn >= 0) {
+            bitrv2(n, ip + 2, a);
+            cftfsub(n, a, w);
+        } else {
+            bitrv2conj(n, ip + 2, a);
+            cftbsub(n, a, w);
+        }
+    } else if (n == 4) {
+        cftfsub(n, a, w);
+    }
+}
+#endif
+
+
+void WebRtc_rdft(size_t n, int isgn, float *a, size_t *ip, float *w)
+{
+    size_t nw, nc;
+    float xi;
+
+    nw = ip[0];
+    if (n > (nw << 2)) {
+        nw = n >> 2;
+        makewt(nw, ip, w);
+    }
+    nc = ip[1];
+    if (n > (nc << 2)) {
+        nc = n >> 2;
+        makect(nc, ip, w + nw);
+    }
+    if (isgn >= 0) {
+        if (n > 4) {
+            bitrv2(n, ip + 2, a);
+            cftfsub(n, a, w);
+            rftfsub(n, a, nc, w + nw);
+        } else if (n == 4) {
+            cftfsub(n, a, w);
+        }
+        xi = a[0] - a[1];
+        a[0] += a[1];
+        a[1] = xi;
+    } else {
+        a[1] = 0.5f * (a[0] - a[1]);
+        a[0] -= a[1];
+        if (n > 4) {
+            rftbsub(n, a, nc, w + nw);
+            bitrv2(n, ip + 2, a);
+            cftbsub(n, a, w);
+        } else if (n == 4) {
+            cftfsub(n, a, w);
+        }
+    }
+}
+
+#if 0  // Not used.
+static void ddct(int n, int isgn, float *a, int *ip, float *w)
+{
+    int j, nw, nc;
+    float xr;
+
+    nw = ip[0];
+    if (n > (nw << 2)) {
+        nw = n >> 2;
+        makewt(nw, ip, w);
+    }
+    nc = ip[1];
+    if (n > nc) {
+        nc = n;
+        makect(nc, ip, w + nw);
+    }
+    if (isgn < 0) {
+        xr = a[n - 1];
+        for (j = n - 2; j >= 2; j -= 2) {
+            a[j + 1] = a[j] - a[j - 1];
+            a[j] += a[j - 1];
+        }
+        a[1] = a[0] - xr;
+        a[0] += xr;
+        if (n > 4) {
+            rftbsub(n, a, nc, w + nw);
+            bitrv2(n, ip + 2, a);
+            cftbsub(n, a, w);
+        } else if (n == 4) {
+            cftfsub(n, a, w);
+        }
+    }
+    dctsub(n, a, nc, w + nw);
+    if (isgn >= 0) {
+        if (n > 4) {
+            bitrv2(n, ip + 2, a);
+            cftfsub(n, a, w);
+            rftfsub(n, a, nc, w + nw);
+        } else if (n == 4) {
+            cftfsub(n, a, w);
+        }
+        xr = a[0] - a[1];
+        a[0] += a[1];
+        for (j = 2; j < n; j += 2) {
+            a[j - 1] = a[j] - a[j + 1];
+            a[j] += a[j + 1];
+        }
+        a[n - 1] = xr;
+    }
+}
+
+
+static void ddst(int n, int isgn, float *a, int *ip, float *w)
+{
+    int j, nw, nc;
+    float xr;
+
+    nw = ip[0];
+    if (n > (nw << 2)) {
+        nw = n >> 2;
+        makewt(nw, ip, w);
+    }
+    nc = ip[1];
+    if (n > nc) {
+        nc = n;
+        makect(nc, ip, w + nw);
+    }
+    if (isgn < 0) {
+        xr = a[n - 1];
+        for (j = n - 2; j >= 2; j -= 2) {
+            a[j + 1] = -a[j] - a[j - 1];
+            a[j] -= a[j - 1];
+        }
+        a[1] = a[0] + xr;
+        a[0] -= xr;
+        if (n > 4) {
+            rftbsub(n, a, nc, w + nw);
+            bitrv2(n, ip + 2, a);
+            cftbsub(n, a, w);
+        } else if (n == 4) {
+            cftfsub(n, a, w);
+        }
+    }
+    dstsub(n, a, nc, w + nw);
+    if (isgn >= 0) {
+        if (n > 4) {
+            bitrv2(n, ip + 2, a);
+            cftfsub(n, a, w);
+            rftfsub(n, a, nc, w + nw);
+        } else if (n == 4) {
+            cftfsub(n, a, w);
+        }
+        xr = a[0] - a[1];
+        a[0] += a[1];
+        for (j = 2; j < n; j += 2) {
+            a[j - 1] = -a[j] - a[j + 1];
+            a[j] -= a[j + 1];
+        }
+        a[n - 1] = -xr;
+    }
+}
+
+
+static void dfct(int n, float *a, float *t, int *ip, float *w)
+{
+    int j, k, l, m, mh, nw, nc;
+    float xr, xi, yr, yi;
+
+    nw = ip[0];
+    if (n > (nw << 3)) {
+        nw = n >> 3;
+        makewt(nw, ip, w);
+    }
+    nc = ip[1];
+    if (n > (nc << 1)) {
+        nc = n >> 1;
+        makect(nc, ip, w + nw);
+    }
+    m = n >> 1;
+    yi = a[m];
+    xi = a[0] + a[n];
+    a[0] -= a[n];
+    t[0] = xi - yi;
+    t[m] = xi + yi;
+    if (n > 2) {
+        mh = m >> 1;
+        for (j = 1; j < mh; j++) {
+            k = m - j;
+            xr = a[j] - a[n - j];
+            xi = a[j] + a[n - j];
+            yr = a[k] - a[n - k];
+            yi = a[k] + a[n - k];
+            a[j] = xr;
+            a[k] = yr;
+            t[j] = xi - yi;
+            t[k] = xi + yi;
+        }
+        t[mh] = a[mh] + a[n - mh];
+        a[mh] -= a[n - mh];
+        dctsub(m, a, nc, w + nw);
+        if (m > 4) {
+            bitrv2(m, ip + 2, a);
+            cftfsub(m, a, w);
+            rftfsub(m, a, nc, w + nw);
+        } else if (m == 4) {
+            cftfsub(m, a, w);
+        }
+        a[n - 1] = a[0] - a[1];
+        a[1] = a[0] + a[1];
+        for (j = m - 2; j >= 2; j -= 2) {
+            a[2 * j + 1] = a[j] + a[j + 1];
+            a[2 * j - 1] = a[j] - a[j + 1];
+        }
+        l = 2;
+        m = mh;
+        while (m >= 2) {
+            dctsub(m, t, nc, w + nw);
+            if (m > 4) {
+                bitrv2(m, ip + 2, t);
+                cftfsub(m, t, w);
+                rftfsub(m, t, nc, w + nw);
+            } else if (m == 4) {
+                cftfsub(m, t, w);
+            }
+            a[n - l] = t[0] - t[1];
+            a[l] = t[0] + t[1];
+            k = 0;
+            for (j = 2; j < m; j += 2) {
+                k += l << 2;
+                a[k - l] = t[j] - t[j + 1];
+                a[k + l] = t[j] + t[j + 1];
+            }
+            l <<= 1;
+            mh = m >> 1;
+            for (j = 0; j < mh; j++) {
+                k = m - j;
+                t[j] = t[m + k] - t[m + j];
+                t[k] = t[m + k] + t[m + j];
+            }
+            t[mh] = t[m + mh];
+            m = mh;
+        }
+        a[l] = t[0];
+        a[n] = t[2] - t[1];
+        a[0] = t[2] + t[1];
+    } else {
+        a[1] = a[0];
+        a[2] = t[0];
+        a[0] = t[1];
+    }
+}
+
+static void dfst(int n, float *a, float *t, int *ip, float *w)
+{
+    int j, k, l, m, mh, nw, nc;
+    float xr, xi, yr, yi;
+
+    nw = ip[0];
+    if (n > (nw << 3)) {
+        nw = n >> 3;
+        makewt(nw, ip, w);
+    }
+    nc = ip[1];
+    if (n > (nc << 1)) {
+        nc = n >> 1;
+        makect(nc, ip, w + nw);
+    }
+    if (n > 2) {
+        m = n >> 1;
+        mh = m >> 1;
+        for (j = 1; j < mh; j++) {
+            k = m - j;
+            xr = a[j] + a[n - j];
+            xi = a[j] - a[n - j];
+            yr = a[k] + a[n - k];
+            yi = a[k] - a[n - k];
+            a[j] = xr;
+            a[k] = yr;
+            t[j] = xi + yi;
+            t[k] = xi - yi;
+        }
+        t[0] = a[mh] - a[n - mh];
+        a[mh] += a[n - mh];
+        a[0] = a[m];
+        dstsub(m, a, nc, w + nw);
+        if (m > 4) {
+            bitrv2(m, ip + 2, a);
+            cftfsub(m, a, w);
+            rftfsub(m, a, nc, w + nw);
+        } else if (m == 4) {
+            cftfsub(m, a, w);
+        }
+        a[n - 1] = a[1] - a[0];
+        a[1] = a[0] + a[1];
+        for (j = m - 2; j >= 2; j -= 2) {
+            a[2 * j + 1] = a[j] - a[j + 1];
+            a[2 * j - 1] = -a[j] - a[j + 1];
+        }
+        l = 2;
+        m = mh;
+        while (m >= 2) {
+            dstsub(m, t, nc, w + nw);
+            if (m > 4) {
+                bitrv2(m, ip + 2, t);
+                cftfsub(m, t, w);
+                rftfsub(m, t, nc, w + nw);
+            } else if (m == 4) {
+                cftfsub(m, t, w);
+            }
+            a[n - l] = t[1] - t[0];
+            a[l] = t[0] + t[1];
+            k = 0;
+            for (j = 2; j < m; j += 2) {
+                k += l << 2;
+                a[k - l] = -t[j] - t[j + 1];
+                a[k + l] = t[j] - t[j + 1];
+            }
+            l <<= 1;
+            mh = m >> 1;
+            for (j = 1; j < mh; j++) {
+                k = m - j;
+                t[j] = t[m + k] + t[m + j];
+                t[k] = t[m + k] - t[m + j];
+            }
+            t[0] = t[m + mh];
+            m = mh;
+        }
+        a[l] = t[0];
+    }
+    a[0] = 0;
+}
+#endif  // Not used.
+
+
+/* -------- initializing routines -------- */
+
+
+#include <math.h>
+
+static void makewt(size_t nw, size_t *ip, float *w)
+{
+    size_t j, nwh;
+    float delta, x, y;
+
+    ip[0] = nw;
+    ip[1] = 1;
+    if (nw > 2) {
+        nwh = nw >> 1;
+        delta = atanf(1.0f) / nwh;
+        w[0] = 1;
+        w[1] = 0;
+        w[nwh] = (float)cos(delta * nwh);
+        w[nwh + 1] = w[nwh];
+        if (nwh > 2) {
+            for (j = 2; j < nwh; j += 2) {
+                x = (float)cos(delta * j);
+                y = (float)sin(delta * j);
+                w[j] = x;
+                w[j + 1] = y;
+                w[nw - j] = y;
+                w[nw - j + 1] = x;
+            }
+            bitrv2(nw, ip + 2, w);
+        }
+    }
+}
+
+
+static void makect(size_t nc, size_t *ip, float *c)
+{
+    size_t j, nch;
+    float delta;
+
+    ip[1] = nc;
+    if (nc > 1) {
+        nch = nc >> 1;
+        delta = atanf(1.0f) / nch;
+        c[0] = (float)cos(delta * nch);
+        c[nch] = 0.5f * c[0];
+        for (j = 1; j < nch; j++) {
+            c[j] = 0.5f * (float)cos(delta * j);
+            c[nc - j] = 0.5f * (float)sin(delta * j);
+        }
+    }
+}
+
+
+/* -------- child routines -------- */
+
+
+static void bitrv2(size_t n, size_t *ip, float *a)
+{
+    size_t j, j1, k, k1, l, m, m2;
+    float xr, xi, yr, yi;
+
+    ip[0] = 0;
+    l = n;
+    m = 1;
+    while ((m << 3) < l) {
+        l >>= 1;
+        for (j = 0; j < m; j++) {
+            ip[m + j] = ip[j] + l;
+        }
+        m <<= 1;
+    }
+    m2 = 2 * m;
+    if ((m << 3) == l) {
+        for (k = 0; k < m; k++) {
+            for (j = 0; j < k; j++) {
+                j1 = 2 * j + ip[k];
+                k1 = 2 * k + ip[j];
+                xr = a[j1];
+                xi = a[j1 + 1];
+                yr = a[k1];
+                yi = a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 += 2 * m2;
+                xr = a[j1];
+                xi = a[j1 + 1];
+                yr = a[k1];
+                yi = a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 -= m2;
+                xr = a[j1];
+                xi = a[j1 + 1];
+                yr = a[k1];
+                yi = a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 += 2 * m2;
+                xr = a[j1];
+                xi = a[j1 + 1];
+                yr = a[k1];
+                yi = a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+            }
+            j1 = 2 * k + m2 + ip[k];
+            k1 = j1 + m2;
+            xr = a[j1];
+            xi = a[j1 + 1];
+            yr = a[k1];
+            yi = a[k1 + 1];
+            a[j1] = yr;
+            a[j1 + 1] = yi;
+            a[k1] = xr;
+            a[k1 + 1] = xi;
+        }
+    } else {
+        for (k = 1; k < m; k++) {
+            for (j = 0; j < k; j++) {
+                j1 = 2 * j + ip[k];
+                k1 = 2 * k + ip[j];
+                xr = a[j1];
+                xi = a[j1 + 1];
+                yr = a[k1];
+                yi = a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 += m2;
+                xr = a[j1];
+                xi = a[j1 + 1];
+                yr = a[k1];
+                yi = a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+            }
+        }
+    }
+}
+
+#if 0  // Not used.
+static void bitrv2conj(int n, int *ip, float *a)
+{
+    int j, j1, k, k1, l, m, m2;
+    float xr, xi, yr, yi;
+
+    ip[0] = 0;
+    l = n;
+    m = 1;
+    while ((m << 3) < l) {
+        l >>= 1;
+        for (j = 0; j < m; j++) {
+            ip[m + j] = ip[j] + l;
+        }
+        m <<= 1;
+    }
+    m2 = 2 * m;
+    if ((m << 3) == l) {
+        for (k = 0; k < m; k++) {
+            for (j = 0; j < k; j++) {
+                j1 = 2 * j + ip[k];
+                k1 = 2 * k + ip[j];
+                xr = a[j1];
+                xi = -a[j1 + 1];
+                yr = a[k1];
+                yi = -a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 += 2 * m2;
+                xr = a[j1];
+                xi = -a[j1 + 1];
+                yr = a[k1];
+                yi = -a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 -= m2;
+                xr = a[j1];
+                xi = -a[j1 + 1];
+                yr = a[k1];
+                yi = -a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 += 2 * m2;
+                xr = a[j1];
+                xi = -a[j1 + 1];
+                yr = a[k1];
+                yi = -a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+            }
+            k1 = 2 * k + ip[k];
+            a[k1 + 1] = -a[k1 + 1];
+            j1 = k1 + m2;
+            k1 = j1 + m2;
+            xr = a[j1];
+            xi = -a[j1 + 1];
+            yr = a[k1];
+            yi = -a[k1 + 1];
+            a[j1] = yr;
+            a[j1 + 1] = yi;
+            a[k1] = xr;
+            a[k1 + 1] = xi;
+            k1 += m2;
+            a[k1 + 1] = -a[k1 + 1];
+        }
+    } else {
+        a[1] = -a[1];
+        a[m2 + 1] = -a[m2 + 1];
+        for (k = 1; k < m; k++) {
+            for (j = 0; j < k; j++) {
+                j1 = 2 * j + ip[k];
+                k1 = 2 * k + ip[j];
+                xr = a[j1];
+                xi = -a[j1 + 1];
+                yr = a[k1];
+                yi = -a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+                j1 += m2;
+                k1 += m2;
+                xr = a[j1];
+                xi = -a[j1 + 1];
+                yr = a[k1];
+                yi = -a[k1 + 1];
+                a[j1] = yr;
+                a[j1 + 1] = yi;
+                a[k1] = xr;
+                a[k1 + 1] = xi;
+            }
+            k1 = 2 * k + ip[k];
+            a[k1 + 1] = -a[k1 + 1];
+            a[k1 + m2 + 1] = -a[k1 + m2 + 1];
+        }
+    }
+}
+#endif
+
+static void cftfsub(size_t n, float *a, float *w)
+{
+    size_t j, j1, j2, j3, l;
+    float x0r, x0i, x1r, x1i, x2r, x2i, x3r, x3i;
+
+    l = 2;
+    if (n > 8) {
+        cft1st(n, a, w);
+        l = 8;
+        while ((l << 2) < n) {
+            cftmdl(n, l, a, w);
+            l <<= 2;
+        }
+    }
+    if ((l << 2) == n) {
+        for (j = 0; j < l; j += 2) {
+            j1 = j + l;
+            j2 = j1 + l;
+            j3 = j2 + l;
+            x0r = a[j] + a[j1];
+            x0i = a[j + 1] + a[j1 + 1];
+            x1r = a[j] - a[j1];
+            x1i = a[j + 1] - a[j1 + 1];
+            x2r = a[j2] + a[j3];
+            x2i = a[j2 + 1] + a[j3 + 1];
+            x3r = a[j2] - a[j3];
+            x3i = a[j2 + 1] - a[j3 + 1];
+            a[j] = x0r + x2r;
+            a[j + 1] = x0i + x2i;
+            a[j2] = x0r - x2r;
+            a[j2 + 1] = x0i - x2i;
+            a[j1] = x1r - x3i;
+            a[j1 + 1] = x1i + x3r;
+            a[j3] = x1r + x3i;
+            a[j3 + 1] = x1i - x3r;
+        }
+    } else {
+        for (j = 0; j < l; j += 2) {
+            j1 = j + l;
+            x0r = a[j] - a[j1];
+            x0i = a[j + 1] - a[j1 + 1];
+            a[j] += a[j1];
+            a[j + 1] += a[j1 + 1];
+            a[j1] = x0r;
+            a[j1 + 1] = x0i;
+        }
+    }
+}
+
+
+static void cftbsub(size_t n, float *a, float *w)
+{
+    size_t j, j1, j2, j3, l;
+    float x0r, x0i, x1r, x1i, x2r, x2i, x3r, x3i;
+
+    l = 2;
+    if (n > 8) {
+        cft1st(n, a, w);
+        l = 8;
+        while ((l << 2) < n) {
+            cftmdl(n, l, a, w);
+            l <<= 2;
+        }
+    }
+    if ((l << 2) == n) {
+        for (j = 0; j < l; j += 2) {
+            j1 = j + l;
+            j2 = j1 + l;
+            j3 = j2 + l;
+            x0r = a[j] + a[j1];
+            x0i = -a[j + 1] - a[j1 + 1];
+            x1r = a[j] - a[j1];
+            x1i = -a[j + 1] + a[j1 + 1];
+            x2r = a[j2] + a[j3];
+            x2i = a[j2 + 1] + a[j3 + 1];
+            x3r = a[j2] - a[j3];
+            x3i = a[j2 + 1] - a[j3 + 1];
+            a[j] = x0r + x2r;
+            a[j + 1] = x0i - x2i;
+            a[j2] = x0r - x2r;
+            a[j2 + 1] = x0i + x2i;
+            a[j1] = x1r - x3i;
+            a[j1 + 1] = x1i - x3r;
+            a[j3] = x1r + x3i;
+            a[j3 + 1] = x1i + x3r;
+        }
+    } else {
+        for (j = 0; j < l; j += 2) {
+            j1 = j + l;
+            x0r = a[j] - a[j1];
+            x0i = -a[j + 1] + a[j1 + 1];
+            a[j] += a[j1];
+            a[j + 1] = -a[j + 1] - a[j1 + 1];
+            a[j1] = x0r;
+            a[j1 + 1] = x0i;
+        }
+    }
+}
+
+
+static void cft1st(size_t n, float *a, float *w)
+{
+    size_t j, k1, k2;
+    float wk1r, wk1i, wk2r, wk2i, wk3r, wk3i;
+    float x0r, x0i, x1r, x1i, x2r, x2i, x3r, x3i;
+
+    x0r = a[0] + a[2];
+    x0i = a[1] + a[3];
+    x1r = a[0] - a[2];
+    x1i = a[1] - a[3];
+    x2r = a[4] + a[6];
+    x2i = a[5] + a[7];
+    x3r = a[4] - a[6];
+    x3i = a[5] - a[7];
+    a[0] = x0r + x2r;
+    a[1] = x0i + x2i;
+    a[4] = x0r - x2r;
+    a[5] = x0i - x2i;
+    a[2] = x1r - x3i;
+    a[3] = x1i + x3r;
+    a[6] = x1r + x3i;
+    a[7] = x1i - x3r;
+    wk1r = w[2];
+    x0r = a[8] + a[10];
+    x0i = a[9] + a[11];
+    x1r = a[8] - a[10];
+    x1i = a[9] - a[11];
+    x2r = a[12] + a[14];
+    x2i = a[13] + a[15];
+    x3r = a[12] - a[14];
+    x3i = a[13] - a[15];
+    a[8] = x0r + x2r;
+    a[9] = x0i + x2i;
+    a[12] = x2i - x0i;
+    a[13] = x0r - x2r;
+    x0r = x1r - x3i;
+    x0i = x1i + x3r;
+    a[10] = wk1r * (x0r - x0i);
+    a[11] = wk1r * (x0r + x0i);
+    x0r = x3i + x1r;
+    x0i = x3r - x1i;
+    a[14] = wk1r * (x0i - x0r);
+    a[15] = wk1r * (x0i + x0r);
+    k1 = 0;
+    for (j = 16; j < n; j += 16) {
+        k1 += 2;
+        k2 = 2 * k1;
+        wk2r = w[k1];
+        wk2i = w[k1 + 1];
+        wk1r = w[k2];
+        wk1i = w[k2 + 1];
+        wk3r = wk1r - 2 * wk2i * wk1i;
+        wk3i = 2 * wk2i * wk1r - wk1i;
+        x0r = a[j] + a[j + 2];
+        x0i = a[j + 1] + a[j + 3];
+        x1r = a[j] - a[j + 2];
+        x1i = a[j + 1] - a[j + 3];
+        x2r = a[j + 4] + a[j + 6];
+        x2i = a[j + 5] + a[j + 7];
+        x3r = a[j + 4] - a[j + 6];
+        x3i = a[j + 5] - a[j + 7];
+        a[j] = x0r + x2r;
+        a[j + 1] = x0i + x2i;
+        x0r -= x2r;
+        x0i -= x2i;
+        a[j + 4] = wk2r * x0r - wk2i * x0i;
+        a[j + 5] = wk2r * x0i + wk2i * x0r;
+        x0r = x1r - x3i;
+        x0i = x1i + x3r;
+        a[j + 2] = wk1r * x0r - wk1i * x0i;
+        a[j + 3] = wk1r * x0i + wk1i * x0r;
+        x0r = x1r + x3i;
+        x0i = x1i - x3r;
+        a[j + 6] = wk3r * x0r - wk3i * x0i;
+        a[j + 7] = wk3r * x0i + wk3i * x0r;
+        wk1r = w[k2 + 2];
+        wk1i = w[k2 + 3];
+        wk3r = wk1r - 2 * wk2r * wk1i;
+        wk3i = 2 * wk2r * wk1r - wk1i;
+        x0r = a[j + 8] + a[j + 10];
+        x0i = a[j + 9] + a[j + 11];
+        x1r = a[j + 8] - a[j + 10];
+        x1i = a[j + 9] - a[j + 11];
+        x2r = a[j + 12] + a[j + 14];
+        x2i = a[j + 13] + a[j + 15];
+        x3r = a[j + 12] - a[j + 14];
+        x3i = a[j + 13] - a[j + 15];
+        a[j + 8] = x0r + x2r;
+        a[j + 9] = x0i + x2i;
+        x0r -= x2r;
+        x0i -= x2i;
+        a[j + 12] = -wk2i * x0r - wk2r * x0i;
+        a[j + 13] = -wk2i * x0i + wk2r * x0r;
+        x0r = x1r - x3i;
+        x0i = x1i + x3r;
+        a[j + 10] = wk1r * x0r - wk1i * x0i;
+        a[j + 11] = wk1r * x0i + wk1i * x0r;
+        x0r = x1r + x3i;
+        x0i = x1i - x3r;
+        a[j + 14] = wk3r * x0r - wk3i * x0i;
+        a[j + 15] = wk3r * x0i + wk3i * x0r;
+    }
+}
+
+
+static void cftmdl(size_t n, size_t l, float *a, float *w)
+{
+    size_t j, j1, j2, j3, k, k1, k2, m, m2;
+    float wk1r, wk1i, wk2r, wk2i, wk3r, wk3i;
+    float x0r, x0i, x1r, x1i, x2r, x2i, x3r, x3i;
+
+    m = l << 2;
+    for (j = 0; j < l; j += 2) {
+        j1 = j + l;
+        j2 = j1 + l;
+        j3 = j2 + l;
+        x0r = a[j] + a[j1];
+        x0i = a[j + 1] + a[j1 + 1];
+        x1r = a[j] - a[j1];
+        x1i = a[j + 1] - a[j1 + 1];
+        x2r = a[j2] + a[j3];
+        x2i = a[j2 + 1] + a[j3 + 1];
+        x3r = a[j2] - a[j3];
+        x3i = a[j2 + 1] - a[j3 + 1];
+        a[j] = x0r + x2r;
+        a[j + 1] = x0i + x2i;
+        a[j2] = x0r - x2r;
+        a[j2 + 1] = x0i - x2i;
+        a[j1] = x1r - x3i;
+        a[j1 + 1] = x1i + x3r;
+        a[j3] = x1r + x3i;
+        a[j3 + 1] = x1i - x3r;
+    }
+    wk1r = w[2];
+    for (j = m; j < l + m; j += 2) {
+        j1 = j + l;
+        j2 = j1 + l;
+        j3 = j2 + l;
+        x0r = a[j] + a[j1];
+        x0i = a[j + 1] + a[j1 + 1];
+        x1r = a[j] - a[j1];
+        x1i = a[j + 1] - a[j1 + 1];
+        x2r = a[j2] + a[j3];
+        x2i = a[j2 + 1] + a[j3 + 1];
+        x3r = a[j2] - a[j3];
+        x3i = a[j2 + 1] - a[j3 + 1];
+        a[j] = x0r + x2r;
+        a[j + 1] = x0i + x2i;
+        a[j2] = x2i - x0i;
+        a[j2 + 1] = x0r - x2r;
+        x0r = x1r - x3i;
+        x0i = x1i + x3r;
+        a[j1] = wk1r * (x0r - x0i);
+        a[j1 + 1] = wk1r * (x0r + x0i);
+        x0r = x3i + x1r;
+        x0i = x3r - x1i;
+        a[j3] = wk1r * (x0i - x0r);
+        a[j3 + 1] = wk1r * (x0i + x0r);
+    }
+    k1 = 0;
+    m2 = 2 * m;
+    for (k = m2; k < n; k += m2) {
+        k1 += 2;
+        k2 = 2 * k1;
+        wk2r = w[k1];
+        wk2i = w[k1 + 1];
+        wk1r = w[k2];
+        wk1i = w[k2 + 1];
+        wk3r = wk1r - 2 * wk2i * wk1i;
+        wk3i = 2 * wk2i * wk1r - wk1i;
+        for (j = k; j < l + k; j += 2) {
+            j1 = j + l;
+            j2 = j1 + l;
+            j3 = j2 + l;
+            x0r = a[j] + a[j1];
+            x0i = a[j + 1] + a[j1 + 1];
+            x1r = a[j] - a[j1];
+            x1i = a[j + 1] - a[j1 + 1];
+            x2r = a[j2] + a[j3];
+            x2i = a[j2 + 1] + a[j3 + 1];
+            x3r = a[j2] - a[j3];
+            x3i = a[j2 + 1] - a[j3 + 1];
+            a[j] = x0r + x2r;
+            a[j + 1] = x0i + x2i;
+            x0r -= x2r;
+            x0i -= x2i;
+            a[j2] = wk2r * x0r - wk2i * x0i;
+            a[j2 + 1] = wk2r * x0i + wk2i * x0r;
+            x0r = x1r - x3i;
+            x0i = x1i + x3r;
+            a[j1] = wk1r * x0r - wk1i * x0i;
+            a[j1 + 1] = wk1r * x0i + wk1i * x0r;
+            x0r = x1r + x3i;
+            x0i = x1i - x3r;
+            a[j3] = wk3r * x0r - wk3i * x0i;
+            a[j3 + 1] = wk3r * x0i + wk3i * x0r;
+        }
+        wk1r = w[k2 + 2];
+        wk1i = w[k2 + 3];
+        wk3r = wk1r - 2 * wk2r * wk1i;
+        wk3i = 2 * wk2r * wk1r - wk1i;
+        for (j = k + m; j < l + (k + m); j += 2) {
+            j1 = j + l;
+            j2 = j1 + l;
+            j3 = j2 + l;
+            x0r = a[j] + a[j1];
+            x0i = a[j + 1] + a[j1 + 1];
+            x1r = a[j] - a[j1];
+            x1i = a[j + 1] - a[j1 + 1];
+            x2r = a[j2] + a[j3];
+            x2i = a[j2 + 1] + a[j3 + 1];
+            x3r = a[j2] - a[j3];
+            x3i = a[j2 + 1] - a[j3 + 1];
+            a[j] = x0r + x2r;
+            a[j + 1] = x0i + x2i;
+            x0r -= x2r;
+            x0i -= x2i;
+            a[j2] = -wk2i * x0r - wk2r * x0i;
+            a[j2 + 1] = -wk2i * x0i + wk2r * x0r;
+            x0r = x1r - x3i;
+            x0i = x1i + x3r;
+            a[j1] = wk1r * x0r - wk1i * x0i;
+            a[j1 + 1] = wk1r * x0i + wk1i * x0r;
+            x0r = x1r + x3i;
+            x0i = x1i - x3r;
+            a[j3] = wk3r * x0r - wk3i * x0i;
+            a[j3 + 1] = wk3r * x0i + wk3i * x0r;
+        }
+    }
+}
+
+
+static void rftfsub(size_t n, float *a, size_t nc, float *c)
+{
+    size_t j, k, kk, ks, m;
+    float wkr, wki, xr, xi, yr, yi;
+
+    m = n >> 1;
+    ks = 2 * nc / m;
+    kk = 0;
+    for (j = 2; j < m; j += 2) {
+        k = n - j;
+        kk += ks;
+        wkr = 0.5f - c[nc - kk];
+        wki = c[kk];
+        xr = a[j] - a[k];
+        xi = a[j + 1] + a[k + 1];
+        yr = wkr * xr - wki * xi;
+        yi = wkr * xi + wki * xr;
+        a[j] -= yr;
+        a[j + 1] -= yi;
+        a[k] += yr;
+        a[k + 1] -= yi;
+    }
+}
+
+
+static void rftbsub(size_t n, float *a, size_t nc, float *c)
+{
+    size_t j, k, kk, ks, m;
+    float wkr, wki, xr, xi, yr, yi;
+
+    a[1] = -a[1];
+    m = n >> 1;
+    ks = 2 * nc / m;
+    kk = 0;
+    for (j = 2; j < m; j += 2) {
+        k = n - j;
+        kk += ks;
+        wkr = 0.5f - c[nc - kk];
+        wki = c[kk];
+        xr = a[j] - a[k];
+        xi = a[j + 1] + a[k + 1];
+        yr = wkr * xr + wki * xi;
+        yi = wkr * xi - wki * xr;
+        a[j] -= yr;
+        a[j + 1] = yi - a[j + 1];
+        a[k] += yr;
+        a[k + 1] = yi - a[k + 1];
+    }
+    a[m + 1] = -a[m + 1];
+}
+
+#if 0  // Not used.
+static void dctsub(int n, float *a, int nc, float *c)
+{
+    int j, k, kk, ks, m;
+    float wkr, wki, xr;
+
+    m = n >> 1;
+    ks = nc / n;
+    kk = 0;
+    for (j = 1; j < m; j++) {
+        k = n - j;
+        kk += ks;
+        wkr = c[kk] - c[nc - kk];
+        wki = c[kk] + c[nc - kk];
+        xr = wki * a[j] - wkr * a[k];
+        a[j] = wkr * a[j] + wki * a[k];
+        a[k] = xr;
+    }
+    a[m] *= c[0];
+}
+
+
+static void dstsub(int n, float *a, int nc, float *c)
+{
+    int j, k, kk, ks, m;
+    float wkr, wki, xr;
+
+    m = n >> 1;
+    ks = nc / n;
+    kk = 0;
+    for (j = 1; j < m; j++) {
+        k = n - j;
+        kk += ks;
+        wkr = c[kk] - c[nc - kk];
+        wki = c[kk] + c[nc - kk];
+        xr = wki * a[k] - wkr * a[j];
+        a[k] = wkr * a[k] + wki * a[j];
+        a[j] = xr;
+    }
+    a[m] *= c[0];
+}
+#endif  // Not used.
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/fft4g.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/fft4g.h
new file mode 100644
index 0000000..6dd792f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/fft4g.h
@@ -0,0 +1,25 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_FFT4G_H_
+#define WEBRTC_COMMON_AUDIO_FFT4G_H_
+
+#if defined(__cplusplus)
+extern "C" {
+#endif
+
+// Refer to fft4g.c for documentation.
+void WebRtc_rdft(size_t n, int isgn, float *a, size_t *ip, float *w);
+
+#if defined(__cplusplus)
+}
+#endif
+
+#endif  // WEBRTC_COMMON_AUDIO_FFT4G_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/include/audio_util.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/include/audio_util.h
new file mode 100644
index 0000000..8d31f65
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/include/audio_util.h
@@ -0,0 +1,188 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
+#define WEBRTC_COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
+
+#include <algorithm>
+#include <limits>
+#include <cstring>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+typedef std::numeric_limits<int16_t> limits_int16;
+
+// The conversion functions use the following naming convention:
+// S16:      int16_t [-32768, 32767]
+// Float:    float   [-1.0, 1.0]
+// FloatS16: float   [-32768.0, 32767.0]
+static inline int16_t FloatToS16(float v) {
+  if (v > 0)
+    return v >= 1 ? (limits_int16::max)()
+                  : static_cast<int16_t>(v * (limits_int16::max)() + 0.5f);
+  return v <= -1 ? (limits_int16::min)()
+                 : static_cast<int16_t>(-v * (limits_int16::min)() - 0.5f);
+}
+
+static inline float S16ToFloat(int16_t v) {
+  static const float kMaxInt16Inverse = 1.f / (limits_int16::max)();
+  static const float kMinInt16Inverse = 1.f / (limits_int16::min)();
+  return v * (v > 0 ? kMaxInt16Inverse : -kMinInt16Inverse);
+}
+
+static inline int16_t FloatS16ToS16(float v) {
+  static const float kMaxRound = (limits_int16::max)() - 0.5f;
+  static const float kMinRound = (limits_int16::min)() + 0.5f;
+  if (v > 0)
+    return v >= kMaxRound ? (limits_int16::max)()
+                          : static_cast<int16_t>(v + 0.5f);
+  return v <= kMinRound ? (limits_int16::min)() : static_cast<int16_t>(v - 0.5f);
+}
+
+static inline float FloatToFloatS16(float v) {
+  return v * (v > 0 ? (limits_int16::max)() : -(limits_int16::min)());
+}
+
+static inline float FloatS16ToFloat(float v) {
+  static const float kMaxInt16Inverse = 1.f / (limits_int16::max)();
+  static const float kMinInt16Inverse = 1.f / (limits_int16::min)();
+  return v * (v > 0 ? kMaxInt16Inverse : -kMinInt16Inverse);
+}
+
+void FloatToS16(const float* src, size_t size, int16_t* dest);
+void S16ToFloat(const int16_t* src, size_t size, float* dest);
+void FloatS16ToS16(const float* src, size_t size, int16_t* dest);
+void FloatToFloatS16(const float* src, size_t size, float* dest);
+void FloatS16ToFloat(const float* src, size_t size, float* dest);
+
+// Copy audio from |src| channels to |dest| channels unless |src| and |dest|
+// point to the same address. |src| and |dest| must have the same number of
+// channels, and there must be sufficient space allocated in |dest|.
+template <typename T>
+void CopyAudioIfNeeded(const T* const* src,
+                       int num_frames,
+                       int num_channels,
+                       T* const* dest) {
+  for (int i = 0; i < num_channels; ++i) {
+    if (src[i] != dest[i]) {
+      std::copy(src[i], src[i] + num_frames, dest[i]);
+    }
+  }
+}
+
+// Deinterleave audio from |interleaved| to the channel buffers pointed to
+// by |deinterleaved|. There must be sufficient space allocated in the
+// |deinterleaved| buffers (|num_channel| buffers with |samples_per_channel|
+// per buffer).
+template <typename T>
+void Deinterleave(const T* interleaved,
+                  size_t samples_per_channel,
+                  size_t num_channels,
+                  T* const* deinterleaved) {
+  for (size_t i = 0; i < num_channels; ++i) {
+    T* channel = deinterleaved[i];
+    size_t interleaved_idx = i;
+    for (size_t j = 0; j < samples_per_channel; ++j) {
+      channel[j] = interleaved[interleaved_idx];
+      interleaved_idx += num_channels;
+    }
+  }
+}
+
+// Interleave audio from the channel buffers pointed to by |deinterleaved| to
+// |interleaved|. There must be sufficient space allocated in |interleaved|
+// (|samples_per_channel| * |num_channels|).
+template <typename T>
+void Interleave(const T* const* deinterleaved,
+                size_t samples_per_channel,
+                size_t num_channels,
+                T* interleaved) {
+  for (size_t i = 0; i < num_channels; ++i) {
+    const T* channel = deinterleaved[i];
+    size_t interleaved_idx = i;
+    for (size_t j = 0; j < samples_per_channel; ++j) {
+      interleaved[interleaved_idx] = channel[j];
+      interleaved_idx += num_channels;
+    }
+  }
+}
+
+// Copies audio from a single channel buffer pointed to by |mono| to each
+// channel of |interleaved|. There must be sufficient space allocated in
+// |interleaved| (|samples_per_channel| * |num_channels|).
+template <typename T>
+void UpmixMonoToInterleaved(const T* mono,
+                            int num_frames,
+                            int num_channels,
+                            T* interleaved) {
+  int interleaved_idx = 0;
+  for (int i = 0; i < num_frames; ++i) {
+    for (int j = 0; j < num_channels; ++j) {
+      interleaved[interleaved_idx++] = mono[i];
+    }
+  }
+}
+
+template <typename T, typename Intermediate>
+void DownmixToMono(const T* const* input_channels,
+                   size_t num_frames,
+                   int num_channels,
+                   T* out) {
+  for (size_t i = 0; i < num_frames; ++i) {
+    Intermediate value = input_channels[0][i];
+    for (int j = 1; j < num_channels; ++j) {
+      value += input_channels[j][i];
+    }
+    out[i] = value / num_channels;
+  }
+}
+
+// Downmixes an interleaved multichannel signal to a single channel by averaging
+// all channels.
+template <typename T, typename Intermediate>
+void DownmixInterleavedToMonoImpl(const T* interleaved,
+                                  size_t num_frames,
+                                  int num_channels,
+                                  T* deinterleaved) {
+  RTC_DCHECK_GT(num_channels, 0);
+  RTC_DCHECK_GT(num_frames, 0);
+
+  const T* const end = interleaved + num_frames * num_channels;
+
+  while (interleaved < end) {
+    const T* const frame_end = interleaved + num_channels;
+
+    Intermediate value = *interleaved++;
+    while (interleaved < frame_end) {
+      value += *interleaved++;
+    }
+
+    *deinterleaved++ = value / num_channels;
+  }
+}
+
+template <typename T>
+void DownmixInterleavedToMono(const T* interleaved,
+                              size_t num_frames,
+                              int num_channels,
+                              T* deinterleaved);
+
+template <>
+void DownmixInterleavedToMono<int16_t>(const int16_t* interleaved,
+                                       size_t num_frames,
+                                       int num_channels,
+                                       int16_t* deinterleaved);
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/push_sinc_resampler.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/push_sinc_resampler.cc
new file mode 100644
index 0000000..a740423
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/push_sinc_resampler.cc
@@ -0,0 +1,103 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/resampler/push_sinc_resampler.h"
+
+#include <cstring>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/include/audio_util.h"
+
+namespace webrtc {
+
+PushSincResampler::PushSincResampler(size_t source_frames,
+                                     size_t destination_frames)
+    : resampler_(new SincResampler(source_frames * 1.0 / destination_frames,
+                                   source_frames,
+                                   this)),
+      source_ptr_(nullptr),
+      source_ptr_int_(nullptr),
+      destination_frames_(destination_frames),
+      first_pass_(true),
+      source_available_(0) {}
+
+PushSincResampler::~PushSincResampler() {
+}
+
+size_t PushSincResampler::Resample(const int16_t* source,
+                                   size_t source_length,
+                                   int16_t* destination,
+                                   size_t destination_capacity) {
+  if (!float_buffer_.get())
+    float_buffer_.reset(new float[destination_frames_]);
+
+  source_ptr_int_ = source;
+  // Pass nullptr as the float source to have Run() read from the int16 source.
+  Resample(nullptr, source_length, float_buffer_.get(), destination_frames_);
+  FloatS16ToS16(float_buffer_.get(), destination_frames_, destination);
+  source_ptr_int_ = nullptr;
+  return destination_frames_;
+}
+
+size_t PushSincResampler::Resample(const float* source,
+                                   size_t source_length,
+                                   float* destination,
+                                   size_t destination_capacity) {
+  RTC_CHECK_EQ(source_length, resampler_->request_frames());
+  RTC_CHECK_GE(destination_capacity, destination_frames_);
+  // Cache the source pointer. Calling Resample() will immediately trigger
+  // the Run() callback whereupon we provide the cached value.
+  source_ptr_ = source;
+  source_available_ = source_length;
+
+  // On the first pass, we call Resample() twice. During the first call, we
+  // provide dummy input and discard the output. This is done to prime the
+  // SincResampler buffer with the correct delay (half the kernel size), thereby
+  // ensuring that all later Resample() calls will only result in one input
+  // request through Run().
+  //
+  // If this wasn't done, SincResampler would call Run() twice on the first
+  // pass, and we'd have to introduce an entire |source_frames| of delay, rather
+  // than the minimum half kernel.
+  //
+  // It works out that ChunkSize() is exactly the amount of output we need to
+  // request in order to prime the buffer with a single Run() request for
+  // |source_frames|.
+  if (first_pass_)
+    resampler_->Resample(resampler_->ChunkSize(), destination);
+
+  resampler_->Resample(destination_frames_, destination);
+  source_ptr_ = nullptr;
+  return destination_frames_;
+}
+
+void PushSincResampler::Run(size_t frames, float* destination) {
+  // Ensure we are only asked for the available samples. This would fail if
+  // Run() was triggered more than once per Resample() call.
+  RTC_CHECK_EQ(source_available_, frames);
+
+  if (first_pass_) {
+    // Provide dummy input on the first pass, the output of which will be
+    // discarded, as described in Resample().
+    std::memset(destination, 0, frames * sizeof(*destination));
+    first_pass_ = false;
+    return;
+  }
+
+  if (source_ptr_) {
+    std::memcpy(destination, source_ptr_, frames * sizeof(*destination));
+  } else {
+    for (size_t i = 0; i < frames; ++i)
+      destination[i] = static_cast<float>(source_ptr_int_[i]);
+  }
+  source_available_ -= frames;
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/push_sinc_resampler.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/push_sinc_resampler.h
new file mode 100644
index 0000000..2ba60ca
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/push_sinc_resampler.h
@@ -0,0 +1,77 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_RESAMPLER_PUSH_SINC_RESAMPLER_H_
+#define WEBRTC_COMMON_AUDIO_RESAMPLER_PUSH_SINC_RESAMPLER_H_
+
+#include <memory>
+
+#include "webrtc/base/constructormagic.h"
+#include "webrtc/common_audio/resampler/sinc_resampler.h"
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+// A thin wrapper over SincResampler to provide a push-based interface as
+// required by WebRTC. SincResampler uses a pull-based interface, and will
+// use SincResamplerCallback::Run() to request data upon a call to Resample().
+// These Run() calls will happen on the same thread Resample() is called on.
+class PushSincResampler : public SincResamplerCallback {
+ public:
+  // Provide the size of the source and destination blocks in samples. These
+  // must correspond to the same time duration (typically 10 ms) as the sample
+  // ratio is inferred from them.
+  PushSincResampler(size_t source_frames, size_t destination_frames);
+  ~PushSincResampler() override;
+
+  // Perform the resampling. |source_frames| must always equal the
+  // |source_frames| provided at construction. |destination_capacity| must be
+  // at least as large as |destination_frames|. Returns the number of samples
+  // provided in destination (for convenience, since this will always be equal
+  // to |destination_frames|).
+  size_t Resample(const int16_t* source, size_t source_frames,
+                  int16_t* destination, size_t destination_capacity);
+  size_t Resample(const float* source,
+                  size_t source_frames,
+                  float* destination,
+                  size_t destination_capacity);
+
+  // Delay due to the filter kernel. Essentially, the time after which an input
+  // sample will appear in the resampled output.
+  static float AlgorithmicDelaySeconds(int source_rate_hz) {
+    return 1.f / source_rate_hz * SincResampler::kKernelSize / 2;
+  }
+
+ protected:
+  // Implements SincResamplerCallback.
+  void Run(size_t frames, float* destination) override;
+
+ private:
+  friend class PushSincResamplerTest;
+  SincResampler* get_resampler_for_testing() { return resampler_.get(); }
+
+  std::unique_ptr<SincResampler> resampler_;
+  std::unique_ptr<float[]> float_buffer_;
+  const float* source_ptr_;
+  const int16_t* source_ptr_int_;
+  const size_t destination_frames_;
+
+  // True on the first call to Resample(), to prime the SincResampler buffer.
+  bool first_pass_;
+
+  // Used to assert we are only requested for as much data as is available.
+  size_t source_available_;
+
+  RTC_DISALLOW_COPY_AND_ASSIGN(PushSincResampler);
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_COMMON_AUDIO_RESAMPLER_PUSH_SINC_RESAMPLER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler.cc
new file mode 100644
index 0000000..1203f77
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler.cc
@@ -0,0 +1,374 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Modified from the Chromium original:
+// src/media/base/sinc_resampler.cc
+
+// Initial input buffer layout, dividing into regions r0_ to r4_ (note: r0_, r3_
+// and r4_ will move after the first load):
+//
+// |----------------|-----------------------------------------|----------------|
+//
+//                                        request_frames_
+//                   <--------------------------------------------------------->
+//                                    r0_ (during first load)
+//
+//  kKernelSize / 2   kKernelSize / 2         kKernelSize / 2   kKernelSize / 2
+// <---------------> <--------------->       <---------------> <--------------->
+//        r1_               r2_                     r3_               r4_
+//
+//                             block_size_ == r4_ - r2_
+//                   <--------------------------------------->
+//
+//                                                  request_frames_
+//                                    <------------------ ... ----------------->
+//                                               r0_ (during second load)
+//
+// On the second request r0_ slides to the right by kKernelSize / 2 and r3_, r4_
+// and block_size_ are reinitialized via step (3) in the algorithm below.
+//
+// These new regions remain constant until a Flush() occurs.  While complicated,
+// this allows us to reduce jitter by always requesting the same amount from the
+// provided callback.
+//
+// The algorithm:
+//
+// 1) Allocate input_buffer of size: request_frames_ + kKernelSize; this ensures
+//    there's enough room to read request_frames_ from the callback into region
+//    r0_ (which will move between the first and subsequent passes).
+//
+// 2) Let r1_, r2_ each represent half the kernel centered around r0_:
+//
+//        r0_ = input_buffer_ + kKernelSize / 2
+//        r1_ = input_buffer_
+//        r2_ = r0_
+//
+//    r0_ is always request_frames_ in size.  r1_, r2_ are kKernelSize / 2 in
+//    size.  r1_ must be zero initialized to avoid convolution with garbage (see
+//    step (5) for why).
+//
+// 3) Let r3_, r4_ each represent half the kernel right aligned with the end of
+//    r0_ and choose block_size_ as the distance in frames between r4_ and r2_:
+//
+//        r3_ = r0_ + request_frames_ - kKernelSize
+//        r4_ = r0_ + request_frames_ - kKernelSize / 2
+//        block_size_ = r4_ - r2_ = request_frames_ - kKernelSize / 2
+//
+// 4) Consume request_frames_ frames into r0_.
+//
+// 5) Position kernel centered at start of r2_ and generate output frames until
+//    the kernel is centered at the start of r4_ or we've finished generating
+//    all the output frames.
+//
+// 6) Wrap left over data from the r3_ to r1_ and r4_ to r2_.
+//
+// 7) If we're on the second load, in order to avoid overwriting the frames we
+//    just wrapped from r4_ we need to slide r0_ to the right by the size of
+//    r4_, which is kKernelSize / 2:
+//
+//        r0_ = r0_ + kKernelSize / 2 = input_buffer_ + kKernelSize
+//
+//    r3_, r4_, and block_size_ then need to be reinitialized, so goto (3).
+//
+// 8) Else, if we're not on the second load, goto (4).
+//
+// Note: we're glossing over how the sub-sample handling works with
+// |virtual_source_idx_|, etc.
+
+// MSVC++ requires this to be set before any other includes to get M_PI.
+#define _USE_MATH_DEFINES
+
+#include "webrtc/common_audio/resampler/sinc_resampler.h"
+
+#include <math.h>
+#include <string.h>
+
+#include <limits>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/system_wrappers/include/cpu_features_wrapper.h"
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+namespace {
+
+double SincScaleFactor(double io_ratio) {
+  // |sinc_scale_factor| is basically the normalized cutoff frequency of the
+  // low-pass filter.
+  double sinc_scale_factor = io_ratio > 1.0 ? 1.0 / io_ratio : 1.0;
+
+  // The sinc function is an idealized brick-wall filter, but since we're
+  // windowing it the transition from pass to stop does not happen right away.
+  // So we should adjust the low pass filter cutoff slightly downward to avoid
+  // some aliasing at the very high-end.
+  // TODO(crogers): this value is empirical and to be more exact should vary
+  // depending on kKernelSize.
+  sinc_scale_factor *= 0.9;
+
+  return sinc_scale_factor;
+}
+
+}  // namespace
+
+const size_t SincResampler::kKernelSize;
+
+// If we know the minimum architecture at compile time, avoid CPU detection.
+#if defined(WEBRTC_ARCH_X86_FAMILY)
+#if defined(__SSE2__)
+#define CONVOLVE_FUNC Convolve_SSE
+void SincResampler::InitializeCPUSpecificFeatures() {}
+#else
+// x86 CPU detection required.  Function will be set by
+// InitializeCPUSpecificFeatures().
+// TODO(dalecurtis): Once Chrome moves to an SSE baseline this can be removed.
+#define CONVOLVE_FUNC convolve_proc_
+
+void SincResampler::InitializeCPUSpecificFeatures() {
+  convolve_proc_ = WebRtc_GetCPUInfo(kSSE2) ? Convolve_SSE : Convolve_C;
+}
+#endif
+#elif defined(WEBRTC_HAS_NEON)
+#define CONVOLVE_FUNC Convolve_NEON
+void SincResampler::InitializeCPUSpecificFeatures() {}
+#else
+// Unknown architecture.
+#define CONVOLVE_FUNC Convolve_C
+void SincResampler::InitializeCPUSpecificFeatures() {}
+#endif
+
+SincResampler::SincResampler(double io_sample_rate_ratio,
+                             size_t request_frames,
+                             SincResamplerCallback* read_cb)
+    : io_sample_rate_ratio_(io_sample_rate_ratio),
+      read_cb_(read_cb),
+      request_frames_(request_frames),
+      input_buffer_size_(request_frames_ + kKernelSize),
+      // Create input buffers with a 16-byte alignment for SSE optimizations.
+      kernel_storage_(static_cast<float*>(
+          AlignedMalloc(sizeof(float) * kKernelStorageSize, 16))),
+      kernel_pre_sinc_storage_(static_cast<float*>(
+          AlignedMalloc(sizeof(float) * kKernelStorageSize, 16))),
+      kernel_window_storage_(static_cast<float*>(
+          AlignedMalloc(sizeof(float) * kKernelStorageSize, 16))),
+      input_buffer_(static_cast<float*>(
+          AlignedMalloc(sizeof(float) * input_buffer_size_, 16))),
+#if defined(WEBRTC_CPU_DETECTION)
+      convolve_proc_(nullptr),
+#endif
+      r1_(input_buffer_.get()),
+      r2_(input_buffer_.get() + kKernelSize / 2) {
+#if defined(WEBRTC_CPU_DETECTION)
+  InitializeCPUSpecificFeatures();
+  RTC_DCHECK(convolve_proc_);
+#endif
+  RTC_DCHECK_GT(request_frames_, 0);
+  Flush();
+  RTC_DCHECK_GT(block_size_, kKernelSize);
+
+  memset(kernel_storage_.get(), 0,
+         sizeof(*kernel_storage_.get()) * kKernelStorageSize);
+  memset(kernel_pre_sinc_storage_.get(), 0,
+         sizeof(*kernel_pre_sinc_storage_.get()) * kKernelStorageSize);
+  memset(kernel_window_storage_.get(), 0,
+         sizeof(*kernel_window_storage_.get()) * kKernelStorageSize);
+
+  InitializeKernel();
+}
+
+SincResampler::~SincResampler() {}
+
+void SincResampler::UpdateRegions(bool second_load) {
+  // Setup various region pointers in the buffer (see diagram above).  If we're
+  // on the second load we need to slide r0_ to the right by kKernelSize / 2.
+  r0_ = input_buffer_.get() + (second_load ? kKernelSize : kKernelSize / 2);
+  r3_ = r0_ + request_frames_ - kKernelSize;
+  r4_ = r0_ + request_frames_ - kKernelSize / 2;
+  block_size_ = r4_ - r2_;
+
+  // r1_ at the beginning of the buffer.
+  RTC_DCHECK_EQ(r1_, input_buffer_.get());
+  // r1_ left of r2_, r4_ left of r3_ and size correct.
+  RTC_DCHECK_EQ(r2_ - r1_, r4_ - r3_);
+  // r2_ left of r3.
+  RTC_DCHECK_LT(r2_, r3_);
+}
+
+void SincResampler::InitializeKernel() {
+  // Blackman window parameters.
+  static const double kAlpha = 0.16;
+  static const double kA0 = 0.5 * (1.0 - kAlpha);
+  static const double kA1 = 0.5;
+  static const double kA2 = 0.5 * kAlpha;
+
+  // Generates a set of windowed sinc() kernels.
+  // We generate a range of sub-sample offsets from 0.0 to 1.0.
+  const double sinc_scale_factor = SincScaleFactor(io_sample_rate_ratio_);
+  for (size_t offset_idx = 0; offset_idx <= kKernelOffsetCount; ++offset_idx) {
+    const float subsample_offset =
+        static_cast<float>(offset_idx) / kKernelOffsetCount;
+
+    for (size_t i = 0; i < kKernelSize; ++i) {
+      const size_t idx = i + offset_idx * kKernelSize;
+      const float pre_sinc = static_cast<float>(M_PI *
+          (static_cast<int>(i) - static_cast<int>(kKernelSize / 2) -
+           subsample_offset));
+      kernel_pre_sinc_storage_[idx] = pre_sinc;
+
+      // Compute Blackman window, matching the offset of the sinc().
+      const float x = (i - subsample_offset) / kKernelSize;
+      const float window = static_cast<float>(kA0 - kA1 * cos(2.0 * M_PI * x) +
+          kA2 * cos(4.0 * M_PI * x));
+      kernel_window_storage_[idx] = window;
+
+      // Compute the sinc with offset, then window the sinc() function and store
+      // at the correct offset.
+      kernel_storage_[idx] = static_cast<float>(window *
+          ((pre_sinc == 0) ?
+              sinc_scale_factor :
+              (sin(sinc_scale_factor * pre_sinc) / pre_sinc)));
+    }
+  }
+}
+
+void SincResampler::SetRatio(double io_sample_rate_ratio) {
+  if (fabs(io_sample_rate_ratio_ - io_sample_rate_ratio) <
+      std::numeric_limits<double>::epsilon()) {
+    return;
+  }
+
+  io_sample_rate_ratio_ = io_sample_rate_ratio;
+
+  // Optimize reinitialization by reusing values which are independent of
+  // |sinc_scale_factor|.  Provides a 3x speedup.
+  const double sinc_scale_factor = SincScaleFactor(io_sample_rate_ratio_);
+  for (size_t offset_idx = 0; offset_idx <= kKernelOffsetCount; ++offset_idx) {
+    for (size_t i = 0; i < kKernelSize; ++i) {
+      const size_t idx = i + offset_idx * kKernelSize;
+      const float window = kernel_window_storage_[idx];
+      const float pre_sinc = kernel_pre_sinc_storage_[idx];
+
+      kernel_storage_[idx] = static_cast<float>(window *
+          ((pre_sinc == 0) ?
+              sinc_scale_factor :
+              (sin(sinc_scale_factor * pre_sinc) / pre_sinc)));
+    }
+  }
+}
+
+void SincResampler::Resample(size_t frames, float* destination) {
+  size_t remaining_frames = frames;
+
+  // Step (1) -- Prime the input buffer at the start of the input stream.
+  if (!buffer_primed_ && remaining_frames) {
+    read_cb_->Run(request_frames_, r0_);
+    buffer_primed_ = true;
+  }
+
+  // Step (2) -- Resample!  const what we can outside of the loop for speed.  It
+  // actually has an impact on ARM performance.  See inner loop comment below.
+  const double current_io_ratio = io_sample_rate_ratio_;
+  const float* const kernel_ptr = kernel_storage_.get();
+  while (remaining_frames) {
+    // |i| may be negative if the last Resample() call ended on an iteration
+    // that put |virtual_source_idx_| over the limit.
+    //
+    // Note: The loop construct here can severely impact performance on ARM
+    // or when built with clang.  See https://codereview.chromium.org/18566009/
+    for (int i = static_cast<int>(
+             ceil((block_size_ - virtual_source_idx_) / current_io_ratio));
+         i > 0; --i) {
+      RTC_DCHECK_LT(virtual_source_idx_, block_size_);
+
+      // |virtual_source_idx_| lies in between two kernel offsets so figure out
+      // what they are.
+      const int source_idx = static_cast<int>(virtual_source_idx_);
+      const double subsample_remainder = virtual_source_idx_ - source_idx;
+
+      const double virtual_offset_idx =
+          subsample_remainder * kKernelOffsetCount;
+      const int offset_idx = static_cast<int>(virtual_offset_idx);
+
+      // We'll compute "convolutions" for the two kernels which straddle
+      // |virtual_source_idx_|.
+      const float* const k1 = kernel_ptr + offset_idx * kKernelSize;
+      const float* const k2 = k1 + kKernelSize;
+
+      // Ensure |k1|, |k2| are 16-byte aligned for SIMD usage.  Should always be
+      // true so long as kKernelSize is a multiple of 16.
+      RTC_DCHECK_EQ(0, reinterpret_cast<uintptr_t>(k1) % 16);
+      RTC_DCHECK_EQ(0, reinterpret_cast<uintptr_t>(k2) % 16);
+
+      // Initialize input pointer based on quantized |virtual_source_idx_|.
+      const float* const input_ptr = r1_ + source_idx;
+
+      // Figure out how much to weight each kernel's "convolution".
+      const double kernel_interpolation_factor =
+          virtual_offset_idx - offset_idx;
+      *destination++ = CONVOLVE_FUNC(
+          input_ptr, k1, k2, kernel_interpolation_factor);
+
+      // Advance the virtual index.
+      virtual_source_idx_ += current_io_ratio;
+
+      if (!--remaining_frames)
+        return;
+    }
+
+    // Wrap back around to the start.
+    virtual_source_idx_ -= block_size_;
+
+    // Step (3) -- Copy r3_, r4_ to r1_, r2_.
+    // This wraps the last input frames back to the start of the buffer.
+    memcpy(r1_, r3_, sizeof(*input_buffer_.get()) * kKernelSize);
+
+    // Step (4) -- Reinitialize regions if necessary.
+    if (r0_ == r2_)
+      UpdateRegions(true);
+
+    // Step (5) -- Refresh the buffer with more input.
+    read_cb_->Run(request_frames_, r0_);
+  }
+}
+
+#undef CONVOLVE_FUNC
+
+size_t SincResampler::ChunkSize() const {
+  return static_cast<size_t>(block_size_ / io_sample_rate_ratio_);
+}
+
+void SincResampler::Flush() {
+  virtual_source_idx_ = 0;
+  buffer_primed_ = false;
+  memset(input_buffer_.get(), 0,
+         sizeof(*input_buffer_.get()) * input_buffer_size_);
+  UpdateRegions(false);
+}
+
+float SincResampler::Convolve_C(const float* input_ptr, const float* k1,
+                                const float* k2,
+                                double kernel_interpolation_factor) {
+  float sum1 = 0;
+  float sum2 = 0;
+
+  // Generate a single output sample.  Unrolling this loop hurt performance in
+  // local testing.
+  size_t n = kKernelSize;
+  while (n--) {
+    sum1 += *input_ptr * *k1++;
+    sum2 += *input_ptr++ * *k2++;
+  }
+
+  // Linearly interpolate the two "convolutions".
+  return static_cast<float>((1.0 - kernel_interpolation_factor) * sum1 +
+      kernel_interpolation_factor * sum2);
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler.h
new file mode 100644
index 0000000..ecfd64c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler.h
@@ -0,0 +1,171 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Modified from the Chromium original here:
+// src/media/base/sinc_resampler.h
+
+#ifndef WEBRTC_COMMON_AUDIO_RESAMPLER_SINC_RESAMPLER_H_
+#define WEBRTC_COMMON_AUDIO_RESAMPLER_SINC_RESAMPLER_H_
+
+#include <memory>
+
+#include "webrtc/base/constructormagic.h"
+#include "webrtc/base/gtest_prod_util.h"
+#include "webrtc/system_wrappers/include/aligned_malloc.h"
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+// Callback class for providing more data into the resampler.  Expects |frames|
+// of data to be rendered into |destination|; zero padded if not enough frames
+// are available to satisfy the request.
+class SincResamplerCallback {
+ public:
+  virtual ~SincResamplerCallback() {}
+  virtual void Run(size_t frames, float* destination) = 0;
+};
+
+// SincResampler is a high-quality single-channel sample-rate converter.
+class SincResampler {
+ public:
+  // The kernel size can be adjusted for quality (higher is better) at the
+  // expense of performance.  Must be a multiple of 32.
+  // TODO(dalecurtis): Test performance to see if we can jack this up to 64+.
+  static const size_t kKernelSize = 32;
+
+  // Default request size.  Affects how often and for how much SincResampler
+  // calls back for input.  Must be greater than kKernelSize.
+  static const size_t kDefaultRequestSize = 512;
+
+  // The kernel offset count is used for interpolation and is the number of
+  // sub-sample kernel shifts.  Can be adjusted for quality (higher is better)
+  // at the expense of allocating more memory.
+  static const size_t kKernelOffsetCount = 32;
+  static const size_t kKernelStorageSize =
+      kKernelSize * (kKernelOffsetCount + 1);
+
+  // Constructs a SincResampler with the specified |read_cb|, which is used to
+  // acquire audio data for resampling.  |io_sample_rate_ratio| is the ratio
+  // of input / output sample rates.  |request_frames| controls the size in
+  // frames of the buffer requested by each |read_cb| call.  The value must be
+  // greater than kKernelSize.  Specify kDefaultRequestSize if there are no
+  // request size constraints.
+  SincResampler(double io_sample_rate_ratio,
+                size_t request_frames,
+                SincResamplerCallback* read_cb);
+  virtual ~SincResampler();
+
+  // Resample |frames| of data from |read_cb_| into |destination|.
+  void Resample(size_t frames, float* destination);
+
+  // The maximum size in frames that guarantees Resample() will only make a
+  // single call to |read_cb_| for more data.
+  size_t ChunkSize() const;
+
+  size_t request_frames() const { return request_frames_; }
+
+  // Flush all buffered data and reset internal indices.  Not thread safe, do
+  // not call while Resample() is in progress.
+  void Flush();
+
+  // Update |io_sample_rate_ratio_|.  SetRatio() will cause a reconstruction of
+  // the kernels used for resampling.  Not thread safe, do not call while
+  // Resample() is in progress.
+  //
+  // TODO(ajm): Use this in PushSincResampler rather than reconstructing
+  // SincResampler.  We would also need a way to update |request_frames_|.
+  void SetRatio(double io_sample_rate_ratio);
+
+  float* get_kernel_for_testing() { return kernel_storage_.get(); }
+
+ private:
+  FRIEND_TEST_ALL_PREFIXES(SincResamplerTest, Convolve);
+  FRIEND_TEST_ALL_PREFIXES(SincResamplerTest, ConvolveBenchmark);
+
+  void InitializeKernel();
+  void UpdateRegions(bool second_load);
+
+  // Selects runtime specific CPU features like SSE.  Must be called before
+  // using SincResampler.
+  // TODO(ajm): Currently managed by the class internally. See the note with
+  // |convolve_proc_| below.
+  void InitializeCPUSpecificFeatures();
+
+  // Compute convolution of |k1| and |k2| over |input_ptr|, resultant sums are
+  // linearly interpolated using |kernel_interpolation_factor|.  On x86 and ARM
+  // the underlying implementation is chosen at run time.
+  static float Convolve_C(const float* input_ptr, const float* k1,
+                          const float* k2, double kernel_interpolation_factor);
+#if defined(WEBRTC_ARCH_X86_FAMILY)
+  static float Convolve_SSE(const float* input_ptr, const float* k1,
+                            const float* k2,
+                            double kernel_interpolation_factor);
+#elif defined(WEBRTC_HAS_NEON)
+  static float Convolve_NEON(const float* input_ptr, const float* k1,
+                             const float* k2,
+                             double kernel_interpolation_factor);
+#endif
+
+  // The ratio of input / output sample rates.
+  double io_sample_rate_ratio_;
+
+  // An index on the source input buffer with sub-sample precision.  It must be
+  // double precision to avoid drift.
+  double virtual_source_idx_;
+
+  // The buffer is primed once at the very beginning of processing.
+  bool buffer_primed_;
+
+  // Source of data for resampling.
+  SincResamplerCallback* read_cb_;
+
+  // The size (in samples) to request from each |read_cb_| execution.
+  const size_t request_frames_;
+
+  // The number of source frames processed per pass.
+  size_t block_size_;
+
+  // The size (in samples) of the internal buffer used by the resampler.
+  const size_t input_buffer_size_;
+
+  // Contains kKernelOffsetCount kernels back-to-back, each of size kKernelSize.
+  // The kernel offsets are sub-sample shifts of a windowed sinc shifted from
+  // 0.0 to 1.0 sample.
+  std::unique_ptr<float[], AlignedFreeDeleter> kernel_storage_;
+  std::unique_ptr<float[], AlignedFreeDeleter> kernel_pre_sinc_storage_;
+  std::unique_ptr<float[], AlignedFreeDeleter> kernel_window_storage_;
+
+  // Data from the source is copied into this buffer for each processing pass.
+  std::unique_ptr<float[], AlignedFreeDeleter> input_buffer_;
+
+  // Stores the runtime selection of which Convolve function to use.
+  // TODO(ajm): Move to using a global static which must only be initialized
+  // once by the user. We're not doing this initially, because we don't have
+  // e.g. a LazyInstance helper in webrtc.
+#if defined(WEBRTC_CPU_DETECTION)
+  typedef float (*ConvolveProc)(const float*, const float*, const float*,
+                                double);
+  ConvolveProc convolve_proc_;
+#endif
+
+  // Pointers to the various regions inside |input_buffer_|.  See the diagram at
+  // the top of the .cc file for more information.
+  float* r0_;
+  float* const r1_;
+  float* const r2_;
+  float* r3_;
+  float* r4_;
+
+  RTC_DISALLOW_COPY_AND_ASSIGN(SincResampler);
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_COMMON_AUDIO_RESAMPLER_SINC_RESAMPLER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler_neon.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler_neon.cc
new file mode 100644
index 0000000..e909a6c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler_neon.cc
@@ -0,0 +1,47 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Modified from the Chromium original:
+// src/media/base/sinc_resampler.cc
+
+#include "webrtc/common_audio/resampler/sinc_resampler.h"
+
+#include <arm_neon.h>
+
+namespace webrtc {
+
+float SincResampler::Convolve_NEON(const float* input_ptr, const float* k1,
+                                   const float* k2,
+                                   double kernel_interpolation_factor) {
+  float32x4_t m_input;
+  float32x4_t m_sums1 = vmovq_n_f32(0);
+  float32x4_t m_sums2 = vmovq_n_f32(0);
+
+  const float* upper = input_ptr + kKernelSize;
+  for (; input_ptr < upper; ) {
+    m_input = vld1q_f32(input_ptr);
+    input_ptr += 4;
+    m_sums1 = vmlaq_f32(m_sums1, m_input, vld1q_f32(k1));
+    k1 += 4;
+    m_sums2 = vmlaq_f32(m_sums2, m_input, vld1q_f32(k2));
+    k2 += 4;
+  }
+
+  // Linearly interpolate the two "convolutions".
+  m_sums1 = vmlaq_f32(
+      vmulq_f32(m_sums1, vmovq_n_f32(1.0 - kernel_interpolation_factor)),
+      m_sums2, vmovq_n_f32(kernel_interpolation_factor));
+
+  // Sum components together.
+  float32x2_t m_half = vadd_f32(vget_high_f32(m_sums1), vget_low_f32(m_sums1));
+  return vget_lane_f32(vpadd_f32(m_half, m_half), 0);
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler_sse.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler_sse.cc
new file mode 100644
index 0000000..9e3953f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/resampler/sinc_resampler_sse.cc
@@ -0,0 +1,59 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Modified from the Chromium original:
+// src/media/base/simd/sinc_resampler_sse.cc
+
+#include "webrtc/common_audio/resampler/sinc_resampler.h"
+
+#include <xmmintrin.h>
+
+namespace webrtc {
+
+float SincResampler::Convolve_SSE(const float* input_ptr, const float* k1,
+                                  const float* k2,
+                                  double kernel_interpolation_factor) {
+  __m128 m_input;
+  __m128 m_sums1 = _mm_setzero_ps();
+  __m128 m_sums2 = _mm_setzero_ps();
+
+  // Based on |input_ptr| alignment, we need to use loadu or load.  Unrolling
+  // these loops hurt performance in local testing.
+  if (reinterpret_cast<uintptr_t>(input_ptr) & 0x0F) {
+    for (size_t i = 0; i < kKernelSize; i += 4) {
+      m_input = _mm_loadu_ps(input_ptr + i);
+      m_sums1 = _mm_add_ps(m_sums1, _mm_mul_ps(m_input, _mm_load_ps(k1 + i)));
+      m_sums2 = _mm_add_ps(m_sums2, _mm_mul_ps(m_input, _mm_load_ps(k2 + i)));
+    }
+  } else {
+    for (size_t i = 0; i < kKernelSize; i += 4) {
+      m_input = _mm_load_ps(input_ptr + i);
+      m_sums1 = _mm_add_ps(m_sums1, _mm_mul_ps(m_input, _mm_load_ps(k1 + i)));
+      m_sums2 = _mm_add_ps(m_sums2, _mm_mul_ps(m_input, _mm_load_ps(k2 + i)));
+    }
+  }
+
+  // Linearly interpolate the two "convolutions".
+  m_sums1 = _mm_mul_ps(m_sums1, _mm_set_ps1(
+      static_cast<float>(1.0 - kernel_interpolation_factor)));
+  m_sums2 = _mm_mul_ps(m_sums2, _mm_set_ps1(
+      static_cast<float>(kernel_interpolation_factor)));
+  m_sums1 = _mm_add_ps(m_sums1, m_sums2);
+
+  // Sum components together.
+  float result;
+  m_sums2 = _mm_add_ps(_mm_movehl_ps(m_sums1, m_sums1), m_sums1);
+  _mm_store_ss(&result, _mm_add_ss(m_sums2, _mm_shuffle_ps(
+      m_sums2, m_sums2, 1)));
+
+  return result;
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/auto_corr_to_refl_coef.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/auto_corr_to_refl_coef.c
new file mode 100644
index 0000000..f99dd62
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/auto_corr_to_refl_coef.c
@@ -0,0 +1,103 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_AutoCorrToReflCoef().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_AutoCorrToReflCoef(const int32_t *R, int use_order, int16_t *K)
+{
+    int i, n;
+    int16_t tmp;
+    const int32_t *rptr;
+    int32_t L_num, L_den;
+    int16_t *acfptr, *pptr, *wptr, *p1ptr, *w1ptr, ACF[WEBRTC_SPL_MAX_LPC_ORDER],
+            P[WEBRTC_SPL_MAX_LPC_ORDER], W[WEBRTC_SPL_MAX_LPC_ORDER];
+
+    // Initialize loop and pointers.
+    acfptr = ACF;
+    rptr = R;
+    pptr = P;
+    p1ptr = &P[1];
+    w1ptr = &W[1];
+    wptr = w1ptr;
+
+    // First loop; n=0. Determine shifting.
+    tmp = WebRtcSpl_NormW32(*R);
+    *acfptr = (int16_t)((*rptr++ << tmp) >> 16);
+    *pptr++ = *acfptr++;
+
+    // Initialize ACF, P and W.
+    for (i = 1; i <= use_order; i++)
+    {
+        *acfptr = (int16_t)((*rptr++ << tmp) >> 16);
+        *wptr++ = *acfptr;
+        *pptr++ = *acfptr++;
+    }
+
+    // Compute reflection coefficients.
+    for (n = 1; n <= use_order; n++, K++)
+    {
+        tmp = WEBRTC_SPL_ABS_W16(*p1ptr);
+        if (*P < tmp)
+        {
+            for (i = n; i <= use_order; i++)
+                *K++ = 0;
+
+            return;
+        }
+
+        // Division: WebRtcSpl_div(tmp, *P)
+        *K = 0;
+        if (tmp != 0)
+        {
+            L_num = tmp;
+            L_den = *P;
+            i = 15;
+            while (i--)
+            {
+                (*K) <<= 1;
+                L_num <<= 1;
+                if (L_num >= L_den)
+                {
+                    L_num -= L_den;
+                    (*K)++;
+                }
+            }
+            if (*p1ptr > 0)
+                *K = -*K;
+        }
+
+        // Last iteration; don't do Schur recursion.
+        if (n == use_order)
+            return;
+
+        // Schur recursion.
+        pptr = P;
+        wptr = w1ptr;
+        tmp = (int16_t)(((int32_t)*p1ptr * (int32_t)*K + 16384) >> 15);
+        *pptr = WebRtcSpl_AddSatW16(*pptr, tmp);
+        pptr++;
+        for (i = 1; i <= use_order - n; i++)
+        {
+            tmp = (int16_t)(((int32_t)*wptr * (int32_t)*K + 16384) >> 15);
+            *pptr = WebRtcSpl_AddSatW16(*(pptr + 1), tmp);
+            pptr++;
+            tmp = (int16_t)(((int32_t)*pptr * (int32_t)*K + 16384) >> 15);
+            *wptr = WebRtcSpl_AddSatW16(*wptr, tmp);
+            wptr++;
+        }
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/auto_correlation.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/auto_correlation.c
new file mode 100644
index 0000000..58e6d6e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/auto_correlation.c
@@ -0,0 +1,65 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#include "webrtc/base/checks.h"
+
+size_t WebRtcSpl_AutoCorrelation(const int16_t* in_vector,
+                                 size_t in_vector_length,
+                                 size_t order,
+                                 int32_t* result,
+                                 int* scale) {
+  int32_t sum = 0;
+  size_t i = 0, j = 0;
+  int16_t smax = 0;
+  int scaling = 0;
+
+  RTC_DCHECK_LE(order, in_vector_length);
+
+  // Find the maximum absolute value of the samples.
+  smax = WebRtcSpl_MaxAbsValueW16(in_vector, in_vector_length);
+
+  // In order to avoid overflow when computing the sum we should scale the
+  // samples so that (in_vector_length * smax * smax) will not overflow.
+  if (smax == 0) {
+    scaling = 0;
+  } else {
+    // Number of bits in the sum loop.
+    int nbits = WebRtcSpl_GetSizeInBits((uint32_t)in_vector_length);
+    // Number of bits to normalize smax.
+    int t = WebRtcSpl_NormW32(WEBRTC_SPL_MUL(smax, smax));
+
+    if (t > nbits) {
+      scaling = 0;
+    } else {
+      scaling = nbits - t;
+    }
+  }
+
+  // Perform the actual correlation calculation.
+  for (i = 0; i < order + 1; i++) {
+    sum = 0;
+    /* Unroll the loop to improve performance. */
+    for (j = 0; i + j + 3 < in_vector_length; j += 4) {
+      sum += (in_vector[j + 0] * in_vector[i + j + 0]) >> scaling;
+      sum += (in_vector[j + 1] * in_vector[i + j + 1]) >> scaling;
+      sum += (in_vector[j + 2] * in_vector[i + j + 2]) >> scaling;
+      sum += (in_vector[j + 3] * in_vector[i + j + 3]) >> scaling;
+    }
+    for (; j < in_vector_length - i; j++) {
+      sum += (in_vector[j] * in_vector[i + j]) >> scaling;
+    }
+    *result++ = sum;
+  }
+
+  *scale = scaling;
+  return order + 1;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse.c
new file mode 100644
index 0000000..c8bd2dc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse.c
@@ -0,0 +1,108 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+/* Tables for data buffer indexes that are bit reversed and thus need to be
+ * swapped. Note that, index_7[{0, 2, 4, ...}] are for the left side of the swap
+ * operations, while index_7[{1, 3, 5, ...}] are for the right side of the
+ * operation. Same for index_8.
+ */
+
+/* Indexes for the case of stages == 7. */
+static const int16_t index_7[112] = {
+  1, 64, 2, 32, 3, 96, 4, 16, 5, 80, 6, 48, 7, 112, 9, 72, 10, 40, 11, 104,
+  12, 24, 13, 88, 14, 56, 15, 120, 17, 68, 18, 36, 19, 100, 21, 84, 22, 52,
+  23, 116, 25, 76, 26, 44, 27, 108, 29, 92, 30, 60, 31, 124, 33, 66, 35, 98,
+  37, 82, 38, 50, 39, 114, 41, 74, 43, 106, 45, 90, 46, 58, 47, 122, 49, 70,
+  51, 102, 53, 86, 55, 118, 57, 78, 59, 110, 61, 94, 63, 126, 67, 97, 69,
+  81, 71, 113, 75, 105, 77, 89, 79, 121, 83, 101, 87, 117, 91, 109, 95, 125,
+  103, 115, 111, 123
+};
+
+/* Indexes for the case of stages == 8. */
+static const int16_t index_8[240] = {
+  1, 128, 2, 64, 3, 192, 4, 32, 5, 160, 6, 96, 7, 224, 8, 16, 9, 144, 10, 80,
+  11, 208, 12, 48, 13, 176, 14, 112, 15, 240, 17, 136, 18, 72, 19, 200, 20,
+  40, 21, 168, 22, 104, 23, 232, 25, 152, 26, 88, 27, 216, 28, 56, 29, 184,
+  30, 120, 31, 248, 33, 132, 34, 68, 35, 196, 37, 164, 38, 100, 39, 228, 41,
+  148, 42, 84, 43, 212, 44, 52, 45, 180, 46, 116, 47, 244, 49, 140, 50, 76,
+  51, 204, 53, 172, 54, 108, 55, 236, 57, 156, 58, 92, 59, 220, 61, 188, 62,
+  124, 63, 252, 65, 130, 67, 194, 69, 162, 70, 98, 71, 226, 73, 146, 74, 82,
+  75, 210, 77, 178, 78, 114, 79, 242, 81, 138, 83, 202, 85, 170, 86, 106, 87,
+  234, 89, 154, 91, 218, 93, 186, 94, 122, 95, 250, 97, 134, 99, 198, 101,
+  166, 103, 230, 105, 150, 107, 214, 109, 182, 110, 118, 111, 246, 113, 142,
+  115, 206, 117, 174, 119, 238, 121, 158, 123, 222, 125, 190, 127, 254, 131,
+  193, 133, 161, 135, 225, 137, 145, 139, 209, 141, 177, 143, 241, 147, 201,
+  149, 169, 151, 233, 155, 217, 157, 185, 159, 249, 163, 197, 167, 229, 171,
+  213, 173, 181, 175, 245, 179, 205, 183, 237, 187, 221, 191, 253, 199, 227,
+  203, 211, 207, 243, 215, 235, 223, 251, 239, 247
+};
+
+void WebRtcSpl_ComplexBitReverse(int16_t* __restrict complex_data, int stages) {
+  /* For any specific value of stages, we know exactly the indexes that are
+   * bit reversed. Currently (Feb. 2012) in WebRTC the only possible values of
+   * stages are 7 and 8, so we use tables to save unnecessary iterations and
+   * calculations for these two cases.
+   */
+  if (stages == 7 || stages == 8) {
+    int m = 0;
+    int length = 112;
+    const int16_t* index = index_7;
+
+    if (stages == 8) {
+      length = 240;
+      index = index_8;
+    }
+
+    /* Decimation in time. Swap the elements with bit-reversed indexes. */
+    for (m = 0; m < length; m += 2) {
+      /* We declare a int32_t* type pointer, to load both the 16-bit real
+       * and imaginary elements from complex_data in one instruction, reducing
+       * complexity.
+       */
+      int32_t* complex_data_ptr = (int32_t*)complex_data;
+      int32_t temp = 0;
+
+      temp = complex_data_ptr[index[m]];  /* Real and imaginary */
+      complex_data_ptr[index[m]] = complex_data_ptr[index[m + 1]];
+      complex_data_ptr[index[m + 1]] = temp;
+    }
+  }
+  else {
+    int m = 0, mr = 0, l = 0;
+    int n = 1 << stages;
+    int nn = n - 1;
+
+    /* Decimation in time - re-order data */
+    for (m = 1; m <= nn; ++m) {
+      int32_t* complex_data_ptr = (int32_t*)complex_data;
+      int32_t temp = 0;
+
+      /* Find out indexes that are bit-reversed. */
+      l = n;
+      do {
+        l >>= 1;
+      } while (l > nn - mr);
+      mr = (mr & (l - 1)) + l;
+
+      if (mr <= m) {
+        continue;
+      }
+
+      /* Swap the elements with bit-reversed indexes.
+       * This is similar to the loop in the stages == 7 or 8 cases.
+       */
+      temp = complex_data_ptr[m];  /* Real and imaginary */
+      complex_data_ptr[m] = complex_data_ptr[mr];
+      complex_data_ptr[mr] = temp;
+    }
+  }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse_arm.S b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse_arm.S
new file mode 100644
index 0000000..93de99f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse_arm.S
@@ -0,0 +1,119 @@
+@
+@ Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+@
+@ Use of this source code is governed by a BSD-style license
+@ that can be found in the LICENSE file in the root of the source
+@ tree. An additional intellectual property rights grant can be found
+@ in the file PATENTS.  All contributing project authors may
+@ be found in the AUTHORS file in the root of the source tree.
+@
+
+@ This file contains the function WebRtcSpl_ComplexBitReverse(), optimized
+@ for ARMv5 platforms.
+@ Reference C code is in file complex_bit_reverse.c. Bit-exact.
+
+#include "webrtc/system_wrappers/include/asm_defines.h"
+
+GLOBAL_FUNCTION WebRtcSpl_ComplexBitReverse
+.align  2
+DEFINE_FUNCTION WebRtcSpl_ComplexBitReverse
+  push {r4-r7}
+
+  cmp r1, #7
+  adr r3, index_7                 @ Table pointer.
+  mov r4, #112                    @ Number of interations.
+  beq PRE_LOOP_STAGES_7_OR_8
+
+  cmp r1, #8
+  adr r3, index_8                 @ Table pointer.
+  mov r4, #240                    @ Number of interations.
+  beq PRE_LOOP_STAGES_7_OR_8
+
+  mov r3, #1                      @ Initialize m.
+  mov r1, r3, asl r1              @ n = 1 << stages;
+  subs r6, r1, #1                 @ nn = n - 1;
+  ble END
+
+  mov r5, r0                      @ &complex_data
+  mov r4, #0                      @ ml
+
+LOOP_GENERIC:
+  rsb r12, r4, r6                 @ l > nn - mr
+  mov r2, r1                      @ n
+
+LOOP_SHIFT:
+  asr r2, #1                      @ l >>= 1;
+  cmp r2, r12
+  bgt LOOP_SHIFT
+
+  sub r12, r2, #1
+  and r4, r12, r4
+  add r4, r2                      @ mr = (mr & (l - 1)) + l;
+  cmp r4, r3                      @ mr <= m ?
+  ble UPDATE_REGISTERS
+
+  mov r12, r4, asl #2
+  ldr r7, [r5, #4]                @ complex_data[2 * m, 2 * m + 1].
+                                  @   Offset 4 due to m incrementing from 1.
+  ldr r2, [r0, r12]               @ complex_data[2 * mr, 2 * mr + 1].
+  str r7, [r0, r12]
+  str r2, [r5, #4]
+
+UPDATE_REGISTERS:
+  add r3, r3, #1
+  add r5, #4
+  cmp r3, r1
+  bne LOOP_GENERIC
+
+  b END
+
+PRE_LOOP_STAGES_7_OR_8:
+  add r4, r3, r4, asl #1
+
+LOOP_STAGES_7_OR_8:
+  ldrsh r2, [r3], #2              @ index[m]
+  ldrsh r5, [r3], #2              @ index[m + 1]
+  ldr r1, [r0, r2]                @ complex_data[index[m], index[m] + 1]
+  ldr r12, [r0, r5]               @ complex_data[index[m + 1], index[m + 1] + 1]
+  cmp r3, r4
+  str r1, [r0, r5]
+  str r12, [r0, r2]
+  bne LOOP_STAGES_7_OR_8
+
+END:
+  pop {r4-r7}
+  bx lr
+
+@ The index tables. Note the values are doubles of the actual indexes for 16-bit
+@ elements, different from the generic C code. It actually provides byte offsets
+@ for the indexes.
+
+.align  2
+index_7:  @ Indexes for stages == 7.
+  .short 4, 256, 8, 128, 12, 384, 16, 64, 20, 320, 24, 192, 28, 448, 36, 288
+  .short 40, 160, 44, 416, 48, 96, 52, 352, 56, 224, 60, 480, 68, 272, 72, 144
+  .short 76, 400, 84, 336, 88, 208, 92, 464, 100, 304, 104, 176, 108, 432, 116
+  .short 368, 120, 240, 124, 496, 132, 264, 140, 392, 148, 328, 152, 200, 156
+  .short 456, 164, 296, 172, 424, 180, 360, 184, 232, 188, 488, 196, 280, 204
+  .short 408, 212, 344, 220, 472, 228, 312, 236, 440, 244, 376, 252, 504, 268
+  .short 388, 276, 324, 284, 452, 300, 420, 308, 356, 316, 484, 332, 404, 348
+  .short 468, 364, 436, 380, 500, 412, 460, 444, 492
+
+index_8:  @ Indexes for stages == 8.
+  .short 4, 512, 8, 256, 12, 768, 16, 128, 20, 640, 24, 384, 28, 896, 32, 64
+  .short 36, 576, 40, 320, 44, 832, 48, 192, 52, 704, 56, 448, 60, 960, 68, 544
+  .short 72, 288, 76, 800, 80, 160, 84, 672, 88, 416, 92, 928, 100, 608, 104
+  .short 352, 108, 864, 112, 224, 116, 736, 120, 480, 124, 992, 132, 528, 136
+  .short 272, 140, 784, 148, 656, 152, 400, 156, 912, 164, 592, 168, 336, 172
+  .short 848, 176, 208, 180, 720, 184, 464, 188, 976, 196, 560, 200, 304, 204
+  .short 816, 212, 688, 216, 432, 220, 944, 228, 624, 232, 368, 236, 880, 244
+  .short 752, 248, 496, 252, 1008, 260, 520, 268, 776, 276, 648, 280, 392, 284
+  .short 904, 292, 584, 296, 328, 300, 840, 308, 712, 312, 456, 316, 968, 324
+  .short 552, 332, 808, 340, 680, 344, 424, 348, 936, 356, 616, 364, 872, 372
+  .short 744, 376, 488, 380, 1000, 388, 536, 396, 792, 404, 664, 412, 920, 420
+  .short 600, 428, 856, 436, 728, 440, 472, 444, 984, 452, 568, 460, 824, 468
+  .short 696, 476, 952, 484, 632, 492, 888, 500, 760, 508, 1016, 524, 772, 532
+  .short 644, 540, 900, 548, 580, 556, 836, 564, 708, 572, 964, 588, 804, 596
+  .short 676, 604, 932, 620, 868, 628, 740, 636, 996, 652, 788, 668, 916, 684
+  .short 852, 692, 724, 700, 980, 716, 820, 732, 948, 748, 884, 764, 1012, 796
+  .short 908, 812, 844, 828, 972, 860, 940, 892, 1004, 956, 988
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse_mips.c
new file mode 100644
index 0000000..583fe4f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_bit_reverse_mips.c
@@ -0,0 +1,176 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+static int16_t coefTable_7[] = {
+    4, 256,   8, 128,  12, 384,  16,  64,
+   20, 320,  24, 192,  28, 448,  36, 288,
+   40, 160,  44, 416,  48,  96,  52, 352,
+   56, 224,  60, 480,  68, 272,  72, 144,
+   76, 400,  84, 336,  88, 208,  92, 464,
+  100, 304, 104, 176, 108, 432, 116, 368,
+  120, 240, 124, 496, 132, 264, 140, 392,
+  148, 328, 152, 200, 156, 456, 164, 296,
+  172, 424, 180, 360, 184, 232, 188, 488,
+  196, 280, 204, 408, 212, 344, 220, 472,
+  228, 312, 236, 440, 244, 376, 252, 504,
+  268, 388, 276, 324, 284, 452, 300, 420,
+  308, 356, 316, 484, 332, 404, 348, 468,
+  364, 436, 380, 500, 412, 460, 444, 492
+};
+
+static int16_t coefTable_8[] = {
+    4,  512,    8,  256,   12,  768,   16,  128,
+   20,  640,   24,  384,   28,  896,   32,   64,
+   36,  576,   40,  320,   44,  832,   48,  192,
+   52,  704,   56,  448,   60,  960,   68,  544,
+   72,  288,   76,  800,   80,  160,   84,  672,
+   88,  416,   92,  928,  100,  608,  104,  352,
+  108,  864,  112,  224,  116,  736,  120,  480,
+  124,  992,  132,  528,  136,  272,  140,  784,
+  148,  656,  152,  400,  156,  912,  164,  592,
+  168,  336,  172,  848,  176,  208,  180,  720,
+  184,  464,  188,  976,  196,  560,  200,  304,
+  204,  816,  212,  688,  216,  432,  220,  944,
+  228,  624,  232,  368,  236,  880,  244,  752,
+  248,  496,  252, 1008,  260,  520,  268,  776,
+  276,  648,  280,  392,  284,  904,  292,  584,
+  296,  328,  300,  840,  308,  712,  312,  456,
+  316,  968,  324,  552,  332,  808,  340,  680,
+  344,  424,  348,  936,  356,  616,  364,  872,
+  372,  744,  376,  488,  380, 1000,  388,  536,
+  396,  792,  404,  664,  412,  920,  420,  600,
+  428,  856,  436,  728,  440,  472,  444,  984,
+  452,  568,  460,  824,  468,  696,  476,  952,
+  484,  632,  492,  888,  500,  760,  508, 1016,
+  524,  772,  532,  644,  540,  900,  548,  580,
+  556,  836,  564,  708,  572,  964,  588,  804,
+  596,  676,  604,  932,  620,  868,  628,  740,
+  636,  996,  652,  788,  668,  916,  684,  852,
+  692,  724,  700,  980,  716,  820,  732,  948,
+  748,  884,  764, 1012,  796,  908,  812,  844,
+  828,  972,  860,  940,  892, 1004,  956,  988
+};
+
+void WebRtcSpl_ComplexBitReverse(int16_t frfi[], int stages) {
+  int l;
+  int16_t tr, ti;
+  int32_t tmp1, tmp2, tmp3, tmp4;
+  int32_t* ptr_i;
+  int32_t* ptr_j;
+
+  if (stages == 8) {
+    int16_t* pcoeftable_8 = coefTable_8;
+
+    __asm __volatile (
+      ".set         push                                             \n\t"
+      ".set         noreorder                                        \n\t"
+      "addiu        %[l],            $zero,               120        \n\t"
+     "1:                                                             \n\t"
+      "addiu        %[l],            %[l],                -4         \n\t"
+      "lh           %[tr],           0(%[pcoeftable_8])              \n\t"
+      "lh           %[ti],           2(%[pcoeftable_8])              \n\t"
+      "lh           %[tmp3],         4(%[pcoeftable_8])              \n\t"
+      "lh           %[tmp4],         6(%[pcoeftable_8])              \n\t"
+      "addu         %[ptr_i],        %[frfi],             %[tr]      \n\t"
+      "addu         %[ptr_j],        %[frfi],             %[ti]      \n\t"
+      "addu         %[tr],           %[frfi],             %[tmp3]    \n\t"
+      "addu         %[ti],           %[frfi],             %[tmp4]    \n\t"
+      "ulw          %[tmp1],         0(%[ptr_i])                     \n\t"
+      "ulw          %[tmp2],         0(%[ptr_j])                     \n\t"
+      "ulw          %[tmp3],         0(%[tr])                        \n\t"
+      "ulw          %[tmp4],         0(%[ti])                        \n\t"
+      "usw          %[tmp1],         0(%[ptr_j])                     \n\t"
+      "usw          %[tmp2],         0(%[ptr_i])                     \n\t"
+      "usw          %[tmp4],         0(%[tr])                        \n\t"
+      "usw          %[tmp3],         0(%[ti])                        \n\t"
+      "lh           %[tmp1],         8(%[pcoeftable_8])              \n\t"
+      "lh           %[tmp2],         10(%[pcoeftable_8])             \n\t"
+      "lh           %[tr],           12(%[pcoeftable_8])             \n\t"
+      "lh           %[ti],           14(%[pcoeftable_8])             \n\t"
+      "addu         %[ptr_i],        %[frfi],             %[tmp1]    \n\t"
+      "addu         %[ptr_j],        %[frfi],             %[tmp2]    \n\t"
+      "addu         %[tr],           %[frfi],             %[tr]      \n\t"
+      "addu         %[ti],           %[frfi],             %[ti]      \n\t"
+      "ulw          %[tmp1],         0(%[ptr_i])                     \n\t"
+      "ulw          %[tmp2],         0(%[ptr_j])                     \n\t"
+      "ulw          %[tmp3],         0(%[tr])                        \n\t"
+      "ulw          %[tmp4],         0(%[ti])                        \n\t"
+      "usw          %[tmp1],         0(%[ptr_j])                     \n\t"
+      "usw          %[tmp2],         0(%[ptr_i])                     \n\t"
+      "usw          %[tmp4],         0(%[tr])                        \n\t"
+      "usw          %[tmp3],         0(%[ti])                        \n\t"
+      "bgtz         %[l],            1b                              \n\t"
+      " addiu       %[pcoeftable_8], %[pcoeftable_8],     16         \n\t"
+      ".set         pop                                              \n\t"
+
+      : [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2), [ptr_i] "=&r" (ptr_i),
+        [ptr_j] "=&r" (ptr_j), [tr] "=&r" (tr), [l] "=&r" (l),
+        [tmp3] "=&r" (tmp3), [pcoeftable_8] "+r" (pcoeftable_8),
+        [ti] "=&r" (ti), [tmp4] "=&r" (tmp4)
+      : [frfi] "r" (frfi)
+      : "memory"
+    );
+  } else if (stages == 7) {
+    int16_t* pcoeftable_7 = coefTable_7;
+
+    __asm __volatile (
+      ".set push                                                     \n\t"
+      ".set noreorder                                                \n\t"
+      "addiu        %[l],            $zero,               56         \n\t"
+     "1:                                                             \n\t"
+      "addiu        %[l],            %[l],                -4         \n\t"
+      "lh           %[tr],           0(%[pcoeftable_7])              \n\t"
+      "lh           %[ti],           2(%[pcoeftable_7])              \n\t"
+      "lh           %[tmp3],         4(%[pcoeftable_7])              \n\t"
+      "lh           %[tmp4],         6(%[pcoeftable_7])              \n\t"
+      "addu         %[ptr_i],        %[frfi],             %[tr]      \n\t"
+      "addu         %[ptr_j],        %[frfi],             %[ti]      \n\t"
+      "addu         %[tr],           %[frfi],             %[tmp3]    \n\t"
+      "addu         %[ti],           %[frfi],             %[tmp4]    \n\t"
+      "ulw          %[tmp1],         0(%[ptr_i])                     \n\t"
+      "ulw          %[tmp2],         0(%[ptr_j])                     \n\t"
+      "ulw          %[tmp3],         0(%[tr])                        \n\t"
+      "ulw          %[tmp4],         0(%[ti])                        \n\t"
+      "usw          %[tmp1],         0(%[ptr_j])                     \n\t"
+      "usw          %[tmp2],         0(%[ptr_i])                     \n\t"
+      "usw          %[tmp4],         0(%[tr])                        \n\t"
+      "usw          %[tmp3],         0(%[ti])                        \n\t"
+      "lh           %[tmp1],         8(%[pcoeftable_7])              \n\t"
+      "lh           %[tmp2],         10(%[pcoeftable_7])             \n\t"
+      "lh           %[tr],           12(%[pcoeftable_7])             \n\t"
+      "lh           %[ti],           14(%[pcoeftable_7])             \n\t"
+      "addu         %[ptr_i],        %[frfi],             %[tmp1]    \n\t"
+      "addu         %[ptr_j],        %[frfi],             %[tmp2]    \n\t"
+      "addu         %[tr],           %[frfi],             %[tr]      \n\t"
+      "addu         %[ti],           %[frfi],             %[ti]      \n\t"
+      "ulw          %[tmp1],         0(%[ptr_i])                     \n\t"
+      "ulw          %[tmp2],         0(%[ptr_j])                     \n\t"
+      "ulw          %[tmp3],         0(%[tr])                        \n\t"
+      "ulw          %[tmp4],         0(%[ti])                        \n\t"
+      "usw          %[tmp1],         0(%[ptr_j])                     \n\t"
+      "usw          %[tmp2],         0(%[ptr_i])                     \n\t"
+      "usw          %[tmp4],         0(%[tr])                        \n\t"
+      "usw          %[tmp3],         0(%[ti])                        \n\t"
+      "bgtz         %[l],            1b                              \n\t"
+      " addiu       %[pcoeftable_7], %[pcoeftable_7],     16         \n\t"
+      ".set pop                                                      \n\t"
+
+      : [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2), [ptr_i] "=&r" (ptr_i),
+        [ptr_j] "=&r" (ptr_j), [ti] "=&r" (ti), [tr] "=&r" (tr),
+        [l] "=&r" (l), [pcoeftable_7] "+r" (pcoeftable_7),
+        [tmp3] "=&r" (tmp3), [tmp4] "=&r" (tmp4)
+      : [frfi] "r" (frfi)
+      : "memory"
+    );
+  }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft.c
new file mode 100644
index 0000000..97ebacc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft.c
@@ -0,0 +1,298 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_ComplexFFT().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/complex_fft_tables.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#define CFFTSFT 14
+#define CFFTRND 1
+#define CFFTRND2 16384
+
+#define CIFFTSFT 14
+#define CIFFTRND 1
+
+
+int WebRtcSpl_ComplexFFT(int16_t frfi[], int stages, int mode)
+{
+    int i, j, l, k, istep, n, m;
+    int16_t wr, wi;
+    int32_t tr32, ti32, qr32, qi32;
+
+    /* The 1024-value is a constant given from the size of kSinTable1024[],
+     * and should not be changed depending on the input parameter 'stages'
+     */
+    n = 1 << stages;
+    if (n > 1024)
+        return -1;
+
+    l = 1;
+    k = 10 - 1; /* Constant for given kSinTable1024[]. Do not change
+         depending on the input parameter 'stages' */
+
+    if (mode == 0)
+    {
+        // mode==0: Low-complexity and Low-accuracy mode
+        while (l < n)
+        {
+            istep = l << 1;
+
+            for (m = 0; m < l; ++m)
+            {
+                j = m << k;
+
+                /* The 256-value is a constant given as 1/4 of the size of
+                 * kSinTable1024[], and should not be changed depending on the input
+                 * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2
+                 */
+                wr = kSinTable1024[j + 256];
+                wi = -kSinTable1024[j];
+
+                for (i = m; i < n; i += istep)
+                {
+                    j = i + l;
+
+                    tr32 = (wr * frfi[2 * j] - wi * frfi[2 * j + 1]) >> 15;
+
+                    ti32 = (wr * frfi[2 * j + 1] + wi * frfi[2 * j]) >> 15;
+
+                    qr32 = (int32_t)frfi[2 * i];
+                    qi32 = (int32_t)frfi[2 * i + 1];
+                    frfi[2 * j] = (int16_t)((qr32 - tr32) >> 1);
+                    frfi[2 * j + 1] = (int16_t)((qi32 - ti32) >> 1);
+                    frfi[2 * i] = (int16_t)((qr32 + tr32) >> 1);
+                    frfi[2 * i + 1] = (int16_t)((qi32 + ti32) >> 1);
+                }
+            }
+
+            --k;
+            l = istep;
+
+        }
+
+    } else
+    {
+        // mode==1: High-complexity and High-accuracy mode
+        while (l < n)
+        {
+            istep = l << 1;
+
+            for (m = 0; m < l; ++m)
+            {
+                j = m << k;
+
+                /* The 256-value is a constant given as 1/4 of the size of
+                 * kSinTable1024[], and should not be changed depending on the input
+                 * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2
+                 */
+                wr = kSinTable1024[j + 256];
+                wi = -kSinTable1024[j];
+
+#ifdef WEBRTC_ARCH_ARM_V7
+                int32_t wri = 0;
+                __asm __volatile("pkhbt %0, %1, %2, lsl #16" : "=r"(wri) :
+                    "r"((int32_t)wr), "r"((int32_t)wi));
+#endif
+
+                for (i = m; i < n; i += istep)
+                {
+                    j = i + l;
+
+#ifdef WEBRTC_ARCH_ARM_V7
+                    register int32_t frfi_r;
+                    __asm __volatile(
+                        "pkhbt %[frfi_r], %[frfi_even], %[frfi_odd],"
+                        " lsl #16\n\t"
+                        "smlsd %[tr32], %[wri], %[frfi_r], %[cfftrnd]\n\t"
+                        "smladx %[ti32], %[wri], %[frfi_r], %[cfftrnd]\n\t"
+                        :[frfi_r]"=&r"(frfi_r),
+                         [tr32]"=&r"(tr32),
+                         [ti32]"=r"(ti32)
+                        :[frfi_even]"r"((int32_t)frfi[2*j]),
+                         [frfi_odd]"r"((int32_t)frfi[2*j +1]),
+                         [wri]"r"(wri),
+                         [cfftrnd]"r"(CFFTRND));
+#else
+                    tr32 = wr * frfi[2 * j] - wi * frfi[2 * j + 1] + CFFTRND;
+
+                    ti32 = wr * frfi[2 * j + 1] + wi * frfi[2 * j] + CFFTRND;
+#endif
+
+                    tr32 >>= 15 - CFFTSFT;
+                    ti32 >>= 15 - CFFTSFT;
+
+                    qr32 = ((int32_t)frfi[2 * i]) << CFFTSFT;
+                    qi32 = ((int32_t)frfi[2 * i + 1]) << CFFTSFT;
+
+                    frfi[2 * j] = (int16_t)(
+                        (qr32 - tr32 + CFFTRND2) >> (1 + CFFTSFT));
+                    frfi[2 * j + 1] = (int16_t)(
+                        (qi32 - ti32 + CFFTRND2) >> (1 + CFFTSFT));
+                    frfi[2 * i] = (int16_t)(
+                        (qr32 + tr32 + CFFTRND2) >> (1 + CFFTSFT));
+                    frfi[2 * i + 1] = (int16_t)(
+                        (qi32 + ti32 + CFFTRND2) >> (1 + CFFTSFT));
+                }
+            }
+
+            --k;
+            l = istep;
+        }
+    }
+    return 0;
+}
+
+int WebRtcSpl_ComplexIFFT(int16_t frfi[], int stages, int mode)
+{
+    size_t i, j, l, istep, n, m;
+    int k, scale, shift;
+    int16_t wr, wi;
+    int32_t tr32, ti32, qr32, qi32;
+    int32_t tmp32, round2;
+
+    /* The 1024-value is a constant given from the size of kSinTable1024[],
+     * and should not be changed depending on the input parameter 'stages'
+     */
+    n = 1 << stages;
+    if (n > 1024)
+        return -1;
+
+    scale = 0;
+
+    l = 1;
+    k = 10 - 1; /* Constant for given kSinTable1024[]. Do not change
+         depending on the input parameter 'stages' */
+
+    while (l < n)
+    {
+        // variable scaling, depending upon data
+        shift = 0;
+        round2 = 8192;
+
+        tmp32 = WebRtcSpl_MaxAbsValueW16(frfi, 2 * n);
+        if (tmp32 > 13573)
+        {
+            shift++;
+            scale++;
+            round2 <<= 1;
+        }
+        if (tmp32 > 27146)
+        {
+            shift++;
+            scale++;
+            round2 <<= 1;
+        }
+
+        istep = l << 1;
+
+        if (mode == 0)
+        {
+            // mode==0: Low-complexity and Low-accuracy mode
+            for (m = 0; m < l; ++m)
+            {
+                j = m << k;
+
+                /* The 256-value is a constant given as 1/4 of the size of
+                 * kSinTable1024[], and should not be changed depending on the input
+                 * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2
+                 */
+                wr = kSinTable1024[j + 256];
+                wi = kSinTable1024[j];
+
+                for (i = m; i < n; i += istep)
+                {
+                    j = i + l;
+
+                    tr32 = (wr * frfi[2 * j] - wi * frfi[2 * j + 1]) >> 15;
+
+                    ti32 = (wr * frfi[2 * j + 1] + wi * frfi[2 * j]) >> 15;
+
+                    qr32 = (int32_t)frfi[2 * i];
+                    qi32 = (int32_t)frfi[2 * i + 1];
+                    frfi[2 * j] = (int16_t)((qr32 - tr32) >> shift);
+                    frfi[2 * j + 1] = (int16_t)((qi32 - ti32) >> shift);
+                    frfi[2 * i] = (int16_t)((qr32 + tr32) >> shift);
+                    frfi[2 * i + 1] = (int16_t)((qi32 + ti32) >> shift);
+                }
+            }
+        } else
+        {
+            // mode==1: High-complexity and High-accuracy mode
+
+            for (m = 0; m < l; ++m)
+            {
+                j = m << k;
+
+                /* The 256-value is a constant given as 1/4 of the size of
+                 * kSinTable1024[], and should not be changed depending on the input
+                 * parameter 'stages'. It will result in 0 <= j < N_SINE_WAVE/2
+                 */
+                wr = kSinTable1024[j + 256];
+                wi = kSinTable1024[j];
+
+#ifdef WEBRTC_ARCH_ARM_V7
+                int32_t wri = 0;
+                __asm __volatile("pkhbt %0, %1, %2, lsl #16" : "=r"(wri) :
+                    "r"((int32_t)wr), "r"((int32_t)wi));
+#endif
+
+                for (i = m; i < n; i += istep)
+                {
+                    j = i + l;
+
+#ifdef WEBRTC_ARCH_ARM_V7
+                    register int32_t frfi_r;
+                    __asm __volatile(
+                      "pkhbt %[frfi_r], %[frfi_even], %[frfi_odd], lsl #16\n\t"
+                      "smlsd %[tr32], %[wri], %[frfi_r], %[cifftrnd]\n\t"
+                      "smladx %[ti32], %[wri], %[frfi_r], %[cifftrnd]\n\t"
+                      :[frfi_r]"=&r"(frfi_r),
+                       [tr32]"=&r"(tr32),
+                       [ti32]"=r"(ti32)
+                      :[frfi_even]"r"((int32_t)frfi[2*j]),
+                       [frfi_odd]"r"((int32_t)frfi[2*j +1]),
+                       [wri]"r"(wri),
+                       [cifftrnd]"r"(CIFFTRND)
+                    );
+#else
+
+                    tr32 = wr * frfi[2 * j] - wi * frfi[2 * j + 1] + CIFFTRND;
+
+                    ti32 = wr * frfi[2 * j + 1] + wi * frfi[2 * j] + CIFFTRND;
+#endif
+                    tr32 >>= 15 - CIFFTSFT;
+                    ti32 >>= 15 - CIFFTSFT;
+
+                    qr32 = ((int32_t)frfi[2 * i]) << CIFFTSFT;
+                    qi32 = ((int32_t)frfi[2 * i + 1]) << CIFFTSFT;
+
+                    frfi[2 * j] = (int16_t)(
+                        (qr32 - tr32 + round2) >> (shift + CIFFTSFT));
+                    frfi[2 * j + 1] = (int16_t)(
+                        (qi32 - ti32 + round2) >> (shift + CIFFTSFT));
+                    frfi[2 * i] = (int16_t)(
+                        (qr32 + tr32 + round2) >> (shift + CIFFTSFT));
+                    frfi[2 * i + 1] = (int16_t)(
+                        (qi32 + ti32 + round2) >> (shift + CIFFTSFT));
+                }
+            }
+
+        }
+        --k;
+        l = istep;
+    }
+    return scale;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft_mips.c
new file mode 100644
index 0000000..34c4f23
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft_mips.c
@@ -0,0 +1,328 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+#include "webrtc/common_audio/signal_processing/complex_fft_tables.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#define CFFTSFT 14
+#define CFFTRND 1
+#define CFFTRND2 16384
+
+#define CIFFTSFT 14
+#define CIFFTRND 1
+
+int WebRtcSpl_ComplexFFT(int16_t frfi[], int stages, int mode) {
+  int i = 0;
+  int l = 0;
+  int k = 0;
+  int istep = 0;
+  int n = 0;
+  int m = 0;
+  int32_t wr = 0, wi = 0;
+  int32_t tmp1 = 0;
+  int32_t tmp2 = 0;
+  int32_t tmp3 = 0;
+  int32_t tmp4 = 0;
+  int32_t tmp5 = 0;
+  int32_t tmp6 = 0;
+  int32_t tmp = 0;
+  int16_t* ptr_j = NULL;
+  int16_t* ptr_i = NULL;
+
+  n = 1 << stages;
+  if (n > 1024) {
+    return -1;
+  }
+
+  __asm __volatile (
+    ".set push                                                         \n\t"
+    ".set noreorder                                                    \n\t"
+
+    "addiu      %[k],           $zero,            10                   \n\t"
+    "addiu      %[l],           $zero,            1                    \n\t"
+   "3:                                                                 \n\t"
+    "sll        %[istep],       %[l],             1                    \n\t"
+    "move       %[m],           $zero                                  \n\t"
+    "sll        %[tmp],         %[l],             2                    \n\t"
+    "move       %[i],           $zero                                  \n\t"
+   "2:                                                                 \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "sllv       %[tmp3],        %[m],             %[k]                 \n\t"
+    "addiu      %[tmp2],        %[tmp3],          512                  \n\t"
+    "addiu      %[m],           %[m],             1                    \n\t"
+    "lhx        %[wi],          %[tmp3](%[kSinTable1024])              \n\t"
+    "lhx        %[wr],          %[tmp2](%[kSinTable1024])              \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "sllv       %[tmp3],        %[m],             %[k]                 \n\t"
+    "addu       %[ptr_j],       %[tmp3],          %[kSinTable1024]     \n\t"
+    "addiu      %[ptr_i],       %[ptr_j],         512                  \n\t"
+    "addiu      %[m],           %[m],             1                    \n\t"
+    "lh         %[wi],          0(%[ptr_j])                            \n\t"
+    "lh         %[wr],          0(%[ptr_i])                            \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+   "1:                                                                 \n\t"
+    "sll        %[tmp1],        %[i],             2                    \n\t"
+    "addu       %[ptr_i],       %[frfi],          %[tmp1]              \n\t"
+    "addu       %[ptr_j],       %[ptr_i],         %[tmp]               \n\t"
+    "lh         %[tmp6],        0(%[ptr_i])                            \n\t"
+    "lh         %[tmp5],        2(%[ptr_i])                            \n\t"
+    "lh         %[tmp3],        0(%[ptr_j])                            \n\t"
+    "lh         %[tmp4],        2(%[ptr_j])                            \n\t"
+    "addu       %[i],           %[i],             %[istep]             \n\t"
+#if defined(MIPS_DSP_R2_LE)
+    "mult       %[wr],          %[tmp3]                                \n\t"
+    "madd       %[wi],          %[tmp4]                                \n\t"
+    "mult       $ac1,           %[wr],            %[tmp4]              \n\t"
+    "msub       $ac1,           %[wi],            %[tmp3]              \n\t"
+    "mflo       %[tmp1]                                                \n\t"
+    "mflo       %[tmp2],        $ac1                                   \n\t"
+    "sll        %[tmp6],        %[tmp6],          14                   \n\t"
+    "sll        %[tmp5],        %[tmp5],          14                   \n\t"
+    "shra_r.w   %[tmp1],        %[tmp1],          1                    \n\t"
+    "shra_r.w   %[tmp2],        %[tmp2],          1                    \n\t"
+    "subu       %[tmp4],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp1],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp6],        %[tmp5],          %[tmp2]              \n\t"
+    "subu       %[tmp5],        %[tmp5],          %[tmp2]              \n\t"
+    "shra_r.w   %[tmp1],        %[tmp1],          15                   \n\t"
+    "shra_r.w   %[tmp6],        %[tmp6],          15                   \n\t"
+    "shra_r.w   %[tmp4],        %[tmp4],          15                   \n\t"
+    "shra_r.w   %[tmp5],        %[tmp5],          15                   \n\t"
+#else  // #if defined(MIPS_DSP_R2_LE)
+    "mul        %[tmp2],        %[wr],            %[tmp4]              \n\t"
+    "mul        %[tmp1],        %[wr],            %[tmp3]              \n\t"
+    "mul        %[tmp4],        %[wi],            %[tmp4]              \n\t"
+    "mul        %[tmp3],        %[wi],            %[tmp3]              \n\t"
+    "sll        %[tmp6],        %[tmp6],          14                   \n\t"
+    "sll        %[tmp5],        %[tmp5],          14                   \n\t"
+    "addiu      %[tmp6],        %[tmp6],          16384                \n\t"
+    "addiu      %[tmp5],        %[tmp5],          16384                \n\t"
+    "addu       %[tmp1],        %[tmp1],          %[tmp4]              \n\t"
+    "subu       %[tmp2],        %[tmp2],          %[tmp3]              \n\t"
+    "addiu      %[tmp1],        %[tmp1],          1                    \n\t"
+    "addiu      %[tmp2],        %[tmp2],          1                    \n\t"
+    "sra        %[tmp1],        %[tmp1],          1                    \n\t"
+    "sra        %[tmp2],        %[tmp2],          1                    \n\t"
+    "subu       %[tmp4],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp1],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp6],        %[tmp5],          %[tmp2]              \n\t"
+    "subu       %[tmp5],        %[tmp5],          %[tmp2]              \n\t"
+    "sra        %[tmp4],        %[tmp4],          15                   \n\t"
+    "sra        %[tmp1],        %[tmp1],          15                   \n\t"
+    "sra        %[tmp6],        %[tmp6],          15                   \n\t"
+    "sra        %[tmp5],        %[tmp5],          15                   \n\t"
+#endif  // #if defined(MIPS_DSP_R2_LE)
+    "sh         %[tmp1],        0(%[ptr_i])                            \n\t"
+    "sh         %[tmp6],        2(%[ptr_i])                            \n\t"
+    "sh         %[tmp4],        0(%[ptr_j])                            \n\t"
+    "blt        %[i],           %[n],             1b                   \n\t"
+    " sh        %[tmp5],        2(%[ptr_j])                            \n\t"
+    "blt        %[m],           %[l],             2b                   \n\t"
+    " addu      %[i],           $zero,            %[m]                 \n\t"
+    "move       %[l],           %[istep]                               \n\t"
+    "blt        %[l],           %[n],             3b                   \n\t"
+    " addiu     %[k],           %[k],             -1                   \n\t"
+
+    ".set pop                                                          \n\t"
+
+    : [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2), [tmp3] "=&r" (tmp3),
+      [tmp4] "=&r" (tmp4), [tmp5] "=&r" (tmp5), [tmp6] "=&r" (tmp6),
+      [ptr_i] "=&r" (ptr_i), [i] "=&r" (i), [wi] "=&r" (wi), [wr] "=&r" (wr),
+      [m] "=&r" (m), [istep] "=&r" (istep), [l] "=&r" (l), [k] "=&r" (k),
+      [ptr_j] "=&r" (ptr_j), [tmp] "=&r" (tmp)
+    : [n] "r" (n), [frfi] "r" (frfi), [kSinTable1024] "r" (kSinTable1024)
+    : "hi", "lo", "memory"
+#if defined(MIPS_DSP_R2_LE)
+    , "$ac1hi", "$ac1lo"
+#endif  // #if defined(MIPS_DSP_R2_LE)
+  );
+
+  return 0;
+}
+
+int WebRtcSpl_ComplexIFFT(int16_t frfi[], int stages, int mode) {
+  int i = 0, l = 0, k = 0;
+  int istep = 0, n = 0, m = 0;
+  int scale = 0, shift = 0;
+  int32_t wr = 0, wi = 0;
+  int32_t tmp1 = 0, tmp2 = 0, tmp3 = 0, tmp4 = 0;
+  int32_t tmp5 = 0, tmp6 = 0, tmp = 0, tempMax = 0, round2 = 0;
+  int16_t* ptr_j = NULL;
+  int16_t* ptr_i = NULL;
+
+  n = 1 << stages;
+  if (n > 1024) {
+    return -1;
+  }
+
+  __asm __volatile (
+    ".set push                                                         \n\t"
+    ".set noreorder                                                    \n\t"
+
+    "addiu      %[k],           $zero,            10                   \n\t"
+    "addiu      %[l],           $zero,            1                    \n\t"
+    "move       %[scale],       $zero                                  \n\t"
+   "3:                                                                 \n\t"
+    "addiu      %[shift],       $zero,            14                   \n\t"
+    "addiu      %[round2],      $zero,            8192                 \n\t"
+    "move       %[ptr_i],       %[frfi]                                \n\t"
+    "move       %[tempMax],     $zero                                  \n\t"
+    "addu       %[i],           %[n],             %[n]                 \n\t"
+   "5:                                                                 \n\t"
+    "lh         %[tmp1],        0(%[ptr_i])                            \n\t"
+    "lh         %[tmp2],        2(%[ptr_i])                            \n\t"
+    "lh         %[tmp3],        4(%[ptr_i])                            \n\t"
+    "lh         %[tmp4],        6(%[ptr_i])                            \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "absq_s.w   %[tmp1],        %[tmp1]                                \n\t"
+    "absq_s.w   %[tmp2],        %[tmp2]                                \n\t"
+    "absq_s.w   %[tmp3],        %[tmp3]                                \n\t"
+    "absq_s.w   %[tmp4],        %[tmp4]                                \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "slt        %[tmp5],        %[tmp1],          $zero                \n\t"
+    "subu       %[tmp6],        $zero,            %[tmp1]              \n\t"
+    "movn       %[tmp1],        %[tmp6],          %[tmp5]              \n\t"
+    "slt        %[tmp5],        %[tmp2],          $zero                \n\t"
+    "subu       %[tmp6],        $zero,            %[tmp2]              \n\t"
+    "movn       %[tmp2],        %[tmp6],          %[tmp5]              \n\t"
+    "slt        %[tmp5],        %[tmp3],          $zero                \n\t"
+    "subu       %[tmp6],        $zero,            %[tmp3]              \n\t"
+    "movn       %[tmp3],        %[tmp6],          %[tmp5]              \n\t"
+    "slt        %[tmp5],        %[tmp4],          $zero                \n\t"
+    "subu       %[tmp6],        $zero,            %[tmp4]              \n\t"
+    "movn       %[tmp4],        %[tmp6],          %[tmp5]              \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+    "slt        %[tmp5],        %[tempMax],       %[tmp1]              \n\t"
+    "movn       %[tempMax],     %[tmp1],          %[tmp5]              \n\t"
+    "addiu      %[i],           %[i],             -4                   \n\t"
+    "slt        %[tmp5],        %[tempMax],       %[tmp2]              \n\t"
+    "movn       %[tempMax],     %[tmp2],          %[tmp5]              \n\t"
+    "slt        %[tmp5],        %[tempMax],       %[tmp3]              \n\t"
+    "movn       %[tempMax],     %[tmp3],          %[tmp5]              \n\t"
+    "slt        %[tmp5],        %[tempMax],       %[tmp4]              \n\t"
+    "movn       %[tempMax],     %[tmp4],          %[tmp5]              \n\t"
+    "bgtz       %[i],                             5b                   \n\t"
+    " addiu     %[ptr_i],       %[ptr_i],         8                    \n\t"
+    "addiu      %[tmp1],        $zero,            13573                \n\t"
+    "addiu      %[tmp2],        $zero,            27146                \n\t"
+#if !defined(MIPS32_R2_LE)
+    "sll        %[tempMax],     %[tempMax],       16                   \n\t"
+    "sra        %[tempMax],     %[tempMax],       16                   \n\t"
+#else  // #if !defined(MIPS32_R2_LE)
+    "seh        %[tempMax]                                             \n\t"
+#endif  // #if !defined(MIPS32_R2_LE)
+    "slt        %[tmp1],        %[tmp1],          %[tempMax]           \n\t"
+    "slt        %[tmp2],        %[tmp2],          %[tempMax]           \n\t"
+    "addu       %[tmp1],        %[tmp1],          %[tmp2]              \n\t"
+    "addu       %[shift],       %[shift],         %[tmp1]              \n\t"
+    "addu       %[scale],       %[scale],         %[tmp1]              \n\t"
+    "sllv       %[round2],      %[round2],        %[tmp1]              \n\t"
+    "sll        %[istep],       %[l],             1                    \n\t"
+    "move       %[m],           $zero                                  \n\t"
+    "sll        %[tmp],         %[l],             2                    \n\t"
+   "2:                                                                 \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "sllv       %[tmp3],        %[m],             %[k]                 \n\t"
+    "addiu      %[tmp2],        %[tmp3],          512                  \n\t"
+    "addiu      %[m],           %[m],             1                    \n\t"
+    "lhx        %[wi],          %[tmp3](%[kSinTable1024])              \n\t"
+    "lhx        %[wr],          %[tmp2](%[kSinTable1024])              \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "sllv       %[tmp3],        %[m],             %[k]                 \n\t"
+    "addu       %[ptr_j],       %[tmp3],          %[kSinTable1024]     \n\t"
+    "addiu      %[ptr_i],       %[ptr_j],         512                  \n\t"
+    "addiu      %[m],           %[m],             1                    \n\t"
+    "lh         %[wi],          0(%[ptr_j])                            \n\t"
+    "lh         %[wr],          0(%[ptr_i])                            \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+   "1:                                                                 \n\t"
+    "sll        %[tmp1],        %[i],             2                    \n\t"
+    "addu       %[ptr_i],       %[frfi],          %[tmp1]              \n\t"
+    "addu       %[ptr_j],       %[ptr_i],         %[tmp]               \n\t"
+    "lh         %[tmp3],        0(%[ptr_j])                            \n\t"
+    "lh         %[tmp4],        2(%[ptr_j])                            \n\t"
+    "lh         %[tmp6],        0(%[ptr_i])                            \n\t"
+    "lh         %[tmp5],        2(%[ptr_i])                            \n\t"
+    "addu       %[i],           %[i],             %[istep]             \n\t"
+#if defined(MIPS_DSP_R2_LE)
+    "mult       %[wr],          %[tmp3]                                \n\t"
+    "msub       %[wi],          %[tmp4]                                \n\t"
+    "mult       $ac1,           %[wr],            %[tmp4]              \n\t"
+    "madd       $ac1,           %[wi],            %[tmp3]              \n\t"
+    "mflo       %[tmp1]                                                \n\t"
+    "mflo       %[tmp2],        $ac1                                   \n\t"
+    "sll        %[tmp6],        %[tmp6],          14                   \n\t"
+    "sll        %[tmp5],        %[tmp5],          14                   \n\t"
+    "shra_r.w   %[tmp1],        %[tmp1],          1                    \n\t"
+    "shra_r.w   %[tmp2],        %[tmp2],          1                    \n\t"
+    "addu       %[tmp6],        %[tmp6],          %[round2]            \n\t"
+    "addu       %[tmp5],        %[tmp5],          %[round2]            \n\t"
+    "subu       %[tmp4],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp1],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp6],        %[tmp5],          %[tmp2]              \n\t"
+    "subu       %[tmp5],        %[tmp5],          %[tmp2]              \n\t"
+    "srav       %[tmp4],        %[tmp4],          %[shift]             \n\t"
+    "srav       %[tmp1],        %[tmp1],          %[shift]             \n\t"
+    "srav       %[tmp6],        %[tmp6],          %[shift]             \n\t"
+    "srav       %[tmp5],        %[tmp5],          %[shift]             \n\t"
+#else  // #if defined(MIPS_DSP_R2_LE)
+    "mul        %[tmp1],        %[wr],            %[tmp3]              \n\t"
+    "mul        %[tmp2],        %[wr],            %[tmp4]              \n\t"
+    "mul        %[tmp4],        %[wi],            %[tmp4]              \n\t"
+    "mul        %[tmp3],        %[wi],            %[tmp3]              \n\t"
+    "sll        %[tmp6],        %[tmp6],          14                   \n\t"
+    "sll        %[tmp5],        %[tmp5],          14                   \n\t"
+    "sub        %[tmp1],        %[tmp1],          %[tmp4]              \n\t"
+    "addu       %[tmp2],        %[tmp2],          %[tmp3]              \n\t"
+    "addiu      %[tmp1],        %[tmp1],          1                    \n\t"
+    "addiu      %[tmp2],        %[tmp2],          1                    \n\t"
+    "sra        %[tmp2],        %[tmp2],          1                    \n\t"
+    "sra        %[tmp1],        %[tmp1],          1                    \n\t"
+    "addu       %[tmp6],        %[tmp6],          %[round2]            \n\t"
+    "addu       %[tmp5],        %[tmp5],          %[round2]            \n\t"
+    "subu       %[tmp4],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp1],        %[tmp6],          %[tmp1]              \n\t"
+    "addu       %[tmp6],        %[tmp5],          %[tmp2]              \n\t"
+    "subu       %[tmp5],        %[tmp5],          %[tmp2]              \n\t"
+    "sra        %[tmp4],        %[tmp4],          %[shift]             \n\t"
+    "sra        %[tmp1],        %[tmp1],          %[shift]             \n\t"
+    "sra        %[tmp6],        %[tmp6],          %[shift]             \n\t"
+    "sra        %[tmp5],        %[tmp5],          %[shift]             \n\t"
+#endif  // #if defined(MIPS_DSP_R2_LE)
+    "sh         %[tmp1],         0(%[ptr_i])                           \n\t"
+    "sh         %[tmp6],         2(%[ptr_i])                           \n\t"
+    "sh         %[tmp4],         0(%[ptr_j])                           \n\t"
+    "blt        %[i],            %[n],            1b                   \n\t"
+    " sh        %[tmp5],         2(%[ptr_j])                           \n\t"
+    "blt        %[m],            %[l],            2b                   \n\t"
+    " addu      %[i],            $zero,           %[m]                 \n\t"
+    "move       %[l],            %[istep]                              \n\t"
+    "blt        %[l],            %[n],            3b                   \n\t"
+    " addiu     %[k],            %[k],            -1                   \n\t"
+
+    ".set pop                                                          \n\t"
+
+    : [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2), [tmp3] "=&r" (tmp3),
+      [tmp4] "=&r" (tmp4), [tmp5] "=&r" (tmp5), [tmp6] "=&r" (tmp6),
+      [ptr_i] "=&r" (ptr_i), [i] "=&r" (i), [m] "=&r" (m), [tmp] "=&r" (tmp),
+      [istep] "=&r" (istep), [wi] "=&r" (wi), [wr] "=&r" (wr), [l] "=&r" (l),
+      [k] "=&r" (k), [round2] "=&r" (round2), [ptr_j] "=&r" (ptr_j),
+      [shift] "=&r" (shift), [scale] "=&r" (scale), [tempMax] "=&r" (tempMax)
+    : [n] "r" (n), [frfi] "r" (frfi), [kSinTable1024] "r" (kSinTable1024)
+    : "hi", "lo", "memory"
+#if defined(MIPS_DSP_R2_LE)
+    , "$ac1hi", "$ac1lo"
+#endif  // #if defined(MIPS_DSP_R2_LE)
+  );
+
+  return scale;
+
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft_tables.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft_tables.h
new file mode 100644
index 0000000..ca7b7fe
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/complex_fft_tables.h
@@ -0,0 +1,148 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_COMPLEX_FFT_TABLES_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_COMPLEX_FFT_TABLES_H_
+
+#include "webrtc/typedefs.h"
+
+static const int16_t kSinTable1024[] = {
+       0,    201,    402,    603,    804,   1005,   1206,   1406,
+    1607,   1808,   2009,   2209,   2410,   2610,   2811,   3011,
+    3211,   3411,   3611,   3811,   4011,   4210,   4409,   4608,
+    4807,   5006,   5205,   5403,   5601,   5799,   5997,   6195,
+    6392,   6589,   6786,   6982,   7179,   7375,   7571,   7766,
+    7961,   8156,   8351,   8545,   8739,   8932,   9126,   9319,
+    9511,   9703,   9895,  10087,  10278,  10469,  10659,  10849,
+   11038,  11227,  11416,  11604,  11792,  11980,  12166,  12353,
+   12539,  12724,  12909,  13094,  13278,  13462,  13645,  13827,
+   14009,  14191,  14372,  14552,  14732,  14911,  15090,  15268,
+   15446,  15623,  15799,  15975,  16150,  16325,  16499,  16672,
+   16845,  17017,  17189,  17360,  17530,  17699,  17868,  18036,
+   18204,  18371,  18537,  18702,  18867,  19031,  19194,  19357,
+   19519,  19680,  19840,  20000,  20159,  20317,  20474,  20631,
+   20787,  20942,  21096,  21249,  21402,  21554,  21705,  21855,
+   22004,  22153,  22301,  22448,  22594,  22739,  22883,  23027,
+   23169,  23311,  23452,  23592,  23731,  23869,  24006,  24143,
+   24278,  24413,  24546,  24679,  24811,  24942,  25072,  25201,
+   25329,  25456,  25582,  25707,  25831,  25954,  26077,  26198,
+   26318,  26437,  26556,  26673,  26789,  26905,  27019,  27132,
+   27244,  27355,  27466,  27575,  27683,  27790,  27896,  28001,
+   28105,  28208,  28309,  28410,  28510,  28608,  28706,  28802,
+   28897,  28992,  29085,  29177,  29268,  29358,  29446,  29534,
+   29621,  29706,  29790,  29873,  29955,  30036,  30116,  30195,
+   30272,  30349,  30424,  30498,  30571,  30643,  30713,  30783,
+   30851,  30918,  30984,  31049,  31113,  31175,  31236,  31297,
+   31356,  31413,  31470,  31525,  31580,  31633,  31684,  31735,
+   31785,  31833,  31880,  31926,  31970,  32014,  32056,  32097,
+   32137,  32176,  32213,  32249,  32284,  32318,  32350,  32382,
+   32412,  32441,  32468,  32495,  32520,  32544,  32567,  32588,
+   32609,  32628,  32646,  32662,  32678,  32692,  32705,  32717,
+   32727,  32736,  32744,  32751,  32757,  32761,  32764,  32766,
+   32767,  32766,  32764,  32761,  32757,  32751,  32744,  32736,
+   32727,  32717,  32705,  32692,  32678,  32662,  32646,  32628,
+   32609,  32588,  32567,  32544,  32520,  32495,  32468,  32441,
+   32412,  32382,  32350,  32318,  32284,  32249,  32213,  32176,
+   32137,  32097,  32056,  32014,  31970,  31926,  31880,  31833,
+   31785,  31735,  31684,  31633,  31580,  31525,  31470,  31413,
+   31356,  31297,  31236,  31175,  31113,  31049,  30984,  30918,
+   30851,  30783,  30713,  30643,  30571,  30498,  30424,  30349,
+   30272,  30195,  30116,  30036,  29955,  29873,  29790,  29706,
+   29621,  29534,  29446,  29358,  29268,  29177,  29085,  28992,
+   28897,  28802,  28706,  28608,  28510,  28410,  28309,  28208,
+   28105,  28001,  27896,  27790,  27683,  27575,  27466,  27355,
+   27244,  27132,  27019,  26905,  26789,  26673,  26556,  26437,
+   26318,  26198,  26077,  25954,  25831,  25707,  25582,  25456,
+   25329,  25201,  25072,  24942,  24811,  24679,  24546,  24413,
+   24278,  24143,  24006,  23869,  23731,  23592,  23452,  23311,
+   23169,  23027,  22883,  22739,  22594,  22448,  22301,  22153,
+   22004,  21855,  21705,  21554,  21402,  21249,  21096,  20942,
+   20787,  20631,  20474,  20317,  20159,  20000,  19840,  19680,
+   19519,  19357,  19194,  19031,  18867,  18702,  18537,  18371,
+   18204,  18036,  17868,  17699,  17530,  17360,  17189,  17017,
+   16845,  16672,  16499,  16325,  16150,  15975,  15799,  15623,
+   15446,  15268,  15090,  14911,  14732,  14552,  14372,  14191,
+   14009,  13827,  13645,  13462,  13278,  13094,  12909,  12724,
+   12539,  12353,  12166,  11980,  11792,  11604,  11416,  11227,
+   11038,  10849,  10659,  10469,  10278,  10087,   9895,   9703,
+    9511,   9319,   9126,   8932,   8739,   8545,   8351,   8156,
+    7961,   7766,   7571,   7375,   7179,   6982,   6786,   6589,
+    6392,   6195,   5997,   5799,   5601,   5403,   5205,   5006,
+    4807,   4608,   4409,   4210,   4011,   3811,   3611,   3411,
+    3211,   3011,   2811,   2610,   2410,   2209,   2009,   1808,
+    1607,   1406,   1206,   1005,    804,    603,    402,    201,
+       0,   -201,   -402,   -603,   -804,  -1005,  -1206,  -1406,
+   -1607,  -1808,  -2009,  -2209,  -2410,  -2610,  -2811,  -3011,
+   -3211,  -3411,  -3611,  -3811,  -4011,  -4210,  -4409,  -4608,
+   -4807,  -5006,  -5205,  -5403,  -5601,  -5799,  -5997,  -6195,
+   -6392,  -6589,  -6786,  -6982,  -7179,  -7375,  -7571,  -7766,
+   -7961,  -8156,  -8351,  -8545,  -8739,  -8932,  -9126,  -9319,
+   -9511,  -9703,  -9895, -10087, -10278, -10469, -10659, -10849,
+  -11038, -11227, -11416, -11604, -11792, -11980, -12166, -12353,
+  -12539, -12724, -12909, -13094, -13278, -13462, -13645, -13827,
+  -14009, -14191, -14372, -14552, -14732, -14911, -15090, -15268,
+  -15446, -15623, -15799, -15975, -16150, -16325, -16499, -16672,
+  -16845, -17017, -17189, -17360, -17530, -17699, -17868, -18036,
+  -18204, -18371, -18537, -18702, -18867, -19031, -19194, -19357,
+  -19519, -19680, -19840, -20000, -20159, -20317, -20474, -20631,
+  -20787, -20942, -21096, -21249, -21402, -21554, -21705, -21855,
+  -22004, -22153, -22301, -22448, -22594, -22739, -22883, -23027,
+  -23169, -23311, -23452, -23592, -23731, -23869, -24006, -24143,
+  -24278, -24413, -24546, -24679, -24811, -24942, -25072, -25201,
+  -25329, -25456, -25582, -25707, -25831, -25954, -26077, -26198,
+  -26318, -26437, -26556, -26673, -26789, -26905, -27019, -27132,
+  -27244, -27355, -27466, -27575, -27683, -27790, -27896, -28001,
+  -28105, -28208, -28309, -28410, -28510, -28608, -28706, -28802,
+  -28897, -28992, -29085, -29177, -29268, -29358, -29446, -29534,
+  -29621, -29706, -29790, -29873, -29955, -30036, -30116, -30195,
+  -30272, -30349, -30424, -30498, -30571, -30643, -30713, -30783,
+  -30851, -30918, -30984, -31049, -31113, -31175, -31236, -31297,
+  -31356, -31413, -31470, -31525, -31580, -31633, -31684, -31735,
+  -31785, -31833, -31880, -31926, -31970, -32014, -32056, -32097,
+  -32137, -32176, -32213, -32249, -32284, -32318, -32350, -32382,
+  -32412, -32441, -32468, -32495, -32520, -32544, -32567, -32588,
+  -32609, -32628, -32646, -32662, -32678, -32692, -32705, -32717,
+  -32727, -32736, -32744, -32751, -32757, -32761, -32764, -32766,
+  -32767, -32766, -32764, -32761, -32757, -32751, -32744, -32736,
+  -32727, -32717, -32705, -32692, -32678, -32662, -32646, -32628,
+  -32609, -32588, -32567, -32544, -32520, -32495, -32468, -32441,
+  -32412, -32382, -32350, -32318, -32284, -32249, -32213, -32176,
+  -32137, -32097, -32056, -32014, -31970, -31926, -31880, -31833,
+  -31785, -31735, -31684, -31633, -31580, -31525, -31470, -31413,
+  -31356, -31297, -31236, -31175, -31113, -31049, -30984, -30918,
+  -30851, -30783, -30713, -30643, -30571, -30498, -30424, -30349,
+  -30272, -30195, -30116, -30036, -29955, -29873, -29790, -29706,
+  -29621, -29534, -29446, -29358, -29268, -29177, -29085, -28992,
+  -28897, -28802, -28706, -28608, -28510, -28410, -28309, -28208,
+  -28105, -28001, -27896, -27790, -27683, -27575, -27466, -27355,
+  -27244, -27132, -27019, -26905, -26789, -26673, -26556, -26437,
+  -26318, -26198, -26077, -25954, -25831, -25707, -25582, -25456,
+  -25329, -25201, -25072, -24942, -24811, -24679, -24546, -24413,
+  -24278, -24143, -24006, -23869, -23731, -23592, -23452, -23311,
+  -23169, -23027, -22883, -22739, -22594, -22448, -22301, -22153,
+  -22004, -21855, -21705, -21554, -21402, -21249, -21096, -20942,
+  -20787, -20631, -20474, -20317, -20159, -20000, -19840, -19680,
+  -19519, -19357, -19194, -19031, -18867, -18702, -18537, -18371,
+  -18204, -18036, -17868, -17699, -17530, -17360, -17189, -17017,
+  -16845, -16672, -16499, -16325, -16150, -15975, -15799, -15623,
+  -15446, -15268, -15090, -14911, -14732, -14552, -14372, -14191,
+  -14009, -13827, -13645, -13462, -13278, -13094, -12909, -12724,
+  -12539, -12353, -12166, -11980, -11792, -11604, -11416, -11227,
+  -11038, -10849, -10659, -10469, -10278, -10087,  -9895,  -9703,
+   -9511,  -9319,  -9126,  -8932,  -8739,  -8545,  -8351,  -8156,
+   -7961,  -7766,  -7571,  -7375,  -7179,  -6982,  -6786,  -6589,
+   -6392,  -6195,  -5997,  -5799,  -5601,  -5403,  -5205,  -5006,
+   -4807,  -4608,  -4409,  -4210,  -4011,  -3811,  -3611,  -3411,
+   -3211,  -3011,  -2811,  -2610,  -2410,  -2209,  -2009,  -1808,
+   -1607,  -1406,  -1206,  -1005,   -804,   -603,   -402,   -201
+};
+
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_COMPLEX_FFT_TABLES_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/copy_set_operations.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/copy_set_operations.c
new file mode 100644
index 0000000..9d7cf47
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/copy_set_operations.c
@@ -0,0 +1,82 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the implementation of functions
+ * WebRtcSpl_MemSetW16()
+ * WebRtcSpl_MemSetW32()
+ * WebRtcSpl_MemCpyReversedOrder()
+ * WebRtcSpl_CopyFromEndW16()
+ * WebRtcSpl_ZerosArrayW16()
+ * WebRtcSpl_ZerosArrayW32()
+ *
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include <string.h>
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+
+void WebRtcSpl_MemSetW16(int16_t *ptr, int16_t set_value, size_t length)
+{
+    size_t j;
+    int16_t *arrptr = ptr;
+
+    for (j = length; j > 0; j--)
+    {
+        *arrptr++ = set_value;
+    }
+}
+
+void WebRtcSpl_MemSetW32(int32_t *ptr, int32_t set_value, size_t length)
+{
+    size_t j;
+    int32_t *arrptr = ptr;
+
+    for (j = length; j > 0; j--)
+    {
+        *arrptr++ = set_value;
+    }
+}
+
+void WebRtcSpl_MemCpyReversedOrder(int16_t* dest,
+                                   int16_t* source,
+                                   size_t length)
+{
+    size_t j;
+    int16_t* destPtr = dest;
+    int16_t* sourcePtr = source;
+
+    for (j = 0; j < length; j++)
+    {
+        *destPtr-- = *sourcePtr++;
+    }
+}
+
+void WebRtcSpl_CopyFromEndW16(const int16_t *vector_in,
+                              size_t length,
+                              size_t samples,
+                              int16_t *vector_out)
+{
+    // Copy the last <samples> of the input vector to vector_out
+    WEBRTC_SPL_MEMCPY_W16(vector_out, &vector_in[length - samples], samples);
+}
+
+void WebRtcSpl_ZerosArrayW16(int16_t *vector, size_t length)
+{
+    WebRtcSpl_MemSetW16(vector, 0, length);
+}
+
+void WebRtcSpl_ZerosArrayW32(int32_t *vector, size_t length)
+{
+    WebRtcSpl_MemSetW32(vector, 0, length);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation.c
new file mode 100644
index 0000000..d7c9f2b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation.c
@@ -0,0 +1,30 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+/* C version of WebRtcSpl_CrossCorrelation() for generic platforms. */
+void WebRtcSpl_CrossCorrelationC(int32_t* cross_correlation,
+                                 const int16_t* seq1,
+                                 const int16_t* seq2,
+                                 size_t dim_seq,
+                                 size_t dim_cross_correlation,
+                                 int right_shifts,
+                                 int step_seq2) {
+  size_t i = 0, j = 0;
+
+  for (i = 0; i < dim_cross_correlation; i++) {
+    int32_t corr = 0;
+    for (j = 0; j < dim_seq; j++)
+      corr += (seq1[j] * seq2[j]) >> right_shifts;
+    seq2 += step_seq2;
+    *cross_correlation++ = corr;
+  }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation_mips.c
new file mode 100644
index 0000000..b236402
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation_mips.c
@@ -0,0 +1,104 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_CrossCorrelation_mips(int32_t* cross_correlation,
+                                     const int16_t* seq1,
+                                     const int16_t* seq2,
+                                     size_t dim_seq,
+                                     size_t dim_cross_correlation,
+                                     int right_shifts,
+                                     int step_seq2) {
+
+  int32_t t0 = 0, t1 = 0, t2 = 0, t3 = 0, sum = 0;
+  int16_t *pseq2 = NULL;
+  int16_t *pseq1 = NULL;
+  int16_t *pseq1_0 = (int16_t*)&seq1[0];
+  int16_t *pseq2_0 = (int16_t*)&seq2[0];
+  int k = 0;
+
+  __asm __volatile (
+    ".set        push                                           \n\t"
+    ".set        noreorder                                      \n\t"
+    "sll         %[step_seq2], %[step_seq2],   1                \n\t"
+    "andi        %[t0],        %[dim_seq],     1                \n\t"
+    "bgtz        %[t0],        3f                               \n\t"
+    " nop                                                       \n\t"
+   "1:                                                          \n\t"
+    "move        %[pseq1],     %[pseq1_0]                       \n\t"
+    "move        %[pseq2],     %[pseq2_0]                       \n\t"
+    "sra         %[k],         %[dim_seq],     1                \n\t"
+    "addiu       %[dim_cc],    %[dim_cc],      -1               \n\t"
+    "xor         %[sum],       %[sum],         %[sum]           \n\t"
+   "2:                                                          \n\t"
+    "lh          %[t0],        0(%[pseq1])                      \n\t"
+    "lh          %[t1],        0(%[pseq2])                      \n\t"
+    "lh          %[t2],        2(%[pseq1])                      \n\t"
+    "lh          %[t3],        2(%[pseq2])                      \n\t"
+    "mul         %[t0],        %[t0],          %[t1]            \n\t"
+    "addiu       %[k],         %[k],           -1               \n\t"
+    "mul         %[t2],        %[t2],          %[t3]            \n\t"
+    "addiu       %[pseq1],     %[pseq1],       4                \n\t"
+    "addiu       %[pseq2],     %[pseq2],       4                \n\t"
+    "srav        %[t0],        %[t0],          %[right_shifts]  \n\t"
+    "addu        %[sum],       %[sum],         %[t0]            \n\t"
+    "srav        %[t2],        %[t2],          %[right_shifts]  \n\t"
+    "bgtz        %[k],         2b                               \n\t"
+    " addu       %[sum],       %[sum],         %[t2]            \n\t"
+    "addu        %[pseq2_0],   %[pseq2_0],     %[step_seq2]     \n\t"
+    "sw          %[sum],       0(%[cc])                         \n\t"
+    "bgtz        %[dim_cc],    1b                               \n\t"
+    " addiu      %[cc],        %[cc],          4                \n\t"
+    "b           6f                                             \n\t"
+    " nop                                                       \n\t"
+   "3:                                                          \n\t"
+    "move        %[pseq1],     %[pseq1_0]                       \n\t"
+    "move        %[pseq2],     %[pseq2_0]                       \n\t"
+    "sra         %[k],         %[dim_seq],     1                \n\t"
+    "addiu       %[dim_cc],    %[dim_cc],      -1               \n\t"
+    "beqz        %[k],         5f                               \n\t"
+    " xor        %[sum],       %[sum],         %[sum]           \n\t"
+   "4:                                                          \n\t"
+    "lh          %[t0],        0(%[pseq1])                      \n\t"
+    "lh          %[t1],        0(%[pseq2])                      \n\t"
+    "lh          %[t2],        2(%[pseq1])                      \n\t"
+    "lh          %[t3],        2(%[pseq2])                      \n\t"
+    "mul         %[t0],        %[t0],          %[t1]            \n\t"
+    "addiu       %[k],         %[k],           -1               \n\t"
+    "mul         %[t2],        %[t2],          %[t3]            \n\t"
+    "addiu       %[pseq1],     %[pseq1],       4                \n\t"
+    "addiu       %[pseq2],     %[pseq2],       4                \n\t"
+    "srav        %[t0],        %[t0],          %[right_shifts]  \n\t"
+    "addu        %[sum],       %[sum],         %[t0]            \n\t"
+    "srav        %[t2],        %[t2],          %[right_shifts]  \n\t"
+    "bgtz        %[k],         4b                               \n\t"
+    " addu       %[sum],       %[sum],         %[t2]            \n\t"
+   "5:                                                          \n\t"
+    "lh          %[t0],        0(%[pseq1])                      \n\t"
+    "lh          %[t1],        0(%[pseq2])                      \n\t"
+    "mul         %[t0],        %[t0],          %[t1]            \n\t"
+    "srav        %[t0],        %[t0],          %[right_shifts]  \n\t"
+    "addu        %[sum],       %[sum],         %[t0]            \n\t"
+    "addu        %[pseq2_0],   %[pseq2_0],     %[step_seq2]     \n\t"
+    "sw          %[sum],       0(%[cc])                         \n\t"
+    "bgtz        %[dim_cc],    3b                               \n\t"
+    " addiu      %[cc],        %[cc],          4                \n\t"
+   "6:                                                          \n\t"
+    ".set        pop                                            \n\t"
+    : [step_seq2] "+r" (step_seq2), [t0] "=&r" (t0), [t1] "=&r" (t1),
+      [t2] "=&r" (t2), [t3] "=&r" (t3), [pseq1] "=&r" (pseq1),
+      [pseq2] "=&r" (pseq2), [pseq1_0] "+r" (pseq1_0), [pseq2_0] "+r" (pseq2_0),
+      [k] "=&r" (k), [dim_cc] "+r" (dim_cross_correlation), [sum] "=&r" (sum),
+      [cc] "+r" (cross_correlation)
+    : [dim_seq] "r" (dim_seq), [right_shifts] "r" (right_shifts)
+    : "hi", "lo", "memory"
+  );
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation_neon.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation_neon.c
new file mode 100644
index 0000000..918b671
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/cross_correlation_neon.c
@@ -0,0 +1,87 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#include <arm_neon.h>
+
+static inline void DotProductWithScaleNeon(int32_t* cross_correlation,
+                                           const int16_t* vector1,
+                                           const int16_t* vector2,
+                                           size_t length,
+                                           int scaling) {
+  size_t i = 0;
+  size_t len1 = length >> 3;
+  size_t len2 = length & 7;
+  int64x2_t sum0 = vdupq_n_s64(0);
+  int64x2_t sum1 = vdupq_n_s64(0);
+
+  for (i = len1; i > 0; i -= 1) {
+    int16x8_t seq1_16x8 = vld1q_s16(vector1);
+    int16x8_t seq2_16x8 = vld1q_s16(vector2);
+#if defined(WEBRTC_ARCH_ARM64)
+    int32x4_t tmp0 = vmull_s16(vget_low_s16(seq1_16x8),
+                               vget_low_s16(seq2_16x8));
+    int32x4_t tmp1 = vmull_high_s16(seq1_16x8, seq2_16x8);
+#else
+    int32x4_t tmp0 = vmull_s16(vget_low_s16(seq1_16x8),
+                               vget_low_s16(seq2_16x8));
+    int32x4_t tmp1 = vmull_s16(vget_high_s16(seq1_16x8),
+                               vget_high_s16(seq2_16x8));
+#endif
+    sum0 = vpadalq_s32(sum0, tmp0);
+    sum1 = vpadalq_s32(sum1, tmp1);
+    vector1 += 8;
+    vector2 += 8;
+  }
+
+  // Calculate the rest of the samples.
+  int64_t sum_res = 0;
+  for (i = len2; i > 0; i -= 1) {
+    sum_res += WEBRTC_SPL_MUL_16_16(*vector1, *vector2);
+    vector1++;
+    vector2++;
+  }
+
+  sum0 = vaddq_s64(sum0, sum1);
+#if defined(WEBRTC_ARCH_ARM64)
+  int64_t sum2 = vaddvq_s64(sum0);
+  *cross_correlation = (int32_t)((sum2 + sum_res) >> scaling);
+#else
+  int64x1_t shift = vdup_n_s64(-scaling);
+  int64x1_t sum2 = vadd_s64(vget_low_s64(sum0), vget_high_s64(sum0));
+  sum2 = vadd_s64(sum2, vdup_n_s64(sum_res));
+  sum2 = vshl_s64(sum2, shift);
+  vst1_lane_s32(cross_correlation, vreinterpret_s32_s64(sum2), 0);
+#endif
+}
+
+/* NEON version of WebRtcSpl_CrossCorrelation() for ARM32/64 platforms. */
+void WebRtcSpl_CrossCorrelationNeon(int32_t* cross_correlation,
+                                    const int16_t* seq1,
+                                    const int16_t* seq2,
+                                    size_t dim_seq,
+                                    size_t dim_cross_correlation,
+                                    int right_shifts,
+                                    int step_seq2) {
+  size_t i = 0;
+
+  for (i = 0; i < dim_cross_correlation; i++) {
+    const int16_t* seq1_ptr = seq1;
+    const int16_t* seq2_ptr = seq2 + (step_seq2 * i);
+
+    DotProductWithScaleNeon(cross_correlation,
+                            seq1_ptr,
+                            seq2_ptr,
+                            dim_seq,
+                            right_shifts);
+    cross_correlation++;
+  }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/division_operations.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/division_operations.c
new file mode 100644
index 0000000..eaa06a1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/division_operations.c
@@ -0,0 +1,138 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains implementations of the divisions
+ * WebRtcSpl_DivU32U16()
+ * WebRtcSpl_DivW32W16()
+ * WebRtcSpl_DivW32W16ResW16()
+ * WebRtcSpl_DivResultInQ31()
+ * WebRtcSpl_DivW32HiLow()
+ *
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+uint32_t WebRtcSpl_DivU32U16(uint32_t num, uint16_t den)
+{
+    // Guard against division with 0
+    if (den != 0)
+    {
+        return (uint32_t)(num / den);
+    } else
+    {
+        return (uint32_t)0xFFFFFFFF;
+    }
+}
+
+int32_t WebRtcSpl_DivW32W16(int32_t num, int16_t den)
+{
+    // Guard against division with 0
+    if (den != 0)
+    {
+        return (int32_t)(num / den);
+    } else
+    {
+        return (int32_t)0x7FFFFFFF;
+    }
+}
+
+int16_t WebRtcSpl_DivW32W16ResW16(int32_t num, int16_t den)
+{
+    // Guard against division with 0
+    if (den != 0)
+    {
+        return (int16_t)(num / den);
+    } else
+    {
+        return (int16_t)0x7FFF;
+    }
+}
+
+int32_t WebRtcSpl_DivResultInQ31(int32_t num, int32_t den)
+{
+    int32_t L_num = num;
+    int32_t L_den = den;
+    int32_t div = 0;
+    int k = 31;
+    int change_sign = 0;
+
+    if (num == 0)
+        return 0;
+
+    if (num < 0)
+    {
+        change_sign++;
+        L_num = -num;
+    }
+    if (den < 0)
+    {
+        change_sign++;
+        L_den = -den;
+    }
+    while (k--)
+    {
+        div <<= 1;
+        L_num <<= 1;
+        if (L_num >= L_den)
+        {
+            L_num -= L_den;
+            div++;
+        }
+    }
+    if (change_sign == 1)
+    {
+        div = -div;
+    }
+    return div;
+}
+
+int32_t WebRtcSpl_DivW32HiLow(int32_t num, int16_t den_hi, int16_t den_low)
+{
+    int16_t approx, tmp_hi, tmp_low, num_hi, num_low;
+    int32_t tmpW32;
+
+    approx = (int16_t)WebRtcSpl_DivW32W16((int32_t)0x1FFFFFFF, den_hi);
+    // result in Q14 (Note: 3FFFFFFF = 0.5 in Q30)
+
+    // tmpW32 = 1/den = approx * (2.0 - den * approx) (in Q30)
+    tmpW32 = (den_hi * approx << 1) + ((den_low * approx >> 15) << 1);
+    // tmpW32 = den * approx
+
+    tmpW32 = (int32_t)0x7fffffffL - tmpW32; // result in Q30 (tmpW32 = 2.0-(den*approx))
+
+    // Store tmpW32 in hi and low format
+    tmp_hi = (int16_t)(tmpW32 >> 16);
+    tmp_low = (int16_t)((tmpW32 - ((int32_t)tmp_hi << 16)) >> 1);
+
+    // tmpW32 = 1/den in Q29
+    tmpW32 = (tmp_hi * approx + (tmp_low * approx >> 15)) << 1;
+
+    // 1/den in hi and low format
+    tmp_hi = (int16_t)(tmpW32 >> 16);
+    tmp_low = (int16_t)((tmpW32 - ((int32_t)tmp_hi << 16)) >> 1);
+
+    // Store num in hi and low format
+    num_hi = (int16_t)(num >> 16);
+    num_low = (int16_t)((num - ((int32_t)num_hi << 16)) >> 1);
+
+    // num * (1/den) by 32 bit multiplication (result in Q28)
+
+    tmpW32 = num_hi * tmp_hi + (num_hi * tmp_low >> 15) +
+        (num_low * tmp_hi >> 15);
+
+    // Put result in Q31 (convert from Q28)
+    tmpW32 = WEBRTC_SPL_LSHIFT_W32(tmpW32, 3);
+
+    return tmpW32;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/dot_product_with_scale.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/dot_product_with_scale.cc
new file mode 100644
index 0000000..4067ab5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/dot_product_with_scale.cc
@@ -0,0 +1,34 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/dot_product_with_scale.h"
+
+#include "webrtc/base/safe_conversions.h"
+
+int32_t WebRtcSpl_DotProductWithScale(const int16_t* vector1,
+                                      const int16_t* vector2,
+                                      size_t length,
+                                      int scaling) {
+  int64_t sum = 0;
+  size_t i = 0;
+
+  /* Unroll the loop to improve performance. */
+  for (i = 0; i + 3 < length; i += 4) {
+    sum += (vector1[i + 0] * vector2[i + 0]) >> scaling;
+    sum += (vector1[i + 1] * vector2[i + 1]) >> scaling;
+    sum += (vector1[i + 2] * vector2[i + 2]) >> scaling;
+    sum += (vector1[i + 3] * vector2[i + 3]) >> scaling;
+  }
+  for (; i < length; i++) {
+    sum += (vector1[i] * vector2[i]) >> scaling;
+  }
+
+  return rtc::saturated_cast<int32_t>(sum);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/dot_product_with_scale.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/dot_product_with_scale.h
new file mode 100644
index 0000000..288fe5e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/dot_product_with_scale.h
@@ -0,0 +1,41 @@
+/*
+ *  Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_DOT_PRODUCT_WITH_SCALE_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_DOT_PRODUCT_WITH_SCALE_H_
+
+#include <string.h>
+
+#include "webrtc/typedefs.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+// Calculates the dot product between two (int16_t) vectors.
+//
+// Input:
+//      - vector1       : Vector 1
+//      - vector2       : Vector 2
+//      - vector_length : Number of samples used in the dot product
+//      - scaling       : The number of right bit shifts to apply on each term
+//                        during calculation to avoid overflow, i.e., the
+//                        output will be in Q(-|scaling|)
+//
+// Return value         : The dot product in Q(-scaling)
+int32_t WebRtcSpl_DotProductWithScale(const int16_t* vector1,
+                                      const int16_t* vector2,
+                                      size_t length,
+                                      int scaling);
+
+#ifdef __cplusplus
+}
+#endif  // __cplusplus
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_DOT_PRODUCT_WITH_SCALE_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast.c
new file mode 100644
index 0000000..3cbc3c1
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast.c
@@ -0,0 +1,60 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#include "webrtc/base/checks.h"
+#include "webrtc/base/sanitizer.h"
+
+// TODO(Bjornv): Change the function parameter order to WebRTC code style.
+// C version of WebRtcSpl_DownsampleFast() for generic platforms.
+int WebRtcSpl_DownsampleFastC(const int16_t* data_in,
+                              size_t data_in_length,
+                              int16_t* data_out,
+                              size_t data_out_length,
+                              const int16_t* __restrict coefficients,
+                              size_t coefficients_length,
+                              int factor,
+                              size_t delay) {
+  int16_t* const original_data_out = data_out;
+  size_t i = 0;
+  size_t j = 0;
+  int32_t out_s32 = 0;
+  size_t endpos = delay + factor * (data_out_length - 1) + 1;
+
+  // Return error if any of the running conditions doesn't meet.
+  if (data_out_length == 0 || coefficients_length == 0
+                           || data_in_length < endpos) {
+    return -1;
+  }
+
+  rtc_MsanCheckInitialized(coefficients, sizeof(coefficients[0]),
+                           coefficients_length);
+
+  for (i = delay; i < endpos; i += factor) {
+    out_s32 = 2048;  // Round value, 0.5 in Q12.
+
+    for (j = 0; j < coefficients_length; j++) {
+      rtc_MsanCheckInitialized(&data_in[i - j], sizeof(data_in[0]), 1);
+      out_s32 += coefficients[j] * data_in[i - j];  // Q12.
+    }
+
+    out_s32 >>= 12;  // Q0.
+
+    // Saturate and store the output.
+    *data_out++ = WebRtcSpl_SatW32ToW16(out_s32);
+  }
+
+  RTC_DCHECK_EQ(original_data_out + data_out_length, data_out);
+  rtc_MsanCheckInitialized(original_data_out, sizeof(original_data_out[0]),
+                           data_out_length);
+
+  return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast_mips.c
new file mode 100644
index 0000000..ac39401
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast_mips.c
@@ -0,0 +1,169 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// Version of WebRtcSpl_DownsampleFast() for MIPS platforms.
+int WebRtcSpl_DownsampleFast_mips(const int16_t* data_in,
+                                  size_t data_in_length,
+                                  int16_t* data_out,
+                                  size_t data_out_length,
+                                  const int16_t* __restrict coefficients,
+                                  size_t coefficients_length,
+                                  int factor,
+                                  size_t delay) {
+  int i;
+  int j;
+  int k;
+  int32_t out_s32 = 0;
+  size_t endpos = delay + factor * (data_out_length - 1) + 1;
+
+  int32_t  tmp1, tmp2, tmp3, tmp4, factor_2;
+  int16_t* p_coefficients;
+  int16_t* p_data_in;
+  int16_t* p_data_in_0 = (int16_t*)&data_in[delay];
+  int16_t* p_coefficients_0 = (int16_t*)&coefficients[0];
+#if !defined(MIPS_DSP_R1_LE)
+  int32_t max_16 = 0x7FFF;
+  int32_t min_16 = 0xFFFF8000;
+#endif  // #if !defined(MIPS_DSP_R1_LE)
+
+  // Return error if any of the running conditions doesn't meet.
+  if (data_out_length == 0 || coefficients_length == 0
+                           || data_in_length < endpos) {
+    return -1;
+  }
+#if defined(MIPS_DSP_R2_LE)
+  __asm __volatile (
+    ".set        push                                                \n\t"
+    ".set        noreorder                                           \n\t"
+    "subu        %[i],            %[endpos],       %[delay]          \n\t"
+    "sll         %[factor_2],     %[factor],       1                 \n\t"
+   "1:                                                               \n\t"
+    "move        %[p_data_in],    %[p_data_in_0]                     \n\t"
+    "mult        $zero,           $zero                              \n\t"
+    "move        %[p_coefs],      %[p_coefs_0]                       \n\t"
+    "sra         %[j],            %[coef_length],  2                 \n\t"
+    "beq         %[j],            $zero,           3f                \n\t"
+    " andi       %[k],            %[coef_length],  3                 \n\t"
+   "2:                                                               \n\t"
+    "lwl         %[tmp1],         1(%[p_data_in])                    \n\t"
+    "lwl         %[tmp2],         3(%[p_coefs])                      \n\t"
+    "lwl         %[tmp3],         -3(%[p_data_in])                   \n\t"
+    "lwl         %[tmp4],         7(%[p_coefs])                      \n\t"
+    "lwr         %[tmp1],         -2(%[p_data_in])                   \n\t"
+    "lwr         %[tmp2],         0(%[p_coefs])                      \n\t"
+    "lwr         %[tmp3],         -6(%[p_data_in])                   \n\t"
+    "lwr         %[tmp4],         4(%[p_coefs])                      \n\t"
+    "packrl.ph   %[tmp1],         %[tmp1],         %[tmp1]           \n\t"
+    "packrl.ph   %[tmp3],         %[tmp3],         %[tmp3]           \n\t"
+    "dpa.w.ph    $ac0,            %[tmp1],         %[tmp2]           \n\t"
+    "dpa.w.ph    $ac0,            %[tmp3],         %[tmp4]           \n\t"
+    "addiu       %[j],            %[j],            -1                \n\t"
+    "addiu       %[p_data_in],    %[p_data_in],    -8                \n\t"
+    "bgtz        %[j],            2b                                 \n\t"
+    " addiu      %[p_coefs],      %[p_coefs],      8                 \n\t"
+   "3:                                                               \n\t"
+    "beq         %[k],            $zero,           5f                \n\t"
+    " nop                                                            \n\t"
+   "4:                                                               \n\t"
+    "lhu         %[tmp1],         0(%[p_data_in])                    \n\t"
+    "lhu         %[tmp2],         0(%[p_coefs])                      \n\t"
+    "addiu       %[p_data_in],    %[p_data_in],    -2                \n\t"
+    "addiu       %[k],            %[k],            -1                \n\t"
+    "dpa.w.ph    $ac0,            %[tmp1],         %[tmp2]           \n\t"
+    "bgtz        %[k],            4b                                 \n\t"
+    " addiu      %[p_coefs],      %[p_coefs],      2                 \n\t"
+   "5:                                                               \n\t"
+    "extr_r.w    %[out_s32],      $ac0,            12                \n\t"
+    "addu        %[p_data_in_0],  %[p_data_in_0],  %[factor_2]       \n\t"
+    "subu        %[i],            %[i],            %[factor]         \n\t"
+    "shll_s.w    %[out_s32],      %[out_s32],      16                \n\t"
+    "sra         %[out_s32],      %[out_s32],      16                \n\t"
+    "sh          %[out_s32],      0(%[data_out])                     \n\t"
+    "bgtz        %[i],            1b                                 \n\t"
+    " addiu      %[data_out],     %[data_out],     2                 \n\t"
+    ".set        pop                                                 \n\t"
+    : [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2), [tmp3] "=&r" (tmp3),
+      [tmp4] "=&r" (tmp4), [p_data_in] "=&r" (p_data_in),
+      [p_data_in_0] "+r" (p_data_in_0), [p_coefs] "=&r" (p_coefficients),
+      [j] "=&r" (j), [out_s32] "=&r" (out_s32), [factor_2] "=&r" (factor_2),
+      [i] "=&r" (i), [k] "=&r" (k)
+    : [coef_length] "r" (coefficients_length), [data_out] "r" (data_out),
+      [p_coefs_0] "r" (p_coefficients_0), [endpos] "r" (endpos),
+      [delay] "r" (delay), [factor] "r" (factor)
+    : "memory", "hi", "lo"
+ );
+#else  // #if defined(MIPS_DSP_R2_LE)
+  __asm __volatile (
+    ".set        push                                                \n\t"
+    ".set        noreorder                                           \n\t"
+    "sll         %[factor_2],     %[factor],       1                 \n\t"
+    "subu        %[i],            %[endpos],       %[delay]          \n\t"
+   "1:                                                               \n\t"
+    "move        %[p_data_in],    %[p_data_in_0]                     \n\t"
+    "addiu       %[out_s32],      $zero,           2048              \n\t"
+    "move        %[p_coefs],      %[p_coefs_0]                       \n\t"
+    "sra         %[j],            %[coef_length],  1                 \n\t"
+    "beq         %[j],            $zero,           3f                \n\t"
+    " andi       %[k],            %[coef_length],  1                 \n\t"
+   "2:                                                               \n\t"
+    "lh          %[tmp1],         0(%[p_data_in])                    \n\t"
+    "lh          %[tmp2],         0(%[p_coefs])                      \n\t"
+    "lh          %[tmp3],         -2(%[p_data_in])                   \n\t"
+    "lh          %[tmp4],         2(%[p_coefs])                      \n\t"
+    "mul         %[tmp1],         %[tmp1],         %[tmp2]           \n\t"
+    "addiu       %[p_coefs],      %[p_coefs],      4                 \n\t"
+    "mul         %[tmp3],         %[tmp3],         %[tmp4]           \n\t"
+    "addiu       %[j],            %[j],            -1                \n\t"
+    "addiu       %[p_data_in],    %[p_data_in],    -4                \n\t"
+    "addu        %[tmp1],         %[tmp1],         %[tmp3]           \n\t"
+    "bgtz        %[j],            2b                                 \n\t"
+    " addu       %[out_s32],      %[out_s32],      %[tmp1]           \n\t"
+   "3:                                                               \n\t"
+    "beq         %[k],            $zero,           4f                \n\t"
+    " nop                                                            \n\t"
+    "lh          %[tmp1],         0(%[p_data_in])                    \n\t"
+    "lh          %[tmp2],         0(%[p_coefs])                      \n\t"
+    "mul         %[tmp1],         %[tmp1],         %[tmp2]           \n\t"
+    "addu        %[out_s32],      %[out_s32],      %[tmp1]           \n\t"
+   "4:                                                               \n\t"
+    "sra         %[out_s32],      %[out_s32],      12                \n\t"
+    "addu        %[p_data_in_0],  %[p_data_in_0],  %[factor_2]       \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "shll_s.w    %[out_s32],      %[out_s32],      16                \n\t"
+    "sra         %[out_s32],      %[out_s32],      16                \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "slt         %[tmp1],         %[max_16],       %[out_s32]        \n\t"
+    "movn        %[out_s32],      %[max_16],       %[tmp1]           \n\t"
+    "slt         %[tmp1],         %[out_s32],      %[min_16]         \n\t"
+    "movn        %[out_s32],      %[min_16],       %[tmp1]           \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+    "subu        %[i],            %[i],            %[factor]         \n\t"
+    "sh          %[out_s32],      0(%[data_out])                     \n\t"
+    "bgtz        %[i],            1b                                 \n\t"
+    " addiu      %[data_out],     %[data_out],     2                 \n\t"
+    ".set        pop                                                 \n\t"
+    : [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2), [tmp3] "=&r" (tmp3),
+      [tmp4] "=&r" (tmp4), [p_data_in] "=&r" (p_data_in), [k] "=&r" (k),
+      [p_data_in_0] "+r" (p_data_in_0), [p_coefs] "=&r" (p_coefficients),
+      [j] "=&r" (j), [out_s32] "=&r" (out_s32), [factor_2] "=&r" (factor_2),
+      [i] "=&r" (i)
+    : [coef_length] "r" (coefficients_length), [data_out] "r" (data_out),
+      [p_coefs_0] "r" (p_coefficients_0), [endpos] "r" (endpos),
+#if !defined(MIPS_DSP_R1_LE)
+      [max_16] "r" (max_16), [min_16] "r" (min_16),
+#endif  // #if !defined(MIPS_DSP_R1_LE)
+      [delay] "r" (delay), [factor] "r" (factor)
+    : "memory", "hi", "lo"
+  );
+#endif  // #if defined(MIPS_DSP_R2_LE)
+  return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast_neon.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast_neon.c
new file mode 100644
index 0000000..58732da
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/downsample_fast_neon.c
@@ -0,0 +1,217 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#include <arm_neon.h>
+
+// NEON intrinsics version of WebRtcSpl_DownsampleFast()
+// for ARM 32-bit/64-bit platforms.
+int WebRtcSpl_DownsampleFastNeon(const int16_t* data_in,
+                                 size_t data_in_length,
+                                 int16_t* data_out,
+                                 size_t data_out_length,
+                                 const int16_t* __restrict coefficients,
+                                 size_t coefficients_length,
+                                 int factor,
+                                 size_t delay) {
+  size_t i = 0;
+  size_t j = 0;
+  int32_t out_s32 = 0;
+  size_t endpos = delay + factor * (data_out_length - 1) + 1;
+  size_t res = data_out_length & 0x7;
+  size_t endpos1 = endpos - factor * res;
+
+  // Return error if any of the running conditions doesn't meet.
+  if (data_out_length == 0 || coefficients_length == 0
+                           || data_in_length < endpos) {
+    return -1;
+  }
+
+  // First part, unroll the loop 8 times, with 3 subcases
+  // (factor == 2, 4, others).
+  switch (factor) {
+    case 2: {
+      for (i = delay; i < endpos1; i += 16) {
+        // Round value, 0.5 in Q12.
+        int32x4_t out32x4_0 = vdupq_n_s32(2048);
+        int32x4_t out32x4_1 = vdupq_n_s32(2048);
+
+#if defined(WEBRTC_ARCH_ARM64)
+        // Unroll the loop 2 times.
+        for (j = 0; j < coefficients_length - 1; j += 2) {
+          int32x2_t coeff32 = vld1_dup_s32((int32_t*)&coefficients[j]);
+          int16x4_t coeff16x4 = vreinterpret_s16_s32(coeff32);
+          int16x8x2_t in16x8x2 = vld2q_s16(&data_in[i - j - 1]);
+
+          // Mul and accumulate low 64-bit data.
+          int16x4_t in16x4_0 = vget_low_s16(in16x8x2.val[0]);
+          int16x4_t in16x4_1 = vget_low_s16(in16x8x2.val[1]);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_0, coeff16x4, 1);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_1, coeff16x4, 0);
+
+          // Mul and accumulate high 64-bit data.
+          // TODO: vget_high_s16 need extra cost on ARM64. This could be
+          // replaced by vmlal_high_lane_s16. But for the interface of
+          // vmlal_high_lane_s16, there is a bug in gcc 4.9.
+          // This issue need to be tracked in the future.
+          int16x4_t in16x4_2 = vget_high_s16(in16x8x2.val[0]);
+          int16x4_t in16x4_3 = vget_high_s16(in16x8x2.val[1]);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_2, coeff16x4, 1);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_3, coeff16x4, 0);
+        }
+
+        for (; j < coefficients_length; j++) {
+          int16x4_t coeff16x4 = vld1_dup_s16(&coefficients[j]);
+          int16x8x2_t in16x8x2 = vld2q_s16(&data_in[i - j]);
+
+          // Mul and accumulate low 64-bit data.
+          int16x4_t in16x4_0 = vget_low_s16(in16x8x2.val[0]);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_0, coeff16x4, 0);
+
+          // Mul and accumulate high 64-bit data.
+          // TODO: vget_high_s16 need extra cost on ARM64. This could be
+          // replaced by vmlal_high_lane_s16. But for the interface of
+          // vmlal_high_lane_s16, there is a bug in gcc 4.9.
+          // This issue need to be tracked in the future.
+          int16x4_t in16x4_1 = vget_high_s16(in16x8x2.val[0]);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_1, coeff16x4, 0);
+        }
+#else
+        // On ARMv7, the loop unrolling 2 times results in performance
+        // regression.
+        for (j = 0; j < coefficients_length; j++) {
+          int16x4_t coeff16x4 = vld1_dup_s16(&coefficients[j]);
+          int16x8x2_t in16x8x2 = vld2q_s16(&data_in[i - j]);
+
+          // Mul and accumulate.
+          int16x4_t in16x4_0 = vget_low_s16(in16x8x2.val[0]);
+          int16x4_t in16x4_1 = vget_high_s16(in16x8x2.val[0]);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_0, coeff16x4, 0);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_1, coeff16x4, 0);
+        }
+#endif
+
+        // Saturate and store the output.
+        int16x4_t out16x4_0 = vqshrn_n_s32(out32x4_0, 12);
+        int16x4_t out16x4_1 = vqshrn_n_s32(out32x4_1, 12);
+        vst1q_s16(data_out, vcombine_s16(out16x4_0, out16x4_1));
+        data_out += 8;
+      }
+      break;
+    }
+    case 4: {
+      for (i = delay; i < endpos1; i += 32) {
+        // Round value, 0.5 in Q12.
+        int32x4_t out32x4_0 = vdupq_n_s32(2048);
+        int32x4_t out32x4_1 = vdupq_n_s32(2048);
+
+        // Unroll the loop 4 times.
+        for (j = 0; j < coefficients_length - 3; j += 4) {
+          int16x4_t coeff16x4 = vld1_s16(&coefficients[j]);
+          int16x8x4_t in16x8x4 = vld4q_s16(&data_in[i - j - 3]);
+
+          // Mul and accumulate low 64-bit data.
+          int16x4_t in16x4_0 = vget_low_s16(in16x8x4.val[0]);
+          int16x4_t in16x4_2 = vget_low_s16(in16x8x4.val[1]);
+          int16x4_t in16x4_4 = vget_low_s16(in16x8x4.val[2]);
+          int16x4_t in16x4_6 = vget_low_s16(in16x8x4.val[3]);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_0, coeff16x4, 3);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_2, coeff16x4, 2);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_4, coeff16x4, 1);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_6, coeff16x4, 0);
+
+          // Mul and accumulate high 64-bit data.
+          // TODO: vget_high_s16 need extra cost on ARM64. This could be
+          // replaced by vmlal_high_lane_s16. But for the interface of
+          // vmlal_high_lane_s16, there is a bug in gcc 4.9.
+          // This issue need to be tracked in the future.
+          int16x4_t in16x4_1 = vget_high_s16(in16x8x4.val[0]);
+          int16x4_t in16x4_3 = vget_high_s16(in16x8x4.val[1]);
+          int16x4_t in16x4_5 = vget_high_s16(in16x8x4.val[2]);
+          int16x4_t in16x4_7 = vget_high_s16(in16x8x4.val[3]);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_1, coeff16x4, 3);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_3, coeff16x4, 2);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_5, coeff16x4, 1);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_7, coeff16x4, 0);
+        }
+
+        for (; j < coefficients_length; j++) {
+          int16x4_t coeff16x4 = vld1_dup_s16(&coefficients[j]);
+          int16x8x4_t in16x8x4 = vld4q_s16(&data_in[i - j]);
+
+          // Mul and accumulate low 64-bit data.
+          int16x4_t in16x4_0 = vget_low_s16(in16x8x4.val[0]);
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_0, coeff16x4, 0);
+
+          // Mul and accumulate high 64-bit data.
+          // TODO: vget_high_s16 need extra cost on ARM64. This could be
+          // replaced by vmlal_high_lane_s16. But for the interface of
+          // vmlal_high_lane_s16, there is a bug in gcc 4.9.
+          // This issue need to be tracked in the future.
+          int16x4_t in16x4_1 = vget_high_s16(in16x8x4.val[0]);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_1, coeff16x4, 0);
+        }
+
+        // Saturate and store the output.
+        int16x4_t out16x4_0 = vqshrn_n_s32(out32x4_0, 12);
+        int16x4_t out16x4_1 = vqshrn_n_s32(out32x4_1, 12);
+        vst1q_s16(data_out, vcombine_s16(out16x4_0, out16x4_1));
+        data_out += 8;
+      }
+      break;
+    }
+    default: {
+      for (i = delay; i < endpos1; i += factor * 8) {
+        // Round value, 0.5 in Q12.
+        int32x4_t out32x4_0 = vdupq_n_s32(2048);
+        int32x4_t out32x4_1 = vdupq_n_s32(2048);
+
+        for (j = 0; j < coefficients_length; j++) {
+          int16x4_t coeff16x4 = vld1_dup_s16(&coefficients[j]);
+          int16x4_t in16x4_0 = vld1_dup_s16(&data_in[i - j]);
+          in16x4_0 = vld1_lane_s16(&data_in[i + factor - j], in16x4_0, 1);
+          in16x4_0 = vld1_lane_s16(&data_in[i + factor * 2 - j], in16x4_0, 2);
+          in16x4_0 = vld1_lane_s16(&data_in[i + factor * 3 - j], in16x4_0, 3);
+          int16x4_t in16x4_1 = vld1_dup_s16(&data_in[i + factor * 4 - j]);
+          in16x4_1 = vld1_lane_s16(&data_in[i + factor * 5 - j], in16x4_1, 1);
+          in16x4_1 = vld1_lane_s16(&data_in[i + factor * 6 - j], in16x4_1, 2);
+          in16x4_1 = vld1_lane_s16(&data_in[i + factor * 7 - j], in16x4_1, 3);
+
+          // Mul and accumulate.
+          out32x4_0 = vmlal_lane_s16(out32x4_0, in16x4_0, coeff16x4, 0);
+          out32x4_1 = vmlal_lane_s16(out32x4_1, in16x4_1, coeff16x4, 0);
+        }
+
+        // Saturate and store the output.
+        int16x4_t out16x4_0 = vqshrn_n_s32(out32x4_0, 12);
+        int16x4_t out16x4_1 = vqshrn_n_s32(out32x4_1, 12);
+        vst1q_s16(data_out, vcombine_s16(out16x4_0, out16x4_1));
+        data_out += 8;
+      }
+      break;
+    }
+  }
+
+  // Second part, do the rest iterations (if any).
+  for (; i < endpos; i += factor) {
+    out_s32 = 2048;  // Round value, 0.5 in Q12.
+
+    for (j = 0; j < coefficients_length; j++) {
+      out_s32 = WebRtc_MulAccumW16(coefficients[j], data_in[i - j], out_s32);
+    }
+
+    // Saturate and store the output.
+    out_s32 >>= 12;
+    *data_out++ = WebRtcSpl_SatW32ToW16(out_s32);
+  }
+
+  return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/energy.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/energy.c
new file mode 100644
index 0000000..e83f1a6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/energy.c
@@ -0,0 +1,39 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_Energy().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+int32_t WebRtcSpl_Energy(int16_t* vector,
+                         size_t vector_length,
+                         int* scale_factor)
+{
+    int32_t en = 0;
+    size_t i;
+    int scaling =
+        WebRtcSpl_GetScalingSquare(vector, vector_length, vector_length);
+    size_t looptimes = vector_length;
+    int16_t *vectorptr = vector;
+
+    for (i = 0; i < looptimes; i++)
+    {
+      en += (*vectorptr * *vectorptr) >> scaling;
+      vectorptr++;
+    }
+    *scale_factor = scaling;
+
+    return en;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar.c
new file mode 100644
index 0000000..d389ee4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar.c
@@ -0,0 +1,89 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_FilterAR().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+size_t WebRtcSpl_FilterAR(const int16_t* a,
+                          size_t a_length,
+                          const int16_t* x,
+                          size_t x_length,
+                          int16_t* state,
+                          size_t state_length,
+                          int16_t* state_low,
+                          size_t state_low_length,
+                          int16_t* filtered,
+                          int16_t* filtered_low,
+                          size_t filtered_low_length)
+{
+    int32_t o;
+    int32_t oLOW;
+    size_t i, j, stop;
+    const int16_t* x_ptr = &x[0];
+    int16_t* filteredFINAL_ptr = filtered;
+    int16_t* filteredFINAL_LOW_ptr = filtered_low;
+
+    for (i = 0; i < x_length; i++)
+    {
+        // Calculate filtered[i] and filtered_low[i]
+        const int16_t* a_ptr = &a[1];
+        int16_t* filtered_ptr = &filtered[i - 1];
+        int16_t* filtered_low_ptr = &filtered_low[i - 1];
+        int16_t* state_ptr = &state[state_length - 1];
+        int16_t* state_low_ptr = &state_low[state_length - 1];
+
+        o = (int32_t)(*x_ptr++) * (1 << 12);
+        oLOW = (int32_t)0;
+
+        stop = (i < a_length) ? i + 1 : a_length;
+        for (j = 1; j < stop; j++)
+        {
+          o -= *a_ptr * *filtered_ptr--;
+          oLOW -= *a_ptr++ * *filtered_low_ptr--;
+        }
+        for (j = i + 1; j < a_length; j++)
+        {
+          o -= *a_ptr * *state_ptr--;
+          oLOW -= *a_ptr++ * *state_low_ptr--;
+        }
+
+        o += (oLOW >> 12);
+        *filteredFINAL_ptr = (int16_t)((o + (int32_t)2048) >> 12);
+        *filteredFINAL_LOW_ptr++ =
+            (int16_t)(o - ((int32_t)(*filteredFINAL_ptr++) * (1 << 12)));
+    }
+
+    // Save the filter state
+    if (x_length >= state_length)
+    {
+        WebRtcSpl_CopyFromEndW16(filtered, x_length, a_length - 1, state);
+        WebRtcSpl_CopyFromEndW16(filtered_low, x_length, a_length - 1, state_low);
+    } else
+    {
+        for (i = 0; i < state_length - x_length; i++)
+        {
+            state[i] = state[i + x_length];
+            state_low[i] = state_low[i + x_length];
+        }
+        for (i = 0; i < x_length; i++)
+        {
+            state[state_length - x_length + i] = filtered[i];
+            state[state_length - x_length + i] = filtered_low[i];
+        }
+    }
+
+    return x_length;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12.c
new file mode 100644
index 0000000..53e800b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12.c
@@ -0,0 +1,42 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// TODO(bjornv): Change the return type to report errors.
+
+void WebRtcSpl_FilterARFastQ12(const int16_t* data_in,
+                               int16_t* data_out,
+                               const int16_t* __restrict coefficients,
+                               size_t coefficients_length,
+                               size_t data_length) {
+  size_t i = 0;
+  size_t j = 0;
+
+  RTC_DCHECK_GT(data_length, 0);
+  RTC_DCHECK_GT(coefficients_length, 1);
+
+  for (i = 0; i < data_length; i++) {
+    int32_t output = 0;
+    int32_t sum = 0;
+
+    for (j = coefficients_length - 1; j > 0; j--) {
+      sum += coefficients[j] * data_out[i - j];
+    }
+
+    output = coefficients[0] * data_in[i];
+    output -= sum;
+
+    // Saturate and store the output.
+    output = WEBRTC_SPL_SAT(134215679, output, -134217728);
+    data_out[i] = (int16_t)((output + 2048) >> 12);
+  }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12_armv7.S b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12_armv7.S
new file mode 100644
index 0000000..f163627
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12_armv7.S
@@ -0,0 +1,218 @@
+@
+@ Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+@
+@ Use of this source code is governed by a BSD-style license
+@ that can be found in the LICENSE file in the root of the source
+@ tree. An additional intellectual property rights grant can be found
+@ in the file PATENTS.  All contributing project authors may
+@ be found in the AUTHORS file in the root of the source tree.
+@
+
+@ This file contains the function WebRtcSpl_FilterARFastQ12(), optimized for
+@ ARMv7  platform. The description header can be found in
+@ signal_processing_library.h
+@
+@ Output is bit-exact with the generic C code as in filter_ar_fast_q12.c, and
+@ the reference C code at end of this file.
+
+@ Assumptions:
+@ (1) data_length > 0
+@ (2) coefficients_length > 1
+
+@ Register usage:
+@
+@ r0:  &data_in[i]
+@ r1:  &data_out[i], for result ouput
+@ r2:  &coefficients[0]
+@ r3:  coefficients_length
+@ r4:  Iteration counter for the outer loop.
+@ r5:  data_out[j] as multiplication inputs
+@ r6:  Calculated value for output data_out[]; interation counter for inner loop
+@ r7:  Partial sum of a filtering multiplication results
+@ r8:  Partial sum of a filtering multiplication results
+@ r9:  &data_out[], for filtering input; data_in[i]
+@ r10: coefficients[j]
+@ r11: Scratch
+@ r12: &coefficients[j]
+
+#include "webrtc/system_wrappers/include/asm_defines.h"
+
+GLOBAL_FUNCTION WebRtcSpl_FilterARFastQ12
+.align  2
+DEFINE_FUNCTION WebRtcSpl_FilterARFastQ12
+  push {r4-r11}
+
+  ldrsh r12, [sp, #32]         @ data_length
+  subs r4, r12, #1
+  beq ODD_LENGTH               @ jump if data_length == 1
+
+LOOP_LENGTH:
+  add r12, r2, r3, lsl #1
+  sub r12, #4                  @ &coefficients[coefficients_length - 2]
+  sub r9, r1, r3, lsl #1
+  add r9, #2                   @ &data_out[i - coefficients_length + 1]
+  ldr r5, [r9], #4             @ data_out[i - coefficients_length + {1,2}]
+
+  mov r7, #0                   @ sum1
+  mov r8, #0                   @ sum2
+  subs r6, r3, #3              @ Iteration counter for inner loop.
+  beq ODD_A_LENGTH             @ branch if coefficients_length == 3
+  blt POST_LOOP_A_LENGTH       @ branch if coefficients_length == 2
+
+LOOP_A_LENGTH:
+  ldr r10, [r12], #-4          @ coefficients[j - 1], coefficients[j]
+  subs r6, #2
+  smlatt r8, r10, r5, r8       @ sum2 += coefficients[j] * data_out[i - j + 1];
+  smlatb r7, r10, r5, r7       @ sum1 += coefficients[j] * data_out[i - j];
+  smlabt r7, r10, r5, r7       @ coefficients[j - 1] * data_out[i - j + 1];
+  ldr r5, [r9], #4             @ data_out[i - j + 2],  data_out[i - j + 3]
+  smlabb r8, r10, r5, r8       @ coefficients[j - 1] * data_out[i - j + 2];
+  bgt LOOP_A_LENGTH
+  blt POST_LOOP_A_LENGTH
+
+ODD_A_LENGTH:
+  ldrsh r10, [r12, #2]         @ Filter coefficients coefficients[2]
+  sub r12, #2                  @ &coefficients[0]
+  smlabb r7, r10, r5, r7       @ sum1 += coefficients[2] * data_out[i - 2];
+  smlabt r8, r10, r5, r8       @ sum2 += coefficients[2] * data_out[i - 1];
+  ldr r5, [r9, #-2]            @ data_out[i - 1],  data_out[i]
+
+POST_LOOP_A_LENGTH:
+  ldr r10, [r12]               @ coefficients[0], coefficients[1]
+  smlatb r7, r10, r5, r7       @ sum1 += coefficients[1] * data_out[i - 1];
+
+  ldr r9, [r0], #4             @ data_in[i], data_in[i + 1]
+  smulbb r6, r10, r9           @ output1 = coefficients[0] * data_in[i];
+  sub r6, r7                   @ output1 -= sum1;
+
+  sbfx r11, r6, #12, #16
+  ssat r7, #16, r6, asr #12
+  cmp r7, r11
+  addeq r6, r6, #2048
+  ssat r6, #16, r6, asr #12
+  strh r6, [r1], #2            @ Store data_out[i]
+
+  smlatb r8, r10, r6, r8       @ sum2 += coefficients[1] * data_out[i];
+  smulbt r6, r10, r9           @ output2 = coefficients[0] * data_in[i + 1];
+  sub r6, r8                   @ output1 -= sum1;
+
+  sbfx r11, r6, #12, #16
+  ssat r7, #16, r6, asr #12
+  cmp r7, r11
+  addeq r6, r6, #2048
+  ssat r6, #16, r6, asr #12
+  strh r6, [r1], #2            @ Store data_out[i + 1]
+
+  subs r4, #2
+  bgt LOOP_LENGTH
+  blt END                      @ For even data_length, it's done. Jump to END.
+
+@ Process i = data_length -1, for the case of an odd length.
+ODD_LENGTH:
+  add r12, r2, r3, lsl #1
+  sub r12, #4                  @ &coefficients[coefficients_length - 2]
+  sub r9, r1, r3, lsl #1
+  add r9, #2                   @ &data_out[i - coefficients_length + 1]
+  mov r7, #0                   @ sum1
+  mov r8, #0                   @ sum1
+  subs r6, r3, #2              @ inner loop counter
+  beq EVEN_A_LENGTH            @ branch if coefficients_length == 2
+
+LOOP2_A_LENGTH:
+  ldr r10, [r12], #-4          @ coefficients[j - 1], coefficients[j]
+  ldr r5, [r9], #4             @ data_out[i - j],  data_out[i - j + 1]
+  subs r6, #2
+  smlatb r7, r10, r5, r7       @ sum1 += coefficients[j] * data_out[i - j];
+  smlabt r8, r10, r5, r8       @ coefficients[j - 1] * data_out[i - j + 1];
+  bgt LOOP2_A_LENGTH
+  addlt r12, #2
+  blt POST_LOOP2_A_LENGTH
+
+EVEN_A_LENGTH:
+  ldrsh r10, [r12, #2]         @ Filter coefficients coefficients[1]
+  ldrsh r5, [r9]               @ data_out[i - 1]
+  smlabb r7, r10, r5, r7       @ sum1 += coefficients[1] * data_out[i - 1];
+
+POST_LOOP2_A_LENGTH:
+  ldrsh r10, [r12]             @ Filter coefficients coefficients[0]
+  ldrsh r9, [r0]               @ data_in[i]
+  smulbb r6, r10, r9           @ output1 = coefficients[0] * data_in[i];
+  sub r6, r7                   @ output1 -= sum1;
+  sub r6, r8                   @ output1 -= sum1;
+  sbfx r8, r6, #12, #16
+  ssat r7, #16, r6, asr #12
+  cmp r7, r8
+  addeq r6, r6, #2048
+  ssat r6, #16, r6, asr #12
+  strh r6, [r1]                @ Store the data_out[i]
+
+END:
+  pop {r4-r11}
+  bx  lr
+
+@Reference C code:
+@
+@void WebRtcSpl_FilterARFastQ12(int16_t* data_in,
+@                               int16_t* data_out,
+@                               int16_t* __restrict coefficients,
+@                               size_t coefficients_length,
+@                               size_t data_length) {
+@  size_t i = 0;
+@  size_t j = 0;
+@
+@  assert(data_length > 0);
+@  assert(coefficients_length > 1);
+@
+@  for (i = 0; i < data_length - 1; i += 2) {
+@    int32_t output1 = 0;
+@    int32_t sum1 = 0;
+@    int32_t output2 = 0;
+@    int32_t sum2 = 0;
+@
+@    for (j = coefficients_length - 1; j > 2; j -= 2) {
+@      sum1 += coefficients[j]      * data_out[i - j];
+@      sum1 += coefficients[j - 1]  * data_out[i - j + 1];
+@      sum2 += coefficients[j]     * data_out[i - j + 1];
+@      sum2 += coefficients[j - 1] * data_out[i - j + 2];
+@    }
+@
+@    if (j == 2) {
+@      sum1 += coefficients[2] * data_out[i - 2];
+@      sum2 += coefficients[2] * data_out[i - 1];
+@    }
+@
+@    sum1 += coefficients[1] * data_out[i - 1];
+@    output1 = coefficients[0] * data_in[i];
+@    output1 -= sum1;
+@    // Saturate and store the output.
+@    output1 = WEBRTC_SPL_SAT(134215679, output1, -134217728);
+@    data_out[i] = (int16_t)((output1 + 2048) >> 12);
+@
+@    sum2 += coefficients[1] * data_out[i];
+@    output2 = coefficients[0] * data_in[i + 1];
+@    output2 -= sum2;
+@    // Saturate and store the output.
+@    output2 = WEBRTC_SPL_SAT(134215679, output2, -134217728);
+@    data_out[i + 1] = (int16_t)((output2 + 2048) >> 12);
+@  }
+@
+@  if (i == data_length - 1) {
+@    int32_t output1 = 0;
+@    int32_t sum1 = 0;
+@
+@    for (j = coefficients_length - 1; j > 1; j -= 2) {
+@      sum1 += coefficients[j]      * data_out[i - j];
+@      sum1 += coefficients[j - 1]  * data_out[i - j + 1];
+@    }
+@
+@    if (j == 1) {
+@      sum1 += coefficients[1] * data_out[i - 1];
+@    }
+@
+@    output1 = coefficients[0] * data_in[i];
+@    output1 -= sum1;
+@    // Saturate and store the output.
+@    output1 = WEBRTC_SPL_SAT(134215679, output1, -134217728);
+@    data_out[i] = (int16_t)((output1 + 2048) >> 12);
+@  }
+@}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12_mips.c
new file mode 100644
index 0000000..02fa80b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ar_fast_q12_mips.c
@@ -0,0 +1,140 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_FilterARFastQ12(const int16_t* data_in,
+                               int16_t* data_out,
+                               const int16_t* __restrict coefficients,
+                               size_t coefficients_length,
+                               size_t data_length) {
+  int r0, r1, r2, r3;
+  int coef0, offset;
+  int i, j, k;
+  int coefptr, outptr, tmpout, inptr;
+#if !defined(MIPS_DSP_R1_LE)
+  int max16 = 0x7FFF;
+  int min16 = 0xFFFF8000;
+#endif  // #if !defined(MIPS_DSP_R1_LE)
+
+  RTC_DCHECK_GT(data_length, 0);
+  RTC_DCHECK_GT(coefficients_length, 1);
+
+  __asm __volatile (
+    ".set       push                                             \n\t"
+    ".set       noreorder                                        \n\t"
+    "addiu      %[i],       %[data_length],          0           \n\t"
+    "lh         %[coef0],   0(%[coefficients])                   \n\t"
+    "addiu      %[j],       %[coefficients_length],  -1          \n\t"
+    "andi       %[k],       %[j],                    1           \n\t"
+    "sll        %[offset],  %[j],                    1           \n\t"
+    "subu       %[outptr],  %[data_out],             %[offset]   \n\t"
+    "addiu      %[inptr],   %[data_in],              0           \n\t"
+    "bgtz       %[k],       3f                                   \n\t"
+    " addu      %[coefptr], %[coefficients],         %[offset]   \n\t"
+   "1:                                                           \n\t"
+    "lh         %[r0],      0(%[inptr])                          \n\t"
+    "addiu      %[i],       %[i],                    -1          \n\t"
+    "addiu      %[tmpout],  %[outptr],               0           \n\t"
+    "mult       %[r0],      %[coef0]                             \n\t"
+   "2:                                                           \n\t"
+    "lh         %[r0],      0(%[tmpout])                         \n\t"
+    "lh         %[r1],      0(%[coefptr])                        \n\t"
+    "lh         %[r2],      2(%[tmpout])                         \n\t"
+    "lh         %[r3],      -2(%[coefptr])                       \n\t"
+    "addiu      %[tmpout],  %[tmpout],               4           \n\t"
+    "msub       %[r0],      %[r1]                                \n\t"
+    "msub       %[r2],      %[r3]                                \n\t"
+    "addiu      %[j],       %[j],                    -2          \n\t"
+    "bgtz       %[j],       2b                                   \n\t"
+    " addiu     %[coefptr], %[coefptr],              -4          \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "extr_r.w   %[r0],      $ac0,                    12          \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "mflo       %[r0]                                            \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+    "addu       %[coefptr], %[coefficients],         %[offset]   \n\t"
+    "addiu      %[inptr],   %[inptr],                2           \n\t"
+    "addiu      %[j],       %[coefficients_length],  -1          \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "shll_s.w   %[r0],      %[r0],                   16          \n\t"
+    "sra        %[r0],      %[r0],                   16          \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "addiu      %[r0],      %[r0],                   2048        \n\t"
+    "sra        %[r0],      %[r0],                   12          \n\t"
+    "slt        %[r1],      %[max16],                %[r0]       \n\t"
+    "movn       %[r0],      %[max16],                %[r1]       \n\t"
+    "slt        %[r1],      %[r0],                   %[min16]    \n\t"
+    "movn       %[r0],      %[min16],                %[r1]       \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+    "sh         %[r0],      0(%[tmpout])                         \n\t"
+    "bgtz       %[i],       1b                                   \n\t"
+    " addiu     %[outptr],  %[outptr],               2           \n\t"
+    "b          5f                                               \n\t"
+    " nop                                                        \n\t"
+   "3:                                                           \n\t"
+    "lh         %[r0],      0(%[inptr])                          \n\t"
+    "addiu      %[i],       %[i],                    -1          \n\t"
+    "addiu      %[tmpout],  %[outptr],               0           \n\t"
+    "mult       %[r0],      %[coef0]                             \n\t"
+   "4:                                                           \n\t"
+    "lh         %[r0],      0(%[tmpout])                         \n\t"
+    "lh         %[r1],      0(%[coefptr])                        \n\t"
+    "lh         %[r2],      2(%[tmpout])                         \n\t"
+    "lh         %[r3],      -2(%[coefptr])                       \n\t"
+    "addiu      %[tmpout],  %[tmpout],               4           \n\t"
+    "msub       %[r0],      %[r1]                                \n\t"
+    "msub       %[r2],      %[r3]                                \n\t"
+    "addiu      %[j],       %[j],                    -2          \n\t"
+    "bgtz       %[j],       4b                                   \n\t"
+    " addiu     %[coefptr], %[coefptr],              -4          \n\t"
+    "lh         %[r0],      0(%[tmpout])                         \n\t"
+    "lh         %[r1],      0(%[coefptr])                        \n\t"
+    "msub       %[r0],      %[r1]                                \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "extr_r.w   %[r0],      $ac0,                    12          \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "mflo       %[r0]                                            \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+    "addu       %[coefptr], %[coefficients],         %[offset]   \n\t"
+    "addiu      %[inptr],   %[inptr],                2           \n\t"
+    "addiu      %[j],       %[coefficients_length],  -1          \n\t"
+#if defined(MIPS_DSP_R1_LE)
+    "shll_s.w   %[r0],      %[r0],                   16          \n\t"
+    "sra        %[r0],      %[r0],                   16          \n\t"
+#else  // #if defined(MIPS_DSP_R1_LE)
+    "addiu      %[r0],      %[r0],                   2048        \n\t"
+    "sra        %[r0],      %[r0],                   12          \n\t"
+    "slt        %[r1],      %[max16],                %[r0]       \n\t"
+    "movn       %[r0],      %[max16],                %[r1]       \n\t"
+    "slt        %[r1],      %[r0],                   %[min16]    \n\t"
+    "movn       %[r0],      %[min16],                %[r1]       \n\t"
+#endif  // #if defined(MIPS_DSP_R1_LE)
+    "sh         %[r0],      2(%[tmpout])                         \n\t"
+    "bgtz       %[i],       3b                                   \n\t"
+    " addiu     %[outptr],  %[outptr],               2           \n\t"
+   "5:                                                           \n\t"
+    ".set       pop                                              \n\t"
+    : [i] "=&r" (i), [j] "=&r" (j), [k] "=&r" (k), [r0] "=&r" (r0),
+      [r1] "=&r" (r1), [r2] "=&r" (r2), [r3] "=&r" (r3),
+      [coef0] "=&r" (coef0), [offset] "=&r" (offset),
+      [outptr] "=&r" (outptr), [inptr] "=&r" (inptr),
+      [coefptr] "=&r" (coefptr), [tmpout] "=&r" (tmpout)
+    : [coefficients] "r" (coefficients), [data_length] "r" (data_length),
+      [coefficients_length] "r" (coefficients_length),
+#if !defined(MIPS_DSP_R1_LE)
+      [max16] "r" (max16), [min16] "r" (min16),
+#endif
+      [data_out] "r" (data_out), [data_in] "r" (data_in)
+    : "hi", "lo", "memory"
+  );
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ma_fast_q12.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ma_fast_q12.c
new file mode 100644
index 0000000..98f5b3c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/filter_ma_fast_q12.c
@@ -0,0 +1,52 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_FilterMAFastQ12().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#include "webrtc/base/sanitizer.h"
+
+void WebRtcSpl_FilterMAFastQ12(const int16_t* in_ptr,
+                               int16_t* out_ptr,
+                               const int16_t* B,
+                               size_t B_length,
+                               size_t length)
+{
+    size_t i, j;
+
+    rtc_MsanCheckInitialized(B, sizeof(B[0]), B_length);
+    rtc_MsanCheckInitialized(in_ptr - B_length + 1, sizeof(in_ptr[0]),
+                             B_length + length - 1);
+
+    for (i = 0; i < length; i++)
+    {
+        int32_t o = 0;
+
+        for (j = 0; j < B_length; j++)
+        {
+          o += B[j] * in_ptr[i - j];
+        }
+
+        // If output is higher than 32768, saturate it. Same with negative side
+        // 2^27 = 134217728, which corresponds to 32768 in Q12
+
+        // Saturate the output
+        o = WEBRTC_SPL_SAT((int32_t)134215679, o, (int32_t)-134217728);
+
+        *out_ptr++ = (int16_t)((o + (int32_t)2048) >> 12);
+    }
+    return;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/get_hanning_window.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/get_hanning_window.c
new file mode 100644
index 0000000..d83ac21
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/get_hanning_window.c
@@ -0,0 +1,77 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_GetHanningWindow().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// Hanning table with 256 entries
+static const int16_t kHanningTable[] = {
+    1,      2,      6,     10,     15,     22,     30,     39,
+   50,     62,     75,     89,    104,    121,    138,    157,
+  178,    199,    222,    246,    271,    297,    324,    353,
+  383,    413,    446,    479,    513,    549,    586,    624,
+  663,    703,    744,    787,    830,    875,    920,    967,
+ 1015,   1064,   1114,   1165,   1218,   1271,   1325,   1381,
+ 1437,   1494,   1553,   1612,   1673,   1734,   1796,   1859,
+ 1924,   1989,   2055,   2122,   2190,   2259,   2329,   2399,
+ 2471,   2543,   2617,   2691,   2765,   2841,   2918,   2995,
+ 3073,   3152,   3232,   3312,   3393,   3475,   3558,   3641,
+ 3725,   3809,   3895,   3980,   4067,   4154,   4242,   4330,
+ 4419,   4509,   4599,   4689,   4781,   4872,   4964,   5057,
+ 5150,   5244,   5338,   5432,   5527,   5622,   5718,   5814,
+ 5910,   6007,   6104,   6202,   6299,   6397,   6495,   6594,
+ 6693,   6791,   6891,   6990,   7090,   7189,   7289,   7389,
+ 7489,   7589,   7690,   7790,   7890,   7991,   8091,   8192,
+ 8293,   8393,   8494,   8594,   8694,   8795,   8895,   8995,
+ 9095,   9195,   9294,   9394,   9493,   9593,   9691,   9790,
+ 9889,   9987,  10085,  10182,  10280,  10377,  10474,  10570,
+10666,  10762,  10857,  10952,  11046,  11140,  11234,  11327,
+11420,  11512,  11603,  11695,  11785,  11875,  11965,  12054,
+12142,  12230,  12317,  12404,  12489,  12575,  12659,  12743,
+12826,  12909,  12991,  13072,  13152,  13232,  13311,  13389,
+13466,  13543,  13619,  13693,  13767,  13841,  13913,  13985,
+14055,  14125,  14194,  14262,  14329,  14395,  14460,  14525,
+14588,  14650,  14711,  14772,  14831,  14890,  14947,  15003,
+15059,  15113,  15166,  15219,  15270,  15320,  15369,  15417,
+15464,  15509,  15554,  15597,  15640,  15681,  15721,  15760,
+15798,  15835,  15871,  15905,  15938,  15971,  16001,  16031,
+16060,  16087,  16113,  16138,  16162,  16185,  16206,  16227,
+16246,  16263,  16280,  16295,  16309,  16322,  16334,  16345,
+16354,  16362,  16369,  16374,  16378,  16382,  16383,  16384
+};
+
+void WebRtcSpl_GetHanningWindow(int16_t *v, size_t size)
+{
+    size_t jj;
+    int16_t *vptr1;
+
+    int32_t index;
+    int32_t factor = ((int32_t)0x40000000);
+
+    factor = WebRtcSpl_DivW32W16(factor, (int16_t)size);
+    if (size < 513)
+        index = (int32_t)-0x200000;
+    else
+        index = (int32_t)-0x100000;
+    vptr1 = v;
+
+    for (jj = 0; jj < size; jj++)
+    {
+        index += factor;
+        (*vptr1++) = kHanningTable[index >> 22];
+    }
+
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/get_scaling_square.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/get_scaling_square.c
new file mode 100644
index 0000000..82e3c8b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/get_scaling_square.c
@@ -0,0 +1,46 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_GetScalingSquare().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+int16_t WebRtcSpl_GetScalingSquare(int16_t* in_vector,
+                                   size_t in_vector_length,
+                                   size_t times)
+{
+    int16_t nbits = WebRtcSpl_GetSizeInBits((uint32_t)times);
+    size_t i;
+    int16_t smax = -1;
+    int16_t sabs;
+    int16_t *sptr = in_vector;
+    int16_t t;
+    size_t looptimes = in_vector_length;
+
+    for (i = looptimes; i > 0; i--)
+    {
+        sabs = (*sptr > 0 ? *sptr++ : -*sptr++);
+        smax = (sabs > smax ? sabs : smax);
+    }
+    t = WebRtcSpl_NormW32(WEBRTC_SPL_MUL(smax, smax));
+
+    if (smax == 0)
+    {
+        return 0; // Since norm(0) returns 0
+    } else
+    {
+        return (t > nbits) ? 0 : nbits - t;
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/ilbc_specific_functions.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/ilbc_specific_functions.c
new file mode 100644
index 0000000..301a922
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/ilbc_specific_functions.c
@@ -0,0 +1,90 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains implementations of the iLBC specific functions
+ * WebRtcSpl_ReverseOrderMultArrayElements()
+ * WebRtcSpl_ElementwiseVectorMult()
+ * WebRtcSpl_AddVectorsAndShift()
+ * WebRtcSpl_AddAffineVectorToVector()
+ * WebRtcSpl_AffineTransformVector()
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_ReverseOrderMultArrayElements(int16_t *out, const int16_t *in,
+                                             const int16_t *win,
+                                             size_t vector_length,
+                                             int16_t right_shifts)
+{
+    size_t i;
+    int16_t *outptr = out;
+    const int16_t *inptr = in;
+    const int16_t *winptr = win;
+    for (i = 0; i < vector_length; i++)
+    {
+      *outptr++ = (int16_t)((*inptr++ * *winptr--) >> right_shifts);
+    }
+}
+
+void WebRtcSpl_ElementwiseVectorMult(int16_t *out, const int16_t *in,
+                                     const int16_t *win, size_t vector_length,
+                                     int16_t right_shifts)
+{
+    size_t i;
+    int16_t *outptr = out;
+    const int16_t *inptr = in;
+    const int16_t *winptr = win;
+    for (i = 0; i < vector_length; i++)
+    {
+      *outptr++ = (int16_t)((*inptr++ * *winptr++) >> right_shifts);
+    }
+}
+
+void WebRtcSpl_AddVectorsAndShift(int16_t *out, const int16_t *in1,
+                                  const int16_t *in2, size_t vector_length,
+                                  int16_t right_shifts)
+{
+    size_t i;
+    int16_t *outptr = out;
+    const int16_t *in1ptr = in1;
+    const int16_t *in2ptr = in2;
+    for (i = vector_length; i > 0; i--)
+    {
+        (*outptr++) = (int16_t)(((*in1ptr++) + (*in2ptr++)) >> right_shifts);
+    }
+}
+
+void WebRtcSpl_AddAffineVectorToVector(int16_t *out, int16_t *in,
+                                       int16_t gain, int32_t add_constant,
+                                       int16_t right_shifts,
+                                       size_t vector_length)
+{
+    size_t i;
+
+    for (i = 0; i < vector_length; i++)
+    {
+      out[i] += (int16_t)((in[i] * gain + add_constant) >> right_shifts);
+    }
+}
+
+void WebRtcSpl_AffineTransformVector(int16_t *out, int16_t *in,
+                                     int16_t gain, int32_t add_constant,
+                                     int16_t right_shifts, size_t vector_length)
+{
+    size_t i;
+
+    for (i = 0; i < vector_length; i++)
+    {
+      out[i] = (int16_t)((in[i] * gain + add_constant) >> right_shifts);
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/real_fft.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/real_fft.h
new file mode 100644
index 0000000..ed0db76
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/real_fft.h
@@ -0,0 +1,97 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_REAL_FFT_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_REAL_FFT_H_
+
+#include "webrtc/typedefs.h"
+
+// For ComplexFFT(), the maximum fft order is 10;
+// for OpenMax FFT in ARM, it is 12;
+// WebRTC APM uses orders of only 7 and 8.
+enum {kMaxFFTOrder = 10};
+
+struct RealFFT;
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+struct RealFFT* WebRtcSpl_CreateRealFFT(int order);
+void WebRtcSpl_FreeRealFFT(struct RealFFT* self);
+
+// Compute an FFT for a real-valued signal of length of 2^order,
+// where 1 < order <= MAX_FFT_ORDER. Transform length is determined by the
+// specification structure, which must be initialized prior to calling the FFT
+// function with WebRtcSpl_CreateRealFFT().
+// The relationship between the input and output sequences can
+// be expressed in terms of the DFT, i.e.:
+//     x[n] = (2^(-scalefactor)/N)  . SUM[k=0,...,N-1] X[k].e^(jnk.2.pi/N)
+//     n=0,1,2,...N-1
+//     N=2^order.
+// The conjugate-symmetric output sequence is represented using a CCS vector,
+// which is of length N+2, and is organized as follows:
+//     Index:      0  1  2  3  4  5   . . .   N-2       N-1       N       N+1
+//     Component:  R0 0  R1 I1 R2 I2  . . .   R[N/2-1]  I[N/2-1]  R[N/2]  0
+// where R[n] and I[n], respectively, denote the real and imaginary components
+// for FFT bin 'n'. Bins  are numbered from 0 to N/2, where N is the FFT length.
+// Bin index 0 corresponds to the DC component, and bin index N/2 corresponds to
+// the foldover frequency.
+//
+// Input Arguments:
+//   self - pointer to preallocated and initialized FFT specification structure.
+//   real_data_in - the input signal. For an ARM Neon platform, it must be
+//                  aligned on a 32-byte boundary.
+//
+// Output Arguments:
+//   complex_data_out - the output complex signal with (2^order + 2) 16-bit
+//                      elements. For an ARM Neon platform, it must be different
+//                      from real_data_in, and aligned on a 32-byte boundary.
+//
+// Return Value:
+//   0  - FFT calculation is successful.
+//   -1 - Error with bad arguments (null pointers).
+int WebRtcSpl_RealForwardFFT(struct RealFFT* self,
+                             const int16_t* real_data_in,
+                             int16_t* complex_data_out);
+
+// Compute the inverse FFT for a conjugate-symmetric input sequence of length of
+// 2^order, where 1 < order <= MAX_FFT_ORDER. Transform length is determined by
+// the specification structure, which must be initialized prior to calling the
+// FFT function with WebRtcSpl_CreateRealFFT().
+// For a transform of length M, the input sequence is represented using a packed
+// CCS vector of length M+2, which is explained in the comments for
+// WebRtcSpl_RealForwardFFTC above.
+//
+// Input Arguments:
+//   self - pointer to preallocated and initialized FFT specification structure.
+//   complex_data_in - the input complex signal with (2^order + 2) 16-bit
+//                     elements. For an ARM Neon platform, it must be aligned on
+//                     a 32-byte boundary.
+//
+// Output Arguments:
+//   real_data_out - the output real signal. For an ARM Neon platform, it must
+//                   be different to complex_data_in, and aligned on a 32-byte
+//                   boundary.
+//
+// Return Value:
+//   0 or a positive number - a value that the elements in the |real_data_out|
+//                            should be shifted left with in order to get
+//                            correct physical values.
+//   -1 - Error with bad arguments (null pointers).
+int WebRtcSpl_RealInverseFFT(struct RealFFT* self,
+                             const int16_t* complex_data_in,
+                             int16_t* real_data_out);
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_REAL_FFT_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/signal_processing_library.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/signal_processing_library.h
new file mode 100644
index 0000000..f4fe8e8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/signal_processing_library.h
@@ -0,0 +1,1627 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This header file includes all of the fix point signal processing library (SPL) function
+ * descriptions and declarations.
+ * For specific function calls, see bottom of file.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SIGNAL_PROCESSING_LIBRARY_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SIGNAL_PROCESSING_LIBRARY_H_
+
+#include <string.h>
+#include "webrtc/common_audio/signal_processing/dot_product_with_scale.h"
+#include "webrtc/typedefs.h"
+
+// Macros specific for the fixed point implementation
+#define WEBRTC_SPL_WORD16_MAX       32767
+#define WEBRTC_SPL_WORD16_MIN       -32768
+#define WEBRTC_SPL_WORD32_MAX       (int32_t)0x7fffffff
+#define WEBRTC_SPL_WORD32_MIN       (int32_t)0x80000000
+#define WEBRTC_SPL_MAX_LPC_ORDER    14
+#define WEBRTC_SPL_MIN(A, B)        (A < B ? A : B)  // Get min value
+#define WEBRTC_SPL_MAX(A, B)        (A > B ? A : B)  // Get max value
+// TODO(kma/bjorn): For the next two macros, investigate how to correct the code
+// for inputs of a = WEBRTC_SPL_WORD16_MIN or WEBRTC_SPL_WORD32_MIN.
+#define WEBRTC_SPL_ABS_W16(a) \
+    (((int16_t)a >= 0) ? ((int16_t)a) : -((int16_t)a))
+#define WEBRTC_SPL_ABS_W32(a) \
+    (((int32_t)a >= 0) ? ((int32_t)a) : -((int32_t)a))
+
+#define WEBRTC_SPL_MUL(a, b) \
+    ((int32_t) ((int32_t)(a) * (int32_t)(b)))
+#define WEBRTC_SPL_UMUL(a, b) \
+    ((uint32_t) ((uint32_t)(a) * (uint32_t)(b)))
+#define WEBRTC_SPL_UMUL_32_16(a, b) \
+    ((uint32_t) ((uint32_t)(a) * (uint16_t)(b)))
+#define WEBRTC_SPL_MUL_16_U16(a, b) \
+    ((int32_t)(int16_t)(a) * (uint16_t)(b))
+
+#ifndef WEBRTC_ARCH_ARM_V7
+// For ARMv7 platforms, these are inline functions in spl_inl_armv7.h
+#ifndef MIPS32_LE
+// For MIPS platforms, these are inline functions in spl_inl_mips.h
+#define WEBRTC_SPL_MUL_16_16(a, b) \
+    ((int32_t) (((int16_t)(a)) * ((int16_t)(b))))
+#define WEBRTC_SPL_MUL_16_32_RSFT16(a, b) \
+    (WEBRTC_SPL_MUL_16_16(a, b >> 16) \
+     + ((WEBRTC_SPL_MUL_16_16(a, (b & 0xffff) >> 1) + 0x4000) >> 15))
+#endif
+#endif
+
+#define WEBRTC_SPL_MUL_16_32_RSFT11(a, b)          \
+  (WEBRTC_SPL_MUL_16_16(a, (b) >> 16) * (1 << 5) + \
+    (((WEBRTC_SPL_MUL_16_U16(a, (uint16_t)(b)) >> 1) + 0x0200) >> 10))
+#define WEBRTC_SPL_MUL_16_32_RSFT14(a, b)          \
+  (WEBRTC_SPL_MUL_16_16(a, (b) >> 16) * (1 << 2) + \
+    (((WEBRTC_SPL_MUL_16_U16(a, (uint16_t)(b)) >> 1) + 0x1000) >> 13))
+#define WEBRTC_SPL_MUL_16_32_RSFT15(a, b)            \
+  ((WEBRTC_SPL_MUL_16_16(a, (b) >> 16) * (1 << 1)) + \
+    (((WEBRTC_SPL_MUL_16_U16(a, (uint16_t)(b)) >> 1) + 0x2000) >> 14))
+
+#define WEBRTC_SPL_MUL_16_16_RSFT(a, b, c) \
+    (WEBRTC_SPL_MUL_16_16(a, b) >> (c))
+
+#define WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(a, b, c) \
+    ((WEBRTC_SPL_MUL_16_16(a, b) + ((int32_t) \
+                                  (((int32_t)1) << ((c) - 1)))) >> (c))
+
+// C + the 32 most significant bits of A * B
+#define WEBRTC_SPL_SCALEDIFF32(A, B, C) \
+    (C + (B >> 16) * A + (((uint32_t)(B & 0x0000FFFF) * A) >> 16))
+
+#define WEBRTC_SPL_SAT(a, b, c)         (b > a ? a : b < c ? c : b)
+
+// Shifting with negative numbers allowed
+// Positive means left shift
+#define WEBRTC_SPL_SHIFT_W32(x, c) ((c) >= 0 ? (x) * (1 << (c)) : (x) >> -(c))
+
+// Shifting with negative numbers not allowed
+// We cannot do casting here due to signed/unsigned problem
+#define WEBRTC_SPL_LSHIFT_W32(x, c)     ((x) << (c))
+
+#define WEBRTC_SPL_RSHIFT_U32(x, c)     ((uint32_t)(x) >> (c))
+
+#define WEBRTC_SPL_RAND(a) \
+    ((int16_t)((((int16_t)a * 18816) >> 7) & 0x00007fff))
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#define WEBRTC_SPL_MEMCPY_W16(v1, v2, length) \
+  memcpy(v1, v2, (length) * sizeof(int16_t))
+
+// inline functions:
+#include "webrtc/common_audio/signal_processing/include/spl_inl.h"
+
+// Initialize SPL. Currently it contains only function pointer initialization.
+// If the underlying platform is known to be ARM-Neon (WEBRTC_HAS_NEON defined),
+// the pointers will be assigned to code optimized for Neon; otherwise, generic
+// C code will be assigned.
+// Note that this function MUST be called in any application that uses SPL
+// functions.
+void WebRtcSpl_Init();
+
+int16_t WebRtcSpl_GetScalingSquare(int16_t* in_vector,
+                                   size_t in_vector_length,
+                                   size_t times);
+
+// Copy and set operations. Implementation in copy_set_operations.c.
+// Descriptions at bottom of file.
+void WebRtcSpl_MemSetW16(int16_t* vector,
+                         int16_t set_value,
+                         size_t vector_length);
+void WebRtcSpl_MemSetW32(int32_t* vector,
+                         int32_t set_value,
+                         size_t vector_length);
+void WebRtcSpl_MemCpyReversedOrder(int16_t* out_vector,
+                                   int16_t* in_vector,
+                                   size_t vector_length);
+void WebRtcSpl_CopyFromEndW16(const int16_t* in_vector,
+                              size_t in_vector_length,
+                              size_t samples,
+                              int16_t* out_vector);
+void WebRtcSpl_ZerosArrayW16(int16_t* vector,
+                             size_t vector_length);
+void WebRtcSpl_ZerosArrayW32(int32_t* vector,
+                             size_t vector_length);
+// End: Copy and set operations.
+
+
+// Minimum and maximum operation functions and their pointers.
+// Implementation in min_max_operations.c.
+
+// Returns the largest absolute value in a signed 16-bit vector.
+//
+// Input:
+//      - vector : 16-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Maximum absolute value in vector.
+typedef int16_t (*MaxAbsValueW16)(const int16_t* vector, size_t length);
+extern MaxAbsValueW16 WebRtcSpl_MaxAbsValueW16;
+int16_t WebRtcSpl_MaxAbsValueW16C(const int16_t* vector, size_t length);
+#if defined(WEBRTC_HAS_NEON)
+int16_t WebRtcSpl_MaxAbsValueW16Neon(const int16_t* vector, size_t length);
+#endif
+#if defined(MIPS32_LE)
+int16_t WebRtcSpl_MaxAbsValueW16_mips(const int16_t* vector, size_t length);
+#endif
+
+// Returns the largest absolute value in a signed 32-bit vector.
+//
+// Input:
+//      - vector : 32-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Maximum absolute value in vector.
+typedef int32_t (*MaxAbsValueW32)(const int32_t* vector, size_t length);
+extern MaxAbsValueW32 WebRtcSpl_MaxAbsValueW32;
+int32_t WebRtcSpl_MaxAbsValueW32C(const int32_t* vector, size_t length);
+#if defined(WEBRTC_HAS_NEON)
+int32_t WebRtcSpl_MaxAbsValueW32Neon(const int32_t* vector, size_t length);
+#endif
+#if defined(MIPS_DSP_R1_LE)
+int32_t WebRtcSpl_MaxAbsValueW32_mips(const int32_t* vector, size_t length);
+#endif
+
+// Returns the maximum value of a 16-bit vector.
+//
+// Input:
+//      - vector : 16-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Maximum sample value in |vector|.
+typedef int16_t (*MaxValueW16)(const int16_t* vector, size_t length);
+extern MaxValueW16 WebRtcSpl_MaxValueW16;
+int16_t WebRtcSpl_MaxValueW16C(const int16_t* vector, size_t length);
+#if defined(WEBRTC_HAS_NEON)
+int16_t WebRtcSpl_MaxValueW16Neon(const int16_t* vector, size_t length);
+#endif
+#if defined(MIPS32_LE)
+int16_t WebRtcSpl_MaxValueW16_mips(const int16_t* vector, size_t length);
+#endif
+
+// Returns the maximum value of a 32-bit vector.
+//
+// Input:
+//      - vector : 32-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Maximum sample value in |vector|.
+typedef int32_t (*MaxValueW32)(const int32_t* vector, size_t length);
+extern MaxValueW32 WebRtcSpl_MaxValueW32;
+int32_t WebRtcSpl_MaxValueW32C(const int32_t* vector, size_t length);
+#if defined(WEBRTC_HAS_NEON)
+int32_t WebRtcSpl_MaxValueW32Neon(const int32_t* vector, size_t length);
+#endif
+#if defined(MIPS32_LE)
+int32_t WebRtcSpl_MaxValueW32_mips(const int32_t* vector, size_t length);
+#endif
+
+// Returns the minimum value of a 16-bit vector.
+//
+// Input:
+//      - vector : 16-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Minimum sample value in |vector|.
+typedef int16_t (*MinValueW16)(const int16_t* vector, size_t length);
+extern MinValueW16 WebRtcSpl_MinValueW16;
+int16_t WebRtcSpl_MinValueW16C(const int16_t* vector, size_t length);
+#if defined(WEBRTC_HAS_NEON)
+int16_t WebRtcSpl_MinValueW16Neon(const int16_t* vector, size_t length);
+#endif
+#if defined(MIPS32_LE)
+int16_t WebRtcSpl_MinValueW16_mips(const int16_t* vector, size_t length);
+#endif
+
+// Returns the minimum value of a 32-bit vector.
+//
+// Input:
+//      - vector : 32-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Minimum sample value in |vector|.
+typedef int32_t (*MinValueW32)(const int32_t* vector, size_t length);
+extern MinValueW32 WebRtcSpl_MinValueW32;
+int32_t WebRtcSpl_MinValueW32C(const int32_t* vector, size_t length);
+#if defined(WEBRTC_HAS_NEON)
+int32_t WebRtcSpl_MinValueW32Neon(const int32_t* vector, size_t length);
+#endif
+#if defined(MIPS32_LE)
+int32_t WebRtcSpl_MinValueW32_mips(const int32_t* vector, size_t length);
+#endif
+
+// Returns the vector index to the largest absolute value of a 16-bit vector.
+//
+// Input:
+//      - vector : 16-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Index to the maximum absolute value in vector.
+//                 If there are multiple equal maxima, return the index of the
+//                 first. -32768 will always have precedence over 32767 (despite
+//                 -32768 presenting an int16 absolute value of 32767).
+size_t WebRtcSpl_MaxAbsIndexW16(const int16_t* vector, size_t length);
+
+// Returns the vector index to the maximum sample value of a 16-bit vector.
+//
+// Input:
+//      - vector : 16-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Index to the maximum value in vector (if multiple
+//                 indexes have the maximum, return the first).
+size_t WebRtcSpl_MaxIndexW16(const int16_t* vector, size_t length);
+
+// Returns the vector index to the maximum sample value of a 32-bit vector.
+//
+// Input:
+//      - vector : 32-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Index to the maximum value in vector (if multiple
+//                 indexes have the maximum, return the first).
+size_t WebRtcSpl_MaxIndexW32(const int32_t* vector, size_t length);
+
+// Returns the vector index to the minimum sample value of a 16-bit vector.
+//
+// Input:
+//      - vector : 16-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Index to the mimimum value in vector  (if multiple
+//                 indexes have the minimum, return the first).
+size_t WebRtcSpl_MinIndexW16(const int16_t* vector, size_t length);
+
+// Returns the vector index to the minimum sample value of a 32-bit vector.
+//
+// Input:
+//      - vector : 32-bit input vector.
+//      - length : Number of samples in vector.
+//
+// Return value  : Index to the mimimum value in vector  (if multiple
+//                 indexes have the minimum, return the first).
+size_t WebRtcSpl_MinIndexW32(const int32_t* vector, size_t length);
+
+// End: Minimum and maximum operations.
+
+
+// Vector scaling operations. Implementation in vector_scaling_operations.c.
+// Description at bottom of file.
+void WebRtcSpl_VectorBitShiftW16(int16_t* out_vector,
+                                 size_t vector_length,
+                                 const int16_t* in_vector,
+                                 int16_t right_shifts);
+void WebRtcSpl_VectorBitShiftW32(int32_t* out_vector,
+                                 size_t vector_length,
+                                 const int32_t* in_vector,
+                                 int16_t right_shifts);
+void WebRtcSpl_VectorBitShiftW32ToW16(int16_t* out_vector,
+                                      size_t vector_length,
+                                      const int32_t* in_vector,
+                                      int right_shifts);
+void WebRtcSpl_ScaleVector(const int16_t* in_vector,
+                           int16_t* out_vector,
+                           int16_t gain,
+                           size_t vector_length,
+                           int16_t right_shifts);
+void WebRtcSpl_ScaleVectorWithSat(const int16_t* in_vector,
+                                  int16_t* out_vector,
+                                  int16_t gain,
+                                  size_t vector_length,
+                                  int16_t right_shifts);
+void WebRtcSpl_ScaleAndAddVectors(const int16_t* in_vector1,
+                                  int16_t gain1, int right_shifts1,
+                                  const int16_t* in_vector2,
+                                  int16_t gain2, int right_shifts2,
+                                  int16_t* out_vector,
+                                  size_t vector_length);
+
+// The functions (with related pointer) perform the vector operation:
+//   out_vector[k] = ((scale1 * in_vector1[k]) + (scale2 * in_vector2[k])
+//        + round_value) >> right_shifts,
+//   where  round_value = (1 << right_shifts) >> 1.
+//
+// Input:
+//      - in_vector1       : Input vector 1
+//      - in_vector1_scale : Gain to be used for vector 1
+//      - in_vector2       : Input vector 2
+//      - in_vector2_scale : Gain to be used for vector 2
+//      - right_shifts     : Number of right bit shifts to be applied
+//      - length           : Number of elements in the input vectors
+//
+// Output:
+//      - out_vector       : Output vector
+// Return value            : 0 if OK, -1 if (in_vector1 == null
+//                           || in_vector2 == null || out_vector == null
+//                           || length <= 0 || right_shift < 0).
+typedef int (*ScaleAndAddVectorsWithRound)(const int16_t* in_vector1,
+                                           int16_t in_vector1_scale,
+                                           const int16_t* in_vector2,
+                                           int16_t in_vector2_scale,
+                                           int right_shifts,
+                                           int16_t* out_vector,
+                                           size_t length);
+extern ScaleAndAddVectorsWithRound WebRtcSpl_ScaleAndAddVectorsWithRound;
+int WebRtcSpl_ScaleAndAddVectorsWithRoundC(const int16_t* in_vector1,
+                                           int16_t in_vector1_scale,
+                                           const int16_t* in_vector2,
+                                           int16_t in_vector2_scale,
+                                           int right_shifts,
+                                           int16_t* out_vector,
+                                           size_t length);
+#if defined(MIPS_DSP_R1_LE)
+int WebRtcSpl_ScaleAndAddVectorsWithRound_mips(const int16_t* in_vector1,
+                                               int16_t in_vector1_scale,
+                                               const int16_t* in_vector2,
+                                               int16_t in_vector2_scale,
+                                               int right_shifts,
+                                               int16_t* out_vector,
+                                               size_t length);
+#endif
+// End: Vector scaling operations.
+
+// iLBC specific functions. Implementations in ilbc_specific_functions.c.
+// Description at bottom of file.
+void WebRtcSpl_ReverseOrderMultArrayElements(int16_t* out_vector,
+                                             const int16_t* in_vector,
+                                             const int16_t* window,
+                                             size_t vector_length,
+                                             int16_t right_shifts);
+void WebRtcSpl_ElementwiseVectorMult(int16_t* out_vector,
+                                     const int16_t* in_vector,
+                                     const int16_t* window,
+                                     size_t vector_length,
+                                     int16_t right_shifts);
+void WebRtcSpl_AddVectorsAndShift(int16_t* out_vector,
+                                  const int16_t* in_vector1,
+                                  const int16_t* in_vector2,
+                                  size_t vector_length,
+                                  int16_t right_shifts);
+void WebRtcSpl_AddAffineVectorToVector(int16_t* out_vector,
+                                       int16_t* in_vector,
+                                       int16_t gain,
+                                       int32_t add_constant,
+                                       int16_t right_shifts,
+                                       size_t vector_length);
+void WebRtcSpl_AffineTransformVector(int16_t* out_vector,
+                                     int16_t* in_vector,
+                                     int16_t gain,
+                                     int32_t add_constant,
+                                     int16_t right_shifts,
+                                     size_t vector_length);
+// End: iLBC specific functions.
+
+// Signal processing operations.
+
+// A 32-bit fix-point implementation of auto-correlation computation
+//
+// Input:
+//      - in_vector        : Vector to calculate autocorrelation upon
+//      - in_vector_length : Length (in samples) of |vector|
+//      - order            : The order up to which the autocorrelation should be
+//                           calculated
+//
+// Output:
+//      - result           : auto-correlation values (values should be seen
+//                           relative to each other since the absolute values
+//                           might have been down shifted to avoid overflow)
+//
+//      - scale            : The number of left shifts required to obtain the
+//                           auto-correlation in Q0
+//
+// Return value            : Number of samples in |result|, i.e. (order+1)
+size_t WebRtcSpl_AutoCorrelation(const int16_t* in_vector,
+                                 size_t in_vector_length,
+                                 size_t order,
+                                 int32_t* result,
+                                 int* scale);
+
+// A 32-bit fix-point implementation of the Levinson-Durbin algorithm that
+// does NOT use the 64 bit class
+//
+// Input:
+//      - auto_corr : Vector with autocorrelation values of length >= |order|+1
+//      - order     : The LPC filter order (support up to order 20)
+//
+// Output:
+//      - lpc_coef  : lpc_coef[0..order] LPC coefficients in Q12
+//      - refl_coef : refl_coef[0...order-1]| Reflection coefficients in Q15
+//
+// Return value     : 1 for stable 0 for unstable
+int16_t WebRtcSpl_LevinsonDurbin(const int32_t* auto_corr,
+                                 int16_t* lpc_coef,
+                                 int16_t* refl_coef,
+                                 size_t order);
+
+// Converts reflection coefficients |refl_coef| to LPC coefficients |lpc_coef|.
+// This version is a 16 bit operation.
+//
+// NOTE: The 16 bit refl_coef -> lpc_coef conversion might result in a
+// "slightly unstable" filter (i.e., a pole just outside the unit circle) in
+// "rare" cases even if the reflection coefficients are stable.
+//
+// Input:
+//      - refl_coef : Reflection coefficients in Q15 that should be converted
+//                    to LPC coefficients
+//      - use_order : Number of coefficients in |refl_coef|
+//
+// Output:
+//      - lpc_coef  : LPC coefficients in Q12
+void WebRtcSpl_ReflCoefToLpc(const int16_t* refl_coef,
+                             int use_order,
+                             int16_t* lpc_coef);
+
+// Converts LPC coefficients |lpc_coef| to reflection coefficients |refl_coef|.
+// This version is a 16 bit operation.
+// The conversion is implemented by the step-down algorithm.
+//
+// Input:
+//      - lpc_coef  : LPC coefficients in Q12, that should be converted to
+//                    reflection coefficients
+//      - use_order : Number of coefficients in |lpc_coef|
+//
+// Output:
+//      - refl_coef : Reflection coefficients in Q15.
+void WebRtcSpl_LpcToReflCoef(int16_t* lpc_coef,
+                             int use_order,
+                             int16_t* refl_coef);
+
+// Calculates reflection coefficients (16 bit) from auto-correlation values
+//
+// Input:
+//      - auto_corr : Auto-correlation values
+//      - use_order : Number of coefficients wanted be calculated
+//
+// Output:
+//      - refl_coef : Reflection coefficients in Q15.
+void WebRtcSpl_AutoCorrToReflCoef(const int32_t* auto_corr,
+                                  int use_order,
+                                  int16_t* refl_coef);
+
+// The functions (with related pointer) calculate the cross-correlation between
+// two sequences |seq1| and |seq2|.
+// |seq1| is fixed and |seq2| slides as the pointer is increased with the
+// amount |step_seq2|. Note the arguments should obey the relationship:
+// |dim_seq| - 1 + |step_seq2| * (|dim_cross_correlation| - 1) <
+//      buffer size of |seq2|
+//
+// Input:
+//      - seq1           : First sequence (fixed throughout the correlation)
+//      - seq2           : Second sequence (slides |step_vector2| for each
+//                            new correlation)
+//      - dim_seq        : Number of samples to use in the cross-correlation
+//      - dim_cross_correlation : Number of cross-correlations to calculate (the
+//                            start position for |vector2| is updated for each
+//                            new one)
+//      - right_shifts   : Number of right bit shifts to use. This will
+//                            become the output Q-domain.
+//      - step_seq2      : How many (positive or negative) steps the
+//                            |vector2| pointer should be updated for each new
+//                            cross-correlation value.
+//
+// Output:
+//      - cross_correlation : The cross-correlation in Q(-right_shifts)
+typedef void (*CrossCorrelation)(int32_t* cross_correlation,
+                                 const int16_t* seq1,
+                                 const int16_t* seq2,
+                                 size_t dim_seq,
+                                 size_t dim_cross_correlation,
+                                 int right_shifts,
+                                 int step_seq2);
+extern CrossCorrelation WebRtcSpl_CrossCorrelation;
+void WebRtcSpl_CrossCorrelationC(int32_t* cross_correlation,
+                                 const int16_t* seq1,
+                                 const int16_t* seq2,
+                                 size_t dim_seq,
+                                 size_t dim_cross_correlation,
+                                 int right_shifts,
+                                 int step_seq2);
+#if defined(WEBRTC_HAS_NEON)
+void WebRtcSpl_CrossCorrelationNeon(int32_t* cross_correlation,
+                                    const int16_t* seq1,
+                                    const int16_t* seq2,
+                                    size_t dim_seq,
+                                    size_t dim_cross_correlation,
+                                    int right_shifts,
+                                    int step_seq2);
+#endif
+#if defined(MIPS32_LE)
+void WebRtcSpl_CrossCorrelation_mips(int32_t* cross_correlation,
+                                     const int16_t* seq1,
+                                     const int16_t* seq2,
+                                     size_t dim_seq,
+                                     size_t dim_cross_correlation,
+                                     int right_shifts,
+                                     int step_seq2);
+#endif
+
+// Creates (the first half of) a Hanning window. Size must be at least 1 and
+// at most 512.
+//
+// Input:
+//      - size      : Length of the requested Hanning window (1 to 512)
+//
+// Output:
+//      - window    : Hanning vector in Q14.
+void WebRtcSpl_GetHanningWindow(int16_t* window, size_t size);
+
+// Calculates y[k] = sqrt(1 - x[k]^2) for each element of the input vector
+// |in_vector|. Input and output values are in Q15.
+//
+// Inputs:
+//      - in_vector     : Values to calculate sqrt(1 - x^2) of
+//      - vector_length : Length of vector |in_vector|
+//
+// Output:
+//      - out_vector    : Output values in Q15
+void WebRtcSpl_SqrtOfOneMinusXSquared(int16_t* in_vector,
+                                      size_t vector_length,
+                                      int16_t* out_vector);
+// End: Signal processing operations.
+
+// Randomization functions. Implementations collected in
+// randomization_functions.c and descriptions at bottom of this file.
+int16_t WebRtcSpl_RandU(uint32_t* seed);
+int16_t WebRtcSpl_RandN(uint32_t* seed);
+int16_t WebRtcSpl_RandUArray(int16_t* vector,
+                             int16_t vector_length,
+                             uint32_t* seed);
+// End: Randomization functions.
+
+// Math functions
+int32_t WebRtcSpl_Sqrt(int32_t value);
+int32_t WebRtcSpl_SqrtFloor(int32_t value);
+
+// Divisions. Implementations collected in division_operations.c and
+// descriptions at bottom of this file.
+uint32_t WebRtcSpl_DivU32U16(uint32_t num, uint16_t den);
+int32_t WebRtcSpl_DivW32W16(int32_t num, int16_t den);
+int16_t WebRtcSpl_DivW32W16ResW16(int32_t num, int16_t den);
+int32_t WebRtcSpl_DivResultInQ31(int32_t num, int32_t den);
+int32_t WebRtcSpl_DivW32HiLow(int32_t num, int16_t den_hi, int16_t den_low);
+// End: Divisions.
+
+int32_t WebRtcSpl_Energy(int16_t* vector,
+                         size_t vector_length,
+                         int* scale_factor);
+
+// Filter operations.
+size_t WebRtcSpl_FilterAR(const int16_t* ar_coef,
+                          size_t ar_coef_length,
+                          const int16_t* in_vector,
+                          size_t in_vector_length,
+                          int16_t* filter_state,
+                          size_t filter_state_length,
+                          int16_t* filter_state_low,
+                          size_t filter_state_low_length,
+                          int16_t* out_vector,
+                          int16_t* out_vector_low,
+                          size_t out_vector_low_length);
+
+// WebRtcSpl_FilterMAFastQ12(...)
+//
+// Performs a MA filtering on a vector in Q12
+//
+// Input:
+//      - in_vector         : Input samples (state in positions
+//                            in_vector[-order] .. in_vector[-1])
+//      - ma_coef           : Filter coefficients (in Q12)
+//      - ma_coef_length    : Number of B coefficients (order+1)
+//      - vector_length     : Number of samples to be filtered
+//
+// Output:
+//      - out_vector        : Filtered samples
+//
+void WebRtcSpl_FilterMAFastQ12(const int16_t* in_vector,
+                               int16_t* out_vector,
+                               const int16_t* ma_coef,
+                               size_t ma_coef_length,
+                               size_t vector_length);
+
+// Performs a AR filtering on a vector in Q12
+// Input:
+//      - data_in            : Input samples
+//      - data_out           : State information in positions
+//                               data_out[-order] .. data_out[-1]
+//      - coefficients       : Filter coefficients (in Q12)
+//      - coefficients_length: Number of coefficients (order+1)
+//      - data_length        : Number of samples to be filtered
+// Output:
+//      - data_out           : Filtered samples
+void WebRtcSpl_FilterARFastQ12(const int16_t* data_in,
+                               int16_t* data_out,
+                               const int16_t* __restrict coefficients,
+                               size_t coefficients_length,
+                               size_t data_length);
+
+// The functions (with related pointer) perform a MA down sampling filter
+// on a vector.
+// Input:
+//      - data_in            : Input samples (state in positions
+//                               data_in[-order] .. data_in[-1])
+//      - data_in_length     : Number of samples in |data_in| to be filtered.
+//                               This must be at least
+//                               |delay| + |factor|*(|out_vector_length|-1) + 1)
+//      - data_out_length    : Number of down sampled samples desired
+//      - coefficients       : Filter coefficients (in Q12)
+//      - coefficients_length: Number of coefficients (order+1)
+//      - factor             : Decimation factor
+//      - delay              : Delay of filter (compensated for in out_vector)
+// Output:
+//      - data_out           : Filtered samples
+// Return value              : 0 if OK, -1 if |in_vector| is too short
+typedef int (*DownsampleFast)(const int16_t* data_in,
+                              size_t data_in_length,
+                              int16_t* data_out,
+                              size_t data_out_length,
+                              const int16_t* __restrict coefficients,
+                              size_t coefficients_length,
+                              int factor,
+                              size_t delay);
+extern DownsampleFast WebRtcSpl_DownsampleFast;
+int WebRtcSpl_DownsampleFastC(const int16_t* data_in,
+                              size_t data_in_length,
+                              int16_t* data_out,
+                              size_t data_out_length,
+                              const int16_t* __restrict coefficients,
+                              size_t coefficients_length,
+                              int factor,
+                              size_t delay);
+#if defined(WEBRTC_HAS_NEON)
+int WebRtcSpl_DownsampleFastNeon(const int16_t* data_in,
+                                 size_t data_in_length,
+                                 int16_t* data_out,
+                                 size_t data_out_length,
+                                 const int16_t* __restrict coefficients,
+                                 size_t coefficients_length,
+                                 int factor,
+                                 size_t delay);
+#endif
+#if defined(MIPS32_LE)
+int WebRtcSpl_DownsampleFast_mips(const int16_t* data_in,
+                                  size_t data_in_length,
+                                  int16_t* data_out,
+                                  size_t data_out_length,
+                                  const int16_t* __restrict coefficients,
+                                  size_t coefficients_length,
+                                  int factor,
+                                  size_t delay);
+#endif
+
+// End: Filter operations.
+
+// FFT operations
+
+int WebRtcSpl_ComplexFFT(int16_t vector[], int stages, int mode);
+int WebRtcSpl_ComplexIFFT(int16_t vector[], int stages, int mode);
+
+// Treat a 16-bit complex data buffer |complex_data| as an array of 32-bit
+// values, and swap elements whose indexes are bit-reverses of each other.
+//
+// Input:
+//      - complex_data  : Complex data buffer containing 2^|stages| real
+//                        elements interleaved with 2^|stages| imaginary
+//                        elements: [Re Im Re Im Re Im....]
+//      - stages        : Number of FFT stages. Must be at least 3 and at most
+//                        10, since the table WebRtcSpl_kSinTable1024[] is 1024
+//                        elements long.
+//
+// Output:
+//      - complex_data  : The complex data buffer.
+
+void WebRtcSpl_ComplexBitReverse(int16_t* __restrict complex_data, int stages);
+
+// End: FFT operations
+
+/************************************************************
+ *
+ * RESAMPLING FUNCTIONS AND THEIR STRUCTS ARE DEFINED BELOW
+ *
+ ************************************************************/
+
+/*******************************************************************
+ * resample.c
+ *
+ * Includes the following resampling combinations
+ * 22 kHz -> 16 kHz
+ * 16 kHz -> 22 kHz
+ * 22 kHz ->  8 kHz
+ *  8 kHz -> 22 kHz
+ *
+ ******************************************************************/
+
+// state structure for 22 -> 16 resampler
+typedef struct {
+  int32_t S_22_44[8];
+  int32_t S_44_32[8];
+  int32_t S_32_16[8];
+} WebRtcSpl_State22khzTo16khz;
+
+void WebRtcSpl_Resample22khzTo16khz(const int16_t* in,
+                                    int16_t* out,
+                                    WebRtcSpl_State22khzTo16khz* state,
+                                    int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample22khzTo16khz(WebRtcSpl_State22khzTo16khz* state);
+
+// state structure for 16 -> 22 resampler
+typedef struct {
+  int32_t S_16_32[8];
+  int32_t S_32_22[8];
+} WebRtcSpl_State16khzTo22khz;
+
+void WebRtcSpl_Resample16khzTo22khz(const int16_t* in,
+                                    int16_t* out,
+                                    WebRtcSpl_State16khzTo22khz* state,
+                                    int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample16khzTo22khz(WebRtcSpl_State16khzTo22khz* state);
+
+// state structure for 22 -> 8 resampler
+typedef struct {
+  int32_t S_22_22[16];
+  int32_t S_22_16[8];
+  int32_t S_16_8[8];
+} WebRtcSpl_State22khzTo8khz;
+
+void WebRtcSpl_Resample22khzTo8khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State22khzTo8khz* state,
+                                   int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample22khzTo8khz(WebRtcSpl_State22khzTo8khz* state);
+
+// state structure for 8 -> 22 resampler
+typedef struct {
+  int32_t S_8_16[8];
+  int32_t S_16_11[8];
+  int32_t S_11_22[8];
+} WebRtcSpl_State8khzTo22khz;
+
+void WebRtcSpl_Resample8khzTo22khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State8khzTo22khz* state,
+                                   int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample8khzTo22khz(WebRtcSpl_State8khzTo22khz* state);
+
+/*******************************************************************
+ * resample_fractional.c
+ * Functions for internal use in the other resample functions
+ *
+ * Includes the following resampling combinations
+ * 48 kHz -> 32 kHz
+ * 32 kHz -> 24 kHz
+ * 44 kHz -> 32 kHz
+ *
+ ******************************************************************/
+
+void WebRtcSpl_Resample48khzTo32khz(const int32_t* In, int32_t* Out, size_t K);
+
+void WebRtcSpl_Resample32khzTo24khz(const int32_t* In, int32_t* Out, size_t K);
+
+void WebRtcSpl_Resample44khzTo32khz(const int32_t* In, int32_t* Out, size_t K);
+
+/*******************************************************************
+ * resample_48khz.c
+ *
+ * Includes the following resampling combinations
+ * 48 kHz -> 16 kHz
+ * 16 kHz -> 48 kHz
+ * 48 kHz ->  8 kHz
+ *  8 kHz -> 48 kHz
+ *
+ ******************************************************************/
+
+typedef struct {
+  int32_t S_48_48[16];
+  int32_t S_48_32[8];
+  int32_t S_32_16[8];
+} WebRtcSpl_State48khzTo16khz;
+
+void WebRtcSpl_Resample48khzTo16khz(const int16_t* in, int16_t* out,
+                                    WebRtcSpl_State48khzTo16khz* state,
+                                    int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample48khzTo16khz(WebRtcSpl_State48khzTo16khz* state);
+
+typedef struct {
+  int32_t S_16_32[8];
+  int32_t S_32_24[8];
+  int32_t S_24_48[8];
+} WebRtcSpl_State16khzTo48khz;
+
+void WebRtcSpl_Resample16khzTo48khz(const int16_t* in, int16_t* out,
+                                    WebRtcSpl_State16khzTo48khz* state,
+                                    int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample16khzTo48khz(WebRtcSpl_State16khzTo48khz* state);
+
+typedef struct {
+  int32_t S_48_24[8];
+  int32_t S_24_24[16];
+  int32_t S_24_16[8];
+  int32_t S_16_8[8];
+} WebRtcSpl_State48khzTo8khz;
+
+void WebRtcSpl_Resample48khzTo8khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State48khzTo8khz* state,
+                                   int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample48khzTo8khz(WebRtcSpl_State48khzTo8khz* state);
+
+typedef struct {
+  int32_t S_8_16[8];
+  int32_t S_16_12[8];
+  int32_t S_12_24[8];
+  int32_t S_24_48[8];
+} WebRtcSpl_State8khzTo48khz;
+
+void WebRtcSpl_Resample8khzTo48khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State8khzTo48khz* state,
+                                   int32_t* tmpmem);
+
+void WebRtcSpl_ResetResample8khzTo48khz(WebRtcSpl_State8khzTo48khz* state);
+
+/*******************************************************************
+ * resample_by_2.c
+ *
+ * Includes down and up sampling by a factor of two.
+ *
+ ******************************************************************/
+
+void WebRtcSpl_DownsampleBy2(const int16_t* in, size_t len,
+                             int16_t* out, int32_t* filtState);
+
+void WebRtcSpl_UpsampleBy2(const int16_t* in, size_t len,
+                           int16_t* out, int32_t* filtState);
+
+/************************************************************
+ * END OF RESAMPLING FUNCTIONS
+ ************************************************************/
+void WebRtcSpl_AnalysisQMF(const int16_t* in_data,
+                           size_t in_data_length,
+                           int16_t* low_band,
+                           int16_t* high_band,
+                           int32_t* filter_state1,
+                           int32_t* filter_state2);
+void WebRtcSpl_SynthesisQMF(const int16_t* low_band,
+                            const int16_t* high_band,
+                            size_t band_length,
+                            int16_t* out_data,
+                            int32_t* filter_state1,
+                            int32_t* filter_state2);
+
+#ifdef __cplusplus
+}
+#endif  // __cplusplus
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SIGNAL_PROCESSING_LIBRARY_H_
+
+//
+// WebRtcSpl_AddSatW16(...)
+// WebRtcSpl_AddSatW32(...)
+//
+// Returns the result of a saturated 16-bit, respectively 32-bit, addition of
+// the numbers specified by the |var1| and |var2| parameters.
+//
+// Input:
+//      - var1      : Input variable 1
+//      - var2      : Input variable 2
+//
+// Return value     : Added and saturated value
+//
+
+//
+// WebRtcSpl_SubSatW16(...)
+// WebRtcSpl_SubSatW32(...)
+//
+// Returns the result of a saturated 16-bit, respectively 32-bit, subtraction
+// of the numbers specified by the |var1| and |var2| parameters.
+//
+// Input:
+//      - var1      : Input variable 1
+//      - var2      : Input variable 2
+//
+// Returned value   : Subtracted and saturated value
+//
+
+//
+// WebRtcSpl_GetSizeInBits(...)
+//
+// Returns the # of bits that are needed at the most to represent the number
+// specified by the |value| parameter.
+//
+// Input:
+//      - value     : Input value
+//
+// Return value     : Number of bits needed to represent |value|
+//
+
+//
+// WebRtcSpl_NormW32(...)
+//
+// Norm returns the # of left shifts required to 32-bit normalize the 32-bit
+// signed number specified by the |value| parameter.
+//
+// Input:
+//      - value     : Input value
+//
+// Return value     : Number of bit shifts needed to 32-bit normalize |value|
+//
+
+//
+// WebRtcSpl_NormW16(...)
+//
+// Norm returns the # of left shifts required to 16-bit normalize the 16-bit
+// signed number specified by the |value| parameter.
+//
+// Input:
+//      - value     : Input value
+//
+// Return value     : Number of bit shifts needed to 32-bit normalize |value|
+//
+
+//
+// WebRtcSpl_NormU32(...)
+//
+// Norm returns the # of left shifts required to 32-bit normalize the unsigned
+// 32-bit number specified by the |value| parameter.
+//
+// Input:
+//      - value     : Input value
+//
+// Return value     : Number of bit shifts needed to 32-bit normalize |value|
+//
+
+//
+// WebRtcSpl_GetScalingSquare(...)
+//
+// Returns the # of bits required to scale the samples specified in the
+// |in_vector| parameter so that, if the squares of the samples are added the
+// # of times specified by the |times| parameter, the 32-bit addition will not
+// overflow (result in int32_t).
+//
+// Input:
+//      - in_vector         : Input vector to check scaling on
+//      - in_vector_length  : Samples in |in_vector|
+//      - times             : Number of additions to be performed
+//
+// Return value             : Number of right bit shifts needed to avoid
+//                            overflow in the addition calculation
+//
+
+//
+// WebRtcSpl_MemSetW16(...)
+//
+// Sets all the values in the int16_t vector |vector| of length
+// |vector_length| to the specified value |set_value|
+//
+// Input:
+//      - vector        : Pointer to the int16_t vector
+//      - set_value     : Value specified
+//      - vector_length : Length of vector
+//
+
+//
+// WebRtcSpl_MemSetW32(...)
+//
+// Sets all the values in the int32_t vector |vector| of length
+// |vector_length| to the specified value |set_value|
+//
+// Input:
+//      - vector        : Pointer to the int16_t vector
+//      - set_value     : Value specified
+//      - vector_length : Length of vector
+//
+
+//
+// WebRtcSpl_MemCpyReversedOrder(...)
+//
+// Copies all the values from the source int16_t vector |in_vector| to a
+// destination int16_t vector |out_vector|. It is done in reversed order,
+// meaning that the first sample of |in_vector| is copied to the last sample of
+// the |out_vector|. The procedure continues until the last sample of
+// |in_vector| has been copied to the first sample of |out_vector|. This
+// creates a reversed vector. Used in e.g. prediction in iLBC.
+//
+// Input:
+//      - in_vector     : Pointer to the first sample in a int16_t vector
+//                        of length |length|
+//      - vector_length : Number of elements to copy
+//
+// Output:
+//      - out_vector    : Pointer to the last sample in a int16_t vector
+//                        of length |length|
+//
+
+//
+// WebRtcSpl_CopyFromEndW16(...)
+//
+// Copies the rightmost |samples| of |in_vector| (of length |in_vector_length|)
+// to the vector |out_vector|.
+//
+// Input:
+//      - in_vector         : Input vector
+//      - in_vector_length  : Number of samples in |in_vector|
+//      - samples           : Number of samples to extract (from right side)
+//                            from |in_vector|
+//
+// Output:
+//      - out_vector        : Vector with the requested samples
+//
+
+//
+// WebRtcSpl_ZerosArrayW16(...)
+// WebRtcSpl_ZerosArrayW32(...)
+//
+// Inserts the value "zero" in all positions of a w16 and a w32 vector
+// respectively.
+//
+// Input:
+//      - vector_length : Number of samples in vector
+//
+// Output:
+//      - vector        : Vector containing all zeros
+//
+
+//
+// WebRtcSpl_VectorBitShiftW16(...)
+// WebRtcSpl_VectorBitShiftW32(...)
+//
+// Bit shifts all the values in a vector up or downwards. Different calls for
+// int16_t and int32_t vectors respectively.
+//
+// Input:
+//      - vector_length : Length of vector
+//      - in_vector     : Pointer to the vector that should be bit shifted
+//      - right_shifts  : Number of right bit shifts (negative value gives left
+//                        shifts)
+//
+// Output:
+//      - out_vector    : Pointer to the result vector (can be the same as
+//                        |in_vector|)
+//
+
+//
+// WebRtcSpl_VectorBitShiftW32ToW16(...)
+//
+// Bit shifts all the values in a int32_t vector up or downwards and
+// stores the result as an int16_t vector. The function will saturate the
+// signal if needed, before storing in the output vector.
+//
+// Input:
+//      - vector_length : Length of vector
+//      - in_vector     : Pointer to the vector that should be bit shifted
+//      - right_shifts  : Number of right bit shifts (negative value gives left
+//                        shifts)
+//
+// Output:
+//      - out_vector    : Pointer to the result vector (can be the same as
+//                        |in_vector|)
+//
+
+//
+// WebRtcSpl_ScaleVector(...)
+//
+// Performs the vector operation:
+//  out_vector[k] = (gain*in_vector[k])>>right_shifts
+//
+// Input:
+//      - in_vector     : Input vector
+//      - gain          : Scaling gain
+//      - vector_length : Elements in the |in_vector|
+//      - right_shifts  : Number of right bit shifts applied
+//
+// Output:
+//      - out_vector    : Output vector (can be the same as |in_vector|)
+//
+
+//
+// WebRtcSpl_ScaleVectorWithSat(...)
+//
+// Performs the vector operation:
+//  out_vector[k] = SATURATE( (gain*in_vector[k])>>right_shifts )
+//
+// Input:
+//      - in_vector     : Input vector
+//      - gain          : Scaling gain
+//      - vector_length : Elements in the |in_vector|
+//      - right_shifts  : Number of right bit shifts applied
+//
+// Output:
+//      - out_vector    : Output vector (can be the same as |in_vector|)
+//
+
+//
+// WebRtcSpl_ScaleAndAddVectors(...)
+//
+// Performs the vector operation:
+//  out_vector[k] = (gain1*in_vector1[k])>>right_shifts1
+//                  + (gain2*in_vector2[k])>>right_shifts2
+//
+// Input:
+//      - in_vector1    : Input vector 1
+//      - gain1         : Gain to be used for vector 1
+//      - right_shifts1 : Right bit shift to be used for vector 1
+//      - in_vector2    : Input vector 2
+//      - gain2         : Gain to be used for vector 2
+//      - right_shifts2 : Right bit shift to be used for vector 2
+//      - vector_length : Elements in the input vectors
+//
+// Output:
+//      - out_vector    : Output vector
+//
+
+//
+// WebRtcSpl_ReverseOrderMultArrayElements(...)
+//
+// Performs the vector operation:
+//  out_vector[n] = (in_vector[n]*window[-n])>>right_shifts
+//
+// Input:
+//      - in_vector     : Input vector
+//      - window        : Window vector (should be reversed). The pointer
+//                        should be set to the last value in the vector
+//      - right_shifts  : Number of right bit shift to be applied after the
+//                        multiplication
+//      - vector_length : Number of elements in |in_vector|
+//
+// Output:
+//      - out_vector    : Output vector (can be same as |in_vector|)
+//
+
+//
+// WebRtcSpl_ElementwiseVectorMult(...)
+//
+// Performs the vector operation:
+//  out_vector[n] = (in_vector[n]*window[n])>>right_shifts
+//
+// Input:
+//      - in_vector     : Input vector
+//      - window        : Window vector.
+//      - right_shifts  : Number of right bit shift to be applied after the
+//                        multiplication
+//      - vector_length : Number of elements in |in_vector|
+//
+// Output:
+//      - out_vector    : Output vector (can be same as |in_vector|)
+//
+
+//
+// WebRtcSpl_AddVectorsAndShift(...)
+//
+// Performs the vector operation:
+//  out_vector[k] = (in_vector1[k] + in_vector2[k])>>right_shifts
+//
+// Input:
+//      - in_vector1    : Input vector 1
+//      - in_vector2    : Input vector 2
+//      - right_shifts  : Number of right bit shift to be applied after the
+//                        multiplication
+//      - vector_length : Number of elements in |in_vector1| and |in_vector2|
+//
+// Output:
+//      - out_vector    : Output vector (can be same as |in_vector1|)
+//
+
+//
+// WebRtcSpl_AddAffineVectorToVector(...)
+//
+// Adds an affine transformed vector to another vector |out_vector|, i.e,
+// performs
+//  out_vector[k] += (in_vector[k]*gain+add_constant)>>right_shifts
+//
+// Input:
+//      - in_vector     : Input vector
+//      - gain          : Gain value, used to multiply the in vector with
+//      - add_constant  : Constant value to add (usually 1<<(right_shifts-1),
+//                        but others can be used as well
+//      - right_shifts  : Number of right bit shifts (0-16)
+//      - vector_length : Number of samples in |in_vector| and |out_vector|
+//
+// Output:
+//      - out_vector    : Vector with the output
+//
+
+//
+// WebRtcSpl_AffineTransformVector(...)
+//
+// Affine transforms a vector, i.e, performs
+//  out_vector[k] = (in_vector[k]*gain+add_constant)>>right_shifts
+//
+// Input:
+//      - in_vector     : Input vector
+//      - gain          : Gain value, used to multiply the in vector with
+//      - add_constant  : Constant value to add (usually 1<<(right_shifts-1),
+//                        but others can be used as well
+//      - right_shifts  : Number of right bit shifts (0-16)
+//      - vector_length : Number of samples in |in_vector| and |out_vector|
+//
+// Output:
+//      - out_vector    : Vector with the output
+//
+
+//
+// WebRtcSpl_IncreaseSeed(...)
+//
+// Increases the seed (and returns the new value)
+//
+// Input:
+//      - seed      : Seed for random calculation
+//
+// Output:
+//      - seed      : Updated seed value
+//
+// Return value     : The new seed value
+//
+
+//
+// WebRtcSpl_RandU(...)
+//
+// Produces a uniformly distributed value in the int16_t range
+//
+// Input:
+//      - seed      : Seed for random calculation
+//
+// Output:
+//      - seed      : Updated seed value
+//
+// Return value     : Uniformly distributed value in the range
+//                    [Word16_MIN...Word16_MAX]
+//
+
+//
+// WebRtcSpl_RandN(...)
+//
+// Produces a normal distributed value in the int16_t range
+//
+// Input:
+//      - seed      : Seed for random calculation
+//
+// Output:
+//      - seed      : Updated seed value
+//
+// Return value     : N(0,1) value in the Q13 domain
+//
+
+//
+// WebRtcSpl_RandUArray(...)
+//
+// Produces a uniformly distributed vector with elements in the int16_t
+// range
+//
+// Input:
+//      - vector_length : Samples wanted in the vector
+//      - seed          : Seed for random calculation
+//
+// Output:
+//      - vector        : Vector with the uniform values
+//      - seed          : Updated seed value
+//
+// Return value         : Number of samples in vector, i.e., |vector_length|
+//
+
+//
+// WebRtcSpl_Sqrt(...)
+//
+// Returns the square root of the input value |value|. The precision of this
+// function is integer precision, i.e., sqrt(8) gives 2 as answer.
+// If |value| is a negative number then 0 is returned.
+//
+// Algorithm:
+//
+// A sixth order Taylor Series expansion is used here to compute the square
+// root of a number y^0.5 = (1+x)^0.5
+// where
+// x = y-1
+//   = 1+(x/2)-0.5*((x/2)^2+0.5*((x/2)^3-0.625*((x/2)^4+0.875*((x/2)^5)
+// 0.5 <= x < 1
+//
+// Input:
+//      - value     : Value to calculate sqrt of
+//
+// Return value     : Result of the sqrt calculation
+//
+
+//
+// WebRtcSpl_SqrtFloor(...)
+//
+// Returns the square root of the input value |value|. The precision of this
+// function is rounding down integer precision, i.e., sqrt(8) gives 2 as answer.
+// If |value| is a negative number then 0 is returned.
+//
+// Algorithm:
+//
+// An iterative 4 cylce/bit routine
+//
+// Input:
+//      - value     : Value to calculate sqrt of
+//
+// Return value     : Result of the sqrt calculation
+//
+
+//
+// WebRtcSpl_DivU32U16(...)
+//
+// Divides a uint32_t |num| by a uint16_t |den|.
+//
+// If |den|==0, (uint32_t)0xFFFFFFFF is returned.
+//
+// Input:
+//      - num       : Numerator
+//      - den       : Denominator
+//
+// Return value     : Result of the division (as a uint32_t), i.e., the
+//                    integer part of num/den.
+//
+
+//
+// WebRtcSpl_DivW32W16(...)
+//
+// Divides a int32_t |num| by a int16_t |den|.
+//
+// If |den|==0, (int32_t)0x7FFFFFFF is returned.
+//
+// Input:
+//      - num       : Numerator
+//      - den       : Denominator
+//
+// Return value     : Result of the division (as a int32_t), i.e., the
+//                    integer part of num/den.
+//
+
+//
+// WebRtcSpl_DivW32W16ResW16(...)
+//
+// Divides a int32_t |num| by a int16_t |den|, assuming that the
+// result is less than 32768, otherwise an unpredictable result will occur.
+//
+// If |den|==0, (int16_t)0x7FFF is returned.
+//
+// Input:
+//      - num       : Numerator
+//      - den       : Denominator
+//
+// Return value     : Result of the division (as a int16_t), i.e., the
+//                    integer part of num/den.
+//
+
+//
+// WebRtcSpl_DivResultInQ31(...)
+//
+// Divides a int32_t |num| by a int16_t |den|, assuming that the
+// absolute value of the denominator is larger than the numerator, otherwise
+// an unpredictable result will occur.
+//
+// Input:
+//      - num       : Numerator
+//      - den       : Denominator
+//
+// Return value     : Result of the division in Q31.
+//
+
+//
+// WebRtcSpl_DivW32HiLow(...)
+//
+// Divides a int32_t |num| by a denominator in hi, low format. The
+// absolute value of the denominator has to be larger (or equal to) the
+// numerator.
+//
+// Input:
+//      - num       : Numerator
+//      - den_hi    : High part of denominator
+//      - den_low   : Low part of denominator
+//
+// Return value     : Divided value in Q31
+//
+
+//
+// WebRtcSpl_Energy(...)
+//
+// Calculates the energy of a vector
+//
+// Input:
+//      - vector        : Vector which the energy should be calculated on
+//      - vector_length : Number of samples in vector
+//
+// Output:
+//      - scale_factor  : Number of left bit shifts needed to get the physical
+//                        energy value, i.e, to get the Q0 value
+//
+// Return value         : Energy value in Q(-|scale_factor|)
+//
+
+//
+// WebRtcSpl_FilterAR(...)
+//
+// Performs a 32-bit AR filtering on a vector in Q12
+//
+// Input:
+//  - ar_coef                   : AR-coefficient vector (values in Q12),
+//                                ar_coef[0] must be 4096.
+//  - ar_coef_length            : Number of coefficients in |ar_coef|.
+//  - in_vector                 : Vector to be filtered.
+//  - in_vector_length          : Number of samples in |in_vector|.
+//  - filter_state              : Current state (higher part) of the filter.
+//  - filter_state_length       : Length (in samples) of |filter_state|.
+//  - filter_state_low          : Current state (lower part) of the filter.
+//  - filter_state_low_length   : Length (in samples) of |filter_state_low|.
+//  - out_vector_low_length     : Maximum length (in samples) of
+//                                |out_vector_low|.
+//
+// Output:
+//  - filter_state              : Updated state (upper part) vector.
+//  - filter_state_low          : Updated state (lower part) vector.
+//  - out_vector                : Vector containing the upper part of the
+//                                filtered values.
+//  - out_vector_low            : Vector containing the lower part of the
+//                                filtered values.
+//
+// Return value                 : Number of samples in the |out_vector|.
+//
+
+//
+// WebRtcSpl_ComplexIFFT(...)
+//
+// Complex Inverse FFT
+//
+// Computes an inverse complex 2^|stages|-point FFT on the input vector, which
+// is in bit-reversed order. The original content of the vector is destroyed in
+// the process, since the input is overwritten by the output, normal-ordered,
+// FFT vector. With X as the input complex vector, y as the output complex
+// vector and with M = 2^|stages|, the following is computed:
+//
+//        M-1
+// y(k) = sum[X(i)*[cos(2*pi*i*k/M) + j*sin(2*pi*i*k/M)]]
+//        i=0
+//
+// The implementations are optimized for speed, not for code size. It uses the
+// decimation-in-time algorithm with radix-2 butterfly technique.
+//
+// Input:
+//      - vector    : In pointer to complex vector containing 2^|stages|
+//                    real elements interleaved with 2^|stages| imaginary
+//                    elements.
+//                    [ReImReImReIm....]
+//                    The elements are in Q(-scale) domain, see more on Return
+//                    Value below.
+//
+//      - stages    : Number of FFT stages. Must be at least 3 and at most 10,
+//                    since the table WebRtcSpl_kSinTable1024[] is 1024
+//                    elements long.
+//
+//      - mode      : This parameter gives the user to choose how the FFT
+//                    should work.
+//                    mode==0: Low-complexity and Low-accuracy mode
+//                    mode==1: High-complexity and High-accuracy mode
+//
+// Output:
+//      - vector    : Out pointer to the FFT vector (the same as input).
+//
+// Return Value     : The scale value that tells the number of left bit shifts
+//                    that the elements in the |vector| should be shifted with
+//                    in order to get Q0 values, i.e. the physically correct
+//                    values. The scale parameter is always 0 or positive,
+//                    except if N>1024 (|stages|>10), which returns a scale
+//                    value of -1, indicating error.
+//
+
+//
+// WebRtcSpl_ComplexFFT(...)
+//
+// Complex FFT
+//
+// Computes a complex 2^|stages|-point FFT on the input vector, which is in
+// bit-reversed order. The original content of the vector is destroyed in
+// the process, since the input is overwritten by the output, normal-ordered,
+// FFT vector. With x as the input complex vector, Y as the output complex
+// vector and with M = 2^|stages|, the following is computed:
+//
+//              M-1
+// Y(k) = 1/M * sum[x(i)*[cos(2*pi*i*k/M) + j*sin(2*pi*i*k/M)]]
+//              i=0
+//
+// The implementations are optimized for speed, not for code size. It uses the
+// decimation-in-time algorithm with radix-2 butterfly technique.
+//
+// This routine prevents overflow by scaling by 2 before each FFT stage. This is
+// a fixed scaling, for proper normalization - there will be log2(n) passes, so
+// this results in an overall factor of 1/n, distributed to maximize arithmetic
+// accuracy.
+//
+// Input:
+//      - vector    : In pointer to complex vector containing 2^|stages| real
+//                    elements interleaved with 2^|stages| imaginary elements.
+//                    [ReImReImReIm....]
+//                    The output is in the Q0 domain.
+//
+//      - stages    : Number of FFT stages. Must be at least 3 and at most 10,
+//                    since the table WebRtcSpl_kSinTable1024[] is 1024
+//                    elements long.
+//
+//      - mode      : This parameter gives the user to choose how the FFT
+//                    should work.
+//                    mode==0: Low-complexity and Low-accuracy mode
+//                    mode==1: High-complexity and High-accuracy mode
+//
+// Output:
+//      - vector    : The output FFT vector is in the Q0 domain.
+//
+// Return value     : The scale parameter is always 0, except if N>1024,
+//                    which returns a scale value of -1, indicating error.
+//
+
+//
+// WebRtcSpl_AnalysisQMF(...)
+//
+// Splits a 0-2*F Hz signal into two sub bands: 0-F Hz and F-2*F Hz. The
+// current version has F = 8000, therefore, a super-wideband audio signal is
+// split to lower-band 0-8 kHz and upper-band 8-16 kHz.
+//
+// Input:
+//      - in_data       : Wide band speech signal, 320 samples (10 ms)
+//
+// Input & Output:
+//      - filter_state1 : Filter state for first All-pass filter
+//      - filter_state2 : Filter state for second All-pass filter
+//
+// Output:
+//      - low_band      : Lower-band signal 0-8 kHz band, 160 samples (10 ms)
+//      - high_band     : Upper-band signal 8-16 kHz band (flipped in frequency
+//                        domain), 160 samples (10 ms)
+//
+
+//
+// WebRtcSpl_SynthesisQMF(...)
+//
+// Combines the two sub bands (0-F and F-2*F Hz) into a signal of 0-2*F
+// Hz, (current version has F = 8000 Hz). So the filter combines lower-band
+// (0-8 kHz) and upper-band (8-16 kHz) channels to obtain super-wideband 0-16
+// kHz audio.
+//
+// Input:
+//      - low_band      : The signal with the 0-8 kHz band, 160 samples (10 ms)
+//      - high_band     : The signal with the 8-16 kHz band, 160 samples (10 ms)
+//
+// Input & Output:
+//      - filter_state1 : Filter state for first All-pass filter
+//      - filter_state2 : Filter state for second All-pass filter
+//
+// Output:
+//      - out_data      : Super-wideband speech signal, 0-16 kHz
+//
+
+// int16_t WebRtcSpl_SatW32ToW16(...)
+//
+// This function saturates a 32-bit word into a 16-bit word.
+//
+// Input:
+//      - value32   : The value of a 32-bit word.
+//
+// Output:
+//      - out16     : the saturated 16-bit word.
+//
+
+// int32_t WebRtc_MulAccumW16(...)
+//
+// This function multiply a 16-bit word by a 16-bit word, and accumulate this
+// value to a 32-bit integer.
+//
+// Input:
+//      - a    : The value of the first 16-bit word.
+//      - b    : The value of the second 16-bit word.
+//      - c    : The value of an 32-bit integer.
+//
+// Return Value: The value of a * b + c.
+//
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl.h
new file mode 100644
index 0000000..48dd181
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl.h
@@ -0,0 +1,154 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+// This header file includes the inline functions in
+// the fix point signal processing library.
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_H_
+
+#include "webrtc/system_wrappers/include/compile_assert_c.h"
+
+extern const int8_t kWebRtcSpl_CountLeadingZeros32_Table[64];
+
+// Don't call this directly except in tests!
+static __inline int WebRtcSpl_CountLeadingZeros32_NotBuiltin(uint32_t n) {
+  // Normalize n by rounding up to the nearest number that is a sequence of 0
+  // bits followed by a sequence of 1 bits. This number has the same number of
+  // leading zeros as the original n. There are exactly 33 such values.
+  n |= n >> 1;
+  n |= n >> 2;
+  n |= n >> 4;
+  n |= n >> 8;
+  n |= n >> 16;
+
+  // Multiply the modified n with a constant selected (by exhaustive search)
+  // such that each of the 33 possible values of n give a product whose 6 most
+  // significant bits are unique. Then look up the answer in the table.
+  return kWebRtcSpl_CountLeadingZeros32_Table[(n * 0x8c0b2891) >> 26];
+}
+
+// Don't call this directly except in tests!
+static __inline int WebRtcSpl_CountLeadingZeros64_NotBuiltin(uint64_t n) {
+  const int leading_zeros = n >> 32 == 0 ? 32 : 0;
+  return leading_zeros + WebRtcSpl_CountLeadingZeros32_NotBuiltin(
+                             (uint32_t)(n >> (32 - leading_zeros)));
+}
+
+// Returns the number of leading zero bits in the argument.
+static __inline int WebRtcSpl_CountLeadingZeros32(uint32_t n) {
+#ifdef __GNUC__
+  RTC_COMPILE_ASSERT(sizeof(unsigned int) == sizeof(uint32_t));
+  return n == 0 ? 32 : __builtin_clz(n);
+#else
+  return WebRtcSpl_CountLeadingZeros32_NotBuiltin(n);
+#endif
+}
+
+// Returns the number of leading zero bits in the argument.
+static __inline int WebRtcSpl_CountLeadingZeros64(uint64_t n) {
+#ifdef __GNUC__
+  RTC_COMPILE_ASSERT(sizeof(unsigned long long) == sizeof(uint64_t));  // NOLINT
+  return n == 0 ? 64 : __builtin_clzll(n);
+#else
+  return WebRtcSpl_CountLeadingZeros64_NotBuiltin(n);
+#endif
+}
+
+#ifdef WEBRTC_ARCH_ARM_V7
+#include "webrtc/common_audio/signal_processing/include/spl_inl_armv7.h"
+#else
+
+#if defined(MIPS32_LE)
+#include "webrtc/common_audio/signal_processing/include/spl_inl_mips.h"
+#endif
+
+#if !defined(MIPS_DSP_R1_LE)
+static __inline int16_t WebRtcSpl_SatW32ToW16(int32_t value32) {
+  int16_t out16 = (int16_t) value32;
+
+  if (value32 > 32767)
+    out16 = 32767;
+  else if (value32 < -32768)
+    out16 = -32768;
+
+  return out16;
+}
+
+static __inline int32_t WebRtcSpl_AddSatW32(int32_t a, int32_t b) {
+  // Do the addition in unsigned numbers, since signed overflow is undefined
+  // behavior.
+  const int32_t sum = (int32_t)((uint32_t)a + (uint32_t)b);
+
+  // a + b can't overflow if a and b have different signs. If they have the
+  // same sign, a + b also has the same sign iff it didn't overflow.
+  if ((a < 0) == (b < 0) && (a < 0) != (sum < 0)) {
+    // The direction of the overflow is obvious from the sign of a + b.
+    return sum < 0 ? INT32_MAX : INT32_MIN;
+  }
+  return sum;
+}
+
+static __inline int32_t WebRtcSpl_SubSatW32(int32_t a, int32_t b) {
+  // Do the subtraction in unsigned numbers, since signed overflow is undefined
+  // behavior.
+  const int32_t diff = (int32_t)((uint32_t)a - (uint32_t)b);
+
+  // a - b can't overflow if a and b have the same sign. If they have different
+  // signs, a - b has the same sign as a iff it didn't overflow.
+  if ((a < 0) != (b < 0) && (a < 0) != (diff < 0)) {
+    // The direction of the overflow is obvious from the sign of a - b.
+    return diff < 0 ? INT32_MAX : INT32_MIN;
+  }
+  return diff;
+}
+
+static __inline int16_t WebRtcSpl_AddSatW16(int16_t a, int16_t b) {
+  return WebRtcSpl_SatW32ToW16((int32_t) a + (int32_t) b);
+}
+
+static __inline int16_t WebRtcSpl_SubSatW16(int16_t var1, int16_t var2) {
+  return WebRtcSpl_SatW32ToW16((int32_t) var1 - (int32_t) var2);
+}
+#endif  // #if !defined(MIPS_DSP_R1_LE)
+
+#if !defined(MIPS32_LE)
+static __inline int16_t WebRtcSpl_GetSizeInBits(uint32_t n) {
+  return 32 - WebRtcSpl_CountLeadingZeros32(n);
+}
+
+// Return the number of steps a can be left-shifted without overflow,
+// or 0 if a == 0.
+static __inline int16_t WebRtcSpl_NormW32(int32_t a) {
+  return a == 0 ? 0 : WebRtcSpl_CountLeadingZeros32(a < 0 ? ~a : a) - 1;
+}
+
+// Return the number of steps a can be left-shifted without overflow,
+// or 0 if a == 0.
+static __inline int16_t WebRtcSpl_NormU32(uint32_t a) {
+  return a == 0 ? 0 : WebRtcSpl_CountLeadingZeros32(a);
+}
+
+// Return the number of steps a can be left-shifted without overflow,
+// or 0 if a == 0.
+static __inline int16_t WebRtcSpl_NormW16(int16_t a) {
+  const int32_t a32 = a;
+  return a == 0 ? 0 : WebRtcSpl_CountLeadingZeros32(a < 0 ? ~a32 : a32) - 17;
+}
+
+static __inline int32_t WebRtc_MulAccumW16(int16_t a, int16_t b, int32_t c) {
+  return (a * b + c);
+}
+#endif  // #if !defined(MIPS32_LE)
+
+#endif  // WEBRTC_ARCH_ARM_V7
+
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl_armv7.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl_armv7.h
new file mode 100644
index 0000000..634be48
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl_armv7.h
@@ -0,0 +1,134 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/* This header file includes the inline functions for ARM processors in
+ * the fix point signal processing library.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_ARMV7_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_ARMV7_H_
+
+/* TODO(kma): Replace some assembly code with GCC intrinsics
+ * (e.g. __builtin_clz).
+ */
+
+/* This function produces result that is not bit exact with that by the generic
+ * C version in some cases, although the former is at least as accurate as the
+ * later.
+ */
+static __inline int32_t WEBRTC_SPL_MUL_16_32_RSFT16(int16_t a, int32_t b) {
+  int32_t tmp = 0;
+  __asm __volatile ("smulwb %0, %1, %2":"=r"(tmp):"r"(b), "r"(a));
+  return tmp;
+}
+
+static __inline int32_t WEBRTC_SPL_MUL_16_16(int16_t a, int16_t b) {
+  int32_t tmp = 0;
+  __asm __volatile ("smulbb %0, %1, %2":"=r"(tmp):"r"(a), "r"(b));
+  return tmp;
+}
+
+// TODO(kma): add unit test.
+static __inline int32_t WebRtc_MulAccumW16(int16_t a, int16_t b, int32_t c) {
+  int32_t tmp = 0;
+  __asm __volatile ("smlabb %0, %1, %2, %3":"=r"(tmp):"r"(a), "r"(b), "r"(c));
+  return tmp;
+}
+
+static __inline int16_t WebRtcSpl_AddSatW16(int16_t a, int16_t b) {
+  int32_t s_sum = 0;
+
+  __asm __volatile ("qadd16 %0, %1, %2":"=r"(s_sum):"r"(a), "r"(b));
+
+  return (int16_t) s_sum;
+}
+
+static __inline int32_t WebRtcSpl_AddSatW32(int32_t l_var1, int32_t l_var2) {
+  int32_t l_sum = 0;
+
+  __asm __volatile ("qadd %0, %1, %2":"=r"(l_sum):"r"(l_var1), "r"(l_var2));
+
+  return l_sum;
+}
+
+static __inline int32_t WebRtcSpl_SubSatW32(int32_t l_var1, int32_t l_var2) {
+  int32_t l_sub = 0;
+
+  __asm __volatile ("qsub %0, %1, %2":"=r"(l_sub):"r"(l_var1), "r"(l_var2));
+
+  return l_sub;
+}
+
+static __inline int16_t WebRtcSpl_SubSatW16(int16_t var1, int16_t var2) {
+  int32_t s_sub = 0;
+
+  __asm __volatile ("qsub16 %0, %1, %2":"=r"(s_sub):"r"(var1), "r"(var2));
+
+  return (int16_t)s_sub;
+}
+
+static __inline int16_t WebRtcSpl_GetSizeInBits(uint32_t n) {
+  int32_t tmp = 0;
+
+  __asm __volatile ("clz %0, %1":"=r"(tmp):"r"(n));
+
+  return (int16_t)(32 - tmp);
+}
+
+static __inline int16_t WebRtcSpl_NormW32(int32_t a) {
+  int32_t tmp = 0;
+
+  if (a == 0) {
+    return 0;
+  } else if (a < 0) {
+    a ^= 0xFFFFFFFF;
+  }
+
+  __asm __volatile ("clz %0, %1":"=r"(tmp):"r"(a));
+
+  return (int16_t)(tmp - 1);
+}
+
+static __inline int16_t WebRtcSpl_NormU32(uint32_t a) {
+  int tmp = 0;
+
+  if (a == 0) return 0;
+
+  __asm __volatile ("clz %0, %1":"=r"(tmp):"r"(a));
+
+  return (int16_t)tmp;
+}
+
+static __inline int16_t WebRtcSpl_NormW16(int16_t a) {
+  int32_t tmp = 0;
+  int32_t a_32 = a;
+
+  if (a_32 == 0) {
+    return 0;
+  } else if (a_32 < 0) {
+    a_32 ^= 0xFFFFFFFF;
+  }
+
+  __asm __volatile ("clz %0, %1":"=r"(tmp):"r"(a_32));
+
+  return (int16_t)(tmp - 17);
+}
+
+// TODO(kma): add unit test.
+static __inline int16_t WebRtcSpl_SatW32ToW16(int32_t value32) {
+  int32_t out = 0;
+
+  __asm __volatile ("ssat %0, #16, %1" : "=r"(out) : "r"(value32));
+
+  return (int16_t)out;
+}
+
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_ARMV7_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl_mips.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl_mips.h
new file mode 100644
index 0000000..90fa07a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/include/spl_inl_mips.h
@@ -0,0 +1,213 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+// This header file includes the inline functions in
+// the fix point signal processing library.
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_MIPS_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_MIPS_H_
+
+static __inline int32_t WEBRTC_SPL_MUL_16_16(int32_t a,
+                                             int32_t b) {
+  int32_t value32 = 0;
+  int32_t a1 = 0, b1 = 0;
+
+  __asm __volatile(
+#if defined(MIPS32_R2_LE)
+    "seh    %[a1],          %[a]                \n\t"
+    "seh    %[b1],          %[b]                \n\t"
+#else
+    "sll    %[a1],          %[a],         16    \n\t"
+    "sll    %[b1],          %[b],         16    \n\t"
+    "sra    %[a1],          %[a1],        16    \n\t"
+    "sra    %[b1],          %[b1],        16    \n\t"
+#endif
+    "mul    %[value32],     %[a1],  %[b1]       \n\t"
+    : [value32] "=r" (value32), [a1] "=&r" (a1), [b1] "=&r" (b1)
+    : [a] "r" (a), [b] "r" (b)
+    : "hi", "lo");
+  return value32;
+}
+
+static __inline int32_t WEBRTC_SPL_MUL_16_32_RSFT16(int16_t a,
+                                                    int32_t b) {
+  int32_t value32 = 0, b1 = 0, b2 = 0;
+  int32_t a1 = 0;
+
+  __asm __volatile(
+#if defined(MIPS32_R2_LE)
+    "seh    %[a1],          %[a]                        \n\t"
+#else
+    "sll    %[a1],          %[a],           16          \n\t"
+    "sra    %[a1],          %[a1],          16          \n\t"
+#endif
+    "andi   %[b2],          %[b],           0xFFFF      \n\t"
+    "sra    %[b1],          %[b],           16          \n\t"
+    "sra    %[b2],          %[b2],          1           \n\t"
+    "mul    %[value32],     %[a1],          %[b1]       \n\t"
+    "mul    %[b2],          %[a1],          %[b2]       \n\t"
+    "addiu  %[b2],          %[b2],          0x4000      \n\t"
+    "sra    %[b2],          %[b2],          15          \n\t"
+    "addu   %[value32],     %[value32],     %[b2]       \n\t"
+    : [value32] "=&r" (value32), [b1] "=&r" (b1), [b2] "=&r" (b2),
+      [a1] "=&r" (a1)
+    : [a] "r" (a), [b] "r" (b)
+    : "hi", "lo");
+  return value32;
+}
+
+#if defined(MIPS_DSP_R1_LE)
+static __inline int16_t WebRtcSpl_SatW32ToW16(int32_t value32) {
+  __asm __volatile(
+    "shll_s.w   %[value32], %[value32], 16      \n\t"
+    "sra        %[value32], %[value32], 16      \n\t"
+    : [value32] "+r" (value32)
+    :);
+  int16_t out16 = (int16_t)value32;
+  return out16;
+}
+
+static __inline int16_t WebRtcSpl_AddSatW16(int16_t a, int16_t b) {
+  int32_t value32 = 0;
+
+  __asm __volatile(
+    "addq_s.ph      %[value32],     %[a],   %[b]    \n\t"
+    : [value32] "=r" (value32)
+    : [a] "r" (a), [b] "r" (b) );
+  return (int16_t)value32;
+}
+
+static __inline int32_t WebRtcSpl_AddSatW32(int32_t l_var1, int32_t l_var2) {
+  int32_t l_sum;
+
+  __asm __volatile(
+    "addq_s.w   %[l_sum],       %[l_var1],      %[l_var2]    \n\t"
+    : [l_sum] "=r" (l_sum)
+    : [l_var1] "r" (l_var1), [l_var2] "r" (l_var2) );
+
+  return l_sum;
+}
+
+static __inline int16_t WebRtcSpl_SubSatW16(int16_t var1, int16_t var2) {
+  int32_t value32;
+
+  __asm __volatile(
+    "subq_s.ph  %[value32], %[var1],    %[var2]     \n\t"
+    : [value32] "=r" (value32)
+    : [var1] "r" (var1), [var2] "r" (var2) );
+
+  return (int16_t)value32;
+}
+
+static __inline int32_t WebRtcSpl_SubSatW32(int32_t l_var1, int32_t l_var2) {
+  int32_t l_diff;
+
+  __asm __volatile(
+    "subq_s.w   %[l_diff],      %[l_var1],      %[l_var2]    \n\t"
+    : [l_diff] "=r" (l_diff)
+    : [l_var1] "r" (l_var1), [l_var2] "r" (l_var2) );
+
+  return l_diff;
+}
+#endif
+
+static __inline int16_t WebRtcSpl_GetSizeInBits(uint32_t n) {
+  int bits = 0;
+  int i32 = 32;
+
+  __asm __volatile(
+    "clz    %[bits],    %[n]                    \n\t"
+    "subu   %[bits],    %[i32],     %[bits]     \n\t"
+    : [bits] "=&r" (bits)
+    : [n] "r" (n), [i32] "r" (i32) );
+
+  return (int16_t)bits;
+}
+
+static __inline int16_t WebRtcSpl_NormW32(int32_t a) {
+  int zeros = 0;
+
+  __asm __volatile(
+    ".set       push                                \n\t"
+    ".set       noreorder                           \n\t"
+    "bnez       %[a],       1f                      \n\t"
+    " sra       %[zeros],   %[a],       31          \n\t"
+    "b          2f                                  \n\t"
+    " move      %[zeros],   $zero                   \n\t"
+   "1:                                              \n\t"
+    "xor        %[zeros],   %[a],       %[zeros]    \n\t"
+    "clz        %[zeros],   %[zeros]                \n\t"
+    "addiu      %[zeros],   %[zeros],   -1          \n\t"
+   "2:                                              \n\t"
+    ".set       pop                                 \n\t"
+    : [zeros]"=&r"(zeros)
+    : [a] "r" (a) );
+
+  return (int16_t)zeros;
+}
+
+static __inline int16_t WebRtcSpl_NormU32(uint32_t a) {
+  int zeros = 0;
+
+  __asm __volatile(
+    "clz    %[zeros],   %[a]    \n\t"
+    : [zeros] "=r" (zeros)
+    : [a] "r" (a) );
+
+  return (int16_t)(zeros & 0x1f);
+}
+
+static __inline int16_t WebRtcSpl_NormW16(int16_t a) {
+  int zeros = 0;
+  int a0 = a << 16;
+
+  __asm __volatile(
+    ".set       push                                \n\t"
+    ".set       noreorder                           \n\t"
+    "bnez       %[a0],      1f                      \n\t"
+    " sra       %[zeros],   %[a0],      31          \n\t"
+    "b          2f                                  \n\t"
+    " move      %[zeros],   $zero                   \n\t"
+   "1:                                              \n\t"
+    "xor        %[zeros],   %[a0],      %[zeros]    \n\t"
+    "clz        %[zeros],   %[zeros]                \n\t"
+    "addiu      %[zeros],   %[zeros],   -1          \n\t"
+   "2:                                              \n\t"
+    ".set       pop                                 \n\t"
+    : [zeros]"=&r"(zeros)
+    : [a0] "r" (a0) );
+
+  return (int16_t)zeros;
+}
+
+static __inline int32_t WebRtc_MulAccumW16(int16_t a,
+                                           int16_t b,
+                                           int32_t c) {
+  int32_t res = 0, c1 = 0;
+  __asm __volatile(
+#if defined(MIPS32_R2_LE)
+    "seh    %[a],       %[a]            \n\t"
+    "seh    %[b],       %[b]            \n\t"
+#else
+    "sll    %[a],       %[a],   16      \n\t"
+    "sll    %[b],       %[b],   16      \n\t"
+    "sra    %[a],       %[a],   16      \n\t"
+    "sra    %[b],       %[b],   16      \n\t"
+#endif
+    "mul    %[res],     %[a],   %[b]    \n\t"
+    "addu   %[c1],      %[c],   %[res]  \n\t"
+    : [c1] "=r" (c1), [res] "=&r" (res)
+    : [a] "r" (a), [b] "r" (b), [c] "r" (c)
+    : "hi", "lo");
+  return (c1);
+}
+
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_INCLUDE_SPL_INL_MIPS_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/levinson_durbin.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/levinson_durbin.c
new file mode 100644
index 0000000..c8e58ba
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/levinson_durbin.c
@@ -0,0 +1,245 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_LevinsonDurbin().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#define SPL_LEVINSON_MAXORDER 20
+
+int16_t WebRtcSpl_LevinsonDurbin(const int32_t* R, int16_t* A, int16_t* K,
+                                 size_t order)
+{
+    size_t i, j;
+    // Auto-correlation coefficients in high precision
+    int16_t R_hi[SPL_LEVINSON_MAXORDER + 1], R_low[SPL_LEVINSON_MAXORDER + 1];
+    // LPC coefficients in high precision
+    int16_t A_hi[SPL_LEVINSON_MAXORDER + 1], A_low[SPL_LEVINSON_MAXORDER + 1];
+    // LPC coefficients for next iteration
+    int16_t A_upd_hi[SPL_LEVINSON_MAXORDER + 1], A_upd_low[SPL_LEVINSON_MAXORDER + 1];
+    // Reflection coefficient in high precision
+    int16_t K_hi, K_low;
+    // Prediction gain Alpha in high precision and with scale factor
+    int16_t Alpha_hi, Alpha_low, Alpha_exp;
+    int16_t tmp_hi, tmp_low;
+    int32_t temp1W32, temp2W32, temp3W32;
+    int16_t norm;
+
+    // Normalize the autocorrelation R[0]...R[order+1]
+
+    norm = WebRtcSpl_NormW32(R[0]);
+
+    for (i = 0; i <= order; ++i)
+    {
+        temp1W32 = R[i] * (1 << norm);
+        // Put R in hi and low format
+        R_hi[i] = (int16_t)(temp1W32 >> 16);
+        R_low[i] = (int16_t)((temp1W32 - ((int32_t)R_hi[i] * 65536)) >> 1);
+    }
+
+    // K = A[1] = -R[1] / R[0]
+
+    temp2W32 = R[1] * (1 << norm); // R[1] in Q31
+    temp3W32 = WEBRTC_SPL_ABS_W32(temp2W32); // abs R[1]
+    temp1W32 = WebRtcSpl_DivW32HiLow(temp3W32, R_hi[0], R_low[0]); // abs(R[1])/R[0] in Q31
+    // Put back the sign on R[1]
+    if (temp2W32 > 0)
+    {
+        temp1W32 = -temp1W32;
+    }
+
+    // Put K in hi and low format
+    K_hi = (int16_t)(temp1W32 >> 16);
+    K_low = (int16_t)((temp1W32 - ((int32_t)K_hi * 65536)) >> 1);
+
+    // Store first reflection coefficient
+    K[0] = K_hi;
+
+    temp1W32 >>= 4;  // A[1] in Q27.
+
+    // Put A[1] in hi and low format
+    A_hi[1] = (int16_t)(temp1W32 >> 16);
+    A_low[1] = (int16_t)((temp1W32 - ((int32_t)A_hi[1] * 65536)) >> 1);
+
+    // Alpha = R[0] * (1-K^2)
+
+    temp1W32 = ((K_hi * K_low >> 14) + K_hi * K_hi) * 2;  // = k^2 in Q31
+
+    temp1W32 = WEBRTC_SPL_ABS_W32(temp1W32); // Guard against <0
+    temp1W32 = (int32_t)0x7fffffffL - temp1W32; // temp1W32 = (1 - K[0]*K[0]) in Q31
+
+    // Store temp1W32 = 1 - K[0]*K[0] on hi and low format
+    tmp_hi = (int16_t)(temp1W32 >> 16);
+    tmp_low = (int16_t)((temp1W32 - ((int32_t)tmp_hi << 16)) >> 1);
+
+    // Calculate Alpha in Q31
+    temp1W32 = (R_hi[0] * tmp_hi + (R_hi[0] * tmp_low >> 15) +
+        (R_low[0] * tmp_hi >> 15)) << 1;
+
+    // Normalize Alpha and put it in hi and low format
+
+    Alpha_exp = WebRtcSpl_NormW32(temp1W32);
+    temp1W32 = WEBRTC_SPL_LSHIFT_W32(temp1W32, Alpha_exp);
+    Alpha_hi = (int16_t)(temp1W32 >> 16);
+    Alpha_low = (int16_t)((temp1W32 - ((int32_t)Alpha_hi << 16)) >> 1);
+
+    // Perform the iterative calculations in the Levinson-Durbin algorithm
+
+    for (i = 2; i <= order; i++)
+    {
+        /*                    ----
+         temp1W32 =  R[i] + > R[j]*A[i-j]
+         /
+         ----
+         j=1..i-1
+         */
+
+        temp1W32 = 0;
+
+        for (j = 1; j < i; j++)
+        {
+          // temp1W32 is in Q31
+          temp1W32 += (R_hi[j] * A_hi[i - j] * 2) +
+              (((R_hi[j] * A_low[i - j] >> 15) +
+              (R_low[j] * A_hi[i - j] >> 15)) * 2);
+        }
+
+        temp1W32 = temp1W32 * 16;
+        temp1W32 += ((int32_t)R_hi[i] * 65536)
+                + WEBRTC_SPL_LSHIFT_W32((int32_t)R_low[i], 1);
+
+        // K = -temp1W32 / Alpha
+        temp2W32 = WEBRTC_SPL_ABS_W32(temp1W32); // abs(temp1W32)
+        temp3W32 = WebRtcSpl_DivW32HiLow(temp2W32, Alpha_hi, Alpha_low); // abs(temp1W32)/Alpha
+
+        // Put the sign of temp1W32 back again
+        if (temp1W32 > 0)
+        {
+            temp3W32 = -temp3W32;
+        }
+
+        // Use the Alpha shifts from earlier to de-normalize
+        norm = WebRtcSpl_NormW32(temp3W32);
+        if ((Alpha_exp <= norm) || (temp3W32 == 0))
+        {
+            temp3W32 = temp3W32 * (1 << Alpha_exp);
+        } else
+        {
+            if (temp3W32 > 0)
+            {
+                temp3W32 = (int32_t)0x7fffffffL;
+            } else
+            {
+                temp3W32 = (int32_t)0x80000000L;
+            }
+        }
+
+        // Put K on hi and low format
+        K_hi = (int16_t)(temp3W32 >> 16);
+        K_low = (int16_t)((temp3W32 - ((int32_t)K_hi * 65536)) >> 1);
+
+        // Store Reflection coefficient in Q15
+        K[i - 1] = K_hi;
+
+        // Test for unstable filter.
+        // If unstable return 0 and let the user decide what to do in that case
+
+        if ((int32_t)WEBRTC_SPL_ABS_W16(K_hi) > (int32_t)32750)
+        {
+            return 0; // Unstable filter
+        }
+
+        /*
+         Compute updated LPC coefficient: Anew[i]
+         Anew[j]= A[j] + K*A[i-j]   for j=1..i-1
+         Anew[i]= K
+         */
+
+        for (j = 1; j < i; j++)
+        {
+            // temp1W32 = A[j] in Q27
+            temp1W32 = (int32_t)A_hi[j] * 65536
+                    + WEBRTC_SPL_LSHIFT_W32((int32_t)A_low[j],1);
+
+            // temp1W32 += K*A[i-j] in Q27
+            temp1W32 += (K_hi * A_hi[i - j] + (K_hi * A_low[i - j] >> 15) +
+                (K_low * A_hi[i - j] >> 15)) * 2;
+
+            // Put Anew in hi and low format
+            A_upd_hi[j] = (int16_t)(temp1W32 >> 16);
+            A_upd_low[j] = (int16_t)(
+                (temp1W32 - ((int32_t)A_upd_hi[j] * 65536)) >> 1);
+        }
+
+        // temp3W32 = K in Q27 (Convert from Q31 to Q27)
+        temp3W32 >>= 4;
+
+        // Store Anew in hi and low format
+        A_upd_hi[i] = (int16_t)(temp3W32 >> 16);
+        A_upd_low[i] = (int16_t)(
+            (temp3W32 - ((int32_t)A_upd_hi[i] * 65536)) >> 1);
+
+        // Alpha = Alpha * (1-K^2)
+
+        temp1W32 = ((K_hi * K_low >> 14) + K_hi * K_hi) * 2;  // K*K in Q31
+
+        temp1W32 = WEBRTC_SPL_ABS_W32(temp1W32); // Guard against <0
+        temp1W32 = (int32_t)0x7fffffffL - temp1W32; // 1 - K*K  in Q31
+
+        // Convert 1- K^2 in hi and low format
+        tmp_hi = (int16_t)(temp1W32 >> 16);
+        tmp_low = (int16_t)((temp1W32 - ((int32_t)tmp_hi << 16)) >> 1);
+
+        // Calculate Alpha = Alpha * (1-K^2) in Q31
+        temp1W32 = (Alpha_hi * tmp_hi + (Alpha_hi * tmp_low >> 15) +
+            (Alpha_low * tmp_hi >> 15)) << 1;
+
+        // Normalize Alpha and store it on hi and low format
+
+        norm = WebRtcSpl_NormW32(temp1W32);
+        temp1W32 = WEBRTC_SPL_LSHIFT_W32(temp1W32, norm);
+
+        Alpha_hi = (int16_t)(temp1W32 >> 16);
+        Alpha_low = (int16_t)((temp1W32 - ((int32_t)Alpha_hi << 16)) >> 1);
+
+        // Update the total normalization of Alpha
+        Alpha_exp = Alpha_exp + norm;
+
+        // Update A[]
+
+        for (j = 1; j <= i; j++)
+        {
+            A_hi[j] = A_upd_hi[j];
+            A_low[j] = A_upd_low[j];
+        }
+    }
+
+    /*
+     Set A[0] to 1.0 and store the A[i] i=1...order in Q12
+     (Convert from Q27 and use rounding)
+     */
+
+    A[0] = 4096;
+
+    for (i = 1; i <= order; i++)
+    {
+        // temp1W32 in Q27
+        temp1W32 = (int32_t)A_hi[i] * 65536
+                + WEBRTC_SPL_LSHIFT_W32((int32_t)A_low[i], 1);
+        // Round and store upper word
+        A[i] = (int16_t)(((temp1W32 * 2) + 32768) >> 16);
+    }
+    return 1; // Stable filters
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/lpc_to_refl_coef.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/lpc_to_refl_coef.c
new file mode 100644
index 0000000..edcebd4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/lpc_to_refl_coef.c
@@ -0,0 +1,56 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_LpcToReflCoef().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#define SPL_LPC_TO_REFL_COEF_MAX_AR_MODEL_ORDER 50
+
+void WebRtcSpl_LpcToReflCoef(int16_t* a16, int use_order, int16_t* k16)
+{
+    int m, k;
+    int32_t tmp32[SPL_LPC_TO_REFL_COEF_MAX_AR_MODEL_ORDER];
+    int32_t tmp_inv_denom32;
+    int16_t tmp_inv_denom16;
+
+    k16[use_order - 1] = a16[use_order] << 3;  // Q12<<3 => Q15
+    for (m = use_order - 1; m > 0; m--)
+    {
+        // (1 - k^2) in Q30
+        tmp_inv_denom32 = 1073741823 - k16[m] * k16[m];
+        // (1 - k^2) in Q15
+        tmp_inv_denom16 = (int16_t)(tmp_inv_denom32 >> 15);
+
+        for (k = 1; k <= m; k++)
+        {
+            // tmp[k] = (a[k] - RC[m] * a[m-k+1]) / (1.0 - RC[m]*RC[m]);
+
+            // [Q12<<16 - (Q15*Q12)<<1] = [Q28 - Q28] = Q28
+            tmp32[k] = (a16[k] << 16) - (k16[m] * a16[m - k + 1] << 1);
+
+            tmp32[k] = WebRtcSpl_DivW32W16(tmp32[k], tmp_inv_denom16); //Q28/Q15 = Q13
+        }
+
+        for (k = 1; k < m; k++)
+        {
+            a16[k] = (int16_t)(tmp32[k] >> 1);  // Q13>>1 => Q12
+        }
+
+        tmp32[m] = WEBRTC_SPL_SAT(8191, tmp32[m], -8191);
+        k16[m - 1] = (int16_t)WEBRTC_SPL_LSHIFT_W32(tmp32[m], 2); //Q13<<2 => Q15
+    }
+    return;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations.c
new file mode 100644
index 0000000..bc23a9c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations.c
@@ -0,0 +1,224 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+/*
+ * This file contains the implementation of functions
+ * WebRtcSpl_MaxAbsValueW16C()
+ * WebRtcSpl_MaxAbsValueW32C()
+ * WebRtcSpl_MaxValueW16C()
+ * WebRtcSpl_MaxValueW32C()
+ * WebRtcSpl_MinValueW16C()
+ * WebRtcSpl_MinValueW32C()
+ * WebRtcSpl_MaxAbsIndexW16()
+ * WebRtcSpl_MaxIndexW16()
+ * WebRtcSpl_MaxIndexW32()
+ * WebRtcSpl_MinIndexW16()
+ * WebRtcSpl_MinIndexW32()
+ *
+ */
+
+#include <stdlib.h>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// TODO(bjorn/kma): Consolidate function pairs (e.g. combine
+//   WebRtcSpl_MaxAbsValueW16C and WebRtcSpl_MaxAbsIndexW16 into a single one.)
+// TODO(kma): Move the next six functions into min_max_operations_c.c.
+
+// Maximum absolute value of word16 vector. C version for generic platforms.
+int16_t WebRtcSpl_MaxAbsValueW16C(const int16_t* vector, size_t length) {
+  size_t i = 0;
+  int absolute = 0, maximum = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    absolute = abs((int)vector[i]);
+
+    if (absolute > maximum) {
+      maximum = absolute;
+    }
+  }
+
+  // Guard the case for abs(-32768).
+  if (maximum > WEBRTC_SPL_WORD16_MAX) {
+    maximum = WEBRTC_SPL_WORD16_MAX;
+  }
+
+  return (int16_t)maximum;
+}
+
+// Maximum absolute value of word32 vector. C version for generic platforms.
+int32_t WebRtcSpl_MaxAbsValueW32C(const int32_t* vector, size_t length) {
+  // Use uint32_t for the local variables, to accommodate the return value
+  // of abs(0x80000000), which is 0x80000000.
+
+  uint32_t absolute = 0, maximum = 0;
+  size_t i = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    absolute = abs((int)vector[i]);
+    if (absolute > maximum) {
+      maximum = absolute;
+    }
+  }
+
+  maximum = WEBRTC_SPL_MIN(maximum, WEBRTC_SPL_WORD32_MAX);
+
+  return (int32_t)maximum;
+}
+
+// Maximum value of word16 vector. C version for generic platforms.
+int16_t WebRtcSpl_MaxValueW16C(const int16_t* vector, size_t length) {
+  int16_t maximum = WEBRTC_SPL_WORD16_MIN;
+  size_t i = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] > maximum)
+      maximum = vector[i];
+  }
+  return maximum;
+}
+
+// Maximum value of word32 vector. C version for generic platforms.
+int32_t WebRtcSpl_MaxValueW32C(const int32_t* vector, size_t length) {
+  int32_t maximum = WEBRTC_SPL_WORD32_MIN;
+  size_t i = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] > maximum)
+      maximum = vector[i];
+  }
+  return maximum;
+}
+
+// Minimum value of word16 vector. C version for generic platforms.
+int16_t WebRtcSpl_MinValueW16C(const int16_t* vector, size_t length) {
+  int16_t minimum = WEBRTC_SPL_WORD16_MAX;
+  size_t i = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] < minimum)
+      minimum = vector[i];
+  }
+  return minimum;
+}
+
+// Minimum value of word32 vector. C version for generic platforms.
+int32_t WebRtcSpl_MinValueW32C(const int32_t* vector, size_t length) {
+  int32_t minimum = WEBRTC_SPL_WORD32_MAX;
+  size_t i = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] < minimum)
+      minimum = vector[i];
+  }
+  return minimum;
+}
+
+// Index of maximum absolute value in a word16 vector.
+size_t WebRtcSpl_MaxAbsIndexW16(const int16_t* vector, size_t length) {
+  // Use type int for local variables, to accomodate the value of abs(-32768).
+
+  size_t i = 0, index = 0;
+  int absolute = 0, maximum = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    absolute = abs((int)vector[i]);
+
+    if (absolute > maximum) {
+      maximum = absolute;
+      index = i;
+    }
+  }
+
+  return index;
+}
+
+// Index of maximum value in a word16 vector.
+size_t WebRtcSpl_MaxIndexW16(const int16_t* vector, size_t length) {
+  size_t i = 0, index = 0;
+  int16_t maximum = WEBRTC_SPL_WORD16_MIN;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] > maximum) {
+      maximum = vector[i];
+      index = i;
+    }
+  }
+
+  return index;
+}
+
+// Index of maximum value in a word32 vector.
+size_t WebRtcSpl_MaxIndexW32(const int32_t* vector, size_t length) {
+  size_t i = 0, index = 0;
+  int32_t maximum = WEBRTC_SPL_WORD32_MIN;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] > maximum) {
+      maximum = vector[i];
+      index = i;
+    }
+  }
+
+  return index;
+}
+
+// Index of minimum value in a word16 vector.
+size_t WebRtcSpl_MinIndexW16(const int16_t* vector, size_t length) {
+  size_t i = 0, index = 0;
+  int16_t minimum = WEBRTC_SPL_WORD16_MAX;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] < minimum) {
+      minimum = vector[i];
+      index = i;
+    }
+  }
+
+  return index;
+}
+
+// Index of minimum value in a word32 vector.
+size_t WebRtcSpl_MinIndexW32(const int32_t* vector, size_t length) {
+  size_t i = 0, index = 0;
+  int32_t minimum = WEBRTC_SPL_WORD32_MAX;
+
+  RTC_DCHECK_GT(length, 0);
+
+  for (i = 0; i < length; i++) {
+    if (vector[i] < minimum) {
+      minimum = vector[i];
+      index = i;
+    }
+  }
+
+  return index;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations_mips.c
new file mode 100644
index 0000000..c769e6a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations_mips.c
@@ -0,0 +1,375 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+/*
+ * This file contains the implementation of function
+ * WebRtcSpl_MaxAbsValueW16()
+ *
+ * The description header can be found in signal_processing_library.h.
+ *
+ */
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// Maximum absolute value of word16 vector.
+int16_t WebRtcSpl_MaxAbsValueW16_mips(const int16_t* vector, size_t length) {
+  int32_t totMax = 0;
+  int32_t tmp32_0, tmp32_1, tmp32_2, tmp32_3;
+  size_t i, loop_size;
+
+  RTC_DCHECK_GT(length, 0);
+
+#if defined(MIPS_DSP_R1)
+  const int32_t* tmpvec32 = (int32_t*)vector;
+  loop_size = length >> 4;
+
+  for (i = 0; i < loop_size; i++) {
+    __asm__ volatile (
+      "lw         %[tmp32_0],     0(%[tmpvec32])              \n\t"
+      "lw         %[tmp32_1],     4(%[tmpvec32])              \n\t"
+      "lw         %[tmp32_2],     8(%[tmpvec32])              \n\t"
+      "lw         %[tmp32_3],     12(%[tmpvec32])             \n\t"
+
+      "absq_s.ph  %[tmp32_0],     %[tmp32_0]                  \n\t"
+      "absq_s.ph  %[tmp32_1],     %[tmp32_1]                  \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_0]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_0],     %[totMax]   \n\t"
+
+      "lw         %[tmp32_0],     16(%[tmpvec32])             \n\t"
+      "absq_s.ph  %[tmp32_2],     %[tmp32_2]                  \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_1]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_1],     %[totMax]   \n\t"
+
+      "lw         %[tmp32_1],     20(%[tmpvec32])             \n\t"
+      "absq_s.ph  %[tmp32_3],     %[tmp32_3]                  \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_2]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_2],     %[totMax]   \n\t"
+
+      "lw         %[tmp32_2],     24(%[tmpvec32])             \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_3]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_3],     %[totMax]   \n\t"
+
+      "lw         %[tmp32_3],     28(%[tmpvec32])             \n\t"
+      "absq_s.ph  %[tmp32_0],     %[tmp32_0]                  \n\t"
+      "absq_s.ph  %[tmp32_1],     %[tmp32_1]                  \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_0]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_0],     %[totMax]   \n\t"
+
+      "absq_s.ph  %[tmp32_2],     %[tmp32_2]                  \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_1]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_1],     %[totMax]   \n\t"
+      "absq_s.ph  %[tmp32_3],     %[tmp32_3]                  \n\t"
+      "cmp.lt.ph  %[totMax],      %[tmp32_2]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_2],     %[totMax]   \n\t"
+
+      "cmp.lt.ph  %[totMax],      %[tmp32_3]                  \n\t"
+      "pick.ph    %[totMax],      %[tmp32_3],     %[totMax]   \n\t"
+
+      "addiu      %[tmpvec32],    %[tmpvec32],    32          \n\t"
+      : [tmp32_0] "=&r" (tmp32_0), [tmp32_1] "=&r" (tmp32_1),
+        [tmp32_2] "=&r" (tmp32_2), [tmp32_3] "=&r" (tmp32_3),
+        [totMax] "+r" (totMax), [tmpvec32] "+r" (tmpvec32)
+      :
+      : "memory"
+    );
+  }
+  __asm__ volatile (
+    "rotr       %[tmp32_0],     %[totMax],      16          \n\t"
+    "cmp.lt.ph  %[totMax],      %[tmp32_0]                  \n\t"
+    "pick.ph    %[totMax],      %[tmp32_0],     %[totMax]   \n\t"
+    "packrl.ph  %[totMax],      $0,             %[totMax]   \n\t"
+    : [tmp32_0] "=&r" (tmp32_0), [totMax] "+r" (totMax)
+    :
+  );
+  loop_size = length & 0xf;
+  for (i = 0; i < loop_size; i++) {
+    __asm__ volatile (
+      "lh         %[tmp32_0],     0(%[tmpvec32])              \n\t"
+      "addiu      %[tmpvec32],    %[tmpvec32],     2          \n\t"
+      "absq_s.w   %[tmp32_0],     %[tmp32_0]                  \n\t"
+      "slt        %[tmp32_1],     %[totMax],       %[tmp32_0] \n\t"
+      "movn       %[totMax],      %[tmp32_0],      %[tmp32_1] \n\t"
+      : [tmp32_0] "=&r" (tmp32_0), [tmp32_1] "=&r" (tmp32_1),
+        [tmpvec32] "+r" (tmpvec32), [totMax] "+r" (totMax)
+      :
+      : "memory"
+    );
+  }
+#else  // #if defined(MIPS_DSP_R1)
+  int32_t v16MaxMax = WEBRTC_SPL_WORD16_MAX;
+  int32_t r, r1, r2, r3;
+  const int16_t* tmpvector = vector;
+  loop_size = length >> 4;
+  for (i = 0; i < loop_size; i++) {
+    __asm__ volatile (
+      "lh     %[tmp32_0],     0(%[tmpvector])                 \n\t"
+      "lh     %[tmp32_1],     2(%[tmpvector])                 \n\t"
+      "lh     %[tmp32_2],     4(%[tmpvector])                 \n\t"
+      "lh     %[tmp32_3],     6(%[tmpvector])                 \n\t"
+
+      "abs    %[tmp32_0],     %[tmp32_0]                      \n\t"
+      "abs    %[tmp32_1],     %[tmp32_1]                      \n\t"
+      "abs    %[tmp32_2],     %[tmp32_2]                      \n\t"
+      "abs    %[tmp32_3],     %[tmp32_3]                      \n\t"
+
+      "slt    %[r],           %[totMax],      %[tmp32_0]      \n\t"
+      "movn   %[totMax],      %[tmp32_0],     %[r]            \n\t"
+      "slt    %[r1],          %[totMax],      %[tmp32_1]      \n\t"
+      "movn   %[totMax],      %[tmp32_1],     %[r1]           \n\t"
+      "slt    %[r2],          %[totMax],      %[tmp32_2]      \n\t"
+      "movn   %[totMax],      %[tmp32_2],     %[r2]           \n\t"
+      "slt    %[r3],          %[totMax],      %[tmp32_3]      \n\t"
+      "movn   %[totMax],      %[tmp32_3],     %[r3]           \n\t"
+
+      "lh     %[tmp32_0],     8(%[tmpvector])                 \n\t"
+      "lh     %[tmp32_1],     10(%[tmpvector])                \n\t"
+      "lh     %[tmp32_2],     12(%[tmpvector])                \n\t"
+      "lh     %[tmp32_3],     14(%[tmpvector])                \n\t"
+
+      "abs    %[tmp32_0],     %[tmp32_0]                      \n\t"
+      "abs    %[tmp32_1],     %[tmp32_1]                      \n\t"
+      "abs    %[tmp32_2],     %[tmp32_2]                      \n\t"
+      "abs    %[tmp32_3],     %[tmp32_3]                      \n\t"
+
+      "slt    %[r],           %[totMax],      %[tmp32_0]      \n\t"
+      "movn   %[totMax],      %[tmp32_0],     %[r]            \n\t"
+      "slt    %[r1],          %[totMax],      %[tmp32_1]      \n\t"
+      "movn   %[totMax],      %[tmp32_1],     %[r1]           \n\t"
+      "slt    %[r2],          %[totMax],      %[tmp32_2]      \n\t"
+      "movn   %[totMax],      %[tmp32_2],     %[r2]           \n\t"
+      "slt    %[r3],          %[totMax],      %[tmp32_3]      \n\t"
+      "movn   %[totMax],      %[tmp32_3],     %[r3]           \n\t"
+
+      "lh     %[tmp32_0],     16(%[tmpvector])                \n\t"
+      "lh     %[tmp32_1],     18(%[tmpvector])                \n\t"
+      "lh     %[tmp32_2],     20(%[tmpvector])                \n\t"
+      "lh     %[tmp32_3],     22(%[tmpvector])                \n\t"
+
+      "abs    %[tmp32_0],     %[tmp32_0]                      \n\t"
+      "abs    %[tmp32_1],     %[tmp32_1]                      \n\t"
+      "abs    %[tmp32_2],     %[tmp32_2]                      \n\t"
+      "abs    %[tmp32_3],     %[tmp32_3]                      \n\t"
+
+      "slt    %[r],           %[totMax],      %[tmp32_0]      \n\t"
+      "movn   %[totMax],      %[tmp32_0],     %[r]            \n\t"
+      "slt    %[r1],          %[totMax],      %[tmp32_1]      \n\t"
+      "movn   %[totMax],      %[tmp32_1],     %[r1]           \n\t"
+      "slt    %[r2],          %[totMax],      %[tmp32_2]      \n\t"
+      "movn   %[totMax],      %[tmp32_2],     %[r2]           \n\t"
+      "slt    %[r3],          %[totMax],      %[tmp32_3]      \n\t"
+      "movn   %[totMax],      %[tmp32_3],     %[r3]           \n\t"
+
+      "lh     %[tmp32_0],     24(%[tmpvector])                \n\t"
+      "lh     %[tmp32_1],     26(%[tmpvector])                \n\t"
+      "lh     %[tmp32_2],     28(%[tmpvector])                \n\t"
+      "lh     %[tmp32_3],     30(%[tmpvector])                \n\t"
+
+      "abs    %[tmp32_0],     %[tmp32_0]                      \n\t"
+      "abs    %[tmp32_1],     %[tmp32_1]                      \n\t"
+      "abs    %[tmp32_2],     %[tmp32_2]                      \n\t"
+      "abs    %[tmp32_3],     %[tmp32_3]                      \n\t"
+
+      "slt    %[r],           %[totMax],      %[tmp32_0]      \n\t"
+      "movn   %[totMax],      %[tmp32_0],     %[r]            \n\t"
+      "slt    %[r1],          %[totMax],      %[tmp32_1]      \n\t"
+      "movn   %[totMax],      %[tmp32_1],     %[r1]           \n\t"
+      "slt    %[r2],          %[totMax],      %[tmp32_2]      \n\t"
+      "movn   %[totMax],      %[tmp32_2],     %[r2]           \n\t"
+      "slt    %[r3],          %[totMax],      %[tmp32_3]      \n\t"
+      "movn   %[totMax],      %[tmp32_3],     %[r3]           \n\t"
+
+      "addiu  %[tmpvector],   %[tmpvector],   32              \n\t"
+      : [tmp32_0] "=&r" (tmp32_0), [tmp32_1] "=&r" (tmp32_1),
+        [tmp32_2] "=&r" (tmp32_2), [tmp32_3] "=&r" (tmp32_3),
+        [totMax] "+r" (totMax), [r] "=&r" (r), [tmpvector] "+r" (tmpvector),
+        [r1] "=&r" (r1), [r2] "=&r" (r2), [r3] "=&r" (r3)
+      :
+      : "memory"
+    );
+  }
+  loop_size = length & 0xf;
+  for (i = 0; i < loop_size; i++) {
+    __asm__ volatile (
+      "lh         %[tmp32_0],     0(%[tmpvector])             \n\t"
+      "addiu      %[tmpvector],   %[tmpvector],    2          \n\t"
+      "abs        %[tmp32_0],     %[tmp32_0]                  \n\t"
+      "slt        %[tmp32_1],     %[totMax],       %[tmp32_0] \n\t"
+      "movn       %[totMax],      %[tmp32_0],      %[tmp32_1] \n\t"
+      : [tmp32_0] "=&r" (tmp32_0), [tmp32_1] "=&r" (tmp32_1),
+        [tmpvector] "+r" (tmpvector), [totMax] "+r" (totMax)
+      :
+      : "memory"
+    );
+  }
+
+  __asm__ volatile (
+    "slt    %[r],       %[v16MaxMax],   %[totMax]   \n\t"
+    "movn   %[totMax],  %[v16MaxMax],   %[r]        \n\t"
+    : [totMax] "+r" (totMax), [r] "=&r" (r)
+    : [v16MaxMax] "r" (v16MaxMax)
+  );
+#endif  // #if defined(MIPS_DSP_R1)
+  return (int16_t)totMax;
+}
+
+#if defined(MIPS_DSP_R1_LE)
+// Maximum absolute value of word32 vector. Version for MIPS platform.
+int32_t WebRtcSpl_MaxAbsValueW32_mips(const int32_t* vector, size_t length) {
+  // Use uint32_t for the local variables, to accommodate the return value
+  // of abs(0x80000000), which is 0x80000000.
+
+  uint32_t absolute = 0, maximum = 0;
+  int tmp1 = 0, max_value = 0x7fffffff;
+
+  RTC_DCHECK_GT(length, 0);
+
+  __asm__ volatile (
+    ".set push                                                        \n\t"
+    ".set noreorder                                                   \n\t"
+
+   "1:                                                                \n\t"
+    "lw         %[absolute],      0(%[vector])                        \n\t"
+    "absq_s.w   %[absolute],      %[absolute]                         \n\t"
+    "addiu      %[length],        %[length],          -1              \n\t"
+    "slt        %[tmp1],          %[maximum],         %[absolute]     \n\t"
+    "movn       %[maximum],       %[absolute],        %[tmp1]         \n\t"
+    "bgtz       %[length],        1b                                  \n\t"
+    " addiu     %[vector],        %[vector],          4               \n\t"
+    "slt        %[tmp1],          %[max_value],       %[maximum]      \n\t"
+    "movn       %[maximum],       %[max_value],       %[tmp1]         \n\t"
+
+    ".set pop                                                         \n\t"
+
+    : [tmp1] "=&r" (tmp1), [maximum] "+r" (maximum), [absolute] "+r" (absolute)
+    : [vector] "r" (vector), [length] "r" (length), [max_value] "r" (max_value)
+    : "memory"
+  );
+
+  return (int32_t)maximum;
+}
+#endif  // #if defined(MIPS_DSP_R1_LE)
+
+// Maximum value of word16 vector. Version for MIPS platform.
+int16_t WebRtcSpl_MaxValueW16_mips(const int16_t* vector, size_t length) {
+  int16_t maximum = WEBRTC_SPL_WORD16_MIN;
+  int tmp1;
+  int16_t value;
+
+  RTC_DCHECK_GT(length, 0);
+
+  __asm__ volatile (
+    ".set push                                                        \n\t"
+    ".set noreorder                                                   \n\t"
+
+   "1:                                                                \n\t"
+    "lh         %[value],         0(%[vector])                        \n\t"
+    "addiu      %[length],        %[length],          -1              \n\t"
+    "slt        %[tmp1],          %[maximum],         %[value]        \n\t"
+    "movn       %[maximum],       %[value],           %[tmp1]         \n\t"
+    "bgtz       %[length],        1b                                  \n\t"
+    " addiu     %[vector],        %[vector],          2               \n\t"
+    ".set pop                                                         \n\t"
+
+    : [tmp1] "=&r" (tmp1), [maximum] "+r" (maximum), [value] "=&r" (value)
+    : [vector] "r" (vector), [length] "r" (length)
+    : "memory"
+  );
+
+  return maximum;
+}
+
+// Maximum value of word32 vector. Version for MIPS platform.
+int32_t WebRtcSpl_MaxValueW32_mips(const int32_t* vector, size_t length) {
+  int32_t maximum = WEBRTC_SPL_WORD32_MIN;
+  int tmp1, value;
+
+  RTC_DCHECK_GT(length, 0);
+
+  __asm__ volatile (
+    ".set push                                                        \n\t"
+    ".set noreorder                                                   \n\t"
+
+   "1:                                                                \n\t"
+    "lw         %[value],         0(%[vector])                        \n\t"
+    "addiu      %[length],        %[length],          -1              \n\t"
+    "slt        %[tmp1],          %[maximum],         %[value]        \n\t"
+    "movn       %[maximum],       %[value],           %[tmp1]         \n\t"
+    "bgtz       %[length],        1b                                  \n\t"
+    " addiu     %[vector],        %[vector],          4               \n\t"
+
+    ".set pop                                                         \n\t"
+
+    : [tmp1] "=&r" (tmp1), [maximum] "+r" (maximum), [value] "=&r" (value)
+    : [vector] "r" (vector), [length] "r" (length)
+    : "memory"
+  );
+
+  return maximum;
+}
+
+// Minimum value of word16 vector. Version for MIPS platform.
+int16_t WebRtcSpl_MinValueW16_mips(const int16_t* vector, size_t length) {
+  int16_t minimum = WEBRTC_SPL_WORD16_MAX;
+  int tmp1;
+  int16_t value;
+
+  RTC_DCHECK_GT(length, 0);
+
+  __asm__ volatile (
+    ".set push                                                        \n\t"
+    ".set noreorder                                                   \n\t"
+
+   "1:                                                                \n\t"
+    "lh         %[value],         0(%[vector])                        \n\t"
+    "addiu      %[length],        %[length],          -1              \n\t"
+    "slt        %[tmp1],          %[value],           %[minimum]      \n\t"
+    "movn       %[minimum],       %[value],           %[tmp1]         \n\t"
+    "bgtz       %[length],        1b                                  \n\t"
+    " addiu     %[vector],        %[vector],          2               \n\t"
+
+    ".set pop                                                         \n\t"
+
+    : [tmp1] "=&r" (tmp1), [minimum] "+r" (minimum), [value] "=&r" (value)
+    : [vector] "r" (vector), [length] "r" (length)
+    : "memory"
+  );
+
+  return minimum;
+}
+
+// Minimum value of word32 vector. Version for MIPS platform.
+int32_t WebRtcSpl_MinValueW32_mips(const int32_t* vector, size_t length) {
+  int32_t minimum = WEBRTC_SPL_WORD32_MAX;
+  int tmp1, value;
+
+  RTC_DCHECK_GT(length, 0);
+
+  __asm__ volatile (
+    ".set push                                                        \n\t"
+    ".set noreorder                                                   \n\t"
+
+   "1:                                                                \n\t"
+    "lw         %[value],         0(%[vector])                        \n\t"
+    "addiu      %[length],        %[length],          -1              \n\t"
+    "slt        %[tmp1],          %[value],           %[minimum]      \n\t"
+    "movn       %[minimum],       %[value],           %[tmp1]         \n\t"
+    "bgtz       %[length],        1b                                  \n\t"
+    " addiu     %[vector],        %[vector],          4               \n\t"
+
+    ".set pop                                                         \n\t"
+
+    : [tmp1] "=&r" (tmp1), [minimum] "+r" (minimum), [value] "=&r" (value)
+    : [vector] "r" (vector), [length] "r" (length)
+    : "memory"
+  );
+
+  return minimum;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations_neon.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations_neon.c
new file mode 100644
index 0000000..d5aad76
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/min_max_operations_neon.c
@@ -0,0 +1,283 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <arm_neon.h>
+#include <stdlib.h>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// Maximum absolute value of word16 vector. C version for generic platforms.
+int16_t WebRtcSpl_MaxAbsValueW16Neon(const int16_t* vector, size_t length) {
+  int absolute = 0, maximum = 0;
+
+  RTC_DCHECK_GT(length, 0);
+
+  const int16_t* p_start = vector;
+  size_t rest = length & 7;
+  const int16_t* p_end = vector + length - rest;
+
+  int16x8_t v;
+  uint16x8_t max_qv;
+  max_qv = vdupq_n_u16(0);
+
+  while (p_start < p_end) {
+    v = vld1q_s16(p_start);
+    // Note vabs doesn't change the value of -32768.
+    v = vabsq_s16(v);
+    // Use u16 so we don't lose the value -32768.
+    max_qv = vmaxq_u16(max_qv, vreinterpretq_u16_s16(v));
+    p_start += 8;
+  }
+
+#ifdef WEBRTC_ARCH_ARM64
+  maximum = (int)vmaxvq_u16(max_qv);
+#else
+  uint16x4_t max_dv;
+  max_dv = vmax_u16(vget_low_u16(max_qv), vget_high_u16(max_qv));
+  max_dv = vpmax_u16(max_dv, max_dv);
+  max_dv = vpmax_u16(max_dv, max_dv);
+
+  maximum = (int)vget_lane_u16(max_dv, 0);
+#endif
+
+  p_end = vector + length;
+  while (p_start < p_end) {
+    absolute = abs((int)(*p_start));
+
+    if (absolute > maximum) {
+      maximum = absolute;
+    }
+    p_start++;
+  }
+
+  // Guard the case for abs(-32768).
+  if (maximum > WEBRTC_SPL_WORD16_MAX) {
+    maximum = WEBRTC_SPL_WORD16_MAX;
+  }
+
+  return (int16_t)maximum;
+}
+
+// Maximum absolute value of word32 vector. NEON intrinsics version for
+// ARM 32-bit/64-bit platforms.
+int32_t WebRtcSpl_MaxAbsValueW32Neon(const int32_t* vector, size_t length) {
+  // Use uint32_t for the local variables, to accommodate the return value
+  // of abs(0x80000000), which is 0x80000000.
+
+  uint32_t absolute = 0, maximum = 0;
+  size_t i = 0;
+  size_t residual = length & 0x7;
+
+  RTC_DCHECK_GT(length, 0);
+
+  const int32_t* p_start = vector;
+  uint32x4_t max32x4_0 = vdupq_n_u32(0);
+  uint32x4_t max32x4_1 = vdupq_n_u32(0);
+
+  // First part, unroll the loop 8 times.
+  for (i = 0; i < length - residual; i += 8) {
+    int32x4_t in32x4_0 = vld1q_s32(p_start);
+    p_start += 4;
+    int32x4_t in32x4_1 = vld1q_s32(p_start);
+    p_start += 4;
+    in32x4_0 = vabsq_s32(in32x4_0);
+    in32x4_1 = vabsq_s32(in32x4_1);
+    // vabs doesn't change the value of 0x80000000.
+    // Use u32 so we don't lose the value 0x80000000.
+    max32x4_0 = vmaxq_u32(max32x4_0, vreinterpretq_u32_s32(in32x4_0));
+    max32x4_1 = vmaxq_u32(max32x4_1, vreinterpretq_u32_s32(in32x4_1));
+  }
+
+  uint32x4_t max32x4 = vmaxq_u32(max32x4_0, max32x4_1);
+#if defined(WEBRTC_ARCH_ARM64)
+  maximum = vmaxvq_u32(max32x4);
+#else
+  uint32x2_t max32x2 = vmax_u32(vget_low_u32(max32x4), vget_high_u32(max32x4));
+  max32x2 = vpmax_u32(max32x2, max32x2);
+
+  maximum = vget_lane_u32(max32x2, 0);
+#endif
+
+  // Second part, do the remaining iterations (if any).
+  for (i = residual; i > 0; i--) {
+    absolute = abs((int)(*p_start));
+    if (absolute > maximum) {
+      maximum = absolute;
+    }
+    p_start++;
+  }
+
+  // Guard against the case for 0x80000000.
+  maximum = WEBRTC_SPL_MIN(maximum, WEBRTC_SPL_WORD32_MAX);
+
+  return (int32_t)maximum;
+}
+
+// Maximum value of word16 vector. NEON intrinsics version for
+// ARM 32-bit/64-bit platforms.
+int16_t WebRtcSpl_MaxValueW16Neon(const int16_t* vector, size_t length) {
+  int16_t maximum = WEBRTC_SPL_WORD16_MIN;
+  size_t i = 0;
+  size_t residual = length & 0x7;
+
+  RTC_DCHECK_GT(length, 0);
+
+  const int16_t* p_start = vector;
+  int16x8_t max16x8 = vdupq_n_s16(WEBRTC_SPL_WORD16_MIN);
+
+  // First part, unroll the loop 8 times.
+  for (i = 0; i < length - residual; i += 8) {
+    int16x8_t in16x8 = vld1q_s16(p_start);
+    max16x8 = vmaxq_s16(max16x8, in16x8);
+    p_start += 8;
+  }
+
+#if defined(WEBRTC_ARCH_ARM64)
+  maximum = vmaxvq_s16(max16x8);
+#else
+  int16x4_t max16x4 = vmax_s16(vget_low_s16(max16x8), vget_high_s16(max16x8));
+  max16x4 = vpmax_s16(max16x4, max16x4);
+  max16x4 = vpmax_s16(max16x4, max16x4);
+
+  maximum = vget_lane_s16(max16x4, 0);
+#endif
+
+  // Second part, do the remaining iterations (if any).
+  for (i = residual; i > 0; i--) {
+    if (*p_start > maximum)
+      maximum = *p_start;
+    p_start++;
+  }
+  return maximum;
+}
+
+// Maximum value of word32 vector. NEON intrinsics version for
+// ARM 32-bit/64-bit platforms.
+int32_t WebRtcSpl_MaxValueW32Neon(const int32_t* vector, size_t length) {
+  int32_t maximum = WEBRTC_SPL_WORD32_MIN;
+  size_t i = 0;
+  size_t residual = length & 0x7;
+
+  RTC_DCHECK_GT(length, 0);
+
+  const int32_t* p_start = vector;
+  int32x4_t max32x4_0 = vdupq_n_s32(WEBRTC_SPL_WORD32_MIN);
+  int32x4_t max32x4_1 = vdupq_n_s32(WEBRTC_SPL_WORD32_MIN);
+
+  // First part, unroll the loop 8 times.
+  for (i = 0; i < length - residual; i += 8) {
+    int32x4_t in32x4_0 = vld1q_s32(p_start);
+    p_start += 4;
+    int32x4_t in32x4_1 = vld1q_s32(p_start);
+    p_start += 4;
+    max32x4_0 = vmaxq_s32(max32x4_0, in32x4_0);
+    max32x4_1 = vmaxq_s32(max32x4_1, in32x4_1);
+  }
+
+  int32x4_t max32x4 = vmaxq_s32(max32x4_0, max32x4_1);
+#if defined(WEBRTC_ARCH_ARM64)
+  maximum = vmaxvq_s32(max32x4);
+#else
+  int32x2_t max32x2 = vmax_s32(vget_low_s32(max32x4), vget_high_s32(max32x4));
+  max32x2 = vpmax_s32(max32x2, max32x2);
+
+  maximum = vget_lane_s32(max32x2, 0);
+#endif
+
+  // Second part, do the remaining iterations (if any).
+  for (i = residual; i > 0; i--) {
+    if (*p_start > maximum)
+      maximum = *p_start;
+    p_start++;
+  }
+  return maximum;
+}
+
+// Minimum value of word16 vector. NEON intrinsics version for
+// ARM 32-bit/64-bit platforms.
+int16_t WebRtcSpl_MinValueW16Neon(const int16_t* vector, size_t length) {
+  int16_t minimum = WEBRTC_SPL_WORD16_MAX;
+  size_t i = 0;
+  size_t residual = length & 0x7;
+
+  RTC_DCHECK_GT(length, 0);
+
+  const int16_t* p_start = vector;
+  int16x8_t min16x8 = vdupq_n_s16(WEBRTC_SPL_WORD16_MAX);
+
+  // First part, unroll the loop 8 times.
+  for (i = 0; i < length - residual; i += 8) {
+    int16x8_t in16x8 = vld1q_s16(p_start);
+    min16x8 = vminq_s16(min16x8, in16x8);
+    p_start += 8;
+  }
+
+#if defined(WEBRTC_ARCH_ARM64)
+  minimum = vminvq_s16(min16x8);
+#else
+  int16x4_t min16x4 = vmin_s16(vget_low_s16(min16x8), vget_high_s16(min16x8));
+  min16x4 = vpmin_s16(min16x4, min16x4);
+  min16x4 = vpmin_s16(min16x4, min16x4);
+
+  minimum = vget_lane_s16(min16x4, 0);
+#endif
+
+  // Second part, do the remaining iterations (if any).
+  for (i = residual; i > 0; i--) {
+    if (*p_start < minimum)
+      minimum = *p_start;
+    p_start++;
+  }
+  return minimum;
+}
+
+// Minimum value of word32 vector. NEON intrinsics version for
+// ARM 32-bit/64-bit platforms.
+int32_t WebRtcSpl_MinValueW32Neon(const int32_t* vector, size_t length) {
+  int32_t minimum = WEBRTC_SPL_WORD32_MAX;
+  size_t i = 0;
+  size_t residual = length & 0x7;
+
+  RTC_DCHECK_GT(length, 0);
+
+  const int32_t* p_start = vector;
+  int32x4_t min32x4_0 = vdupq_n_s32(WEBRTC_SPL_WORD32_MAX);
+  int32x4_t min32x4_1 = vdupq_n_s32(WEBRTC_SPL_WORD32_MAX);
+
+  // First part, unroll the loop 8 times.
+  for (i = 0; i < length - residual; i += 8) {
+    int32x4_t in32x4_0 = vld1q_s32(p_start);
+    p_start += 4;
+    int32x4_t in32x4_1 = vld1q_s32(p_start);
+    p_start += 4;
+    min32x4_0 = vminq_s32(min32x4_0, in32x4_0);
+    min32x4_1 = vminq_s32(min32x4_1, in32x4_1);
+  }
+
+  int32x4_t min32x4 = vminq_s32(min32x4_0, min32x4_1);
+#if defined(WEBRTC_ARCH_ARM64)
+  minimum = vminvq_s32(min32x4);
+#else
+  int32x2_t min32x2 = vmin_s32(vget_low_s32(min32x4), vget_high_s32(min32x4));
+  min32x2 = vpmin_s32(min32x2, min32x2);
+
+  minimum = vget_lane_s32(min32x2, 0);
+#endif
+
+  // Second part, do the remaining iterations (if any).
+  for (i = residual; i > 0; i--) {
+    if (*p_start < minimum)
+      minimum = *p_start;
+    p_start++;
+  }
+  return minimum;
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/randomization_functions.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/randomization_functions.c
new file mode 100644
index 0000000..73f2409
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/randomization_functions.c
@@ -0,0 +1,115 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains implementations of the randomization functions
+ * WebRtcSpl_RandU()
+ * WebRtcSpl_RandN()
+ * WebRtcSpl_RandUArray()
+ *
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+static const uint32_t kMaxSeedUsed = 0x80000000;
+
+static const int16_t kRandNTable[] = {
+    9178,    -7260,       40,    10189,     4894,    -3531,   -13779,    14764,
+   -4008,    -8884,    -8990,     1008,     7368,     5184,     3251,    -5817,
+   -9786,     5963,     1770,     8066,    -7135,    10772,    -2298,     1361,
+    6484,     2241,    -8633,      792,      199,    -3344,     6553,   -10079,
+  -15040,       95,    11608,   -12469,    14161,    -4176,     2476,     6403,
+   13685,   -16005,     6646,     2239,    10916,    -3004,     -602,    -3141,
+    2142,    14144,    -5829,     5305,     8209,     4713,     2697,    -5112,
+   16092,    -1210,    -2891,    -6631,    -5360,   -11878,    -6781,    -2739,
+   -6392,      536,    10923,    10872,     5059,    -4748,    -7770,     5477,
+      38,    -1025,    -2892,     1638,     6304,    14375,   -11028,     1553,
+   -1565,    10762,     -393,     4040,     5257,    12310,     6554,    -4799,
+    4899,    -6354,     1603,    -1048,    -2220,     8247,     -186,    -8944,
+  -12004,     2332,     4801,    -4933,     6371,      131,     8614,    -5927,
+   -8287,   -22760,     4033,   -15162,     3385,     3246,     3153,    -5250,
+    3766,      784,     6494,      -62,     3531,    -1582,    15572,      662,
+   -3952,     -330,    -3196,      669,     7236,    -2678,    -6569,    23319,
+   -8645,     -741,    14830,   -15976,     4903,      315,   -11342,    10311,
+    1858,    -7777,     2145,     5436,     5677,     -113,   -10033,      826,
+   -1353,    17210,     7768,      986,    -1471,     8291,    -4982,     8207,
+  -14911,    -6255,    -2449,   -11881,    -7059,   -11703,    -4338,     8025,
+    7538,    -2823,   -12490,     9470,    -1613,    -2529,   -10092,    -7807,
+    9480,     6970,   -12844,     5123,     3532,     4816,     4803,    -8455,
+   -5045,    14032,    -4378,    -1643,     5756,   -11041,    -2732,   -16618,
+   -6430,   -18375,    -3320,     6098,     5131,    -4269,    -8840,     2482,
+   -7048,     1547,   -21890,    -6505,    -7414,     -424,   -11722,     7955,
+    1653,   -17299,     1823,      473,    -9232,     3337,     1111,      873,
+    4018,    -8982,     9889,     3531,   -11763,    -3799,     7373,    -4539,
+    3231,     7054,    -8537,     7616,     6244,    16635,      447,    -2915,
+   13967,      705,    -2669,    -1520,    -1771,   -16188,     5956,     5117,
+    6371,    -9936,    -1448,     2480,     5128,     7550,    -8130,     5236,
+    8213,    -6443,     7707,    -1950,   -13811,     7218,     7031,    -3883,
+      67,     5731,    -2874,    13480,    -3743,     9298,    -3280,     3552,
+   -4425,      -18,    -3785,    -9988,    -5357,     5477,   -11794,     2117,
+    1416,    -9935,     3376,      802,    -5079,    -8243,    12652,       66,
+    3653,    -2368,     6781,   -21895,    -7227,     2487,     7839,     -385,
+    6646,    -7016,    -4658,     5531,    -1705,      834,      129,     3694,
+   -1343,     2238,   -22640,    -6417,   -11139,    11301,    -2945,    -3494,
+   -5626,      185,    -3615,    -2041,    -7972,    -3106,      -60,   -23497,
+   -1566,    17064,     3519,     2518,      304,    -6805,   -10269,     2105,
+    1936,     -426,     -736,    -8122,    -1467,     4238,    -6939,   -13309,
+     360,     7402,    -7970,    12576,     3287,    12194,    -6289,   -16006,
+    9171,     4042,    -9193,     9123,    -2512,     6388,    -4734,    -8739,
+    1028,    -5406,    -1696,     5889,     -666,    -4736,     4971,     3565,
+    9362,    -6292,     3876,    -3652,   -19666,     7523,    -4061,      391,
+  -11773,     7502,    -3763,     4929,    -9478,    13278,     2805,     4496,
+    7814,    16419,    12455,   -14773,     2127,    -2746,     3763,     4847,
+    3698,     6978,     4751,    -6957,    -3581,      -45,     6252,     1513,
+   -4797,    -7925,    11270,    16188,    -2359,    -5269,     9376,   -10777,
+    7262,    20031,    -6515,    -2208,    -5353,     8085,    -1341,    -1303,
+    7333,     5576,     3625,     5763,    -7931,     9833,    -3371,   -10305,
+    6534,   -13539,    -9971,      997,     8464,    -4064,    -1495,     1857,
+   13624,     5458,     9490,   -11086,    -4524,    12022,     -550,     -198,
+     408,    -8455,    -7068,    10289,     9712,    -3366,     9028,    -7621,
+   -5243,     2362,     6909,     4672,    -4933,    -1799,     4709,    -4563,
+     -62,     -566,     1624,    -7010,    14730,   -17791,    -3697,    -2344,
+   -1741,     7099,    -9509,    -6855,    -1989,     3495,    -2289,     2031,
+   12784,      891,    14189,    -3963,    -5683,      421,   -12575,     1724,
+  -12682,    -5970,    -8169,     3143,    -1824,    -5488,    -5130,     8536,
+   12799,      794,     5738,     3459,   -11689,     -258,    -3738,    -3775,
+   -8742,     2333,     8312,    -9383,    10331,    13119,     8398,    10644,
+  -19433,    -6446,   -16277,   -11793,    16284,     9345,    15222,    15834,
+    2009,    -7349,      130,   -14547,      338,    -5998,     3337,    21492,
+    2406,     7703,     -951,    11196,     -564,     3406,     2217,     4806,
+    2374,    -5797,    11839,     8940,   -11874,    18213,     2855,    10492
+};
+
+static uint32_t IncreaseSeed(uint32_t* seed) {
+  seed[0] = (seed[0] * ((int32_t)69069) + 1) & (kMaxSeedUsed - 1);
+  return seed[0];
+}
+
+int16_t WebRtcSpl_RandU(uint32_t* seed) {
+  return (int16_t)(IncreaseSeed(seed) >> 16);
+}
+
+int16_t WebRtcSpl_RandN(uint32_t* seed) {
+  return kRandNTable[IncreaseSeed(seed) >> 23];
+}
+
+// Creates an array of uniformly distributed variables.
+int16_t WebRtcSpl_RandUArray(int16_t* vector,
+                             int16_t vector_length,
+                             uint32_t* seed) {
+  int i;
+  for (i = 0; i < vector_length; i++) {
+    vector[i] = WebRtcSpl_RandU(seed);
+  }
+  return vector_length;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/real_fft.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/real_fft.c
new file mode 100644
index 0000000..92daae4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/real_fft.c
@@ -0,0 +1,102 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/real_fft.h"
+
+#include <stdlib.h>
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+struct RealFFT {
+  int order;
+};
+
+struct RealFFT* WebRtcSpl_CreateRealFFT(int order) {
+  struct RealFFT* self = NULL;
+
+  if (order > kMaxFFTOrder || order < 0) {
+    return NULL;
+  }
+
+  self = malloc(sizeof(struct RealFFT));
+  if (self == NULL) {
+    return NULL;
+  }
+  self->order = order;
+
+  return self;
+}
+
+void WebRtcSpl_FreeRealFFT(struct RealFFT* self) {
+  if (self != NULL) {
+    free(self);
+  }
+}
+
+// The C version FFT functions (i.e. WebRtcSpl_RealForwardFFT and
+// WebRtcSpl_RealInverseFFT) are real-valued FFT wrappers for complex-valued
+// FFT implementation in SPL.
+
+int WebRtcSpl_RealForwardFFT(struct RealFFT* self,
+                             const int16_t* real_data_in,
+                             int16_t* complex_data_out) {
+  int i = 0;
+  int j = 0;
+  int result = 0;
+  int n = 1 << self->order;
+  // The complex-value FFT implementation needs a buffer to hold 2^order
+  // 16-bit COMPLEX numbers, for both time and frequency data.
+  int16_t complex_buffer[2 << kMaxFFTOrder];
+
+  // Insert zeros to the imaginary parts for complex forward FFT input.
+  for (i = 0, j = 0; i < n; i += 1, j += 2) {
+    complex_buffer[j] = real_data_in[i];
+    complex_buffer[j + 1] = 0;
+  };
+
+  WebRtcSpl_ComplexBitReverse(complex_buffer, self->order);
+  result = WebRtcSpl_ComplexFFT(complex_buffer, self->order, 1);
+
+  // For real FFT output, use only the first N + 2 elements from
+  // complex forward FFT.
+  memcpy(complex_data_out, complex_buffer, sizeof(int16_t) * (n + 2));
+
+  return result;
+}
+
+int WebRtcSpl_RealInverseFFT(struct RealFFT* self,
+                             const int16_t* complex_data_in,
+                             int16_t* real_data_out) {
+  int i = 0;
+  int j = 0;
+  int result = 0;
+  int n = 1 << self->order;
+  // Create the buffer specific to complex-valued FFT implementation.
+  int16_t complex_buffer[2 << kMaxFFTOrder];
+
+  // For n-point FFT, first copy the first n + 2 elements into complex
+  // FFT, then construct the remaining n - 2 elements by real FFT's
+  // conjugate-symmetric properties.
+  memcpy(complex_buffer, complex_data_in, sizeof(int16_t) * (n + 2));
+  for (i = n + 2; i < 2 * n; i += 2) {
+    complex_buffer[i] = complex_data_in[2 * n - i];
+    complex_buffer[i + 1] = -complex_data_in[2 * n - i + 1];
+  }
+
+  WebRtcSpl_ComplexBitReverse(complex_buffer, self->order);
+  result = WebRtcSpl_ComplexIFFT(complex_buffer, self->order, 1);
+
+  // Strip out the imaginary parts of the complex inverse FFT output.
+  for (i = 0, j = 0; i < n; i += 1, j += 2) {
+    real_data_out[i] = complex_buffer[j];
+  }
+
+  return result;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/refl_coef_to_lpc.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/refl_coef_to_lpc.c
new file mode 100644
index 0000000..06a29b6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/refl_coef_to_lpc.c
@@ -0,0 +1,59 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_ReflCoefToLpc().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_ReflCoefToLpc(const int16_t *k, int use_order, int16_t *a)
+{
+    int16_t any[WEBRTC_SPL_MAX_LPC_ORDER + 1];
+    int16_t *aptr, *aptr2, *anyptr;
+    const int16_t *kptr;
+    int m, i;
+
+    kptr = k;
+    *a = 4096; // i.e., (Word16_MAX >> 3)+1.
+    *any = *a;
+    a[1] = *k >> 3;
+
+    for (m = 1; m < use_order; m++)
+    {
+        kptr++;
+        aptr = a;
+        aptr++;
+        aptr2 = &a[m];
+        anyptr = any;
+        anyptr++;
+
+        any[m + 1] = *kptr >> 3;
+        for (i = 0; i < m; i++)
+        {
+            *anyptr = *aptr + (int16_t)((*aptr2 * *kptr) >> 15);
+            anyptr++;
+            aptr++;
+            aptr2--;
+        }
+
+        aptr = a;
+        anyptr = any;
+        for (i = 0; i < (m + 2); i++)
+        {
+            *aptr = *anyptr;
+            aptr++;
+            anyptr++;
+        }
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample.c
new file mode 100644
index 0000000..45fe52a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample.c
@@ -0,0 +1,505 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the resampling functions for 22 kHz.
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/common_audio/signal_processing/resample_by_2_internal.h"
+
+// Declaration of internally used functions
+static void WebRtcSpl_32khzTo22khzIntToShort(const int32_t *In, int16_t *Out,
+                                             int32_t K);
+
+void WebRtcSpl_32khzTo22khzIntToInt(const int32_t *In, int32_t *Out,
+                                    int32_t K);
+
+// interpolation coefficients
+static const int16_t kCoefficients32To22[5][9] = {
+        {127, -712,  2359, -6333, 23456, 16775, -3695,  945, -154},
+        {-39,  230,  -830,  2785, 32366, -2324,   760, -218,   38},
+        {117, -663,  2222, -6133, 26634, 13070, -3174,  831, -137},
+        {-77,  457, -1677,  5958, 31175, -4136,  1405, -408,   71},
+        { 98, -560,  1900, -5406, 29240,  9423, -2480,  663, -110}
+};
+
+//////////////////////
+// 22 kHz -> 16 kHz //
+//////////////////////
+
+// number of subblocks; options: 1, 2, 4, 5, 10
+#define SUB_BLOCKS_22_16    5
+
+// 22 -> 16 resampler
+void WebRtcSpl_Resample22khzTo16khz(const int16_t* in, int16_t* out,
+                                    WebRtcSpl_State22khzTo16khz* state, int32_t* tmpmem)
+{
+    int k;
+
+    // process two blocks of 10/SUB_BLOCKS_22_16 ms (to reduce temp buffer size)
+    for (k = 0; k < SUB_BLOCKS_22_16; k++)
+    {
+        ///// 22 --> 44 /////
+        // int16_t  in[220/SUB_BLOCKS_22_16]
+        // int32_t out[440/SUB_BLOCKS_22_16]
+        /////
+        WebRtcSpl_UpBy2ShortToInt(in, 220 / SUB_BLOCKS_22_16, tmpmem + 16, state->S_22_44);
+
+        ///// 44 --> 32 /////
+        // int32_t  in[440/SUB_BLOCKS_22_16]
+        // int32_t out[320/SUB_BLOCKS_22_16]
+        /////
+        // copy state to and from input array
+        tmpmem[8] = state->S_44_32[0];
+        tmpmem[9] = state->S_44_32[1];
+        tmpmem[10] = state->S_44_32[2];
+        tmpmem[11] = state->S_44_32[3];
+        tmpmem[12] = state->S_44_32[4];
+        tmpmem[13] = state->S_44_32[5];
+        tmpmem[14] = state->S_44_32[6];
+        tmpmem[15] = state->S_44_32[7];
+        state->S_44_32[0] = tmpmem[440 / SUB_BLOCKS_22_16 + 8];
+        state->S_44_32[1] = tmpmem[440 / SUB_BLOCKS_22_16 + 9];
+        state->S_44_32[2] = tmpmem[440 / SUB_BLOCKS_22_16 + 10];
+        state->S_44_32[3] = tmpmem[440 / SUB_BLOCKS_22_16 + 11];
+        state->S_44_32[4] = tmpmem[440 / SUB_BLOCKS_22_16 + 12];
+        state->S_44_32[5] = tmpmem[440 / SUB_BLOCKS_22_16 + 13];
+        state->S_44_32[6] = tmpmem[440 / SUB_BLOCKS_22_16 + 14];
+        state->S_44_32[7] = tmpmem[440 / SUB_BLOCKS_22_16 + 15];
+
+        WebRtcSpl_Resample44khzTo32khz(tmpmem + 8, tmpmem, 40 / SUB_BLOCKS_22_16);
+
+        ///// 32 --> 16 /////
+        // int32_t  in[320/SUB_BLOCKS_22_16]
+        // int32_t out[160/SUB_BLOCKS_22_16]
+        /////
+        WebRtcSpl_DownBy2IntToShort(tmpmem, 320 / SUB_BLOCKS_22_16, out, state->S_32_16);
+
+        // move input/output pointers 10/SUB_BLOCKS_22_16 ms seconds ahead
+        in += 220 / SUB_BLOCKS_22_16;
+        out += 160 / SUB_BLOCKS_22_16;
+    }
+}
+
+// initialize state of 22 -> 16 resampler
+void WebRtcSpl_ResetResample22khzTo16khz(WebRtcSpl_State22khzTo16khz* state)
+{
+    int k;
+    for (k = 0; k < 8; k++)
+    {
+        state->S_22_44[k] = 0;
+        state->S_44_32[k] = 0;
+        state->S_32_16[k] = 0;
+    }
+}
+
+//////////////////////
+// 16 kHz -> 22 kHz //
+//////////////////////
+
+// number of subblocks; options: 1, 2, 4, 5, 10
+#define SUB_BLOCKS_16_22    4
+
+// 16 -> 22 resampler
+void WebRtcSpl_Resample16khzTo22khz(const int16_t* in, int16_t* out,
+                                    WebRtcSpl_State16khzTo22khz* state, int32_t* tmpmem)
+{
+    int k;
+
+    // process two blocks of 10/SUB_BLOCKS_16_22 ms (to reduce temp buffer size)
+    for (k = 0; k < SUB_BLOCKS_16_22; k++)
+    {
+        ///// 16 --> 32 /////
+        // int16_t  in[160/SUB_BLOCKS_16_22]
+        // int32_t out[320/SUB_BLOCKS_16_22]
+        /////
+        WebRtcSpl_UpBy2ShortToInt(in, 160 / SUB_BLOCKS_16_22, tmpmem + 8, state->S_16_32);
+
+        ///// 32 --> 22 /////
+        // int32_t  in[320/SUB_BLOCKS_16_22]
+        // int32_t out[220/SUB_BLOCKS_16_22]
+        /////
+        // copy state to and from input array
+        tmpmem[0] = state->S_32_22[0];
+        tmpmem[1] = state->S_32_22[1];
+        tmpmem[2] = state->S_32_22[2];
+        tmpmem[3] = state->S_32_22[3];
+        tmpmem[4] = state->S_32_22[4];
+        tmpmem[5] = state->S_32_22[5];
+        tmpmem[6] = state->S_32_22[6];
+        tmpmem[7] = state->S_32_22[7];
+        state->S_32_22[0] = tmpmem[320 / SUB_BLOCKS_16_22];
+        state->S_32_22[1] = tmpmem[320 / SUB_BLOCKS_16_22 + 1];
+        state->S_32_22[2] = tmpmem[320 / SUB_BLOCKS_16_22 + 2];
+        state->S_32_22[3] = tmpmem[320 / SUB_BLOCKS_16_22 + 3];
+        state->S_32_22[4] = tmpmem[320 / SUB_BLOCKS_16_22 + 4];
+        state->S_32_22[5] = tmpmem[320 / SUB_BLOCKS_16_22 + 5];
+        state->S_32_22[6] = tmpmem[320 / SUB_BLOCKS_16_22 + 6];
+        state->S_32_22[7] = tmpmem[320 / SUB_BLOCKS_16_22 + 7];
+
+        WebRtcSpl_32khzTo22khzIntToShort(tmpmem, out, 20 / SUB_BLOCKS_16_22);
+
+        // move input/output pointers 10/SUB_BLOCKS_16_22 ms seconds ahead
+        in += 160 / SUB_BLOCKS_16_22;
+        out += 220 / SUB_BLOCKS_16_22;
+    }
+}
+
+// initialize state of 16 -> 22 resampler
+void WebRtcSpl_ResetResample16khzTo22khz(WebRtcSpl_State16khzTo22khz* state)
+{
+    int k;
+    for (k = 0; k < 8; k++)
+    {
+        state->S_16_32[k] = 0;
+        state->S_32_22[k] = 0;
+    }
+}
+
+//////////////////////
+// 22 kHz ->  8 kHz //
+//////////////////////
+
+// number of subblocks; options: 1, 2, 5, 10
+#define SUB_BLOCKS_22_8     2
+
+// 22 -> 8 resampler
+void WebRtcSpl_Resample22khzTo8khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State22khzTo8khz* state, int32_t* tmpmem)
+{
+    int k;
+
+    // process two blocks of 10/SUB_BLOCKS_22_8 ms (to reduce temp buffer size)
+    for (k = 0; k < SUB_BLOCKS_22_8; k++)
+    {
+        ///// 22 --> 22 lowpass /////
+        // int16_t  in[220/SUB_BLOCKS_22_8]
+        // int32_t out[220/SUB_BLOCKS_22_8]
+        /////
+        WebRtcSpl_LPBy2ShortToInt(in, 220 / SUB_BLOCKS_22_8, tmpmem + 16, state->S_22_22);
+
+        ///// 22 --> 16 /////
+        // int32_t  in[220/SUB_BLOCKS_22_8]
+        // int32_t out[160/SUB_BLOCKS_22_8]
+        /////
+        // copy state to and from input array
+        tmpmem[8] = state->S_22_16[0];
+        tmpmem[9] = state->S_22_16[1];
+        tmpmem[10] = state->S_22_16[2];
+        tmpmem[11] = state->S_22_16[3];
+        tmpmem[12] = state->S_22_16[4];
+        tmpmem[13] = state->S_22_16[5];
+        tmpmem[14] = state->S_22_16[6];
+        tmpmem[15] = state->S_22_16[7];
+        state->S_22_16[0] = tmpmem[220 / SUB_BLOCKS_22_8 + 8];
+        state->S_22_16[1] = tmpmem[220 / SUB_BLOCKS_22_8 + 9];
+        state->S_22_16[2] = tmpmem[220 / SUB_BLOCKS_22_8 + 10];
+        state->S_22_16[3] = tmpmem[220 / SUB_BLOCKS_22_8 + 11];
+        state->S_22_16[4] = tmpmem[220 / SUB_BLOCKS_22_8 + 12];
+        state->S_22_16[5] = tmpmem[220 / SUB_BLOCKS_22_8 + 13];
+        state->S_22_16[6] = tmpmem[220 / SUB_BLOCKS_22_8 + 14];
+        state->S_22_16[7] = tmpmem[220 / SUB_BLOCKS_22_8 + 15];
+
+        WebRtcSpl_Resample44khzTo32khz(tmpmem + 8, tmpmem, 20 / SUB_BLOCKS_22_8);
+
+        ///// 16 --> 8 /////
+        // int32_t in[160/SUB_BLOCKS_22_8]
+        // int32_t out[80/SUB_BLOCKS_22_8]
+        /////
+        WebRtcSpl_DownBy2IntToShort(tmpmem, 160 / SUB_BLOCKS_22_8, out, state->S_16_8);
+
+        // move input/output pointers 10/SUB_BLOCKS_22_8 ms seconds ahead
+        in += 220 / SUB_BLOCKS_22_8;
+        out += 80 / SUB_BLOCKS_22_8;
+    }
+}
+
+// initialize state of 22 -> 8 resampler
+void WebRtcSpl_ResetResample22khzTo8khz(WebRtcSpl_State22khzTo8khz* state)
+{
+    int k;
+    for (k = 0; k < 8; k++)
+    {
+        state->S_22_22[k] = 0;
+        state->S_22_22[k + 8] = 0;
+        state->S_22_16[k] = 0;
+        state->S_16_8[k] = 0;
+    }
+}
+
+//////////////////////
+//  8 kHz -> 22 kHz //
+//////////////////////
+
+// number of subblocks; options: 1, 2, 5, 10
+#define SUB_BLOCKS_8_22     2
+
+// 8 -> 22 resampler
+void WebRtcSpl_Resample8khzTo22khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State8khzTo22khz* state, int32_t* tmpmem)
+{
+    int k;
+
+    // process two blocks of 10/SUB_BLOCKS_8_22 ms (to reduce temp buffer size)
+    for (k = 0; k < SUB_BLOCKS_8_22; k++)
+    {
+        ///// 8 --> 16 /////
+        // int16_t  in[80/SUB_BLOCKS_8_22]
+        // int32_t out[160/SUB_BLOCKS_8_22]
+        /////
+        WebRtcSpl_UpBy2ShortToInt(in, 80 / SUB_BLOCKS_8_22, tmpmem + 18, state->S_8_16);
+
+        ///// 16 --> 11 /////
+        // int32_t  in[160/SUB_BLOCKS_8_22]
+        // int32_t out[110/SUB_BLOCKS_8_22]
+        /////
+        // copy state to and from input array
+        tmpmem[10] = state->S_16_11[0];
+        tmpmem[11] = state->S_16_11[1];
+        tmpmem[12] = state->S_16_11[2];
+        tmpmem[13] = state->S_16_11[3];
+        tmpmem[14] = state->S_16_11[4];
+        tmpmem[15] = state->S_16_11[5];
+        tmpmem[16] = state->S_16_11[6];
+        tmpmem[17] = state->S_16_11[7];
+        state->S_16_11[0] = tmpmem[160 / SUB_BLOCKS_8_22 + 10];
+        state->S_16_11[1] = tmpmem[160 / SUB_BLOCKS_8_22 + 11];
+        state->S_16_11[2] = tmpmem[160 / SUB_BLOCKS_8_22 + 12];
+        state->S_16_11[3] = tmpmem[160 / SUB_BLOCKS_8_22 + 13];
+        state->S_16_11[4] = tmpmem[160 / SUB_BLOCKS_8_22 + 14];
+        state->S_16_11[5] = tmpmem[160 / SUB_BLOCKS_8_22 + 15];
+        state->S_16_11[6] = tmpmem[160 / SUB_BLOCKS_8_22 + 16];
+        state->S_16_11[7] = tmpmem[160 / SUB_BLOCKS_8_22 + 17];
+
+        WebRtcSpl_32khzTo22khzIntToInt(tmpmem + 10, tmpmem, 10 / SUB_BLOCKS_8_22);
+
+        ///// 11 --> 22 /////
+        // int32_t  in[110/SUB_BLOCKS_8_22]
+        // int16_t out[220/SUB_BLOCKS_8_22]
+        /////
+        WebRtcSpl_UpBy2IntToShort(tmpmem, 110 / SUB_BLOCKS_8_22, out, state->S_11_22);
+
+        // move input/output pointers 10/SUB_BLOCKS_8_22 ms seconds ahead
+        in += 80 / SUB_BLOCKS_8_22;
+        out += 220 / SUB_BLOCKS_8_22;
+    }
+}
+
+// initialize state of 8 -> 22 resampler
+void WebRtcSpl_ResetResample8khzTo22khz(WebRtcSpl_State8khzTo22khz* state)
+{
+    int k;
+    for (k = 0; k < 8; k++)
+    {
+        state->S_8_16[k] = 0;
+        state->S_16_11[k] = 0;
+        state->S_11_22[k] = 0;
+    }
+}
+
+// compute two inner-products and store them to output array
+static void WebRtcSpl_DotProdIntToInt(const int32_t* in1, const int32_t* in2,
+                                      const int16_t* coef_ptr, int32_t* out1,
+                                      int32_t* out2)
+{
+    int32_t tmp1 = 16384;
+    int32_t tmp2 = 16384;
+    int16_t coef;
+
+    coef = coef_ptr[0];
+    tmp1 += coef * in1[0];
+    tmp2 += coef * in2[-0];
+
+    coef = coef_ptr[1];
+    tmp1 += coef * in1[1];
+    tmp2 += coef * in2[-1];
+
+    coef = coef_ptr[2];
+    tmp1 += coef * in1[2];
+    tmp2 += coef * in2[-2];
+
+    coef = coef_ptr[3];
+    tmp1 += coef * in1[3];
+    tmp2 += coef * in2[-3];
+
+    coef = coef_ptr[4];
+    tmp1 += coef * in1[4];
+    tmp2 += coef * in2[-4];
+
+    coef = coef_ptr[5];
+    tmp1 += coef * in1[5];
+    tmp2 += coef * in2[-5];
+
+    coef = coef_ptr[6];
+    tmp1 += coef * in1[6];
+    tmp2 += coef * in2[-6];
+
+    coef = coef_ptr[7];
+    tmp1 += coef * in1[7];
+    tmp2 += coef * in2[-7];
+
+    coef = coef_ptr[8];
+    *out1 = tmp1 + coef * in1[8];
+    *out2 = tmp2 + coef * in2[-8];
+}
+
+// compute two inner-products and store them to output array
+static void WebRtcSpl_DotProdIntToShort(const int32_t* in1, const int32_t* in2,
+                                        const int16_t* coef_ptr, int16_t* out1,
+                                        int16_t* out2)
+{
+    int32_t tmp1 = 16384;
+    int32_t tmp2 = 16384;
+    int16_t coef;
+
+    coef = coef_ptr[0];
+    tmp1 += coef * in1[0];
+    tmp2 += coef * in2[-0];
+
+    coef = coef_ptr[1];
+    tmp1 += coef * in1[1];
+    tmp2 += coef * in2[-1];
+
+    coef = coef_ptr[2];
+    tmp1 += coef * in1[2];
+    tmp2 += coef * in2[-2];
+
+    coef = coef_ptr[3];
+    tmp1 += coef * in1[3];
+    tmp2 += coef * in2[-3];
+
+    coef = coef_ptr[4];
+    tmp1 += coef * in1[4];
+    tmp2 += coef * in2[-4];
+
+    coef = coef_ptr[5];
+    tmp1 += coef * in1[5];
+    tmp2 += coef * in2[-5];
+
+    coef = coef_ptr[6];
+    tmp1 += coef * in1[6];
+    tmp2 += coef * in2[-6];
+
+    coef = coef_ptr[7];
+    tmp1 += coef * in1[7];
+    tmp2 += coef * in2[-7];
+
+    coef = coef_ptr[8];
+    tmp1 += coef * in1[8];
+    tmp2 += coef * in2[-8];
+
+    // scale down, round and saturate
+    tmp1 >>= 15;
+    if (tmp1 > (int32_t)0x00007FFF)
+        tmp1 = 0x00007FFF;
+    if (tmp1 < (int32_t)0xFFFF8000)
+        tmp1 = 0xFFFF8000;
+    tmp2 >>= 15;
+    if (tmp2 > (int32_t)0x00007FFF)
+        tmp2 = 0x00007FFF;
+    if (tmp2 < (int32_t)0xFFFF8000)
+        tmp2 = 0xFFFF8000;
+    *out1 = (int16_t)tmp1;
+    *out2 = (int16_t)tmp2;
+}
+
+//   Resampling ratio: 11/16
+// input:  int32_t (normalized, not saturated) :: size 16 * K
+// output: int32_t (shifted 15 positions to the left, + offset 16384) :: size 11 * K
+//      K: Number of blocks
+
+void WebRtcSpl_32khzTo22khzIntToInt(const int32_t* In,
+                                    int32_t* Out,
+                                    int32_t K)
+{
+    /////////////////////////////////////////////////////////////
+    // Filter operation:
+    //
+    // Perform resampling (16 input samples -> 11 output samples);
+    // process in sub blocks of size 16 samples.
+    int32_t m;
+
+    for (m = 0; m < K; m++)
+    {
+        // first output sample
+        Out[0] = ((int32_t)In[3] << 15) + (1 << 14);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToInt(&In[0], &In[22], kCoefficients32To22[0], &Out[1], &Out[10]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToInt(&In[2], &In[20], kCoefficients32To22[1], &Out[2], &Out[9]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToInt(&In[3], &In[19], kCoefficients32To22[2], &Out[3], &Out[8]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToInt(&In[5], &In[17], kCoefficients32To22[3], &Out[4], &Out[7]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToInt(&In[6], &In[16], kCoefficients32To22[4], &Out[5], &Out[6]);
+
+        // update pointers
+        In += 16;
+        Out += 11;
+    }
+}
+
+//   Resampling ratio: 11/16
+// input:  int32_t (normalized, not saturated) :: size 16 * K
+// output: int16_t (saturated) :: size 11 * K
+//      K: Number of blocks
+
+void WebRtcSpl_32khzTo22khzIntToShort(const int32_t *In,
+                                      int16_t *Out,
+                                      int32_t K)
+{
+    /////////////////////////////////////////////////////////////
+    // Filter operation:
+    //
+    // Perform resampling (16 input samples -> 11 output samples);
+    // process in sub blocks of size 16 samples.
+    int32_t tmp;
+    int32_t m;
+
+    for (m = 0; m < K; m++)
+    {
+        // first output sample
+        tmp = In[3];
+        if (tmp > (int32_t)0x00007FFF)
+            tmp = 0x00007FFF;
+        if (tmp < (int32_t)0xFFFF8000)
+            tmp = 0xFFFF8000;
+        Out[0] = (int16_t)tmp;
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToShort(&In[0], &In[22], kCoefficients32To22[0], &Out[1], &Out[10]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToShort(&In[2], &In[20], kCoefficients32To22[1], &Out[2], &Out[9]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToShort(&In[3], &In[19], kCoefficients32To22[2], &Out[3], &Out[8]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToShort(&In[5], &In[17], kCoefficients32To22[3], &Out[4], &Out[7]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_DotProdIntToShort(&In[6], &In[16], kCoefficients32To22[4], &Out[5], &Out[6]);
+
+        // update pointers
+        In += 16;
+        Out += 11;
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_48khz.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_48khz.c
new file mode 100644
index 0000000..2220cc3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_48khz.c
@@ -0,0 +1,186 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains resampling functions between 48 kHz and nb/wb.
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include <string.h>
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/common_audio/signal_processing/resample_by_2_internal.h"
+
+////////////////////////////
+///// 48 kHz -> 16 kHz /////
+////////////////////////////
+
+// 48 -> 16 resampler
+void WebRtcSpl_Resample48khzTo16khz(const int16_t* in, int16_t* out,
+                                    WebRtcSpl_State48khzTo16khz* state, int32_t* tmpmem)
+{
+    ///// 48 --> 48(LP) /////
+    // int16_t  in[480]
+    // int32_t out[480]
+    /////
+    WebRtcSpl_LPBy2ShortToInt(in, 480, tmpmem + 16, state->S_48_48);
+
+    ///// 48 --> 32 /////
+    // int32_t  in[480]
+    // int32_t out[320]
+    /////
+    // copy state to and from input array
+    memcpy(tmpmem + 8, state->S_48_32, 8 * sizeof(int32_t));
+    memcpy(state->S_48_32, tmpmem + 488, 8 * sizeof(int32_t));
+    WebRtcSpl_Resample48khzTo32khz(tmpmem + 8, tmpmem, 160);
+
+    ///// 32 --> 16 /////
+    // int32_t  in[320]
+    // int16_t out[160]
+    /////
+    WebRtcSpl_DownBy2IntToShort(tmpmem, 320, out, state->S_32_16);
+}
+
+// initialize state of 48 -> 16 resampler
+void WebRtcSpl_ResetResample48khzTo16khz(WebRtcSpl_State48khzTo16khz* state)
+{
+    memset(state->S_48_48, 0, 16 * sizeof(int32_t));
+    memset(state->S_48_32, 0, 8 * sizeof(int32_t));
+    memset(state->S_32_16, 0, 8 * sizeof(int32_t));
+}
+
+////////////////////////////
+///// 16 kHz -> 48 kHz /////
+////////////////////////////
+
+// 16 -> 48 resampler
+void WebRtcSpl_Resample16khzTo48khz(const int16_t* in, int16_t* out,
+                                    WebRtcSpl_State16khzTo48khz* state, int32_t* tmpmem)
+{
+    ///// 16 --> 32 /////
+    // int16_t  in[160]
+    // int32_t out[320]
+    /////
+    WebRtcSpl_UpBy2ShortToInt(in, 160, tmpmem + 16, state->S_16_32);
+
+    ///// 32 --> 24 /////
+    // int32_t  in[320]
+    // int32_t out[240]
+    // copy state to and from input array
+    /////
+    memcpy(tmpmem + 8, state->S_32_24, 8 * sizeof(int32_t));
+    memcpy(state->S_32_24, tmpmem + 328, 8 * sizeof(int32_t));
+    WebRtcSpl_Resample32khzTo24khz(tmpmem + 8, tmpmem, 80);
+
+    ///// 24 --> 48 /////
+    // int32_t  in[240]
+    // int16_t out[480]
+    /////
+    WebRtcSpl_UpBy2IntToShort(tmpmem, 240, out, state->S_24_48);
+}
+
+// initialize state of 16 -> 48 resampler
+void WebRtcSpl_ResetResample16khzTo48khz(WebRtcSpl_State16khzTo48khz* state)
+{
+    memset(state->S_16_32, 0, 8 * sizeof(int32_t));
+    memset(state->S_32_24, 0, 8 * sizeof(int32_t));
+    memset(state->S_24_48, 0, 8 * sizeof(int32_t));
+}
+
+////////////////////////////
+///// 48 kHz ->  8 kHz /////
+////////////////////////////
+
+// 48 -> 8 resampler
+void WebRtcSpl_Resample48khzTo8khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State48khzTo8khz* state, int32_t* tmpmem)
+{
+    ///// 48 --> 24 /////
+    // int16_t  in[480]
+    // int32_t out[240]
+    /////
+    WebRtcSpl_DownBy2ShortToInt(in, 480, tmpmem + 256, state->S_48_24);
+
+    ///// 24 --> 24(LP) /////
+    // int32_t  in[240]
+    // int32_t out[240]
+    /////
+    WebRtcSpl_LPBy2IntToInt(tmpmem + 256, 240, tmpmem + 16, state->S_24_24);
+
+    ///// 24 --> 16 /////
+    // int32_t  in[240]
+    // int32_t out[160]
+    /////
+    // copy state to and from input array
+    memcpy(tmpmem + 8, state->S_24_16, 8 * sizeof(int32_t));
+    memcpy(state->S_24_16, tmpmem + 248, 8 * sizeof(int32_t));
+    WebRtcSpl_Resample48khzTo32khz(tmpmem + 8, tmpmem, 80);
+
+    ///// 16 --> 8 /////
+    // int32_t  in[160]
+    // int16_t out[80]
+    /////
+    WebRtcSpl_DownBy2IntToShort(tmpmem, 160, out, state->S_16_8);
+}
+
+// initialize state of 48 -> 8 resampler
+void WebRtcSpl_ResetResample48khzTo8khz(WebRtcSpl_State48khzTo8khz* state)
+{
+    memset(state->S_48_24, 0, 8 * sizeof(int32_t));
+    memset(state->S_24_24, 0, 16 * sizeof(int32_t));
+    memset(state->S_24_16, 0, 8 * sizeof(int32_t));
+    memset(state->S_16_8, 0, 8 * sizeof(int32_t));
+}
+
+////////////////////////////
+/////  8 kHz -> 48 kHz /////
+////////////////////////////
+
+// 8 -> 48 resampler
+void WebRtcSpl_Resample8khzTo48khz(const int16_t* in, int16_t* out,
+                                   WebRtcSpl_State8khzTo48khz* state, int32_t* tmpmem)
+{
+    ///// 8 --> 16 /////
+    // int16_t  in[80]
+    // int32_t out[160]
+    /////
+    WebRtcSpl_UpBy2ShortToInt(in, 80, tmpmem + 264, state->S_8_16);
+
+    ///// 16 --> 12 /////
+    // int32_t  in[160]
+    // int32_t out[120]
+    /////
+    // copy state to and from input array
+    memcpy(tmpmem + 256, state->S_16_12, 8 * sizeof(int32_t));
+    memcpy(state->S_16_12, tmpmem + 416, 8 * sizeof(int32_t));
+    WebRtcSpl_Resample32khzTo24khz(tmpmem + 256, tmpmem + 240, 40);
+
+    ///// 12 --> 24 /////
+    // int32_t  in[120]
+    // int16_t out[240]
+    /////
+    WebRtcSpl_UpBy2IntToInt(tmpmem + 240, 120, tmpmem, state->S_12_24);
+
+    ///// 24 --> 48 /////
+    // int32_t  in[240]
+    // int16_t out[480]
+    /////
+    WebRtcSpl_UpBy2IntToShort(tmpmem, 240, out, state->S_24_48);
+}
+
+// initialize state of 8 -> 48 resampler
+void WebRtcSpl_ResetResample8khzTo48khz(WebRtcSpl_State8khzTo48khz* state)
+{
+    memset(state->S_8_16, 0, 8 * sizeof(int32_t));
+    memset(state->S_16_12, 0, 8 * sizeof(int32_t));
+    memset(state->S_12_24, 0, 8 * sizeof(int32_t));
+    memset(state->S_24_48, 0, 8 * sizeof(int32_t));
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2.c
new file mode 100644
index 0000000..dcba82e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2.c
@@ -0,0 +1,183 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the resampling by two functions.
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+#ifdef WEBRTC_ARCH_ARM_V7
+
+// allpass filter coefficients.
+static const uint32_t kResampleAllpass1[3] = {3284, 24441, 49528 << 15};
+static const uint32_t kResampleAllpass2[3] =
+  {12199, 37471 << 15, 60255 << 15};
+
+// Multiply two 32-bit values and accumulate to another input value.
+// Return: state + ((diff * tbl_value) >> 16)
+
+static __inline int32_t MUL_ACCUM_1(int32_t tbl_value,
+                                    int32_t diff,
+                                    int32_t state) {
+  int32_t result;
+  __asm __volatile ("smlawb %0, %1, %2, %3": "=r"(result): "r"(diff),
+                                   "r"(tbl_value), "r"(state));
+  return result;
+}
+
+// Multiply two 32-bit values and accumulate to another input value.
+// Return: Return: state + (((diff << 1) * tbl_value) >> 32)
+//
+// The reason to introduce this function is that, in case we can't use smlawb
+// instruction (in MUL_ACCUM_1) due to input value range, we can still use 
+// smmla to save some cycles.
+
+static __inline int32_t MUL_ACCUM_2(int32_t tbl_value,
+                                    int32_t diff,
+                                    int32_t state) {
+  int32_t result;
+  __asm __volatile ("smmla %0, %1, %2, %3": "=r"(result): "r"(diff << 1),
+                                  "r"(tbl_value), "r"(state));
+  return result;
+}
+
+#else
+
+// allpass filter coefficients.
+static const uint16_t kResampleAllpass1[3] = {3284, 24441, 49528};
+static const uint16_t kResampleAllpass2[3] = {12199, 37471, 60255};
+
+// Multiply a 32-bit value with a 16-bit value and accumulate to another input:
+#define MUL_ACCUM_1(a, b, c) WEBRTC_SPL_SCALEDIFF32(a, b, c)
+#define MUL_ACCUM_2(a, b, c) WEBRTC_SPL_SCALEDIFF32(a, b, c)
+
+#endif  // WEBRTC_ARCH_ARM_V7
+
+
+// decimator
+#if !defined(MIPS32_LE)
+void WebRtcSpl_DownsampleBy2(const int16_t* in, size_t len,
+                             int16_t* out, int32_t* filtState) {
+  int32_t tmp1, tmp2, diff, in32, out32;
+  size_t i;
+
+  register int32_t state0 = filtState[0];
+  register int32_t state1 = filtState[1];
+  register int32_t state2 = filtState[2];
+  register int32_t state3 = filtState[3];
+  register int32_t state4 = filtState[4];
+  register int32_t state5 = filtState[5];
+  register int32_t state6 = filtState[6];
+  register int32_t state7 = filtState[7];
+
+  for (i = (len >> 1); i > 0; i--) {
+    // lower allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state1;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass2[0], diff, state0);
+    state0 = in32;
+    diff = tmp1 - state2;
+    tmp2 = MUL_ACCUM_2(kResampleAllpass2[1], diff, state1);
+    state1 = tmp1;
+    diff = tmp2 - state3;
+    state3 = MUL_ACCUM_2(kResampleAllpass2[2], diff, state2);
+    state2 = tmp2;
+
+    // upper allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state5;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass1[0], diff, state4);
+    state4 = in32;
+    diff = tmp1 - state6;
+    tmp2 = MUL_ACCUM_1(kResampleAllpass1[1], diff, state5);
+    state5 = tmp1;
+    diff = tmp2 - state7;
+    state7 = MUL_ACCUM_2(kResampleAllpass1[2], diff, state6);
+    state6 = tmp2;
+
+    // add two allpass outputs, divide by two and round
+    out32 = (state3 + state7 + 1024) >> 11;
+
+    // limit amplitude to prevent wrap-around, and write to output array
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+  }
+
+  filtState[0] = state0;
+  filtState[1] = state1;
+  filtState[2] = state2;
+  filtState[3] = state3;
+  filtState[4] = state4;
+  filtState[5] = state5;
+  filtState[6] = state6;
+  filtState[7] = state7;
+}
+#endif  // #if defined(MIPS32_LE)
+
+
+void WebRtcSpl_UpsampleBy2(const int16_t* in, size_t len,
+                           int16_t* out, int32_t* filtState) {
+  int32_t tmp1, tmp2, diff, in32, out32;
+  size_t i;
+
+  register int32_t state0 = filtState[0];
+  register int32_t state1 = filtState[1];
+  register int32_t state2 = filtState[2];
+  register int32_t state3 = filtState[3];
+  register int32_t state4 = filtState[4];
+  register int32_t state5 = filtState[5];
+  register int32_t state6 = filtState[6];
+  register int32_t state7 = filtState[7];
+
+  for (i = len; i > 0; i--) {
+    // lower allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state1;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass1[0], diff, state0);
+    state0 = in32;
+    diff = tmp1 - state2;
+    tmp2 = MUL_ACCUM_1(kResampleAllpass1[1], diff, state1);
+    state1 = tmp1;
+    diff = tmp2 - state3;
+    state3 = MUL_ACCUM_2(kResampleAllpass1[2], diff, state2);
+    state2 = tmp2;
+
+    // round; limit amplitude to prevent wrap-around; write to output array
+    out32 = (state3 + 512) >> 10;
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+
+    // upper allpass filter
+    diff = in32 - state5;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass2[0], diff, state4);
+    state4 = in32;
+    diff = tmp1 - state6;
+    tmp2 = MUL_ACCUM_2(kResampleAllpass2[1], diff, state5);
+    state5 = tmp1;
+    diff = tmp2 - state7;
+    state7 = MUL_ACCUM_2(kResampleAllpass2[2], diff, state6);
+    state6 = tmp2;
+
+    // round; limit amplitude to prevent wrap-around; write to output array
+    out32 = (state7 + 512) >> 10;
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+  }
+
+  filtState[0] = state0;
+  filtState[1] = state1;
+  filtState[2] = state2;
+  filtState[3] = state3;
+  filtState[4] = state4;
+  filtState[5] = state5;
+  filtState[6] = state6;
+  filtState[7] = state7;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_internal.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_internal.c
new file mode 100644
index 0000000..085069c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_internal.c
@@ -0,0 +1,679 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This header file contains some internal resampling functions.
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/resample_by_2_internal.h"
+
+// allpass filter coefficients.
+static const int16_t kResampleAllpass[2][3] = {
+        {821, 6110, 12382},
+        {3050, 9368, 15063}
+};
+
+//
+//   decimator
+// input:  int32_t (shifted 15 positions to the left, + offset 16384) OVERWRITTEN!
+// output: int16_t (saturated) (of length len/2)
+// state:  filter state array; length = 8
+
+void WebRtcSpl_DownBy2IntToShort(int32_t *in, int32_t len, int16_t *out,
+                                 int32_t *state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    len >>= 1;
+
+    // lower allpass filter (operates on even input samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i << 1];
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // divide by two and store temporarily
+        in[i << 1] = (state[3] >> 1);
+    }
+
+    in++;
+
+    // upper allpass filter (operates on odd input samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i << 1];
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // divide by two and store temporarily
+        in[i << 1] = (state[7] >> 1);
+    }
+
+    in--;
+
+    // combine allpass outputs
+    for (i = 0; i < len; i += 2)
+    {
+        // divide by two, add both allpass outputs and round
+        tmp0 = (in[i << 1] + in[(i << 1) + 1]) >> 15;
+        tmp1 = (in[(i << 1) + 2] + in[(i << 1) + 3]) >> 15;
+        if (tmp0 > (int32_t)0x00007FFF)
+            tmp0 = 0x00007FFF;
+        if (tmp0 < (int32_t)0xFFFF8000)
+            tmp0 = 0xFFFF8000;
+        out[i] = (int16_t)tmp0;
+        if (tmp1 > (int32_t)0x00007FFF)
+            tmp1 = 0x00007FFF;
+        if (tmp1 < (int32_t)0xFFFF8000)
+            tmp1 = 0xFFFF8000;
+        out[i + 1] = (int16_t)tmp1;
+    }
+}
+
+//
+//   decimator
+// input:  int16_t
+// output: int32_t (shifted 15 positions to the left, + offset 16384) (of length len/2)
+// state:  filter state array; length = 8
+
+void WebRtcSpl_DownBy2ShortToInt(const int16_t *in,
+                                  int32_t len,
+                                  int32_t *out,
+                                  int32_t *state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    len >>= 1;
+
+    // lower allpass filter (operates on even input samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i << 1] << 15) + (1 << 14);
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // divide by two and store temporarily
+        out[i] = (state[3] >> 1);
+    }
+
+    in++;
+
+    // upper allpass filter (operates on odd input samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i << 1] << 15) + (1 << 14);
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // divide by two and store temporarily
+        out[i] += (state[7] >> 1);
+    }
+
+    in--;
+}
+
+//
+//   interpolator
+// input:  int16_t
+// output: int32_t (normalized, not saturated) (of length len*2)
+// state:  filter state array; length = 8
+void WebRtcSpl_UpBy2ShortToInt(const int16_t *in, int32_t len, int32_t *out,
+                               int32_t *state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    // upper allpass filter (generates odd output samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i] << 15) + (1 << 14);
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[7] >> 15;
+    }
+
+    out++;
+
+    // lower allpass filter (generates even output samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i] << 15) + (1 << 14);
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[3] >> 15;
+    }
+}
+
+//
+//   interpolator
+// input:  int32_t (shifted 15 positions to the left, + offset 16384)
+// output: int32_t (shifted 15 positions to the left, + offset 16384) (of length len*2)
+// state:  filter state array; length = 8
+void WebRtcSpl_UpBy2IntToInt(const int32_t *in, int32_t len, int32_t *out,
+                             int32_t *state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    // upper allpass filter (generates odd output samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i];
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[7];
+    }
+
+    out++;
+
+    // lower allpass filter (generates even output samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i];
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[3];
+    }
+}
+
+//
+//   interpolator
+// input:  int32_t (shifted 15 positions to the left, + offset 16384)
+// output: int16_t (saturated) (of length len*2)
+// state:  filter state array; length = 8
+void WebRtcSpl_UpBy2IntToShort(const int32_t *in, int32_t len, int16_t *out,
+                               int32_t *state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    // upper allpass filter (generates odd output samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i];
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // scale down, saturate and store
+        tmp1 = state[7] >> 15;
+        if (tmp1 > (int32_t)0x00007FFF)
+            tmp1 = 0x00007FFF;
+        if (tmp1 < (int32_t)0xFFFF8000)
+            tmp1 = 0xFFFF8000;
+        out[i << 1] = (int16_t)tmp1;
+    }
+
+    out++;
+
+    // lower allpass filter (generates even output samples)
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i];
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // scale down, saturate and store
+        tmp1 = state[3] >> 15;
+        if (tmp1 > (int32_t)0x00007FFF)
+            tmp1 = 0x00007FFF;
+        if (tmp1 < (int32_t)0xFFFF8000)
+            tmp1 = 0xFFFF8000;
+        out[i << 1] = (int16_t)tmp1;
+    }
+}
+
+//   lowpass filter
+// input:  int16_t
+// output: int32_t (normalized, not saturated)
+// state:  filter state array; length = 8
+void WebRtcSpl_LPBy2ShortToInt(const int16_t* in, int32_t len, int32_t* out,
+                               int32_t* state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    len >>= 1;
+
+    // lower allpass filter: odd input -> even output samples
+    in++;
+    // initial state of polyphase delay element
+    tmp0 = state[12];
+    for (i = 0; i < len; i++)
+    {
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[3] >> 1;
+        tmp0 = ((int32_t)in[i << 1] << 15) + (1 << 14);
+    }
+    in--;
+
+    // upper allpass filter: even input -> even output samples
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i << 1] << 15) + (1 << 14);
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // average the two allpass outputs, scale down and store
+        out[i << 1] = (out[i << 1] + (state[7] >> 1)) >> 15;
+    }
+
+    // switch to odd output samples
+    out++;
+
+    // lower allpass filter: even input -> odd output samples
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i << 1] << 15) + (1 << 14);
+        diff = tmp0 - state[9];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[8] + diff * kResampleAllpass[1][0];
+        state[8] = tmp0;
+        diff = tmp1 - state[10];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[9] + diff * kResampleAllpass[1][1];
+        state[9] = tmp1;
+        diff = tmp0 - state[11];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[11] = state[10] + diff * kResampleAllpass[1][2];
+        state[10] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[11] >> 1;
+    }
+
+    // upper allpass filter: odd input -> odd output samples
+    in++;
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = ((int32_t)in[i << 1] << 15) + (1 << 14);
+        diff = tmp0 - state[13];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[12] + diff * kResampleAllpass[0][0];
+        state[12] = tmp0;
+        diff = tmp1 - state[14];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[13] + diff * kResampleAllpass[0][1];
+        state[13] = tmp1;
+        diff = tmp0 - state[15];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[15] = state[14] + diff * kResampleAllpass[0][2];
+        state[14] = tmp0;
+
+        // average the two allpass outputs, scale down and store
+        out[i << 1] = (out[i << 1] + (state[15] >> 1)) >> 15;
+    }
+}
+
+//   lowpass filter
+// input:  int32_t (shifted 15 positions to the left, + offset 16384)
+// output: int32_t (normalized, not saturated)
+// state:  filter state array; length = 8
+void WebRtcSpl_LPBy2IntToInt(const int32_t* in, int32_t len, int32_t* out,
+                             int32_t* state)
+{
+    int32_t tmp0, tmp1, diff;
+    int32_t i;
+
+    len >>= 1;
+
+    // lower allpass filter: odd input -> even output samples
+    in++;
+    // initial state of polyphase delay element
+    tmp0 = state[12];
+    for (i = 0; i < len; i++)
+    {
+        diff = tmp0 - state[1];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[0] + diff * kResampleAllpass[1][0];
+        state[0] = tmp0;
+        diff = tmp1 - state[2];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[1] + diff * kResampleAllpass[1][1];
+        state[1] = tmp1;
+        diff = tmp0 - state[3];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[3] = state[2] + diff * kResampleAllpass[1][2];
+        state[2] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[3] >> 1;
+        tmp0 = in[i << 1];
+    }
+    in--;
+
+    // upper allpass filter: even input -> even output samples
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i << 1];
+        diff = tmp0 - state[5];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[4] + diff * kResampleAllpass[0][0];
+        state[4] = tmp0;
+        diff = tmp1 - state[6];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[5] + diff * kResampleAllpass[0][1];
+        state[5] = tmp1;
+        diff = tmp0 - state[7];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[7] = state[6] + diff * kResampleAllpass[0][2];
+        state[6] = tmp0;
+
+        // average the two allpass outputs, scale down and store
+        out[i << 1] = (out[i << 1] + (state[7] >> 1)) >> 15;
+    }
+
+    // switch to odd output samples
+    out++;
+
+    // lower allpass filter: even input -> odd output samples
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i << 1];
+        diff = tmp0 - state[9];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[8] + diff * kResampleAllpass[1][0];
+        state[8] = tmp0;
+        diff = tmp1 - state[10];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[9] + diff * kResampleAllpass[1][1];
+        state[9] = tmp1;
+        diff = tmp0 - state[11];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[11] = state[10] + diff * kResampleAllpass[1][2];
+        state[10] = tmp0;
+
+        // scale down, round and store
+        out[i << 1] = state[11] >> 1;
+    }
+
+    // upper allpass filter: odd input -> odd output samples
+    in++;
+    for (i = 0; i < len; i++)
+    {
+        tmp0 = in[i << 1];
+        diff = tmp0 - state[13];
+        // scale down and round
+        diff = (diff + (1 << 13)) >> 14;
+        tmp1 = state[12] + diff * kResampleAllpass[0][0];
+        state[12] = tmp0;
+        diff = tmp1 - state[14];
+        // scale down and round
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        tmp0 = state[13] + diff * kResampleAllpass[0][1];
+        state[13] = tmp1;
+        diff = tmp0 - state[15];
+        // scale down and truncate
+        diff = diff >> 14;
+        if (diff < 0)
+            diff += 1;
+        state[15] = state[14] + diff * kResampleAllpass[0][2];
+        state[14] = tmp0;
+
+        // average the two allpass outputs, scale down and store
+        out[i << 1] = (out[i << 1] + (state[15] >> 1)) >> 15;
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_internal.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_internal.h
new file mode 100644
index 0000000..d0954e5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_internal.h
@@ -0,0 +1,47 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This header file contains some internal resampling functions.
+ *
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_RESAMPLE_BY_2_INTERNAL_H_
+#define WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_RESAMPLE_BY_2_INTERNAL_H_
+
+#include "webrtc/typedefs.h"
+
+/*******************************************************************
+ * resample_by_2_fast.c
+ * Functions for internal use in the other resample functions
+ ******************************************************************/
+void WebRtcSpl_DownBy2IntToShort(int32_t *in, int32_t len, int16_t *out,
+                                 int32_t *state);
+
+void WebRtcSpl_DownBy2ShortToInt(const int16_t *in, int32_t len,
+                                 int32_t *out, int32_t *state);
+
+void WebRtcSpl_UpBy2ShortToInt(const int16_t *in, int32_t len,
+                               int32_t *out, int32_t *state);
+
+void WebRtcSpl_UpBy2IntToInt(const int32_t *in, int32_t len, int32_t *out,
+                             int32_t *state);
+
+void WebRtcSpl_UpBy2IntToShort(const int32_t *in, int32_t len,
+                               int16_t *out, int32_t *state);
+
+void WebRtcSpl_LPBy2ShortToInt(const int16_t* in, int32_t len,
+                               int32_t* out, int32_t* state);
+
+void WebRtcSpl_LPBy2IntToInt(const int32_t* in, int32_t len, int32_t* out,
+                             int32_t* state);
+
+#endif  // WEBRTC_COMMON_AUDIO_SIGNAL_PROCESSING_RESAMPLE_BY_2_INTERNAL_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_mips.c
new file mode 100644
index 0000000..ec5fc8b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_by_2_mips.c
@@ -0,0 +1,290 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the resampling by two functions.
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#if defined(MIPS32_LE)
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// allpass filter coefficients.
+static const uint16_t kResampleAllpass1[3] = {3284, 24441, 49528};
+static const uint16_t kResampleAllpass2[3] = {12199, 37471, 60255};
+
+// Multiply a 32-bit value with a 16-bit value and accumulate to another input:
+#define MUL_ACCUM_1(a, b, c) WEBRTC_SPL_SCALEDIFF32(a, b, c)
+#define MUL_ACCUM_2(a, b, c) WEBRTC_SPL_SCALEDIFF32(a, b, c)
+
+// decimator
+void WebRtcSpl_DownsampleBy2(const int16_t* in,
+                             size_t len,
+                             int16_t* out,
+                             int32_t* filtState) {
+  int32_t out32;
+  size_t i, len1;
+
+  register int32_t state0 = filtState[0];
+  register int32_t state1 = filtState[1];
+  register int32_t state2 = filtState[2];
+  register int32_t state3 = filtState[3];
+  register int32_t state4 = filtState[4];
+  register int32_t state5 = filtState[5];
+  register int32_t state6 = filtState[6];
+  register int32_t state7 = filtState[7];
+
+#if defined(MIPS_DSP_R2_LE)
+  int32_t k1Res0, k1Res1, k1Res2, k2Res0, k2Res1, k2Res2;
+
+  k1Res0= 3284;
+  k1Res1= 24441;
+  k1Res2= 49528;
+  k2Res0= 12199;
+  k2Res1= 37471;
+  k2Res2= 60255;
+  len1 = (len >> 1);
+
+  const int32_t* inw = (int32_t*)in;
+  int32_t tmp11, tmp12, tmp21, tmp22;
+  int32_t in322, in321;
+  int32_t diff1, diff2;
+  for (i = len1; i > 0; i--) {
+    __asm__ volatile (
+      "lh         %[in321],    0(%[inw])                  \n\t"
+      "lh         %[in322],    2(%[inw])                  \n\t"
+
+      "sll        %[in321],    %[in321],      10          \n\t"
+      "sll        %[in322],    %[in322],      10          \n\t"
+
+      "addiu      %[inw],      %[inw],        4           \n\t"
+
+      "subu       %[diff1],    %[in321],      %[state1]   \n\t"
+      "subu       %[diff2],    %[in322],      %[state5]   \n\t"
+
+      : [in322] "=&r" (in322), [in321] "=&r" (in321),
+        [diff1] "=&r" (diff1), [diff2] "=r" (diff2), [inw] "+r" (inw)
+      : [state1] "r" (state1), [state5] "r" (state5)
+      : "memory"
+    );
+
+    __asm__ volatile (
+      "mult       $ac0,       %[diff1],       %[k2Res0]   \n\t"
+      "mult       $ac1,       %[diff2],       %[k1Res0]   \n\t"
+
+      "extr.w     %[tmp11],   $ac0,           16          \n\t"
+      "extr.w     %[tmp12],   $ac1,           16          \n\t"
+
+      "addu       %[tmp11],   %[state0],      %[tmp11]    \n\t"
+      "addu       %[tmp12],   %[state4],      %[tmp12]    \n\t"
+
+      "addiu      %[state0],  %[in321],       0           \n\t"
+      "addiu      %[state4],  %[in322],       0           \n\t"
+
+      "subu       %[diff1],   %[tmp11],       %[state2]   \n\t"
+      "subu       %[diff2],   %[tmp12],       %[state6]   \n\t"
+
+      "mult       $ac0,       %[diff1],       %[k2Res1]   \n\t"
+      "mult       $ac1,       %[diff2],       %[k1Res1]   \n\t"
+
+      "extr.w     %[tmp21],   $ac0,           16          \n\t"
+      "extr.w     %[tmp22],   $ac1,           16          \n\t"
+
+      "addu       %[tmp21],   %[state1],      %[tmp21]    \n\t"
+      "addu       %[tmp22],   %[state5],      %[tmp22]    \n\t"
+
+      "addiu      %[state1],  %[tmp11],       0           \n\t"
+      "addiu      %[state5],  %[tmp12],       0           \n\t"
+      : [tmp22] "=r" (tmp22), [tmp21] "=&r" (tmp21),
+        [tmp11] "=&r" (tmp11), [state0] "+r" (state0),
+        [state1] "+r" (state1),
+        [state2] "+r" (state2),
+        [state4] "+r" (state4), [tmp12] "=&r" (tmp12),
+        [state6] "+r" (state6), [state5] "+r" (state5)
+      : [k1Res1] "r" (k1Res1), [k2Res1] "r" (k2Res1), [k2Res0] "r" (k2Res0),
+        [diff2] "r" (diff2), [diff1] "r" (diff1), [in322] "r" (in322),
+        [in321] "r" (in321), [k1Res0] "r" (k1Res0)
+      : "hi", "lo", "$ac1hi", "$ac1lo"
+    );
+
+    // upper allpass filter
+    __asm__ volatile (
+      "subu       %[diff1],   %[tmp21],       %[state3]   \n\t"
+      "subu       %[diff2],   %[tmp22],       %[state7]   \n\t"
+
+      "mult       $ac0,       %[diff1],       %[k2Res2]   \n\t"
+      "mult       $ac1,       %[diff2],       %[k1Res2]   \n\t"
+      "extr.w     %[state3],  $ac0,           16          \n\t"
+      "extr.w     %[state7],  $ac1,           16          \n\t"
+      "addu       %[state3],  %[state2],      %[state3]   \n\t"
+      "addu       %[state7],  %[state6],      %[state7]   \n\t"
+
+      "addiu      %[state2],  %[tmp21],       0           \n\t"
+      "addiu      %[state6],  %[tmp22],       0           \n\t"
+
+      // add two allpass outputs, divide by two and round
+      "addu       %[out32],   %[state3],      %[state7]   \n\t"
+      "addiu      %[out32],   %[out32],       1024        \n\t"
+      "sra        %[out32],   %[out32],       11          \n\t"
+      : [state3] "+r" (state3), [state6] "+r" (state6),
+        [state2] "+r" (state2), [diff2] "=&r" (diff2),
+        [out32] "=r" (out32), [diff1] "=&r" (diff1), [state7] "+r" (state7)
+      : [tmp22] "r" (tmp22), [tmp21] "r" (tmp21),
+        [k1Res2] "r" (k1Res2), [k2Res2] "r" (k2Res2)
+      : "hi", "lo", "$ac1hi", "$ac1lo"
+    );
+
+    // limit amplitude to prevent wrap-around, and write to output array
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+  }
+#else  // #if defined(MIPS_DSP_R2_LE)
+  int32_t tmp1, tmp2, diff;
+  int32_t in32;
+  len1 = (len >> 1)/4;
+  for (i = len1; i > 0; i--) {
+    // lower allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state1;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass2[0], diff, state0);
+    state0 = in32;
+    diff = tmp1 - state2;
+    tmp2 = MUL_ACCUM_2(kResampleAllpass2[1], diff, state1);
+    state1 = tmp1;
+    diff = tmp2 - state3;
+    state3 = MUL_ACCUM_2(kResampleAllpass2[2], diff, state2);
+    state2 = tmp2;
+
+    // upper allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state5;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass1[0], diff, state4);
+    state4 = in32;
+    diff = tmp1 - state6;
+    tmp2 = MUL_ACCUM_1(kResampleAllpass1[1], diff, state5);
+    state5 = tmp1;
+    diff = tmp2 - state7;
+    state7 = MUL_ACCUM_2(kResampleAllpass1[2], diff, state6);
+    state6 = tmp2;
+
+    // add two allpass outputs, divide by two and round
+    out32 = (state3 + state7 + 1024) >> 11;
+
+    // limit amplitude to prevent wrap-around, and write to output array
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+    // lower allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state1;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass2[0], diff, state0);
+    state0 = in32;
+    diff = tmp1 - state2;
+    tmp2 = MUL_ACCUM_2(kResampleAllpass2[1], diff, state1);
+    state1 = tmp1;
+    diff = tmp2 - state3;
+    state3 = MUL_ACCUM_2(kResampleAllpass2[2], diff, state2);
+    state2 = tmp2;
+
+    // upper allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state5;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass1[0], diff, state4);
+    state4 = in32;
+    diff = tmp1 - state6;
+    tmp2 = MUL_ACCUM_1(kResampleAllpass1[1], diff, state5);
+    state5 = tmp1;
+    diff = tmp2 - state7;
+    state7 = MUL_ACCUM_2(kResampleAllpass1[2], diff, state6);
+    state6 = tmp2;
+
+    // add two allpass outputs, divide by two and round
+    out32 = (state3 + state7 + 1024) >> 11;
+
+    // limit amplitude to prevent wrap-around, and write to output array
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+    // lower allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state1;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass2[0], diff, state0);
+    state0 = in32;
+    diff = tmp1 - state2;
+    tmp2 = MUL_ACCUM_2(kResampleAllpass2[1], diff, state1);
+    state1 = tmp1;
+    diff = tmp2 - state3;
+    state3 = MUL_ACCUM_2(kResampleAllpass2[2], diff, state2);
+    state2 = tmp2;
+
+    // upper allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state5;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass1[0], diff, state4);
+    state4 = in32;
+    diff = tmp1 - state6;
+    tmp2 = MUL_ACCUM_1(kResampleAllpass1[1], diff, state5);
+    state5 = tmp1;
+    diff = tmp2 - state7;
+    state7 = MUL_ACCUM_2(kResampleAllpass1[2], diff, state6);
+    state6 = tmp2;
+
+    // add two allpass outputs, divide by two and round
+    out32 = (state3 + state7 + 1024) >> 11;
+
+    // limit amplitude to prevent wrap-around, and write to output array
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+    // lower allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state1;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass2[0], diff, state0);
+    state0 = in32;
+    diff = tmp1 - state2;
+    tmp2 = MUL_ACCUM_2(kResampleAllpass2[1], diff, state1);
+    state1 = tmp1;
+    diff = tmp2 - state3;
+    state3 = MUL_ACCUM_2(kResampleAllpass2[2], diff, state2);
+    state2 = tmp2;
+
+    // upper allpass filter
+    in32 = (int32_t)(*in++) << 10;
+    diff = in32 - state5;
+    tmp1 = MUL_ACCUM_1(kResampleAllpass1[0], diff, state4);
+    state4 = in32;
+    diff = tmp1 - state6;
+    tmp2 = MUL_ACCUM_1(kResampleAllpass1[1], diff, state5);
+    state5 = tmp1;
+    diff = tmp2 - state7;
+    state7 = MUL_ACCUM_2(kResampleAllpass1[2], diff, state6);
+    state6 = tmp2;
+
+    // add two allpass outputs, divide by two and round
+    out32 = (state3 + state7 + 1024) >> 11;
+
+    // limit amplitude to prevent wrap-around, and write to output array
+    *out++ = WebRtcSpl_SatW32ToW16(out32);
+  }
+#endif  // #if defined(MIPS_DSP_R2_LE)
+  __asm__ volatile (
+    "sw       %[state0],      0(%[filtState])     \n\t"
+    "sw       %[state1],      4(%[filtState])     \n\t"
+    "sw       %[state2],      8(%[filtState])     \n\t"
+    "sw       %[state3],      12(%[filtState])    \n\t"
+    "sw       %[state4],      16(%[filtState])    \n\t"
+    "sw       %[state5],      20(%[filtState])    \n\t"
+    "sw       %[state6],      24(%[filtState])    \n\t"
+    "sw       %[state7],      28(%[filtState])    \n\t"
+    :
+    : [state0] "r" (state0), [state1] "r" (state1), [state2] "r" (state2),
+      [state3] "r" (state3), [state4] "r" (state4), [state5] "r" (state5),
+      [state6] "r" (state6), [state7] "r" (state7), [filtState] "r" (filtState)
+    : "memory"
+  );
+}
+
+#endif  // #if defined(MIPS32_LE)
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_fractional.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_fractional.c
new file mode 100644
index 0000000..6409fba
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/resample_fractional.c
@@ -0,0 +1,239 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the resampling functions between 48, 44, 32 and 24 kHz.
+ * The description headers can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// interpolation coefficients
+static const int16_t kCoefficients48To32[2][8] = {
+        {778, -2050, 1087, 23285, 12903, -3783, 441, 222},
+        {222, 441, -3783, 12903, 23285, 1087, -2050, 778}
+};
+
+static const int16_t kCoefficients32To24[3][8] = {
+        {767, -2362, 2434, 24406, 10620, -3838, 721, 90},
+        {386, -381, -2646, 19062, 19062, -2646, -381, 386},
+        {90, 721, -3838, 10620, 24406, 2434, -2362, 767}
+};
+
+static const int16_t kCoefficients44To32[4][9] = {
+        {117, -669, 2245, -6183, 26267, 13529, -3245, 845, -138},
+        {-101, 612, -2283, 8532, 29790, -5138, 1789, -524, 91},
+        {50, -292, 1016, -3064, 32010, 3933, -1147, 315, -53},
+        {-156, 974, -3863, 18603, 21691, -6246, 2353, -712, 126}
+};
+
+//   Resampling ratio: 2/3
+// input:  int32_t (normalized, not saturated) :: size 3 * K
+// output: int32_t (shifted 15 positions to the left, + offset 16384) :: size 2 * K
+//      K: number of blocks
+
+void WebRtcSpl_Resample48khzTo32khz(const int32_t *In, int32_t *Out, size_t K)
+{
+    /////////////////////////////////////////////////////////////
+    // Filter operation:
+    //
+    // Perform resampling (3 input samples -> 2 output samples);
+    // process in sub blocks of size 3 samples.
+    int32_t tmp;
+    size_t m;
+
+    for (m = 0; m < K; m++)
+    {
+        tmp = 1 << 14;
+        tmp += kCoefficients48To32[0][0] * In[0];
+        tmp += kCoefficients48To32[0][1] * In[1];
+        tmp += kCoefficients48To32[0][2] * In[2];
+        tmp += kCoefficients48To32[0][3] * In[3];
+        tmp += kCoefficients48To32[0][4] * In[4];
+        tmp += kCoefficients48To32[0][5] * In[5];
+        tmp += kCoefficients48To32[0][6] * In[6];
+        tmp += kCoefficients48To32[0][7] * In[7];
+        Out[0] = tmp;
+
+        tmp = 1 << 14;
+        tmp += kCoefficients48To32[1][0] * In[1];
+        tmp += kCoefficients48To32[1][1] * In[2];
+        tmp += kCoefficients48To32[1][2] * In[3];
+        tmp += kCoefficients48To32[1][3] * In[4];
+        tmp += kCoefficients48To32[1][4] * In[5];
+        tmp += kCoefficients48To32[1][5] * In[6];
+        tmp += kCoefficients48To32[1][6] * In[7];
+        tmp += kCoefficients48To32[1][7] * In[8];
+        Out[1] = tmp;
+
+        // update pointers
+        In += 3;
+        Out += 2;
+    }
+}
+
+//   Resampling ratio: 3/4
+// input:  int32_t (normalized, not saturated) :: size 4 * K
+// output: int32_t (shifted 15 positions to the left, + offset 16384) :: size 3 * K
+//      K: number of blocks
+
+void WebRtcSpl_Resample32khzTo24khz(const int32_t *In, int32_t *Out, size_t K)
+{
+    /////////////////////////////////////////////////////////////
+    // Filter operation:
+    //
+    // Perform resampling (4 input samples -> 3 output samples);
+    // process in sub blocks of size 4 samples.
+    size_t m;
+    int32_t tmp;
+
+    for (m = 0; m < K; m++)
+    {
+        tmp = 1 << 14;
+        tmp += kCoefficients32To24[0][0] * In[0];
+        tmp += kCoefficients32To24[0][1] * In[1];
+        tmp += kCoefficients32To24[0][2] * In[2];
+        tmp += kCoefficients32To24[0][3] * In[3];
+        tmp += kCoefficients32To24[0][4] * In[4];
+        tmp += kCoefficients32To24[0][5] * In[5];
+        tmp += kCoefficients32To24[0][6] * In[6];
+        tmp += kCoefficients32To24[0][7] * In[7];
+        Out[0] = tmp;
+
+        tmp = 1 << 14;
+        tmp += kCoefficients32To24[1][0] * In[1];
+        tmp += kCoefficients32To24[1][1] * In[2];
+        tmp += kCoefficients32To24[1][2] * In[3];
+        tmp += kCoefficients32To24[1][3] * In[4];
+        tmp += kCoefficients32To24[1][4] * In[5];
+        tmp += kCoefficients32To24[1][5] * In[6];
+        tmp += kCoefficients32To24[1][6] * In[7];
+        tmp += kCoefficients32To24[1][7] * In[8];
+        Out[1] = tmp;
+
+        tmp = 1 << 14;
+        tmp += kCoefficients32To24[2][0] * In[2];
+        tmp += kCoefficients32To24[2][1] * In[3];
+        tmp += kCoefficients32To24[2][2] * In[4];
+        tmp += kCoefficients32To24[2][3] * In[5];
+        tmp += kCoefficients32To24[2][4] * In[6];
+        tmp += kCoefficients32To24[2][5] * In[7];
+        tmp += kCoefficients32To24[2][6] * In[8];
+        tmp += kCoefficients32To24[2][7] * In[9];
+        Out[2] = tmp;
+
+        // update pointers
+        In += 4;
+        Out += 3;
+    }
+}
+
+//
+// fractional resampling filters
+//   Fout = 11/16 * Fin
+//   Fout =  8/11 * Fin
+//
+
+// compute two inner-products and store them to output array
+static void WebRtcSpl_ResampDotProduct(const int32_t *in1, const int32_t *in2,
+                                       const int16_t *coef_ptr, int32_t *out1,
+                                       int32_t *out2)
+{
+    int32_t tmp1 = 16384;
+    int32_t tmp2 = 16384;
+    int16_t coef;
+
+    coef = coef_ptr[0];
+    tmp1 += coef * in1[0];
+    tmp2 += coef * in2[-0];
+
+    coef = coef_ptr[1];
+    tmp1 += coef * in1[1];
+    tmp2 += coef * in2[-1];
+
+    coef = coef_ptr[2];
+    tmp1 += coef * in1[2];
+    tmp2 += coef * in2[-2];
+
+    coef = coef_ptr[3];
+    tmp1 += coef * in1[3];
+    tmp2 += coef * in2[-3];
+
+    coef = coef_ptr[4];
+    tmp1 += coef * in1[4];
+    tmp2 += coef * in2[-4];
+
+    coef = coef_ptr[5];
+    tmp1 += coef * in1[5];
+    tmp2 += coef * in2[-5];
+
+    coef = coef_ptr[6];
+    tmp1 += coef * in1[6];
+    tmp2 += coef * in2[-6];
+
+    coef = coef_ptr[7];
+    tmp1 += coef * in1[7];
+    tmp2 += coef * in2[-7];
+
+    coef = coef_ptr[8];
+    *out1 = tmp1 + coef * in1[8];
+    *out2 = tmp2 + coef * in2[-8];
+}
+
+//   Resampling ratio: 8/11
+// input:  int32_t (normalized, not saturated) :: size 11 * K
+// output: int32_t (shifted 15 positions to the left, + offset 16384) :: size  8 * K
+//      K: number of blocks
+
+void WebRtcSpl_Resample44khzTo32khz(const int32_t *In, int32_t *Out, size_t K)
+{
+    /////////////////////////////////////////////////////////////
+    // Filter operation:
+    //
+    // Perform resampling (11 input samples -> 8 output samples);
+    // process in sub blocks of size 11 samples.
+    int32_t tmp;
+    size_t m;
+
+    for (m = 0; m < K; m++)
+    {
+        tmp = 1 << 14;
+
+        // first output sample
+        Out[0] = ((int32_t)In[3] << 15) + tmp;
+
+        // sum and accumulate filter coefficients and input samples
+        tmp += kCoefficients44To32[3][0] * In[5];
+        tmp += kCoefficients44To32[3][1] * In[6];
+        tmp += kCoefficients44To32[3][2] * In[7];
+        tmp += kCoefficients44To32[3][3] * In[8];
+        tmp += kCoefficients44To32[3][4] * In[9];
+        tmp += kCoefficients44To32[3][5] * In[10];
+        tmp += kCoefficients44To32[3][6] * In[11];
+        tmp += kCoefficients44To32[3][7] * In[12];
+        tmp += kCoefficients44To32[3][8] * In[13];
+        Out[4] = tmp;
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_ResampDotProduct(&In[0], &In[17], kCoefficients44To32[0], &Out[1], &Out[7]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_ResampDotProduct(&In[2], &In[15], kCoefficients44To32[1], &Out[2], &Out[6]);
+
+        // sum and accumulate filter coefficients and input samples
+        WebRtcSpl_ResampDotProduct(&In[3], &In[14], kCoefficients44To32[2], &Out[3], &Out[5]);
+
+        // update pointers
+        In += 11;
+        Out += 8;
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_init.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_init.c
new file mode 100644
index 0000000..c9c4e65
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_init.c
@@ -0,0 +1,133 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+/* The global function contained in this file initializes SPL function
+ * pointers, currently only for ARM platforms.
+ *
+ * Some code came from common/rtcd.c in the WebM project.
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/system_wrappers/include/cpu_features_wrapper.h"
+
+/* Declare function pointers. */
+MaxAbsValueW16 WebRtcSpl_MaxAbsValueW16;
+MaxAbsValueW32 WebRtcSpl_MaxAbsValueW32;
+MaxValueW16 WebRtcSpl_MaxValueW16;
+MaxValueW32 WebRtcSpl_MaxValueW32;
+MinValueW16 WebRtcSpl_MinValueW16;
+MinValueW32 WebRtcSpl_MinValueW32;
+CrossCorrelation WebRtcSpl_CrossCorrelation;
+DownsampleFast WebRtcSpl_DownsampleFast;
+ScaleAndAddVectorsWithRound WebRtcSpl_ScaleAndAddVectorsWithRound;
+
+#if (!defined(WEBRTC_HAS_NEON)) && !defined(MIPS32_LE)
+/* Initialize function pointers to the generic C version. */
+static void InitPointersToC() {
+  WebRtcSpl_MaxAbsValueW16 = WebRtcSpl_MaxAbsValueW16C;
+  WebRtcSpl_MaxAbsValueW32 = WebRtcSpl_MaxAbsValueW32C;
+  WebRtcSpl_MaxValueW16 = WebRtcSpl_MaxValueW16C;
+  WebRtcSpl_MaxValueW32 = WebRtcSpl_MaxValueW32C;
+  WebRtcSpl_MinValueW16 = WebRtcSpl_MinValueW16C;
+  WebRtcSpl_MinValueW32 = WebRtcSpl_MinValueW32C;
+  WebRtcSpl_CrossCorrelation = WebRtcSpl_CrossCorrelationC;
+  WebRtcSpl_DownsampleFast = WebRtcSpl_DownsampleFastC;
+  WebRtcSpl_ScaleAndAddVectorsWithRound =
+      WebRtcSpl_ScaleAndAddVectorsWithRoundC;
+}
+#endif
+
+#if defined(WEBRTC_HAS_NEON)
+/* Initialize function pointers to the Neon version. */
+static void InitPointersToNeon() {
+  WebRtcSpl_MaxAbsValueW16 = WebRtcSpl_MaxAbsValueW16Neon;
+  WebRtcSpl_MaxAbsValueW32 = WebRtcSpl_MaxAbsValueW32Neon;
+  WebRtcSpl_MaxValueW16 = WebRtcSpl_MaxValueW16Neon;
+  WebRtcSpl_MaxValueW32 = WebRtcSpl_MaxValueW32Neon;
+  WebRtcSpl_MinValueW16 = WebRtcSpl_MinValueW16Neon;
+  WebRtcSpl_MinValueW32 = WebRtcSpl_MinValueW32Neon;
+  WebRtcSpl_CrossCorrelation = WebRtcSpl_CrossCorrelationNeon;
+  WebRtcSpl_DownsampleFast = WebRtcSpl_DownsampleFastNeon;
+  WebRtcSpl_ScaleAndAddVectorsWithRound =
+      WebRtcSpl_ScaleAndAddVectorsWithRoundC;
+}
+#endif
+
+#if defined(MIPS32_LE)
+/* Initialize function pointers to the MIPS version. */
+static void InitPointersToMIPS() {
+  WebRtcSpl_MaxAbsValueW16 = WebRtcSpl_MaxAbsValueW16_mips;
+  WebRtcSpl_MaxValueW16 = WebRtcSpl_MaxValueW16_mips;
+  WebRtcSpl_MaxValueW32 = WebRtcSpl_MaxValueW32_mips;
+  WebRtcSpl_MinValueW16 = WebRtcSpl_MinValueW16_mips;
+  WebRtcSpl_MinValueW32 = WebRtcSpl_MinValueW32_mips;
+  WebRtcSpl_CrossCorrelation = WebRtcSpl_CrossCorrelation_mips;
+  WebRtcSpl_DownsampleFast = WebRtcSpl_DownsampleFast_mips;
+#if defined(MIPS_DSP_R1_LE)
+  WebRtcSpl_MaxAbsValueW32 = WebRtcSpl_MaxAbsValueW32_mips;
+  WebRtcSpl_ScaleAndAddVectorsWithRound =
+      WebRtcSpl_ScaleAndAddVectorsWithRound_mips;
+#else
+  WebRtcSpl_MaxAbsValueW32 = WebRtcSpl_MaxAbsValueW32C;
+  WebRtcSpl_ScaleAndAddVectorsWithRound =
+      WebRtcSpl_ScaleAndAddVectorsWithRoundC;
+#endif
+}
+#endif
+
+static void InitFunctionPointers(void) {
+#if defined(WEBRTC_HAS_NEON)
+  InitPointersToNeon();
+#elif defined(MIPS32_LE)
+  InitPointersToMIPS();
+#else
+  InitPointersToC();
+#endif  /* WEBRTC_HAS_NEON */
+}
+
+#if defined(WEBRTC_POSIX)
+#include <pthread.h>
+
+static void once(void (*func)(void)) {
+  static pthread_once_t lock = PTHREAD_ONCE_INIT;
+  pthread_once(&lock, func);
+}
+
+#elif defined(_WIN32)
+#include <windows.h>
+
+static void once(void (*func)(void)) {
+  /* Didn't use InitializeCriticalSection() since there's no race-free context
+   * in which to execute it.
+   *
+   * TODO(kma): Change to different implementation (e.g.
+   * InterlockedCompareExchangePointer) to avoid issues similar to
+   * http://code.google.com/p/webm/issues/detail?id=467.
+   */
+  static CRITICAL_SECTION lock = {(void *)((size_t)-1), -1, 0, 0, 0, 0};
+  static int done = 0;
+
+  EnterCriticalSection(&lock);
+  if (!done) {
+    func();
+    done = 1;
+  }
+  LeaveCriticalSection(&lock);
+}
+
+/* There's no fallback version as an #else block here to ensure thread safety.
+ * In case of neither pthread for WEBRTC_POSIX nor _WIN32 is present, build
+ * system should pick it up.
+ */
+#endif  /* WEBRTC_POSIX */
+
+void WebRtcSpl_Init() {
+  once(InitFunctionPointers);
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_inl.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_inl.c
new file mode 100644
index 0000000..efa6a65
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_inl.c
@@ -0,0 +1,24 @@
+/*
+ *  Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <stdint.h>
+
+#include "webrtc/common_audio/signal_processing/include/spl_inl.h"
+
+// Table used by WebRtcSpl_CountLeadingZeros32_NotBuiltin. For each uint32_t n
+// that's a sequence of 0 bits followed by a sequence of 1 bits, the entry at
+// index (n * 0x8c0b2891) >> 26 in this table gives the number of zero bits in
+// n.
+const int8_t kWebRtcSpl_CountLeadingZeros32_Table[64] = {
+    32, 8,  17, -1, -1, 14, -1, -1, -1, 20, -1, -1, -1, 28, -1, 18,
+    -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, 0,  26, 25, 24,
+    4,  11, 23, 31, 3,  7,  10, 16, 22, 30, -1, -1, 2,  6,  13, 9,
+    -1, 15, -1, 21, -1, 29, 19, -1, -1, -1, -1, -1, 1,  27, 5,  12,
+};
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt.c
new file mode 100644
index 0000000..511039b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt.c
@@ -0,0 +1,194 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_Sqrt().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+int32_t WebRtcSpl_SqrtLocal(int32_t in);
+
+int32_t WebRtcSpl_SqrtLocal(int32_t in)
+{
+
+    int16_t x_half, t16;
+    int32_t A, B, x2;
+
+    /* The following block performs:
+     y=in/2
+     x=y-2^30
+     x_half=x/2^31
+     t = 1 + (x_half) - 0.5*((x_half)^2) + 0.5*((x_half)^3) - 0.625*((x_half)^4)
+         + 0.875*((x_half)^5)
+     */
+
+    B = in / 2;
+
+    B = B - ((int32_t)0x40000000); // B = in/2 - 1/2
+    x_half = (int16_t)(B >> 16);  // x_half = x/2 = (in-1)/2
+    B = B + ((int32_t)0x40000000); // B = 1 + x/2
+    B = B + ((int32_t)0x40000000); // Add 0.5 twice (since 1.0 does not exist in Q31)
+
+    x2 = ((int32_t)x_half) * ((int32_t)x_half) * 2; // A = (x/2)^2
+    A = -x2; // A = -(x/2)^2
+    B = B + (A >> 1); // B = 1 + x/2 - 0.5*(x/2)^2
+
+    A >>= 16;
+    A = A * A * 2; // A = (x/2)^4
+    t16 = (int16_t)(A >> 16);
+    B += -20480 * t16 * 2;  // B = B - 0.625*A
+    // After this, B = 1 + x/2 - 0.5*(x/2)^2 - 0.625*(x/2)^4
+
+    A = x_half * t16 * 2;  // A = (x/2)^5
+    t16 = (int16_t)(A >> 16);
+    B += 28672 * t16 * 2;  // B = B + 0.875*A
+    // After this, B = 1 + x/2 - 0.5*(x/2)^2 - 0.625*(x/2)^4 + 0.875*(x/2)^5
+
+    t16 = (int16_t)(x2 >> 16);
+    A = x_half * t16 * 2;  // A = x/2^3
+
+    B = B + (A >> 1); // B = B + 0.5*A
+    // After this, B = 1 + x/2 - 0.5*(x/2)^2 + 0.5*(x/2)^3 - 0.625*(x/2)^4 + 0.875*(x/2)^5
+
+    B = B + ((int32_t)32768); // Round off bit
+
+    return B;
+}
+
+int32_t WebRtcSpl_Sqrt(int32_t value)
+{
+    /*
+     Algorithm:
+
+     Six term Taylor Series is used here to compute the square root of a number
+     y^0.5 = (1+x)^0.5 where x = y-1
+     = 1+(x/2)-0.5*((x/2)^2+0.5*((x/2)^3-0.625*((x/2)^4+0.875*((x/2)^5)
+     0.5 <= x < 1
+
+     Example of how the algorithm works, with ut=sqrt(in), and
+     with in=73632 and ut=271 (even shift value case):
+
+     in=73632
+     y= in/131072
+     x=y-1
+     t = 1 + (x/2) - 0.5*((x/2)^2) + 0.5*((x/2)^3) - 0.625*((x/2)^4) + 0.875*((x/2)^5)
+     ut=t*(1/sqrt(2))*512
+
+     or:
+
+     in=73632
+     in2=73632*2^14
+     y= in2/2^31
+     x=y-1
+     t = 1 + (x/2) - 0.5*((x/2)^2) + 0.5*((x/2)^3) - 0.625*((x/2)^4) + 0.875*((x/2)^5)
+     ut=t*(1/sqrt(2))
+     ut2=ut*2^9
+
+     which gives:
+
+     in  = 73632
+     in2 = 1206386688
+     y   = 0.56176757812500
+     x   = -0.43823242187500
+     t   = 0.74973506527313
+     ut  = 0.53014274874797
+     ut2 = 2.714330873589594e+002
+
+     or:
+
+     in=73632
+     in2=73632*2^14
+     y=in2/2
+     x=y-2^30
+     x_half=x/2^31
+     t = 1 + (x_half) - 0.5*((x_half)^2) + 0.5*((x_half)^3) - 0.625*((x_half)^4)
+         + 0.875*((x_half)^5)
+     ut=t*(1/sqrt(2))
+     ut2=ut*2^9
+
+     which gives:
+
+     in  = 73632
+     in2 = 1206386688
+     y   = 603193344
+     x   = -470548480
+     x_half =  -0.21911621093750
+     t   = 0.74973506527313
+     ut  = 0.53014274874797
+     ut2 = 2.714330873589594e+002
+
+     */
+
+    int16_t x_norm, nshift, t16, sh;
+    int32_t A;
+
+    int16_t k_sqrt_2 = 23170; // 1/sqrt2 (==5a82)
+
+    A = value;
+
+    // The convention in this function is to calculate sqrt(abs(A)). Negate the
+    // input if it is negative.
+    if (A < 0) {
+        if (A == WEBRTC_SPL_WORD32_MIN) {
+            // This number cannot be held in an int32_t after negating.
+            // Map it to the maximum positive value.
+            A = WEBRTC_SPL_WORD32_MAX;
+        } else {
+            A = -A;
+        }
+    } else if (A == 0) {
+        return 0;  // sqrt(0) = 0
+    }
+
+    sh = WebRtcSpl_NormW32(A); // # shifts to normalize A
+    A = WEBRTC_SPL_LSHIFT_W32(A, sh); // Normalize A
+    if (A < (WEBRTC_SPL_WORD32_MAX - 32767))
+    {
+        A = A + ((int32_t)32768); // Round off bit
+    } else
+    {
+        A = WEBRTC_SPL_WORD32_MAX;
+    }
+
+    x_norm = (int16_t)(A >> 16);  // x_norm = AH
+
+    nshift = (sh / 2);
+    RTC_DCHECK_GE(nshift, 0);
+
+    A = (int32_t)WEBRTC_SPL_LSHIFT_W32((int32_t)x_norm, 16);
+    A = WEBRTC_SPL_ABS_W32(A); // A = abs(x_norm<<16)
+    A = WebRtcSpl_SqrtLocal(A); // A = sqrt(A)
+
+    if (2 * nshift == sh) {
+        // Even shift value case
+
+        t16 = (int16_t)(A >> 16);  // t16 = AH
+
+        A = k_sqrt_2 * t16 * 2;  // A = 1/sqrt(2)*t16
+        A = A + ((int32_t)32768); // Round off
+        A = A & ((int32_t)0x7fff0000); // Round off
+
+        A >>= 15;  // A = A>>16
+
+    } else
+    {
+        A >>= 16;  // A = A>>16
+    }
+
+    A = A & ((int32_t)0x0000ffff);
+    A >>= nshift;  // De-normalize the result.
+
+    return A;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor.c
new file mode 100644
index 0000000..370307a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor.c
@@ -0,0 +1,77 @@
+/*
+ * Written by Wilco Dijkstra, 1996. The following email exchange establishes the
+ * license.
+ *
+ * From: Wilco Dijkstra <Wilco.Dijkstra@ntlworld.com>
+ * Date: Fri, Jun 24, 2011 at 3:20 AM
+ * Subject: Re: sqrt routine
+ * To: Kevin Ma <kma@google.com>
+ * Hi Kevin,
+ * Thanks for asking. Those routines are public domain (originally posted to
+ * comp.sys.arm a long time ago), so you can use them freely for any purpose.
+ * Cheers,
+ * Wilco
+ *
+ * ----- Original Message -----
+ * From: "Kevin Ma" <kma@google.com>
+ * To: <Wilco.Dijkstra@ntlworld.com>
+ * Sent: Thursday, June 23, 2011 11:44 PM
+ * Subject: Fwd: sqrt routine
+ * Hi Wilco,
+ * I saw your sqrt routine from several web sites, including
+ * http://www.finesse.demon.co.uk/steven/sqrt.html.
+ * Just wonder if there's any copyright information with your Successive
+ * approximation routines, or if I can freely use it for any purpose.
+ * Thanks.
+ * Kevin
+ */
+
+// Minor modifications in code style for WebRTC, 2012.
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+/*
+ * Algorithm:
+ * Successive approximation of the equation (root + delta) ^ 2 = N
+ * until delta < 1. If delta < 1 we have the integer part of SQRT (N).
+ * Use delta = 2^i for i = 15 .. 0.
+ *
+ * Output precision is 16 bits. Note for large input values (close to
+ * 0x7FFFFFFF), bit 15 (the highest bit of the low 16-bit half word)
+ * contains the MSB information (a non-sign value). Do with caution
+ * if you need to cast the output to int16_t type.
+ *
+ * If the input value is negative, it returns 0.
+ */
+
+#define WEBRTC_SPL_SQRT_ITER(N)                 \
+  try1 = root + (1 << (N));                     \
+  if (value >= try1 << (N))                     \
+  {                                             \
+    value -= try1 << (N);                       \
+    root |= 2 << (N);                           \
+  }
+
+int32_t WebRtcSpl_SqrtFloor(int32_t value)
+{
+  int32_t root = 0, try1;
+
+  WEBRTC_SPL_SQRT_ITER (15);
+  WEBRTC_SPL_SQRT_ITER (14);
+  WEBRTC_SPL_SQRT_ITER (13);
+  WEBRTC_SPL_SQRT_ITER (12);
+  WEBRTC_SPL_SQRT_ITER (11);
+  WEBRTC_SPL_SQRT_ITER (10);
+  WEBRTC_SPL_SQRT_ITER ( 9);
+  WEBRTC_SPL_SQRT_ITER ( 8);
+  WEBRTC_SPL_SQRT_ITER ( 7);
+  WEBRTC_SPL_SQRT_ITER ( 6);
+  WEBRTC_SPL_SQRT_ITER ( 5);
+  WEBRTC_SPL_SQRT_ITER ( 4);
+  WEBRTC_SPL_SQRT_ITER ( 3);
+  WEBRTC_SPL_SQRT_ITER ( 2);
+  WEBRTC_SPL_SQRT_ITER ( 1);
+  WEBRTC_SPL_SQRT_ITER ( 0);
+
+  return root >> 1;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor_arm.S b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor_arm.S
new file mode 100644
index 0000000..72cd2d9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor_arm.S
@@ -0,0 +1,110 @@
+@
+@ Written by Wilco Dijkstra, 1996. The following email exchange establishes the
+@ license.
+@
+@ From: Wilco Dijkstra <Wilco.Dijkstra@ntlworld.com>
+@ Date: Fri, Jun 24, 2011 at 3:20 AM
+@ Subject: Re: sqrt routine
+@ To: Kevin Ma <kma@google.com>
+@ Hi Kevin,
+@ Thanks for asking. Those routines are public domain (originally posted to
+@ comp.sys.arm a long time ago), so you can use them freely for any purpose.
+@ Cheers,
+@ Wilco
+@
+@ ----- Original Message -----
+@ From: "Kevin Ma" <kma@google.com>
+@ To: <Wilco.Dijkstra@ntlworld.com>
+@ Sent: Thursday, June 23, 2011 11:44 PM
+@ Subject: Fwd: sqrt routine
+@ Hi Wilco,
+@ I saw your sqrt routine from several web sites, including
+@ http://www.finesse.demon.co.uk/steven/sqrt.html.
+@ Just wonder if there's any copyright information with your Successive
+@ approximation routines, or if I can freely use it for any purpose.
+@ Thanks.
+@ Kevin
+
+@ Minor modifications in code style for WebRTC, 2012.
+@ Output is bit-exact with the reference C code in spl_sqrt_floor.c.
+
+@ Input :             r0 32 bit unsigned integer
+@ Output:             r0 = INT (SQRT (r0)), precision is 16 bits
+@ Registers touched:  r1, r2
+
+#include "webrtc/system_wrappers/include/asm_defines.h"
+
+GLOBAL_FUNCTION WebRtcSpl_SqrtFloor
+.align  2
+DEFINE_FUNCTION WebRtcSpl_SqrtFloor
+  mov    r1, #3 << 30
+  mov    r2, #1 << 30
+
+  @ unroll for i = 0 .. 15
+
+  cmp    r0, r2, ror #2 * 0
+  subhs  r0, r0, r2, ror #2 * 0
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 1
+  subhs  r0, r0, r2, ror #2 * 1
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 2
+  subhs  r0, r0, r2, ror #2 * 2
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 3
+  subhs  r0, r0, r2, ror #2 * 3
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 4
+  subhs  r0, r0, r2, ror #2 * 4
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 5
+  subhs  r0, r0, r2, ror #2 * 5
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 6
+  subhs  r0, r0, r2, ror #2 * 6
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 7
+  subhs  r0, r0, r2, ror #2 * 7
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 8
+  subhs  r0, r0, r2, ror #2 * 8
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 9
+  subhs  r0, r0, r2, ror #2 * 9
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 10
+  subhs  r0, r0, r2, ror #2 * 10
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 11
+  subhs  r0, r0, r2, ror #2 * 11
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 12
+  subhs  r0, r0, r2, ror #2 * 12
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 13
+  subhs  r0, r0, r2, ror #2 * 13
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 14
+  subhs  r0, r0, r2, ror #2 * 14
+  adc    r2, r1, r2, lsl #1
+
+  cmp    r0, r2, ror #2 * 15
+  subhs  r0, r0, r2, ror #2 * 15
+  adc    r2, r1, r2, lsl #1
+
+  bic    r0, r2, #3 << 30  @ for rounding add: cmp r0, r2  adc r2, #1
+  bx lr
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor_mips.c
new file mode 100644
index 0000000..8716459
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/spl_sqrt_floor_mips.c
@@ -0,0 +1,207 @@
+/*
+ * Written by Wilco Dijkstra, 1996. The following email exchange establishes the
+ * license.
+ *
+ * From: Wilco Dijkstra <Wilco.Dijkstra@ntlworld.com>
+ * Date: Fri, Jun 24, 2011 at 3:20 AM
+ * Subject: Re: sqrt routine
+ * To: Kevin Ma <kma@google.com>
+ * Hi Kevin,
+ * Thanks for asking. Those routines are public domain (originally posted to
+ * comp.sys.arm a long time ago), so you can use them freely for any purpose.
+ * Cheers,
+ * Wilco
+ *
+ * ----- Original Message -----
+ * From: "Kevin Ma" <kma@google.com>
+ * To: <Wilco.Dijkstra@ntlworld.com>
+ * Sent: Thursday, June 23, 2011 11:44 PM
+ * Subject: Fwd: sqrt routine
+ * Hi Wilco,
+ * I saw your sqrt routine from several web sites, including
+ * http://www.finesse.demon.co.uk/steven/sqrt.html.
+ * Just wonder if there's any copyright information with your Successive
+ * approximation routines, or if I can freely use it for any purpose.
+ * Thanks.
+ * Kevin
+ */
+
+// Minor modifications in code style for WebRTC, 2012.
+// Code optimizations for MIPS, 2013.
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+/*
+ * Algorithm:
+ * Successive approximation of the equation (root + delta) ^ 2 = N
+ * until delta < 1. If delta < 1 we have the integer part of SQRT (N).
+ * Use delta = 2^i for i = 15 .. 0.
+ *
+ * Output precision is 16 bits. Note for large input values (close to
+ * 0x7FFFFFFF), bit 15 (the highest bit of the low 16-bit half word)
+ * contains the MSB information (a non-sign value). Do with caution
+ * if you need to cast the output to int16_t type.
+ *
+ * If the input value is negative, it returns 0.
+ */
+
+
+int32_t WebRtcSpl_SqrtFloor(int32_t value)
+{
+  int32_t root = 0, tmp1, tmp2, tmp3, tmp4;
+
+  __asm __volatile(
+    ".set   push                                       \n\t"
+    ".set   noreorder                                  \n\t"
+
+    "lui    %[tmp1],      0x4000                       \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "sub    %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "lui    %[tmp1],      0x1                          \n\t"
+    "or     %[tmp4],      %[root],      %[tmp1]        \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x4000         \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      14                           \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x8000         \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x2000         \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      13                           \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x4000         \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x1000         \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      12                           \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x2000         \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x800          \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      11                           \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x1000         \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x400          \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      10                           \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x800          \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x200          \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      9                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],       0x400         \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x100          \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      8                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x200          \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x80           \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      7                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x100          \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x40           \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      6                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x80           \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x20           \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      5                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x40           \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x10           \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      4                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x20           \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x8            \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      3                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x10           \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x4            \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      2                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x8            \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x2            \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "sll    %[tmp1],      1                            \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "subu   %[tmp3],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x4            \n\t"
+    "movz   %[value],     %[tmp3],      %[tmp2]        \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    "addiu  %[tmp1],      $0,           0x1            \n\t"
+    "addu   %[tmp1],      %[tmp1],      %[root]        \n\t"
+    "slt    %[tmp2],      %[value],     %[tmp1]        \n\t"
+    "ori    %[tmp4],      %[root],      0x2            \n\t"
+    "movz   %[root],      %[tmp4],      %[tmp2]        \n\t"
+
+    ".set   pop                                        \n\t"
+
+    : [root] "+r" (root), [value] "+r" (value),
+      [tmp1] "=&r" (tmp1), [tmp2] "=&r" (tmp2),
+      [tmp3] "=&r" (tmp3), [tmp4] "=&r" (tmp4)
+    :
+  );
+
+  return root >> 1;
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/splitting_filter.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/splitting_filter.c
new file mode 100644
index 0000000..1400623
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/splitting_filter.c
@@ -0,0 +1,207 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+/*
+ * This file contains the splitting filter functions.
+ *
+ */
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+// Maximum number of samples in a low/high-band frame.
+enum
+{
+    kMaxBandFrameLength = 320  // 10 ms at 64 kHz.
+};
+
+// QMF filter coefficients in Q16.
+static const uint16_t WebRtcSpl_kAllPassFilter1[3] = {6418, 36982, 57261};
+static const uint16_t WebRtcSpl_kAllPassFilter2[3] = {21333, 49062, 63010};
+
+///////////////////////////////////////////////////////////////////////////////////////////////
+// WebRtcSpl_AllPassQMF(...)
+//
+// Allpass filter used by the analysis and synthesis parts of the QMF filter.
+//
+// Input:
+//    - in_data             : Input data sequence (Q10)
+//    - data_length         : Length of data sequence (>2)
+//    - filter_coefficients : Filter coefficients (length 3, Q16)
+//
+// Input & Output:
+//    - filter_state        : Filter state (length 6, Q10).
+//
+// Output:
+//    - out_data            : Output data sequence (Q10), length equal to
+//                            |data_length|
+//
+
+void WebRtcSpl_AllPassQMF(int32_t* in_data, size_t data_length,
+                          int32_t* out_data, const uint16_t* filter_coefficients,
+                          int32_t* filter_state)
+{
+    // The procedure is to filter the input with three first order all pass filters
+    // (cascade operations).
+    //
+    //         a_3 + q^-1    a_2 + q^-1    a_1 + q^-1
+    // y[n] =  -----------   -----------   -----------   x[n]
+    //         1 + a_3q^-1   1 + a_2q^-1   1 + a_1q^-1
+    //
+    // The input vector |filter_coefficients| includes these three filter coefficients.
+    // The filter state contains the in_data state, in_data[-1], followed by
+    // the out_data state, out_data[-1]. This is repeated for each cascade.
+    // The first cascade filter will filter the |in_data| and store the output in
+    // |out_data|. The second will the take the |out_data| as input and make an
+    // intermediate storage in |in_data|, to save memory. The third, and final, cascade
+    // filter operation takes the |in_data| (which is the output from the previous cascade
+    // filter) and store the output in |out_data|.
+    // Note that the input vector values are changed during the process.
+    size_t k;
+    int32_t diff;
+    // First all-pass cascade; filter from in_data to out_data.
+
+    // Let y_i[n] indicate the output of cascade filter i (with filter coefficient a_i) at
+    // vector position n. Then the final output will be y[n] = y_3[n]
+
+    // First loop, use the states stored in memory.
+    // "diff" should be safe from wrap around since max values are 2^25
+    // diff = (x[0] - y_1[-1])
+    diff = WebRtcSpl_SubSatW32(in_data[0], filter_state[1]);
+    // y_1[0] =  x[-1] + a_1 * (x[0] - y_1[-1])
+    out_data[0] = WEBRTC_SPL_SCALEDIFF32(filter_coefficients[0], diff, filter_state[0]);
+
+    // For the remaining loops, use previous values.
+    for (k = 1; k < data_length; k++)
+    {
+        // diff = (x[n] - y_1[n-1])
+        diff = WebRtcSpl_SubSatW32(in_data[k], out_data[k - 1]);
+        // y_1[n] =  x[n-1] + a_1 * (x[n] - y_1[n-1])
+        out_data[k] = WEBRTC_SPL_SCALEDIFF32(filter_coefficients[0], diff, in_data[k - 1]);
+    }
+
+    // Update states.
+    filter_state[0] = in_data[data_length - 1]; // x[N-1], becomes x[-1] next time
+    filter_state[1] = out_data[data_length - 1]; // y_1[N-1], becomes y_1[-1] next time
+
+    // Second all-pass cascade; filter from out_data to in_data.
+    // diff = (y_1[0] - y_2[-1])
+    diff = WebRtcSpl_SubSatW32(out_data[0], filter_state[3]);
+    // y_2[0] =  y_1[-1] + a_2 * (y_1[0] - y_2[-1])
+    in_data[0] = WEBRTC_SPL_SCALEDIFF32(filter_coefficients[1], diff, filter_state[2]);
+    for (k = 1; k < data_length; k++)
+    {
+        // diff = (y_1[n] - y_2[n-1])
+        diff = WebRtcSpl_SubSatW32(out_data[k], in_data[k - 1]);
+        // y_2[0] =  y_1[-1] + a_2 * (y_1[0] - y_2[-1])
+        in_data[k] = WEBRTC_SPL_SCALEDIFF32(filter_coefficients[1], diff, out_data[k-1]);
+    }
+
+    filter_state[2] = out_data[data_length - 1]; // y_1[N-1], becomes y_1[-1] next time
+    filter_state[3] = in_data[data_length - 1]; // y_2[N-1], becomes y_2[-1] next time
+
+    // Third all-pass cascade; filter from in_data to out_data.
+    // diff = (y_2[0] - y[-1])
+    diff = WebRtcSpl_SubSatW32(in_data[0], filter_state[5]);
+    // y[0] =  y_2[-1] + a_3 * (y_2[0] - y[-1])
+    out_data[0] = WEBRTC_SPL_SCALEDIFF32(filter_coefficients[2], diff, filter_state[4]);
+    for (k = 1; k < data_length; k++)
+    {
+        // diff = (y_2[n] - y[n-1])
+        diff = WebRtcSpl_SubSatW32(in_data[k], out_data[k - 1]);
+        // y[n] =  y_2[n-1] + a_3 * (y_2[n] - y[n-1])
+        out_data[k] = WEBRTC_SPL_SCALEDIFF32(filter_coefficients[2], diff, in_data[k-1]);
+    }
+    filter_state[4] = in_data[data_length - 1]; // y_2[N-1], becomes y_2[-1] next time
+    filter_state[5] = out_data[data_length - 1]; // y[N-1], becomes y[-1] next time
+}
+
+void WebRtcSpl_AnalysisQMF(const int16_t* in_data, size_t in_data_length,
+                           int16_t* low_band, int16_t* high_band,
+                           int32_t* filter_state1, int32_t* filter_state2)
+{
+    size_t i;
+    int16_t k;
+    int32_t tmp;
+    int32_t half_in1[kMaxBandFrameLength];
+    int32_t half_in2[kMaxBandFrameLength];
+    int32_t filter1[kMaxBandFrameLength];
+    int32_t filter2[kMaxBandFrameLength];
+    const size_t band_length = in_data_length / 2;
+    RTC_DCHECK_EQ(0, in_data_length % 2);
+    RTC_DCHECK_LE(band_length, kMaxBandFrameLength);
+
+    // Split even and odd samples. Also shift them to Q10.
+    for (i = 0, k = 0; i < band_length; i++, k += 2)
+    {
+        half_in2[i] = WEBRTC_SPL_LSHIFT_W32((int32_t)in_data[k], 10);
+        half_in1[i] = WEBRTC_SPL_LSHIFT_W32((int32_t)in_data[k + 1], 10);
+    }
+
+    // All pass filter even and odd samples, independently.
+    WebRtcSpl_AllPassQMF(half_in1, band_length, filter1,
+                         WebRtcSpl_kAllPassFilter1, filter_state1);
+    WebRtcSpl_AllPassQMF(half_in2, band_length, filter2,
+                         WebRtcSpl_kAllPassFilter2, filter_state2);
+
+    // Take the sum and difference of filtered version of odd and even
+    // branches to get upper & lower band.
+    for (i = 0; i < band_length; i++)
+    {
+        tmp = (filter1[i] + filter2[i] + 1024) >> 11;
+        low_band[i] = WebRtcSpl_SatW32ToW16(tmp);
+
+        tmp = (filter1[i] - filter2[i] + 1024) >> 11;
+        high_band[i] = WebRtcSpl_SatW32ToW16(tmp);
+    }
+}
+
+void WebRtcSpl_SynthesisQMF(const int16_t* low_band, const int16_t* high_band,
+                            size_t band_length, int16_t* out_data,
+                            int32_t* filter_state1, int32_t* filter_state2)
+{
+    int32_t tmp;
+    int32_t half_in1[kMaxBandFrameLength];
+    int32_t half_in2[kMaxBandFrameLength];
+    int32_t filter1[kMaxBandFrameLength];
+    int32_t filter2[kMaxBandFrameLength];
+    size_t i;
+    int16_t k;
+    RTC_DCHECK_LE(band_length, kMaxBandFrameLength);
+
+    // Obtain the sum and difference channels out of upper and lower-band channels.
+    // Also shift to Q10 domain.
+    for (i = 0; i < band_length; i++)
+    {
+        tmp = (int32_t)low_band[i] + (int32_t)high_band[i];
+        half_in1[i] = tmp * (1 << 10);
+        tmp = (int32_t)low_band[i] - (int32_t)high_band[i];
+        half_in2[i] = tmp * (1 << 10);
+    }
+
+    // all-pass filter the sum and difference channels
+    WebRtcSpl_AllPassQMF(half_in1, band_length, filter1,
+                         WebRtcSpl_kAllPassFilter2, filter_state1);
+    WebRtcSpl_AllPassQMF(half_in2, band_length, filter2,
+                         WebRtcSpl_kAllPassFilter1, filter_state2);
+
+    // The filtered signals are even and odd samples of the output. Combine
+    // them. The signals are Q10 should shift them back to Q0 and take care of
+    // saturation.
+    for (i = 0, k = 0; i < band_length; i++)
+    {
+        tmp = (filter2[i] + 512) >> 10;
+        out_data[k++] = WebRtcSpl_SatW32ToW16(tmp);
+
+        tmp = (filter1[i] + 512) >> 10;
+        out_data[k++] = WebRtcSpl_SatW32ToW16(tmp);
+    }
+
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/sqrt_of_one_minus_x_squared.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/sqrt_of_one_minus_x_squared.c
new file mode 100644
index 0000000..ff78b52
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/sqrt_of_one_minus_x_squared.c
@@ -0,0 +1,35 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains the function WebRtcSpl_SqrtOfOneMinusXSquared().
+ * The description header can be found in signal_processing_library.h
+ *
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_SqrtOfOneMinusXSquared(int16_t *xQ15, size_t vector_length,
+                                      int16_t *yQ15)
+{
+    int32_t sq;
+    size_t m;
+    int16_t tmp;
+
+    for (m = 0; m < vector_length; m++)
+    {
+        tmp = xQ15[m];
+        sq = tmp * tmp;  // x^2 in Q30
+        sq = 1073741823 - sq; // 1-x^2, where 1 ~= 0.99999999906 is 1073741823 in Q30
+        sq = WebRtcSpl_Sqrt(sq); // sqrt(1-x^2) in Q15
+        yQ15[m] = (int16_t)sq;
+    }
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/vector_scaling_operations.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/vector_scaling_operations.c
new file mode 100644
index 0000000..e1f391d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/vector_scaling_operations.c
@@ -0,0 +1,165 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains implementations of the functions
+ * WebRtcSpl_VectorBitShiftW16()
+ * WebRtcSpl_VectorBitShiftW32()
+ * WebRtcSpl_VectorBitShiftW32ToW16()
+ * WebRtcSpl_ScaleVector()
+ * WebRtcSpl_ScaleVectorWithSat()
+ * WebRtcSpl_ScaleAndAddVectors()
+ * WebRtcSpl_ScaleAndAddVectorsWithRoundC()
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+void WebRtcSpl_VectorBitShiftW16(int16_t *res, size_t length,
+                                 const int16_t *in, int16_t right_shifts)
+{
+    size_t i;
+
+    if (right_shifts > 0)
+    {
+        for (i = length; i > 0; i--)
+        {
+            (*res++) = ((*in++) >> right_shifts);
+        }
+    } else
+    {
+        for (i = length; i > 0; i--)
+        {
+            (*res++) = ((*in++) * (1 << (-right_shifts)));
+        }
+    }
+}
+
+void WebRtcSpl_VectorBitShiftW32(int32_t *out_vector,
+                                 size_t vector_length,
+                                 const int32_t *in_vector,
+                                 int16_t right_shifts)
+{
+    size_t i;
+
+    if (right_shifts > 0)
+    {
+        for (i = vector_length; i > 0; i--)
+        {
+            (*out_vector++) = ((*in_vector++) >> right_shifts);
+        }
+    } else
+    {
+        for (i = vector_length; i > 0; i--)
+        {
+            (*out_vector++) = ((*in_vector++) << (-right_shifts));
+        }
+    }
+}
+
+void WebRtcSpl_VectorBitShiftW32ToW16(int16_t* out, size_t length,
+                                      const int32_t* in, int right_shifts) {
+  size_t i;
+  int32_t tmp_w32;
+
+  if (right_shifts >= 0) {
+    for (i = length; i > 0; i--) {
+      tmp_w32 = (*in++) >> right_shifts;
+      (*out++) = WebRtcSpl_SatW32ToW16(tmp_w32);
+    }
+  } else {
+    int left_shifts = -right_shifts;
+    for (i = length; i > 0; i--) {
+      tmp_w32 = (*in++) << left_shifts;
+      (*out++) = WebRtcSpl_SatW32ToW16(tmp_w32);
+    }
+  }
+}
+
+void WebRtcSpl_ScaleVector(const int16_t *in_vector, int16_t *out_vector,
+                           int16_t gain, size_t in_vector_length,
+                           int16_t right_shifts)
+{
+    // Performs vector operation: out_vector = (gain*in_vector)>>right_shifts
+    size_t i;
+    const int16_t *inptr;
+    int16_t *outptr;
+
+    inptr = in_vector;
+    outptr = out_vector;
+
+    for (i = 0; i < in_vector_length; i++)
+    {
+      *outptr++ = (int16_t)((*inptr++ * gain) >> right_shifts);
+    }
+}
+
+void WebRtcSpl_ScaleVectorWithSat(const int16_t *in_vector, int16_t *out_vector,
+                                 int16_t gain, size_t in_vector_length,
+                                 int16_t right_shifts)
+{
+    // Performs vector operation: out_vector = (gain*in_vector)>>right_shifts
+    size_t i;
+    const int16_t *inptr;
+    int16_t *outptr;
+
+    inptr = in_vector;
+    outptr = out_vector;
+
+    for (i = 0; i < in_vector_length; i++) {
+      *outptr++ = WebRtcSpl_SatW32ToW16((*inptr++ * gain) >> right_shifts);
+    }
+}
+
+void WebRtcSpl_ScaleAndAddVectors(const int16_t *in1, int16_t gain1, int shift1,
+                                  const int16_t *in2, int16_t gain2, int shift2,
+                                  int16_t *out, size_t vector_length)
+{
+    // Performs vector operation: out = (gain1*in1)>>shift1 + (gain2*in2)>>shift2
+    size_t i;
+    const int16_t *in1ptr;
+    const int16_t *in2ptr;
+    int16_t *outptr;
+
+    in1ptr = in1;
+    in2ptr = in2;
+    outptr = out;
+
+    for (i = 0; i < vector_length; i++)
+    {
+      *outptr++ = (int16_t)((gain1 * *in1ptr++) >> shift1) +
+          (int16_t)((gain2 * *in2ptr++) >> shift2);
+    }
+}
+
+// C version of WebRtcSpl_ScaleAndAddVectorsWithRound() for generic platforms.
+int WebRtcSpl_ScaleAndAddVectorsWithRoundC(const int16_t* in_vector1,
+                                           int16_t in_vector1_scale,
+                                           const int16_t* in_vector2,
+                                           int16_t in_vector2_scale,
+                                           int right_shifts,
+                                           int16_t* out_vector,
+                                           size_t length) {
+  size_t i = 0;
+  int round_value = (1 << right_shifts) >> 1;
+
+  if (in_vector1 == NULL || in_vector2 == NULL || out_vector == NULL ||
+      length == 0 || right_shifts < 0) {
+    return -1;
+  }
+
+  for (i = 0; i < length; i++) {
+    out_vector[i] = (int16_t)((
+        in_vector1[i] * in_vector1_scale + in_vector2[i] * in_vector2_scale +
+        round_value) >> right_shifts);
+  }
+
+  return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/vector_scaling_operations_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/vector_scaling_operations_mips.c
new file mode 100644
index 0000000..dd73eea
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/signal_processing/vector_scaling_operations_mips.c
@@ -0,0 +1,57 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+
+/*
+ * This file contains implementations of the functions
+ * WebRtcSpl_ScaleAndAddVectorsWithRound_mips()
+ */
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+
+int WebRtcSpl_ScaleAndAddVectorsWithRound_mips(const int16_t* in_vector1,
+                                               int16_t in_vector1_scale,
+                                               const int16_t* in_vector2,
+                                               int16_t in_vector2_scale,
+                                               int right_shifts,
+                                               int16_t* out_vector,
+                                               size_t length) {
+  int16_t r0 = 0, r1 = 0;
+  int16_t *in1 = (int16_t*)in_vector1;
+  int16_t *in2 = (int16_t*)in_vector2;
+  int16_t *out = out_vector;
+  size_t i = 0;
+  int value32 = 0;
+
+  if (in_vector1 == NULL || in_vector2 == NULL || out_vector == NULL ||
+      length == 0 || right_shifts < 0) {
+    return -1;
+  }
+  for (i = 0; i < length; i++) {
+    __asm __volatile (
+      "lh         %[r0],          0(%[in1])                               \n\t"
+      "lh         %[r1],          0(%[in2])                               \n\t"
+      "mult       %[r0],          %[in_vector1_scale]                     \n\t"
+      "madd       %[r1],          %[in_vector2_scale]                     \n\t"
+      "extrv_r.w  %[value32],     $ac0,               %[right_shifts]     \n\t"
+      "addiu      %[in1],         %[in1],             2                   \n\t"
+      "addiu      %[in2],         %[in2],             2                   \n\t"
+      "sh         %[value32],     0(%[out])                               \n\t"
+      "addiu      %[out],         %[out],             2                   \n\t"
+      : [value32] "=&r" (value32), [out] "+r" (out), [in1] "+r" (in1),
+        [in2] "+r" (in2), [r0] "=&r" (r0), [r1] "=&r" (r1)
+      : [in_vector1_scale] "r" (in_vector1_scale),
+        [in_vector2_scale] "r" (in_vector2_scale),
+        [right_shifts] "r" (right_shifts)
+      : "hi", "lo", "memory"
+    );
+  }
+  return 0;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/sparse_fir_filter.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/sparse_fir_filter.cc
new file mode 100644
index 0000000..2928004
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/sparse_fir_filter.cc
@@ -0,0 +1,62 @@
+/*
+ *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/common_audio/sparse_fir_filter.h"
+
+#include "webrtc/base/checks.h"
+
+namespace webrtc {
+
+SparseFIRFilter::SparseFIRFilter(const float* nonzero_coeffs,
+                                 size_t num_nonzero_coeffs,
+                                 size_t sparsity,
+                                 size_t offset)
+    : sparsity_(sparsity),
+      offset_(offset),
+      nonzero_coeffs_(nonzero_coeffs, nonzero_coeffs + num_nonzero_coeffs),
+      state_(sparsity_ * (num_nonzero_coeffs - 1) + offset_, 0.f) {
+  RTC_CHECK_GE(num_nonzero_coeffs, 1);
+  RTC_CHECK_GE(sparsity, 1);
+}
+
+SparseFIRFilter::~SparseFIRFilter() = default;
+
+void SparseFIRFilter::Filter(const float* in, size_t length, float* out) {
+  // Convolves the input signal |in| with the filter kernel |nonzero_coeffs_|
+  // taking into account the previous state.
+  for (size_t i = 0; i < length; ++i) {
+    out[i] = 0.f;
+    size_t j;
+    for (j = 0; i >= j * sparsity_ + offset_ &&
+                j < nonzero_coeffs_.size(); ++j) {
+      out[i] += in[i - j * sparsity_ - offset_] * nonzero_coeffs_[j];
+    }
+    for (; j < nonzero_coeffs_.size(); ++j) {
+      out[i] += state_[i + (nonzero_coeffs_.size() - j - 1) * sparsity_] *
+                nonzero_coeffs_[j];
+    }
+  }
+
+  // Update current state.
+  if (state_.size() > 0u) {
+    if (length >= state_.size()) {
+      std::memcpy(&state_[0],
+                  &in[length - state_.size()],
+                  state_.size() * sizeof(*in));
+    } else {
+      std::memmove(&state_[0],
+                   &state_[length],
+                   (state_.size() - length) * sizeof(state_[0]));
+      std::memcpy(&state_[state_.size() - length], in, length * sizeof(*in));
+    }
+  }
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/sparse_fir_filter.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/sparse_fir_filter.h
new file mode 100644
index 0000000..2d406a0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/common_audio/sparse_fir_filter.h
@@ -0,0 +1,53 @@
+/*
+ *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_COMMON_AUDIO_SPARSE_FIR_FILTER_H_
+#define WEBRTC_COMMON_AUDIO_SPARSE_FIR_FILTER_H_
+
+#include <cstring>
+#include <vector>
+
+#include "webrtc/base/constructormagic.h"
+
+namespace webrtc {
+
+// A Finite Impulse Response filter implementation which takes advantage of a
+// sparse structure with uniformly distributed non-zero coefficients.
+class SparseFIRFilter final {
+ public:
+  // |num_nonzero_coeffs| is the number of non-zero coefficients,
+  // |nonzero_coeffs|. They are assumed to be uniformly distributed every
+  // |sparsity| samples and with an initial |offset|. The rest of the filter
+  // coefficients will be assumed zeros. For example, with sparsity = 3, and
+  // offset = 1 the filter coefficients will be:
+  // B = [0 coeffs[0] 0 0 coeffs[1] 0 0 coeffs[2] ... ]
+  // All initial state values will be zeros.
+  SparseFIRFilter(const float* nonzero_coeffs,
+                  size_t num_nonzero_coeffs,
+                  size_t sparsity,
+                  size_t offset);
+  ~SparseFIRFilter();
+
+  // Filters the |in| data supplied.
+  // |out| must be previously allocated and it must be at least of |length|.
+  void Filter(const float* in, size_t length, float* out);
+
+ private:
+  const size_t sparsity_;
+  const size_t offset_;
+  const std::vector<float> nonzero_coeffs_;
+  std::vector<float> state_;
+
+  RTC_DISALLOW_COPY_AND_ASSIGN(SparseFIRFilter);
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_COMMON_AUDIO_SPARSE_FIR_FILTER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/cpufeatures/cpu-features.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/cpufeatures/cpu-features.c
new file mode 100644
index 0000000..6639043
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/cpufeatures/cpu-features.c
@@ -0,0 +1,1316 @@
+/*
+ * Copyright (C) 2010 The Android Open Source Project
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *  * Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ *  * Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in
+ *    the documentation and/or other materials provided with the
+ *    distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+ * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+ * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+ * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
+ * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
+ * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+ * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
+ * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ */
+
+/* ChangeLog for this library:
+ *
+ * NDK r10e?: Add MIPS MSA feature.
+ *
+ * NDK r10: Support for 64-bit CPUs (Intel, ARM & MIPS).
+ *
+ * NDK r8d: Add android_setCpu().
+ *
+ * NDK r8c: Add new ARM CPU features: VFPv2, VFP_D32, VFP_FP16,
+ *          VFP_FMA, NEON_FMA, IDIV_ARM, IDIV_THUMB2 and iWMMXt.
+ *
+ *          Rewrite the code to parse /proc/self/auxv instead of
+ *          the "Features" field in /proc/cpuinfo.
+ *
+ *          Dynamically allocate the buffer that hold the content
+ *          of /proc/cpuinfo to deal with newer hardware.
+ *
+ * NDK r7c: Fix CPU count computation. The old method only reported the
+ *           number of _active_ CPUs when the library was initialized,
+ *           which could be less than the real total.
+ *
+ * NDK r5: Handle buggy kernels which report a CPU Architecture number of 7
+ *         for an ARMv6 CPU (see below).
+ *
+ *         Handle kernels that only report 'neon', and not 'vfpv3'
+ *         (VFPv3 is mandated by the ARM architecture is Neon is implemented)
+ *
+ *         Handle kernels that only report 'vfpv3d16', and not 'vfpv3'
+ *
+ *         Fix x86 compilation. Report ANDROID_CPU_FAMILY_X86 in
+ *         android_getCpuFamily().
+ *
+ * NDK r4: Initial release
+ */
+
+#include "cpu-features.h"
+
+#include <dlfcn.h>
+#include <errno.h>
+#include <fcntl.h>
+#include <pthread.h>
+#include <stdio.h>
+#include <stdlib.h>
+#if __APPLE__
+#else
+#include <sys/system_properties.h>
+#endif
+
+#include <unistd.h>
+
+static  pthread_once_t     g_once;
+static  int                g_inited;
+static  AndroidCpuFamily   g_cpuFamily;
+static  uint64_t           g_cpuFeatures;
+static  int                g_cpuCount;
+
+#ifdef __arm__
+static  uint32_t           g_cpuIdArm;
+#endif
+
+static const int android_cpufeatures_debug = 0;
+
+#define  D(...) \
+    do { \
+        if (android_cpufeatures_debug) { \
+            printf(__VA_ARGS__); fflush(stdout); \
+        } \
+    } while (0)
+
+#ifdef __i386__
+static __inline__ void x86_cpuid(int func, int values[4])
+{
+    int a, b, c, d;
+    /* We need to preserve ebx since we're compiling PIC code */
+    /* this means we can't use "=b" for the second output register */
+    __asm__ __volatile__ ( \
+      "push %%ebx\n"
+      "cpuid\n" \
+      "mov %%ebx, %1\n"
+      "pop %%ebx\n"
+      : "=a" (a), "=r" (b), "=c" (c), "=d" (d) \
+      : "a" (func) \
+    );
+    values[0] = a;
+    values[1] = b;
+    values[2] = c;
+    values[3] = d;
+}
+#elif defined(__x86_64__)
+static __inline__ void x86_cpuid(int func, int values[4])
+{
+    int64_t a, b, c, d;
+    /* We need to preserve ebx since we're compiling PIC code */
+    /* this means we can't use "=b" for the second output register */
+    __asm__ __volatile__ ( \
+      "push %%rbx\n"
+      "cpuid\n" \
+      "mov %%rbx, %1\n"
+      "pop %%rbx\n"
+      : "=a" (a), "=r" (b), "=c" (c), "=d" (d) \
+      : "a" (func) \
+    );
+    values[0] = a;
+    values[1] = b;
+    values[2] = c;
+    values[3] = d;
+}
+#endif
+
+/* Get the size of a file by reading it until the end. This is needed
+ * because files under /proc do not always return a valid size when
+ * using fseek(0, SEEK_END) + ftell(). Nor can they be mmap()-ed.
+ */
+static int
+get_file_size(const char* pathname)
+{
+
+   int fd, result = 0;
+    char buffer[256];
+
+    fd = open(pathname, O_RDONLY);
+    if (fd < 0) {
+        D("Can't open %s: %s\n", pathname, strerror(errno));
+        return -1;
+    }
+
+    for (;;) {
+        int ret = read(fd, buffer, sizeof buffer);
+        if (ret < 0) {
+            if (errno == EINTR)
+                continue;
+            D("Error while reading %s: %s\n", pathname, strerror(errno));
+            break;
+        }
+        if (ret == 0)
+            break;
+
+        result += ret;
+    }
+    close(fd);
+    return result;
+}
+
+/* Read the content of /proc/cpuinfo into a user-provided buffer.
+ * Return the length of the data, or -1 on error. Does *not*
+ * zero-terminate the content. Will not read more
+ * than 'buffsize' bytes.
+ */
+static int
+read_file(const char*  pathname, char*  buffer, size_t  buffsize)
+{
+    int  fd, count;
+
+    fd = open(pathname, O_RDONLY);
+    if (fd < 0) {
+        D("Could not open %s: %s\n", pathname, strerror(errno));
+        return -1;
+    }
+    count = 0;
+    while (count < (int)buffsize) {
+        int ret = read(fd, buffer + count, buffsize - count);
+        if (ret < 0) {
+            if (errno == EINTR)
+                continue;
+            D("Error while reading from %s: %s\n", pathname, strerror(errno));
+            if (count == 0)
+                count = -1;
+            break;
+        }
+        if (ret == 0)
+            break;
+        count += ret;
+    }
+    close(fd);
+    return count;
+}
+
+#ifdef __arm__
+/* Extract the content of a the first occurence of a given field in
+ * the content of /proc/cpuinfo and return it as a heap-allocated
+ * string that must be freed by the caller.
+ *
+ * Return NULL if not found
+ */
+static char*
+extract_cpuinfo_field(const char* buffer, int buflen, const char* field)
+{
+    int  fieldlen = strlen(field);
+    const char* bufend = buffer + buflen;
+    char* result = NULL;
+    int len;
+    const char *p, *q;
+
+    /* Look for first field occurence, and ensures it starts the line. */
+    p = buffer;
+    for (;;) {
+        p = memmem(p, bufend-p, field, fieldlen);
+        if (p == NULL)
+            goto EXIT;
+
+        if (p == buffer || p[-1] == '\n')
+            break;
+
+        p += fieldlen;
+    }
+
+    /* Skip to the first column followed by a space */
+    p += fieldlen;
+    p  = memchr(p, ':', bufend-p);
+    if (p == NULL || p[1] != ' ')
+        goto EXIT;
+
+    /* Find the end of the line */
+    p += 2;
+    q = memchr(p, '\n', bufend-p);
+    if (q == NULL)
+        q = bufend;
+
+    /* Copy the line into a heap-allocated buffer */
+    len = q-p;
+    result = malloc(len+1);
+    if (result == NULL)
+        goto EXIT;
+
+    memcpy(result, p, len);
+    result[len] = '\0';
+
+EXIT:
+    return result;
+}
+
+/* Checks that a space-separated list of items contains one given 'item'.
+ * Returns 1 if found, 0 otherwise.
+ */
+static int
+has_list_item(const char* list, const char* item)
+{
+    const char*  p = list;
+    int itemlen = strlen(item);
+
+    if (list == NULL)
+        return 0;
+
+    while (*p) {
+        const char*  q;
+
+        /* skip spaces */
+        while (*p == ' ' || *p == '\t')
+            p++;
+
+        /* find end of current list item */
+        q = p;
+        while (*q && *q != ' ' && *q != '\t')
+            q++;
+
+        if (itemlen == q-p && !memcmp(p, item, itemlen))
+            return 1;
+
+        /* skip to next item */
+        p = q;
+    }
+    return 0;
+}
+#endif /* __arm__ */
+
+/* Parse a number starting from 'input', but not going further
+ * than 'limit'. Return the value into '*result'.
+ *
+ * NOTE: Does not skip over leading spaces, or deal with sign characters.
+ * NOTE: Ignores overflows.
+ *
+ * The function returns NULL in case of error (bad format), or the new
+ * position after the decimal number in case of success (which will always
+ * be <= 'limit').
+ */
+static const char*
+parse_number(const char* input, const char* limit, int base, int* result)
+{
+    const char* p = input;
+    int val = 0;
+    while (p < limit) {
+        int d = (*p - '0');
+        if ((unsigned)d >= 10U) {
+            d = (*p - 'a');
+            if ((unsigned)d >= 6U)
+              d = (*p - 'A');
+            if ((unsigned)d >= 6U)
+              break;
+            d += 10;
+        }
+        if (d >= base)
+          break;
+        val = val*base + d;
+        p++;
+    }
+    if (p == input)
+        return NULL;
+
+    *result = val;
+    return p;
+}
+
+static const char*
+parse_decimal(const char* input, const char* limit, int* result)
+{
+    return parse_number(input, limit, 10, result);
+}
+
+#ifdef __arm__
+static const char*
+parse_hexadecimal(const char* input, const char* limit, int* result)
+{
+    return parse_number(input, limit, 16, result);
+}
+#endif /* __arm__ */
+
+/* This small data type is used to represent a CPU list / mask, as read
+ * from sysfs on Linux. See http://www.kernel.org/doc/Documentation/cputopology.txt
+ *
+ * For now, we don't expect more than 32 cores on mobile devices, so keep
+ * everything simple.
+ */
+typedef struct {
+    uint32_t mask;
+} CpuList;
+
+static __inline__ void
+cpulist_init(CpuList* list) {
+    list->mask = 0;
+}
+
+static __inline__ void
+cpulist_and(CpuList* list1, CpuList* list2) {
+    list1->mask &= list2->mask;
+}
+
+static __inline__ void
+cpulist_set(CpuList* list, int index) {
+    if ((unsigned)index < 32) {
+        list->mask |= (uint32_t)(1U << index);
+    }
+}
+
+static __inline__ int
+cpulist_count(CpuList* list) {
+    return __builtin_popcount(list->mask);
+}
+
+/* Parse a textual list of cpus and store the result inside a CpuList object.
+ * Input format is the following:
+ * - comma-separated list of items (no spaces)
+ * - each item is either a single decimal number (cpu index), or a range made
+ *   of two numbers separated by a single dash (-). Ranges are inclusive.
+ *
+ * Examples:   0
+ *             2,4-127,128-143
+ *             0-1
+ */
+static void
+cpulist_parse(CpuList* list, const char* line, int line_len)
+{
+    const char* p = line;
+    const char* end = p + line_len;
+    const char* q;
+
+    /* NOTE: the input line coming from sysfs typically contains a
+     * trailing newline, so take care of it in the code below
+     */
+    while (p < end && *p != '\n')
+    {
+        int val, start_value, end_value;
+
+        /* Find the end of current item, and put it into 'q' */
+        q = memchr(p, ',', end-p);
+        if (q == NULL) {
+            q = end;
+        }
+
+        /* Get first value */
+        p = parse_decimal(p, q, &start_value);
+        if (p == NULL)
+            goto BAD_FORMAT;
+
+        end_value = start_value;
+
+        /* If we're not at the end of the item, expect a dash and
+         * and integer; extract end value.
+         */
+        if (p < q && *p == '-') {
+            p = parse_decimal(p+1, q, &end_value);
+            if (p == NULL)
+                goto BAD_FORMAT;
+        }
+
+        /* Set bits CPU list bits */
+        for (val = start_value; val <= end_value; val++) {
+            cpulist_set(list, val);
+        }
+
+        /* Jump to next item */
+        p = q;
+        if (p < end)
+            p++;
+    }
+
+BAD_FORMAT:
+    ;
+}
+
+/* Read a CPU list from one sysfs file */
+static void
+cpulist_read_from(CpuList* list, const char* filename)
+{
+    char   file[64];
+    int    filelen;
+
+    cpulist_init(list);
+
+    filelen = read_file(filename, file, sizeof file);
+    if (filelen < 0) {
+        D("Could not read %s: %s\n", filename, strerror(errno));
+        return;
+    }
+
+    cpulist_parse(list, file, filelen);
+}
+#if defined(__aarch64__)
+// see <uapi/asm/hwcap.h> kernel header
+#define HWCAP_FP                (1 << 0)
+#define HWCAP_ASIMD             (1 << 1)
+#define HWCAP_AES               (1 << 3)
+#define HWCAP_PMULL             (1 << 4)
+#define HWCAP_SHA1              (1 << 5)
+#define HWCAP_SHA2              (1 << 6)
+#define HWCAP_CRC32             (1 << 7)
+#endif
+
+#if defined(__arm__)
+
+// See <asm/hwcap.h> kernel header.
+#define HWCAP_VFP       (1 << 6)
+#define HWCAP_IWMMXT    (1 << 9)
+#define HWCAP_NEON      (1 << 12)
+#define HWCAP_VFPv3     (1 << 13)
+#define HWCAP_VFPv3D16  (1 << 14)
+#define HWCAP_VFPv4     (1 << 16)
+#define HWCAP_IDIVA     (1 << 17)
+#define HWCAP_IDIVT     (1 << 18)
+
+// see <uapi/asm/hwcap.h> kernel header
+#define HWCAP2_AES     (1 << 0)
+#define HWCAP2_PMULL   (1 << 1)
+#define HWCAP2_SHA1    (1 << 2)
+#define HWCAP2_SHA2    (1 << 3)
+#define HWCAP2_CRC32   (1 << 4)
+
+// This is the list of 32-bit ARMv7 optional features that are _always_
+// supported by ARMv8 CPUs, as mandated by the ARM Architecture Reference
+// Manual.
+#define HWCAP_SET_FOR_ARMV8  \
+  ( HWCAP_VFP | \
+    HWCAP_NEON | \
+    HWCAP_VFPv3 | \
+    HWCAP_VFPv4 | \
+    HWCAP_IDIVA | \
+    HWCAP_IDIVT )
+#endif
+
+#if defined(__mips__)
+// see <uapi/asm/hwcap.h> kernel header
+#define HWCAP_MIPS_R6           (1 << 0)
+#define HWCAP_MIPS_MSA          (1 << 1)
+#endif
+
+#if defined(__arm__) || defined(__aarch64__) || defined(__mips__)
+
+#define AT_HWCAP 16
+#define AT_HWCAP2 26
+
+// Probe the system's C library for a 'getauxval' function and call it if
+// it exits, or return 0 for failure. This function is available since API
+// level 20.
+//
+// This code does *NOT* check for '__ANDROID_API__ >= 20' to support the
+// edge case where some NDK developers use headers for a platform that is
+// newer than the one really targetted by their application.
+// This is typically done to use newer native APIs only when running on more
+// recent Android versions, and requires careful symbol management.
+//
+// Note that getauxval() can't really be re-implemented here, because
+// its implementation does not parse /proc/self/auxv. Instead it depends
+// on values  that are passed by the kernel at process-init time to the
+// C runtime initialization layer.
+static uint32_t
+get_elf_hwcap_from_getauxval(int hwcap_type) {
+    typedef unsigned long getauxval_func_t(unsigned long);
+
+    dlerror();
+    void* libc_handle = dlopen("libc.so", RTLD_NOW);
+    if (!libc_handle) {
+        D("Could not dlopen() C library: %s\n", dlerror());
+        return 0;
+    }
+
+    uint32_t ret = 0;
+    getauxval_func_t* func = (getauxval_func_t*)
+            dlsym(libc_handle, "getauxval");
+    if (!func) {
+        D("Could not find getauxval() in C library\n");
+    } else {
+        // Note: getauxval() returns 0 on failure. Doesn't touch errno.
+        ret = (uint32_t)(*func)(hwcap_type);
+    }
+    dlclose(libc_handle);
+    return ret;
+}
+#endif
+
+#if defined(__arm__)
+// Parse /proc/self/auxv to extract the ELF HW capabilities bitmap for the
+// current CPU. Note that this file is not accessible from regular
+// application processes on some Android platform releases.
+// On success, return new ELF hwcaps, or 0 on failure.
+static uint32_t
+get_elf_hwcap_from_proc_self_auxv(void) {
+    const char filepath[] = "/proc/self/auxv";
+    int fd = TEMP_FAILURE_RETRY(open(filepath, O_RDONLY));
+    if (fd < 0) {
+        D("Could not open %s: %s\n", filepath, strerror(errno));
+        return 0;
+    }
+
+    struct { uint32_t tag; uint32_t value; } entry;
+
+    uint32_t result = 0;
+    for (;;) {
+        int ret = TEMP_FAILURE_RETRY(read(fd, (char*)&entry, sizeof entry));
+        if (ret < 0) {
+            D("Error while reading %s: %s\n", filepath, strerror(errno));
+            break;
+        }
+        // Detect end of list.
+        if (ret == 0 || (entry.tag == 0 && entry.value == 0))
+          break;
+        if (entry.tag == AT_HWCAP) {
+          result = entry.value;
+          break;
+        }
+    }
+    close(fd);
+    return result;
+}
+
+/* Compute the ELF HWCAP flags from the content of /proc/cpuinfo.
+ * This works by parsing the 'Features' line, which lists which optional
+ * features the device's CPU supports, on top of its reference
+ * architecture.
+ */
+static uint32_t
+get_elf_hwcap_from_proc_cpuinfo(const char* cpuinfo, int cpuinfo_len) {
+    uint32_t hwcaps = 0;
+    long architecture = 0;
+    char* cpuArch = extract_cpuinfo_field(cpuinfo, cpuinfo_len, "CPU architecture");
+    if (cpuArch) {
+        architecture = strtol(cpuArch, NULL, 10);
+        free(cpuArch);
+
+        if (architecture >= 8L) {
+            // This is a 32-bit ARM binary running on a 64-bit ARM64 kernel.
+            // The 'Features' line only lists the optional features that the
+            // device's CPU supports, compared to its reference architecture
+            // which are of no use for this process.
+            D("Faking 32-bit ARM HWCaps on ARMv%ld CPU\n", architecture);
+            return HWCAP_SET_FOR_ARMV8;
+        }
+    }
+
+    char* cpuFeatures = extract_cpuinfo_field(cpuinfo, cpuinfo_len, "Features");
+    if (cpuFeatures != NULL) {
+        D("Found cpuFeatures = '%s'\n", cpuFeatures);
+
+        if (has_list_item(cpuFeatures, "vfp"))
+            hwcaps |= HWCAP_VFP;
+        if (has_list_item(cpuFeatures, "vfpv3"))
+            hwcaps |= HWCAP_VFPv3;
+        if (has_list_item(cpuFeatures, "vfpv3d16"))
+            hwcaps |= HWCAP_VFPv3D16;
+        if (has_list_item(cpuFeatures, "vfpv4"))
+            hwcaps |= HWCAP_VFPv4;
+        if (has_list_item(cpuFeatures, "neon"))
+            hwcaps |= HWCAP_NEON;
+        if (has_list_item(cpuFeatures, "idiva"))
+            hwcaps |= HWCAP_IDIVA;
+        if (has_list_item(cpuFeatures, "idivt"))
+            hwcaps |= HWCAP_IDIVT;
+        if (has_list_item(cpuFeatures, "idiv"))
+            hwcaps |= HWCAP_IDIVA | HWCAP_IDIVT;
+        if (has_list_item(cpuFeatures, "iwmmxt"))
+            hwcaps |= HWCAP_IWMMXT;
+
+        free(cpuFeatures);
+    }
+    return hwcaps;
+}
+#endif  /* __arm__ */
+
+/* Return the number of cpus present on a given device.
+ *
+ * To handle all weird kernel configurations, we need to compute the
+ * intersection of the 'present' and 'possible' CPU lists and count
+ * the result.
+ */
+static int
+get_cpu_count(void)
+{
+    CpuList cpus_present[1];
+    CpuList cpus_possible[1];
+
+    cpulist_read_from(cpus_present, "/sys/devices/system/cpu/present");
+    cpulist_read_from(cpus_possible, "/sys/devices/system/cpu/possible");
+
+    /* Compute the intersection of both sets to get the actual number of
+     * CPU cores that can be used on this device by the kernel.
+     */
+    cpulist_and(cpus_present, cpus_possible);
+
+    return cpulist_count(cpus_present);
+}
+
+static void
+android_cpuInitFamily(void)
+{
+#if defined(__arm__)
+    g_cpuFamily = ANDROID_CPU_FAMILY_ARM;
+#elif defined(__i386__)
+    g_cpuFamily = ANDROID_CPU_FAMILY_X86;
+#elif defined(__mips64)
+/* Needs to be before __mips__ since the compiler defines both */
+    g_cpuFamily = ANDROID_CPU_FAMILY_MIPS64;
+#elif defined(__mips__)
+    g_cpuFamily = ANDROID_CPU_FAMILY_MIPS;
+#elif defined(__aarch64__)
+    g_cpuFamily = ANDROID_CPU_FAMILY_ARM64;
+#elif defined(__x86_64__)
+    g_cpuFamily = ANDROID_CPU_FAMILY_X86_64;
+#else
+    g_cpuFamily = ANDROID_CPU_FAMILY_UNKNOWN;
+#endif
+}
+
+static void
+android_cpuInit(void)
+{
+    char* cpuinfo = NULL;
+    int   cpuinfo_len;
+
+    android_cpuInitFamily();
+
+    g_cpuFeatures = 0;
+    g_cpuCount    = 1;
+    g_inited      = 1;
+
+    cpuinfo_len = get_file_size("/proc/cpuinfo");
+    if (cpuinfo_len < 0) {
+      D("cpuinfo_len cannot be computed!");
+      return;
+    }
+    cpuinfo = malloc(cpuinfo_len);
+    if (cpuinfo == NULL) {
+      D("cpuinfo buffer could not be allocated");
+      return;
+    }
+    cpuinfo_len = read_file("/proc/cpuinfo", cpuinfo, cpuinfo_len);
+    D("cpuinfo_len is (%d):\n%.*s\n", cpuinfo_len,
+      cpuinfo_len >= 0 ? cpuinfo_len : 0, cpuinfo);
+
+    if (cpuinfo_len < 0)  /* should not happen */ {
+        free(cpuinfo);
+        return;
+    }
+
+    /* Count the CPU cores, the value may be 0 for single-core CPUs */
+    g_cpuCount = get_cpu_count();
+    if (g_cpuCount == 0) {
+        g_cpuCount = 1;
+    }
+
+    D("found cpuCount = %d\n", g_cpuCount);
+
+#ifdef __arm__
+    {
+        /* Extract architecture from the "CPU Architecture" field.
+         * The list is well-known, unlike the the output of
+         * the 'Processor' field which can vary greatly.
+         *
+         * See the definition of the 'proc_arch' array in
+         * $KERNEL/arch/arm/kernel/setup.c and the 'c_show' function in
+         * same file.
+         */
+        char* cpuArch = extract_cpuinfo_field(cpuinfo, cpuinfo_len, "CPU architecture");
+
+        if (cpuArch != NULL) {
+            char*  end;
+            long   archNumber;
+            int    hasARMv7 = 0;
+
+            D("found cpuArch = '%s'\n", cpuArch);
+
+            /* read the initial decimal number, ignore the rest */
+            archNumber = strtol(cpuArch, &end, 10);
+
+            /* Note that ARMv8 is upwards compatible with ARMv7. */
+            if (end > cpuArch && archNumber >= 7) {
+                hasARMv7 = 1;
+            }
+
+            /* Unfortunately, it seems that certain ARMv6-based CPUs
+             * report an incorrect architecture number of 7!
+             *
+             * See http://code.google.com/p/android/issues/detail?id=10812
+             *
+             * We try to correct this by looking at the 'elf_format'
+             * field reported by the 'Processor' field, which is of the
+             * form of "(v7l)" for an ARMv7-based CPU, and "(v6l)" for
+             * an ARMv6-one.
+             */
+            if (hasARMv7) {
+                char* cpuProc = extract_cpuinfo_field(cpuinfo, cpuinfo_len,
+                                                      "Processor");
+                if (cpuProc != NULL) {
+                    D("found cpuProc = '%s'\n", cpuProc);
+                    if (has_list_item(cpuProc, "(v6l)")) {
+                        D("CPU processor and architecture mismatch!!\n");
+                        hasARMv7 = 0;
+                    }
+                    free(cpuProc);
+                }
+            }
+
+            if (hasARMv7) {
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_ARMv7;
+            }
+
+            /* The LDREX / STREX instructions are available from ARMv6 */
+            if (archNumber >= 6) {
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_LDREX_STREX;
+            }
+
+            free(cpuArch);
+        }
+
+        /* Extract the list of CPU features from ELF hwcaps */
+        uint32_t hwcaps = 0;
+        hwcaps = get_elf_hwcap_from_getauxval(AT_HWCAP);
+        if (!hwcaps) {
+            D("Parsing /proc/self/auxv to extract ELF hwcaps!\n");
+            hwcaps = get_elf_hwcap_from_proc_self_auxv();
+        }
+        if (!hwcaps) {
+            // Parsing /proc/self/auxv will fail from regular application
+            // processes on some Android platform versions, when this happens
+            // parse proc/cpuinfo instead.
+            D("Parsing /proc/cpuinfo to extract ELF hwcaps!\n");
+            hwcaps = get_elf_hwcap_from_proc_cpuinfo(cpuinfo, cpuinfo_len);
+        }
+
+        if (hwcaps != 0) {
+            int has_vfp = (hwcaps & HWCAP_VFP);
+            int has_vfpv3 = (hwcaps & HWCAP_VFPv3);
+            int has_vfpv3d16 = (hwcaps & HWCAP_VFPv3D16);
+            int has_vfpv4 = (hwcaps & HWCAP_VFPv4);
+            int has_neon = (hwcaps & HWCAP_NEON);
+            int has_idiva = (hwcaps & HWCAP_IDIVA);
+            int has_idivt = (hwcaps & HWCAP_IDIVT);
+            int has_iwmmxt = (hwcaps & HWCAP_IWMMXT);
+
+            // The kernel does a poor job at ensuring consistency when
+            // describing CPU features. So lots of guessing is needed.
+
+            // 'vfpv4' implies VFPv3|VFP_FMA|FP16
+            if (has_vfpv4)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_VFPv3    |
+                                 ANDROID_CPU_ARM_FEATURE_VFP_FP16 |
+                                 ANDROID_CPU_ARM_FEATURE_VFP_FMA;
+
+            // 'vfpv3' or 'vfpv3d16' imply VFPv3. Note that unlike GCC,
+            // a value of 'vfpv3' doesn't necessarily mean that the D32
+            // feature is present, so be conservative. All CPUs in the
+            // field that support D32 also support NEON, so this should
+            // not be a problem in practice.
+            if (has_vfpv3 || has_vfpv3d16)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_VFPv3;
+
+            // 'vfp' is super ambiguous. Depending on the kernel, it can
+            // either mean VFPv2 or VFPv3. Make it depend on ARMv7.
+            if (has_vfp) {
+              if (g_cpuFeatures & ANDROID_CPU_ARM_FEATURE_ARMv7)
+                  g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_VFPv3;
+              else
+                  g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_VFPv2;
+            }
+
+            // Neon implies VFPv3|D32, and if vfpv4 is detected, NEON_FMA
+            if (has_neon) {
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_VFPv3 |
+                                 ANDROID_CPU_ARM_FEATURE_NEON |
+                                 ANDROID_CPU_ARM_FEATURE_VFP_D32;
+              if (has_vfpv4)
+                  g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_NEON_FMA;
+            }
+
+            // VFPv3 implies VFPv2 and ARMv7
+            if (g_cpuFeatures & ANDROID_CPU_ARM_FEATURE_VFPv3)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_VFPv2 |
+                                 ANDROID_CPU_ARM_FEATURE_ARMv7;
+
+            if (has_idiva)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_IDIV_ARM;
+            if (has_idivt)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_IDIV_THUMB2;
+
+            if (has_iwmmxt)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_iWMMXt;
+        }
+
+        /* Extract the list of CPU features from ELF hwcaps2 */
+        uint32_t hwcaps2 = 0;
+        hwcaps2 = get_elf_hwcap_from_getauxval(AT_HWCAP2);
+        if (hwcaps2 != 0) {
+            int has_aes     = (hwcaps2 & HWCAP2_AES);
+            int has_pmull   = (hwcaps2 & HWCAP2_PMULL);
+            int has_sha1    = (hwcaps2 & HWCAP2_SHA1);
+            int has_sha2    = (hwcaps2 & HWCAP2_SHA2);
+            int has_crc32   = (hwcaps2 & HWCAP2_CRC32);
+
+            if (has_aes)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_AES;
+            if (has_pmull)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_PMULL;
+            if (has_sha1)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_SHA1;
+            if (has_sha2)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_SHA2;
+            if (has_crc32)
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_CRC32;
+        }
+        /* Extract the cpuid value from various fields */
+        // The CPUID value is broken up in several entries in /proc/cpuinfo.
+        // This table is used to rebuild it from the entries.
+        static const struct CpuIdEntry {
+            const char* field;
+            char        format;
+            char        bit_lshift;
+            char        bit_length;
+        } cpu_id_entries[] = {
+            { "CPU implementer", 'x', 24, 8 },
+            { "CPU variant", 'x', 20, 4 },
+            { "CPU part", 'x', 4, 12 },
+            { "CPU revision", 'd', 0, 4 },
+        };
+        size_t i;
+        D("Parsing /proc/cpuinfo to recover CPUID\n");
+        for (i = 0;
+             i < sizeof(cpu_id_entries)/sizeof(cpu_id_entries[0]);
+             ++i) {
+            const struct CpuIdEntry* entry = &cpu_id_entries[i];
+            char* value = extract_cpuinfo_field(cpuinfo,
+                                                cpuinfo_len,
+                                                entry->field);
+            if (value == NULL)
+                continue;
+
+            D("field=%s value='%s'\n", entry->field, value);
+            char* value_end = value + strlen(value);
+            int val = 0;
+            const char* start = value;
+            const char* p;
+            if (value[0] == '0' && (value[1] == 'x' || value[1] == 'X')) {
+              start += 2;
+              p = parse_hexadecimal(start, value_end, &val);
+            } else if (entry->format == 'x')
+              p = parse_hexadecimal(value, value_end, &val);
+            else
+              p = parse_decimal(value, value_end, &val);
+
+            if (p > (const char*)start) {
+              val &= ((1 << entry->bit_length)-1);
+              val <<= entry->bit_lshift;
+              g_cpuIdArm |= (uint32_t) val;
+            }
+
+            free(value);
+        }
+
+        // Handle kernel configuration bugs that prevent the correct
+        // reporting of CPU features.
+        static const struct CpuFix {
+            uint32_t  cpuid;
+            uint64_t  or_flags;
+        } cpu_fixes[] = {
+            /* The Nexus 4 (Qualcomm Krait) kernel configuration
+             * forgets to report IDIV support. */
+            { 0x510006f2, ANDROID_CPU_ARM_FEATURE_IDIV_ARM |
+                          ANDROID_CPU_ARM_FEATURE_IDIV_THUMB2 },
+            { 0x510006f3, ANDROID_CPU_ARM_FEATURE_IDIV_ARM |
+                          ANDROID_CPU_ARM_FEATURE_IDIV_THUMB2 },
+        };
+        size_t n;
+        for (n = 0; n < sizeof(cpu_fixes)/sizeof(cpu_fixes[0]); ++n) {
+            const struct CpuFix* entry = &cpu_fixes[n];
+
+            if (g_cpuIdArm == entry->cpuid)
+                g_cpuFeatures |= entry->or_flags;
+        }
+
+        // Special case: The emulator-specific Android 4.2 kernel fails
+        // to report support for the 32-bit ARM IDIV instruction.
+        // Technically, this is a feature of the virtual CPU implemented
+        // by the emulator. Note that it could also support Thumb IDIV
+        // in the future, and this will have to be slightly updated.
+        char* hardware = extract_cpuinfo_field(cpuinfo,
+                                               cpuinfo_len,
+                                               "Hardware");
+        if (hardware) {
+            if (!strcmp(hardware, "Goldfish") &&
+                g_cpuIdArm == 0x4100c080 &&
+                (g_cpuFamily & ANDROID_CPU_ARM_FEATURE_ARMv7) != 0) {
+                g_cpuFeatures |= ANDROID_CPU_ARM_FEATURE_IDIV_ARM;
+            }
+            free(hardware);
+        }
+    }
+#endif /* __arm__ */
+#ifdef __aarch64__
+    {
+        /* Extract the list of CPU features from ELF hwcaps */
+        uint32_t hwcaps = 0;
+        hwcaps = get_elf_hwcap_from_getauxval(AT_HWCAP);
+        if (hwcaps != 0) {
+            int has_fp      = (hwcaps & HWCAP_FP);
+            int has_asimd   = (hwcaps & HWCAP_ASIMD);
+            int has_aes     = (hwcaps & HWCAP_AES);
+            int has_pmull   = (hwcaps & HWCAP_PMULL);
+            int has_sha1    = (hwcaps & HWCAP_SHA1);
+            int has_sha2    = (hwcaps & HWCAP_SHA2);
+            int has_crc32   = (hwcaps & HWCAP_CRC32);
+
+            if(has_fp == 0) {
+                D("ERROR: Floating-point unit missing, but is required by Android on AArch64 CPUs\n");
+            }
+            if(has_asimd == 0) {
+                D("ERROR: ASIMD unit missing, but is required by Android on AArch64 CPUs\n");
+            }
+
+            if (has_fp)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_FP;
+            if (has_asimd)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_ASIMD;
+            if (has_aes)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_AES;
+            if (has_pmull)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_PMULL;
+            if (has_sha1)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_SHA1;
+            if (has_sha2)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_SHA2;
+            if (has_crc32)
+                g_cpuFeatures |= ANDROID_CPU_ARM64_FEATURE_CRC32;
+        }
+    }
+#endif /* __aarch64__ */
+
+#if defined(__i386__) || defined(__x86_64__)
+    int regs[4];
+
+/* According to http://en.wikipedia.org/wiki/CPUID */
+#define VENDOR_INTEL_b  0x756e6547
+#define VENDOR_INTEL_c  0x6c65746e
+#define VENDOR_INTEL_d  0x49656e69
+
+    x86_cpuid(0, regs);
+    int vendorIsIntel = (regs[1] == VENDOR_INTEL_b &&
+                         regs[2] == VENDOR_INTEL_c &&
+                         regs[3] == VENDOR_INTEL_d);
+
+    x86_cpuid(1, regs);
+    if ((regs[2] & (1 << 9)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_SSSE3;
+    }
+    if ((regs[2] & (1 << 23)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_POPCNT;
+    }
+    if ((regs[2] & (1 << 19)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_SSE4_1;
+    }
+    if ((regs[2] & (1 << 20)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_SSE4_2;
+    }
+    if (vendorIsIntel && (regs[2] & (1 << 22)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_MOVBE;
+    }
+    if ((regs[2] & (1 << 25)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_AES_NI;
+    }
+    if ((regs[2] & (1 << 28)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_AVX;
+    }
+    if ((regs[2] & (1 << 30)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_RDRAND;
+    }
+
+    x86_cpuid(7, regs);
+    if ((regs[1] & (1 << 5)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_AVX2;
+    }
+    if ((regs[1] & (1 << 29)) != 0) {
+        g_cpuFeatures |= ANDROID_CPU_X86_FEATURE_SHA_NI;
+    }
+
+
+#endif
+#if defined( __mips__)
+    {   /* MIPS and MIPS64 */
+        /* Extract the list of CPU features from ELF hwcaps */
+        uint32_t hwcaps = 0;
+        hwcaps = get_elf_hwcap_from_getauxval(AT_HWCAP);
+        if (hwcaps != 0) {
+            int has_r6      = (hwcaps & HWCAP_MIPS_R6);
+            int has_msa     = (hwcaps & HWCAP_MIPS_MSA);
+            if (has_r6)
+                g_cpuFeatures |= ANDROID_CPU_MIPS_FEATURE_R6;
+            if (has_msa)
+                g_cpuFeatures |= ANDROID_CPU_MIPS_FEATURE_MSA;
+        }
+    }
+#endif /* __mips__ */
+
+    free(cpuinfo);
+}
+
+
+AndroidCpuFamily
+android_getCpuFamily(void)
+{
+    pthread_once(&g_once, android_cpuInit);
+    return g_cpuFamily;
+}
+
+
+uint64_t
+android_getCpuFeatures(void)
+{
+    pthread_once(&g_once, android_cpuInit);
+    return g_cpuFeatures;
+}
+
+
+int
+android_getCpuCount(void)
+{
+    pthread_once(&g_once, android_cpuInit);
+    return g_cpuCount;
+}
+
+static void
+android_cpuInitDummy(void)
+{
+    g_inited = 1;
+}
+
+int
+android_setCpu(int cpu_count, uint64_t cpu_features)
+{
+    /* Fail if the library was already initialized. */
+    if (g_inited)
+        return 0;
+
+    android_cpuInitFamily();
+    g_cpuCount = (cpu_count <= 0 ? 1 : cpu_count);
+    g_cpuFeatures = cpu_features;
+    pthread_once(&g_once, android_cpuInitDummy);
+
+    return 1;
+}
+
+#ifdef __arm__
+uint32_t
+android_getCpuIdArm(void)
+{
+    pthread_once(&g_once, android_cpuInit);
+    return g_cpuIdArm;
+}
+
+int
+android_setCpuArm(int cpu_count, uint64_t cpu_features, uint32_t cpu_id)
+{
+    if (!android_setCpu(cpu_count, cpu_features))
+        return 0;
+
+    g_cpuIdArm = cpu_id;
+    return 1;
+}
+#endif  /* __arm__ */
+
+/*
+ * Technical note: Making sense of ARM's FPU architecture versions.
+ *
+ * FPA was ARM's first attempt at an FPU architecture. There is no Android
+ * device that actually uses it since this technology was already obsolete
+ * when the project started. If you see references to FPA instructions
+ * somewhere, you can be sure that this doesn't apply to Android at all.
+ *
+ * FPA was followed by "VFP", soon renamed "VFPv1" due to the emergence of
+ * new versions / additions to it. ARM considers this obsolete right now,
+ * and no known Android device implements it either.
+ *
+ * VFPv2 added a few instructions to VFPv1, and is an *optional* extension
+ * supported by some ARMv5TE, ARMv6 and ARMv6T2 CPUs. Note that a device
+ * supporting the 'armeabi' ABI doesn't necessarily support these.
+ *
+ * VFPv3-D16 adds a few instructions on top of VFPv2 and is typically used
+ * on ARMv7-A CPUs which implement a FPU. Note that it is also mandated
+ * by the Android 'armeabi-v7a' ABI. The -D16 suffix in its name means
+ * that it provides 16 double-precision FPU registers (d0-d15) and 32
+ * single-precision ones (s0-s31) which happen to be mapped to the same
+ * register banks.
+ *
+ * VFPv3-D32 is the name of an extension to VFPv3-D16 that provides 16
+ * additional double precision registers (d16-d31). Note that there are
+ * still only 32 single precision registers.
+ *
+ * VFPv3xD is a *subset* of VFPv3-D16 that only provides single-precision
+ * registers. It is only used on ARMv7-M (i.e. on micro-controllers) which
+ * are not supported by Android. Note that it is not compatible with VFPv2.
+ *
+ * NOTE: The term 'VFPv3' usually designate either VFPv3-D16 or VFPv3-D32
+ *       depending on context. For example GCC uses it for VFPv3-D32, but
+ *       the Linux kernel code uses it for VFPv3-D16 (especially in
+ *       /proc/cpuinfo). Always try to use the full designation when
+ *       possible.
+ *
+ * NEON, a.k.a. "ARM Advanced SIMD" is an extension that provides
+ * instructions to perform parallel computations on vectors of 8, 16,
+ * 32, 64 and 128 bit quantities. NEON requires VFPv32-D32 since all
+ * NEON registers are also mapped to the same register banks.
+ *
+ * VFPv4-D16, adds a few instructions on top of VFPv3-D16 in order to
+ * perform fused multiply-accumulate on VFP registers, as well as
+ * half-precision (16-bit) conversion operations.
+ *
+ * VFPv4-D32 is VFPv4-D16 with 32, instead of 16, FPU double precision
+ * registers.
+ *
+ * VPFv4-NEON is VFPv4-D32 with NEON instructions. It also adds fused
+ * multiply-accumulate instructions that work on the NEON registers.
+ *
+ * NOTE: Similarly, "VFPv4" might either reference VFPv4-D16 or VFPv4-D32
+ *       depending on context.
+ *
+ * The following information was determined by scanning the binutils-2.22
+ * sources:
+ *
+ * Basic VFP instruction subsets:
+ *
+ * #define FPU_VFP_EXT_V1xD 0x08000000     // Base VFP instruction set.
+ * #define FPU_VFP_EXT_V1   0x04000000     // Double-precision insns.
+ * #define FPU_VFP_EXT_V2   0x02000000     // ARM10E VFPr1.
+ * #define FPU_VFP_EXT_V3xD 0x01000000     // VFPv3 single-precision.
+ * #define FPU_VFP_EXT_V3   0x00800000     // VFPv3 double-precision.
+ * #define FPU_NEON_EXT_V1  0x00400000     // Neon (SIMD) insns.
+ * #define FPU_VFP_EXT_D32  0x00200000     // Registers D16-D31.
+ * #define FPU_VFP_EXT_FP16 0x00100000     // Half-precision extensions.
+ * #define FPU_NEON_EXT_FMA 0x00080000     // Neon fused multiply-add
+ * #define FPU_VFP_EXT_FMA  0x00040000     // VFP fused multiply-add
+ *
+ * FPU types (excluding NEON)
+ *
+ * FPU_VFP_V1xD (EXT_V1xD)
+ *    |
+ *    +--------------------------+
+ *    |                          |
+ * FPU_VFP_V1 (+EXT_V1)       FPU_VFP_V3xD (+EXT_V2+EXT_V3xD)
+ *    |                          |
+ *    |                          |
+ * FPU_VFP_V2 (+EXT_V2)       FPU_VFP_V4_SP_D16 (+EXT_FP16+EXT_FMA)
+ *    |
+ * FPU_VFP_V3D16 (+EXT_Vx3D+EXT_V3)
+ *    |
+ *    +--------------------------+
+ *    |                          |
+ * FPU_VFP_V3 (+EXT_D32)     FPU_VFP_V4D16 (+EXT_FP16+EXT_FMA)
+ *    |                          |
+ *    |                      FPU_VFP_V4 (+EXT_D32)
+ *    |
+ * FPU_VFP_HARD (+EXT_FMA+NEON_EXT_FMA)
+ *
+ * VFP architectures:
+ *
+ * ARCH_VFP_V1xD  (EXT_V1xD)
+ *   |
+ *   +------------------+
+ *   |                  |
+ *   |             ARCH_VFP_V3xD (+EXT_V2+EXT_V3xD)
+ *   |                  |
+ *   |             ARCH_VFP_V3xD_FP16 (+EXT_FP16)
+ *   |                  |
+ *   |             ARCH_VFP_V4_SP_D16 (+EXT_FMA)
+ *   |
+ * ARCH_VFP_V1 (+EXT_V1)
+ *   |
+ * ARCH_VFP_V2 (+EXT_V2)
+ *   |
+ * ARCH_VFP_V3D16 (+EXT_V3xD+EXT_V3)
+ *   |
+ *   +-------------------+
+ *   |                   |
+ *   |         ARCH_VFP_V3D16_FP16  (+EXT_FP16)
+ *   |
+ *   +-------------------+
+ *   |                   |
+ *   |         ARCH_VFP_V4_D16 (+EXT_FP16+EXT_FMA)
+ *   |                   |
+ *   |         ARCH_VFP_V4 (+EXT_D32)
+ *   |                   |
+ *   |         ARCH_NEON_VFP_V4 (+EXT_NEON+EXT_NEON_FMA)
+ *   |
+ * ARCH_VFP_V3 (+EXT_D32)
+ *   |
+ *   +-------------------+
+ *   |                   |
+ *   |         ARCH_VFP_V3_FP16 (+EXT_FP16)
+ *   |
+ * ARCH_VFP_V3_PLUS_NEON_V1 (+EXT_NEON)
+ *   |
+ * ARCH_NEON_FP16 (+EXT_FP16)
+ *
+ * -fpu=<name> values and their correspondance with FPU architectures above:
+ *
+ *   {"vfp",               FPU_ARCH_VFP_V2},
+ *   {"vfp9",              FPU_ARCH_VFP_V2},
+ *   {"vfp3",              FPU_ARCH_VFP_V3}, // For backwards compatbility.
+ *   {"vfp10",             FPU_ARCH_VFP_V2},
+ *   {"vfp10-r0",          FPU_ARCH_VFP_V1},
+ *   {"vfpxd",             FPU_ARCH_VFP_V1xD},
+ *   {"vfpv2",             FPU_ARCH_VFP_V2},
+ *   {"vfpv3",             FPU_ARCH_VFP_V3},
+ *   {"vfpv3-fp16",        FPU_ARCH_VFP_V3_FP16},
+ *   {"vfpv3-d16",         FPU_ARCH_VFP_V3D16},
+ *   {"vfpv3-d16-fp16",    FPU_ARCH_VFP_V3D16_FP16},
+ *   {"vfpv3xd",           FPU_ARCH_VFP_V3xD},
+ *   {"vfpv3xd-fp16",      FPU_ARCH_VFP_V3xD_FP16},
+ *   {"neon",              FPU_ARCH_VFP_V3_PLUS_NEON_V1},
+ *   {"neon-fp16",         FPU_ARCH_NEON_FP16},
+ *   {"vfpv4",             FPU_ARCH_VFP_V4},
+ *   {"vfpv4-d16",         FPU_ARCH_VFP_V4D16},
+ *   {"fpv4-sp-d16",       FPU_ARCH_VFP_V4_SP_D16},
+ *   {"neon-vfpv4",        FPU_ARCH_NEON_VFP_V4},
+ *
+ *
+ * Simplified diagram that only includes FPUs supported by Android:
+ * Only ARCH_VFP_V3D16 is actually mandated by the armeabi-v7a ABI,
+ * all others are optional and must be probed at runtime.
+ *
+ * ARCH_VFP_V3D16 (EXT_V1xD+EXT_V1+EXT_V2+EXT_V3xD+EXT_V3)
+ *   |
+ *   +-------------------+
+ *   |                   |
+ *   |         ARCH_VFP_V3D16_FP16  (+EXT_FP16)
+ *   |
+ *   +-------------------+
+ *   |                   |
+ *   |         ARCH_VFP_V4_D16 (+EXT_FP16+EXT_FMA)
+ *   |                   |
+ *   |         ARCH_VFP_V4 (+EXT_D32)
+ *   |                   |
+ *   |         ARCH_NEON_VFP_V4 (+EXT_NEON+EXT_NEON_FMA)
+ *   |
+ * ARCH_VFP_V3 (+EXT_D32)
+ *   |
+ *   +-------------------+
+ *   |                   |
+ *   |         ARCH_VFP_V3_FP16 (+EXT_FP16)
+ *   |
+ * ARCH_VFP_V3_PLUS_NEON_V1 (+EXT_NEON)
+ *   |
+ * ARCH_NEON_FP16 (+EXT_FP16)
+ *
+ */
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/cpufeatures/cpu-features.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/cpufeatures/cpu-features.h
new file mode 100644
index 0000000..1e97241
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/cpufeatures/cpu-features.h
@@ -0,0 +1,323 @@
+/*
+ * Copyright (C) 2010 The Android Open Source Project
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *  * Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ *  * Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in
+ *    the documentation and/or other materials provided with the
+ *    distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
+ * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
+ * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
+ * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
+ * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
+ * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+ * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
+ * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ */
+#ifndef CPU_FEATURES_H
+#define CPU_FEATURES_H
+
+#include <sys/cdefs.h>
+#include <stdint.h>
+
+__BEGIN_DECLS
+
+/* A list of valid values returned by android_getCpuFamily().
+ * They describe the CPU Architecture of the current process.
+ */
+typedef enum {
+    ANDROID_CPU_FAMILY_UNKNOWN = 0,
+    ANDROID_CPU_FAMILY_ARM,
+    ANDROID_CPU_FAMILY_X86,
+    ANDROID_CPU_FAMILY_MIPS,
+    ANDROID_CPU_FAMILY_ARM64,
+    ANDROID_CPU_FAMILY_X86_64,
+    ANDROID_CPU_FAMILY_MIPS64,
+
+    ANDROID_CPU_FAMILY_MAX  /* do not remove */
+
+} AndroidCpuFamily;
+
+/* Return the CPU family of the current process.
+ *
+ * Note that this matches the bitness of the current process. I.e. when
+ * running a 32-bit binary on a 64-bit capable CPU, this will return the
+ * 32-bit CPU family value.
+ */
+extern AndroidCpuFamily android_getCpuFamily(void);
+
+/* Return a bitmap describing a set of optional CPU features that are
+ * supported by the current device's CPU. The exact bit-flags returned
+ * depend on the value returned by android_getCpuFamily(). See the
+ * documentation for the ANDROID_CPU_*_FEATURE_* flags below for details.
+ */
+extern uint64_t android_getCpuFeatures(void);
+
+/* The list of feature flags for ANDROID_CPU_FAMILY_ARM that can be
+ * recognized by the library (see note below for 64-bit ARM). Value details
+ * are:
+ *
+ *   VFPv2:
+ *     CPU supports the VFPv2 instruction set. Many, but not all, ARMv6 CPUs
+ *     support these instructions. VFPv2 is a subset of VFPv3 so this will
+ *     be set whenever VFPv3 is set too.
+ *
+ *   ARMv7:
+ *     CPU supports the ARMv7-A basic instruction set.
+ *     This feature is mandated by the 'armeabi-v7a' ABI.
+ *
+ *   VFPv3:
+ *     CPU supports the VFPv3-D16 instruction set, providing hardware FPU
+ *     support for single and double precision floating point registers.
+ *     Note that only 16 FPU registers are available by default, unless
+ *     the D32 bit is set too. This feature is also mandated by the
+ *     'armeabi-v7a' ABI.
+ *
+ *   VFP_D32:
+ *     CPU VFP optional extension that provides 32 FPU registers,
+ *     instead of 16. Note that ARM mandates this feature is the 'NEON'
+ *     feature is implemented by the CPU.
+ *
+ *   NEON:
+ *     CPU FPU supports "ARM Advanced SIMD" instructions, also known as
+ *     NEON. Note that this mandates the VFP_D32 feature as well, per the
+ *     ARM Architecture specification.
+ *
+ *   VFP_FP16:
+ *     Half-width floating precision VFP extension. If set, the CPU
+ *     supports instructions to perform floating-point operations on
+ *     16-bit registers. This is part of the VFPv4 specification, but
+ *     not mandated by any Android ABI.
+ *
+ *   VFP_FMA:
+ *     Fused multiply-accumulate VFP instructions extension. Also part of
+ *     the VFPv4 specification, but not mandated by any Android ABI.
+ *
+ *   NEON_FMA:
+ *     Fused multiply-accumulate NEON instructions extension. Optional
+ *     extension from the VFPv4 specification, but not mandated by any
+ *     Android ABI.
+ *
+ *   IDIV_ARM:
+ *     Integer division available in ARM mode. Only available
+ *     on recent CPUs (e.g. Cortex-A15).
+ *
+ *   IDIV_THUMB2:
+ *     Integer division available in Thumb-2 mode. Only available
+ *     on recent CPUs (e.g. Cortex-A15).
+ *
+ *   iWMMXt:
+ *     Optional extension that adds MMX registers and operations to an
+ *     ARM CPU. This is only available on a few XScale-based CPU designs
+ *     sold by Marvell. Pretty rare in practice.
+ *
+ *   AES:
+ *     CPU supports AES instructions. These instructions are only
+ *     available for 32-bit applications running on ARMv8 CPU.
+ *
+ *   CRC32:
+ *     CPU supports CRC32 instructions. These instructions are only
+ *     available for 32-bit applications running on ARMv8 CPU.
+ *
+ *   SHA2:
+ *     CPU supports SHA2 instructions. These instructions are only
+ *     available for 32-bit applications running on ARMv8 CPU.
+ *
+ *   SHA1:
+ *     CPU supports SHA1 instructions. These instructions are only
+ *     available for 32-bit applications running on ARMv8 CPU.
+ *
+ *   PMULL:
+ *     CPU supports 64-bit PMULL and PMULL2 instructions. These
+ *     instructions are only available for 32-bit applications
+ *     running on ARMv8 CPU.
+ *
+ * If you want to tell the compiler to generate code that targets one of
+ * the feature set above, you should probably use one of the following
+ * flags (for more details, see technical note at the end of this file):
+ *
+ *   -mfpu=vfp
+ *   -mfpu=vfpv2
+ *     These are equivalent and tell GCC to use VFPv2 instructions for
+ *     floating-point operations. Use this if you want your code to
+ *     run on *some* ARMv6 devices, and any ARMv7-A device supported
+ *     by Android.
+ *
+ *     Generated code requires VFPv2 feature.
+ *
+ *   -mfpu=vfpv3-d16
+ *     Tell GCC to use VFPv3 instructions (using only 16 FPU registers).
+ *     This should be generic code that runs on any CPU that supports the
+ *     'armeabi-v7a' Android ABI. Note that no ARMv6 CPU supports this.
+ *
+ *     Generated code requires VFPv3 feature.
+ *
+ *   -mfpu=vfpv3
+ *     Tell GCC to use VFPv3 instructions with 32 FPU registers.
+ *     Generated code requires VFPv3|VFP_D32 features.
+ *
+ *   -mfpu=neon
+ *     Tell GCC to use VFPv3 instructions with 32 FPU registers, and
+ *     also support NEON intrinsics (see <arm_neon.h>).
+ *     Generated code requires VFPv3|VFP_D32|NEON features.
+ *
+ *   -mfpu=vfpv4-d16
+ *     Generated code requires VFPv3|VFP_FP16|VFP_FMA features.
+ *
+ *   -mfpu=vfpv4
+ *     Generated code requires VFPv3|VFP_FP16|VFP_FMA|VFP_D32 features.
+ *
+ *   -mfpu=neon-vfpv4
+ *     Generated code requires VFPv3|VFP_FP16|VFP_FMA|VFP_D32|NEON|NEON_FMA
+ *     features.
+ *
+ *   -mcpu=cortex-a7
+ *   -mcpu=cortex-a15
+ *     Generated code requires VFPv3|VFP_FP16|VFP_FMA|VFP_D32|
+ *                             NEON|NEON_FMA|IDIV_ARM|IDIV_THUMB2
+ *     This flag implies -mfpu=neon-vfpv4.
+ *
+ *   -mcpu=iwmmxt
+ *     Allows the use of iWMMXt instrinsics with GCC.
+ *
+ * IMPORTANT NOTE: These flags should only be tested when
+ * android_getCpuFamily() returns ANDROID_CPU_FAMILY_ARM, i.e. this is a
+ * 32-bit process.
+ *
+ * When running a 64-bit ARM process on an ARMv8 CPU,
+ * android_getCpuFeatures() will return a different set of bitflags
+ */
+enum {
+    ANDROID_CPU_ARM_FEATURE_ARMv7       = (1 << 0),
+    ANDROID_CPU_ARM_FEATURE_VFPv3       = (1 << 1),
+    ANDROID_CPU_ARM_FEATURE_NEON        = (1 << 2),
+    ANDROID_CPU_ARM_FEATURE_LDREX_STREX = (1 << 3),
+    ANDROID_CPU_ARM_FEATURE_VFPv2       = (1 << 4),
+    ANDROID_CPU_ARM_FEATURE_VFP_D32     = (1 << 5),
+    ANDROID_CPU_ARM_FEATURE_VFP_FP16    = (1 << 6),
+    ANDROID_CPU_ARM_FEATURE_VFP_FMA     = (1 << 7),
+    ANDROID_CPU_ARM_FEATURE_NEON_FMA    = (1 << 8),
+    ANDROID_CPU_ARM_FEATURE_IDIV_ARM    = (1 << 9),
+    ANDROID_CPU_ARM_FEATURE_IDIV_THUMB2 = (1 << 10),
+    ANDROID_CPU_ARM_FEATURE_iWMMXt      = (1 << 11),
+    ANDROID_CPU_ARM_FEATURE_AES         = (1 << 12),
+    ANDROID_CPU_ARM_FEATURE_PMULL       = (1 << 13),
+    ANDROID_CPU_ARM_FEATURE_SHA1        = (1 << 14),
+    ANDROID_CPU_ARM_FEATURE_SHA2        = (1 << 15),
+    ANDROID_CPU_ARM_FEATURE_CRC32       = (1 << 16),
+};
+
+/* The bit flags corresponding to the output of android_getCpuFeatures()
+ * when android_getCpuFamily() returns ANDROID_CPU_FAMILY_ARM64. Value details
+ * are:
+ *
+ *   FP:
+ *     CPU has Floating-point unit.
+ *
+ *   ASIMD:
+ *     CPU has Advanced SIMD unit.
+ *
+ *   AES:
+ *     CPU supports AES instructions.
+ *
+ *   CRC32:
+ *     CPU supports CRC32 instructions.
+ *
+ *   SHA2:
+ *     CPU supports SHA2 instructions.
+ *
+ *   SHA1:
+ *     CPU supports SHA1 instructions.
+ *
+ *   PMULL:
+ *     CPU supports 64-bit PMULL and PMULL2 instructions.
+ */
+enum {
+    ANDROID_CPU_ARM64_FEATURE_FP      = (1 << 0),
+    ANDROID_CPU_ARM64_FEATURE_ASIMD   = (1 << 1),
+    ANDROID_CPU_ARM64_FEATURE_AES     = (1 << 2),
+    ANDROID_CPU_ARM64_FEATURE_PMULL   = (1 << 3),
+    ANDROID_CPU_ARM64_FEATURE_SHA1    = (1 << 4),
+    ANDROID_CPU_ARM64_FEATURE_SHA2    = (1 << 5),
+    ANDROID_CPU_ARM64_FEATURE_CRC32   = (1 << 6),
+};
+
+/* The bit flags corresponding to the output of android_getCpuFeatures()
+ * when android_getCpuFamily() returns ANDROID_CPU_FAMILY_X86 or
+ * ANDROID_CPU_FAMILY_X86_64.
+ */
+enum {
+    ANDROID_CPU_X86_FEATURE_SSSE3  = (1 << 0),
+    ANDROID_CPU_X86_FEATURE_POPCNT = (1 << 1),
+    ANDROID_CPU_X86_FEATURE_MOVBE  = (1 << 2),
+    ANDROID_CPU_X86_FEATURE_SSE4_1 = (1 << 3),
+    ANDROID_CPU_X86_FEATURE_SSE4_2 = (1 << 4),
+    ANDROID_CPU_X86_FEATURE_AES_NI = (1 << 5),
+    ANDROID_CPU_X86_FEATURE_AVX =    (1 << 6),
+    ANDROID_CPU_X86_FEATURE_RDRAND = (1 << 7),
+    ANDROID_CPU_X86_FEATURE_AVX2 =   (1 << 8),
+    ANDROID_CPU_X86_FEATURE_SHA_NI = (1 << 9),
+};
+
+/* The bit flags corresponding to the output of android_getCpuFeatures()
+ * when android_getCpuFamily() returns ANDROID_CPU_FAMILY_MIPS
+ * or ANDROID_CPU_FAMILY_MIPS64.  Values are:
+ *
+ *   R6:
+ *     CPU executes MIPS Release 6 instructions natively, and
+ *     supports obsoleted R1..R5 instructions only via kernel traps.
+ *
+ *   MSA:
+ *     CPU supports Mips SIMD Architecture instructions.
+ */
+enum {
+    ANDROID_CPU_MIPS_FEATURE_R6    = (1 << 0),
+    ANDROID_CPU_MIPS_FEATURE_MSA   = (1 << 1),
+};
+
+
+/* Return the number of CPU cores detected on this device. */
+extern int android_getCpuCount(void);
+
+/* The following is used to force the CPU count and features
+ * mask in sandboxed processes. Under 4.1 and higher, these processes
+ * cannot access /proc, which is the only way to get information from
+ * the kernel about the current hardware (at least on ARM).
+ *
+ * It _must_ be called only once, and before any android_getCpuXXX
+ * function, any other case will fail.
+ *
+ * This function return 1 on success, and 0 on failure.
+ */
+extern int android_setCpu(int      cpu_count,
+                          uint64_t cpu_features);
+
+#ifdef __arm__
+/* Retrieve the ARM 32-bit CPUID value from the kernel.
+ * Note that this cannot work on sandboxed processes under 4.1 and
+ * higher, unless you called android_setCpuArm() before.
+ */
+extern uint32_t android_getCpuIdArm(void);
+
+/* An ARM-specific variant of android_setCpu() that also allows you
+ * to set the ARM CPUID field.
+ */
+extern int android_setCpuArm(int      cpu_count,
+                             uint64_t cpu_features,
+                             uint32_t cpu_id);
+#endif
+
+__END_DECLS
+
+#endif /* CPU_FEATURES_H */
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/include/WebrtcDenoise.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/include/WebrtcDenoise.h
new file mode 100644
index 0000000..f05823c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/include/WebrtcDenoise.h
@@ -0,0 +1,85 @@
+//
+// Created by 杨将 on 2017/8/1.
+//
+
+#ifndef __WEBRTCDENOISE_H__
+#define __WEBRTCDENOISE_H__
+
+//这个类主要是用来封装webrtc降噪的，先这么封着，最好降噪能统一接口和统一的错误处理
+//做了多少进多少出的处理，后面如果要去掉也是可以的，最好外面直接支持
+#include "mutex"
+// 对应Webrtc NS的四个等级
+enum Level {
+    kNone = 0, // 不做降噪
+    kLow = 1,
+    kModerate,
+    kHigh,
+    kVeryHigh
+};
+
+namespace webrtc
+{
+	class AudioBuffer;
+	class NoiseSuppressionImpl;
+	class StreamConfig;
+}
+
+namespace rtc
+{
+	class CriticalSection;
+}
+class CWebrtcDenoise
+{
+public:
+    CWebrtcDenoise();
+    ~CWebrtcDenoise();
+
+public:
+    int init(int samplerate, int channel);
+    //在做对齐的时候要用到，因此需要注意一下
+    float get_latency();
+    void reset();
+    int process(float * buffer, int len);
+    int core_process(float * buffer, int len);
+    void uninit();
+    void set_level(Level level);
+    Level get_level();
+private:
+    void process_one_frame();
+
+private:
+    //采样率
+    int m_sample_rate;
+    //声道数
+    int m_channel;
+    //因为做缓存导致的延迟量
+    int m_latency;
+    //因为底层是一个实例处理，因此就一个就可以了
+    webrtc::NoiseSuppressionImpl * m_noise_suppression;
+    //webrtc降噪内部一帧里面的单声道数据量
+    int m_frame_size;
+    //单帧运算过程中的buffer
+    webrtc::AudioBuffer * m_process_buffer;
+    //传入到AudioBuffer里面的数据的格式信息
+    webrtc::StreamConfig * m_stream_config;
+    //需要传给底层的临界区变量
+    rtc::CriticalSection * m_critical_section;
+    //因为底层是48K处理的，因此这里直接开辟两个480的buffer就好了
+    float m_in_buffer[480];
+    float m_out_buffer[480];
+    //上次还有多少残留的数据没有处理
+    int m_residual;
+    // 降噪相关
+    Level m_level;
+    Level m_current_level;
+    int m_webrtc_level;
+
+    // 是否进行平滑处理
+    bool m_need_smooth; // 需要平滑处理
+    bool m_need_update; // 需要更新
+    float* m_tmp_buf;
+    int m_tmp_buf_len;
+    std::mutex m_mutex;
+};
+
+#endif //__WEBRTCDENOISE_H__
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/include/WebrtcDenoiseAPI.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/include/WebrtcDenoiseAPI.h
new file mode 100644
index 0000000..f7578f7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/include/WebrtcDenoiseAPI.h
@@ -0,0 +1,74 @@
+
+/**
+ * Author: wangjianjun.
+ * Date: 17/8/31 20:58.
+ * Mail: alanwang6584@gmail.com
+ */
+//
+
+#ifndef STARMAKER_ANDROID_CLIENT_WEBRTCDENOISEAPI_H
+#define STARMAKER_ANDROID_CLIENT_WEBRTCDENOISEAPI_H
+
+
+#include "WebrtcDenoise.h"
+
+#define __DENOISE_API  __attribute__ ((visibility("default")))
+
+#ifdef __cplusplus
+extern "C"{
+#endif
+
+/**
+ * 创建CWebrtcDenoise实例
+ * @return
+ */
+void * __DENOISE_API denoise_create();
+
+/**
+ * 初始化
+ * @param instance
+ * @param samplerate
+ * @param channel
+ * @return
+ */
+int __DENOISE_API denoise_init(void * instance, int samplerate, int channel);
+
+/**
+ * 获取延迟
+ * @param instance
+ */
+float __DENOISE_API denoise_get_latency(void * instance);
+
+/**
+ * reset
+ * @param instance
+ */
+void __DENOISE_API denoise_reset(void * instance);
+
+/**
+ *
+ * @param instance
+ * @param buffer
+ * @param len
+ * @return
+ */
+int __DENOISE_API denoise_process(void * instance, float * buffer, int len);
+
+/**
+ * @param instance
+ */
+void __DENOISE_API denoise_uninit(void * instance);
+
+/**
+ * 销毁实例
+ * @param instance
+ */
+void __DENOISE_API denoise_destory(void ** instance);
+
+
+#ifdef __cplusplus
+};
+#endif
+
+
+#endif //STARMAKER_ANDROID_CLIENT_WEBRTCDENOISEAPI_H
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/audio_buffer.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/audio_buffer.cc
new file mode 100644
index 0000000..579a5c2
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/audio_buffer.cc
@@ -0,0 +1,473 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/audio_buffer.h"
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/include/audio_util.h"
+#include "webrtc/common_audio/resampler/push_sinc_resampler.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/common_audio/channel_buffer.h"
+#include "webrtc/modules/audio_processing/common.h"
+
+namespace webrtc {
+namespace {
+
+const size_t kSamplesPer16kHzChannel = 160;
+const size_t kSamplesPer32kHzChannel = 320;
+const size_t kSamplesPer48kHzChannel = 480;
+
+int KeyboardChannelIndex(const StreamConfig& stream_config) {
+  if (!stream_config.has_keyboard()) {
+    RTC_NOTREACHED();
+    return 0;
+  }
+
+  return stream_config.num_channels();
+}
+
+size_t NumBandsFromSamplesPerChannel(size_t num_frames) {
+  size_t num_bands = 1;
+  if (num_frames == kSamplesPer32kHzChannel ||
+      num_frames == kSamplesPer48kHzChannel) {
+    num_bands = rtc::CheckedDivExact(num_frames, kSamplesPer16kHzChannel);
+  }
+  return num_bands;
+}
+
+}  // namespace
+
+AudioBuffer::AudioBuffer(size_t input_num_frames,
+                         size_t num_input_channels,
+                         size_t process_num_frames,
+                         size_t num_process_channels,
+                         size_t output_num_frames)
+  : input_num_frames_(input_num_frames),
+    num_input_channels_(num_input_channels),
+    proc_num_frames_(process_num_frames),
+    num_proc_channels_(num_process_channels),
+    output_num_frames_(output_num_frames),
+    num_channels_(num_process_channels),
+    num_bands_(NumBandsFromSamplesPerChannel(proc_num_frames_)),
+    num_split_frames_(rtc::CheckedDivExact(proc_num_frames_, num_bands_)),
+    mixed_low_pass_valid_(false),
+    reference_copied_(false),
+    activity_(AudioFrame::kVadUnknown),
+    keyboard_data_(NULL),
+    data_(new IFChannelBuffer(proc_num_frames_, num_proc_channels_)),
+    output_buffer_(new IFChannelBuffer(output_num_frames_, num_channels_)) {
+  RTC_DCHECK_GT(input_num_frames_, 0);
+  RTC_DCHECK_GT(proc_num_frames_, 0);
+  RTC_DCHECK_GT(output_num_frames_, 0);
+  RTC_DCHECK_GT(num_input_channels_, 0);
+  RTC_DCHECK_GT(num_proc_channels_, 0);
+  RTC_DCHECK_LE(num_proc_channels_, num_input_channels_);
+
+  if (input_num_frames_ != proc_num_frames_ ||
+      output_num_frames_ != proc_num_frames_) {
+    // Create an intermediate buffer for resampling.
+    process_buffer_.reset(new ChannelBuffer<float>(proc_num_frames_,
+                                                   num_proc_channels_));
+
+    if (input_num_frames_ != proc_num_frames_) {
+      for (size_t i = 0; i < num_proc_channels_; ++i) {
+        input_resamplers_.push_back(std::unique_ptr<PushSincResampler>(
+            new PushSincResampler(input_num_frames_, proc_num_frames_)));
+      }
+    }
+
+    if (output_num_frames_ != proc_num_frames_) {
+      for (size_t i = 0; i < num_proc_channels_; ++i) {
+        output_resamplers_.push_back(std::unique_ptr<PushSincResampler>(
+            new PushSincResampler(proc_num_frames_, output_num_frames_)));
+      }
+    }
+  }
+
+  if (num_bands_ > 1) {
+    split_data_.reset(new IFChannelBuffer(proc_num_frames_,
+                                          num_proc_channels_,
+                                          num_bands_));
+    splitting_filter_.reset(new SplittingFilter(num_proc_channels_,
+                                                num_bands_,
+                                                proc_num_frames_));
+  }
+}
+
+AudioBuffer::~AudioBuffer() {}
+
+void AudioBuffer::CopyFrom(const float* const* data,
+                           const StreamConfig& stream_config) {
+  RTC_DCHECK_EQ(stream_config.num_frames(), input_num_frames_);
+  RTC_DCHECK_EQ(stream_config.num_channels(), num_input_channels_);
+  InitForNewData();
+  // Initialized lazily because there's a different condition in
+  // DeinterleaveFrom.
+  const bool need_to_downmix =
+      num_input_channels_ > 1 && num_proc_channels_ == 1;
+  if (need_to_downmix && !input_buffer_) {
+    input_buffer_.reset(
+        new IFChannelBuffer(input_num_frames_, num_proc_channels_));
+  }
+
+  if (stream_config.has_keyboard()) {
+    keyboard_data_ = data[KeyboardChannelIndex(stream_config)];
+  }
+
+  // Downmix.
+  const float* const* data_ptr = data;
+  if (need_to_downmix) {
+    DownmixToMono<float, float>(data, input_num_frames_, num_input_channels_,
+                                input_buffer_->fbuf()->channels()[0]);
+    data_ptr = input_buffer_->fbuf_const()->channels();
+  }
+
+  // Resample.
+  if (input_num_frames_ != proc_num_frames_) {
+    for (size_t i = 0; i < num_proc_channels_; ++i) {
+      input_resamplers_[i]->Resample(data_ptr[i],
+                                     input_num_frames_,
+                                     process_buffer_->channels()[i],
+                                     proc_num_frames_);
+    }
+    data_ptr = process_buffer_->channels();
+  }
+
+  // Convert to the S16 range.
+  for (size_t i = 0; i < num_proc_channels_; ++i) {
+    FloatToFloatS16(data_ptr[i],
+                    proc_num_frames_,
+                    data_->fbuf()->channels()[i]);
+  }
+}
+
+void AudioBuffer::CopyTo(const StreamConfig& stream_config,
+                         float* const* data) {
+  RTC_DCHECK_EQ(stream_config.num_frames(), output_num_frames_);
+  RTC_DCHECK(stream_config.num_channels() == num_channels_ ||
+             num_channels_ == 1);
+
+  // Convert to the float range.
+  float* const* data_ptr = data;
+  if (output_num_frames_ != proc_num_frames_) {
+    // Convert to an intermediate buffer for subsequent resampling.
+    data_ptr = process_buffer_->channels();
+  }
+  for (size_t i = 0; i < num_channels_; ++i) {
+    FloatS16ToFloat(data_->fbuf()->channels()[i],
+                    proc_num_frames_,
+                    data_ptr[i]);
+  }
+
+  // Resample.
+  if (output_num_frames_ != proc_num_frames_) {
+    for (size_t i = 0; i < num_channels_; ++i) {
+      output_resamplers_[i]->Resample(data_ptr[i],
+                                      proc_num_frames_,
+                                      data[i],
+                                      output_num_frames_);
+    }
+  }
+
+  // Upmix.
+  for (size_t i = num_channels_; i < stream_config.num_channels(); ++i) {
+    memcpy(data[i], data[0], output_num_frames_ * sizeof(**data));
+  }
+}
+
+void AudioBuffer::InitForNewData() {
+  keyboard_data_ = NULL;
+  mixed_low_pass_valid_ = false;
+  reference_copied_ = false;
+  activity_ = AudioFrame::kVadUnknown;
+  num_channels_ = num_proc_channels_;
+  data_->set_num_channels(num_proc_channels_);
+  if (split_data_.get()) {
+    split_data_->set_num_channels(num_proc_channels_);
+  }
+}
+
+const int16_t* const* AudioBuffer::channels_const() const {
+  return data_->ibuf_const()->channels();
+}
+
+int16_t* const* AudioBuffer::channels() {
+  mixed_low_pass_valid_ = false;
+  return data_->ibuf()->channels();
+}
+
+const int16_t* const* AudioBuffer::split_bands_const(size_t channel) const {
+  return split_data_.get() ?
+         split_data_->ibuf_const()->bands(channel) :
+         data_->ibuf_const()->bands(channel);
+}
+
+int16_t* const* AudioBuffer::split_bands(size_t channel) {
+  mixed_low_pass_valid_ = false;
+  return split_data_.get() ?
+         split_data_->ibuf()->bands(channel) :
+         data_->ibuf()->bands(channel);
+}
+
+const int16_t* const* AudioBuffer::split_channels_const(Band band) const {
+  if (split_data_.get()) {
+    return split_data_->ibuf_const()->channels(band);
+  } else {
+    return band == kBand0To8kHz ? data_->ibuf_const()->channels() : nullptr;
+  }
+}
+
+int16_t* const* AudioBuffer::split_channels(Band band) {
+  mixed_low_pass_valid_ = false;
+  if (split_data_.get()) {
+    return split_data_->ibuf()->channels(band);
+  } else {
+    return band == kBand0To8kHz ? data_->ibuf()->channels() : nullptr;
+  }
+}
+
+ChannelBuffer<int16_t>* AudioBuffer::data() {
+  mixed_low_pass_valid_ = false;
+  return data_->ibuf();
+}
+
+const ChannelBuffer<int16_t>* AudioBuffer::data() const {
+  return data_->ibuf_const();
+}
+
+ChannelBuffer<int16_t>* AudioBuffer::split_data() {
+  mixed_low_pass_valid_ = false;
+  return split_data_.get() ? split_data_->ibuf() : data_->ibuf();
+}
+
+const ChannelBuffer<int16_t>* AudioBuffer::split_data() const {
+  return split_data_.get() ? split_data_->ibuf_const() : data_->ibuf_const();
+}
+
+const float* const* AudioBuffer::channels_const_f() const {
+  return data_->fbuf_const()->channels();
+}
+
+float* const* AudioBuffer::channels_f() {
+  mixed_low_pass_valid_ = false;
+  return data_->fbuf()->channels();
+}
+
+const float* const* AudioBuffer::split_bands_const_f(size_t channel) const {
+  return split_data_.get() ?
+         split_data_->fbuf_const()->bands(channel) :
+         data_->fbuf_const()->bands(channel);
+}
+
+float* const* AudioBuffer::split_bands_f(size_t channel) {
+  mixed_low_pass_valid_ = false;
+  return split_data_.get() ?
+         split_data_->fbuf()->bands(channel) :
+         data_->fbuf()->bands(channel);
+}
+
+const float* const* AudioBuffer::split_channels_const_f(Band band) const {
+  if (split_data_.get()) {
+    return split_data_->fbuf_const()->channels(band);
+  } else {
+    return band == kBand0To8kHz ? data_->fbuf_const()->channels() : nullptr;
+  }
+}
+
+float* const* AudioBuffer::split_channels_f(Band band) {
+  mixed_low_pass_valid_ = false;
+  if (split_data_.get()) {
+    return split_data_->fbuf()->channels(band);
+  } else {
+    return band == kBand0To8kHz ? data_->fbuf()->channels() : nullptr;
+  }
+}
+
+ChannelBuffer<float>* AudioBuffer::data_f() {
+  mixed_low_pass_valid_ = false;
+  return data_->fbuf();
+}
+
+const ChannelBuffer<float>* AudioBuffer::data_f() const {
+  return data_->fbuf_const();
+}
+
+ChannelBuffer<float>* AudioBuffer::split_data_f() {
+  mixed_low_pass_valid_ = false;
+  return split_data_.get() ? split_data_->fbuf() : data_->fbuf();
+}
+
+const ChannelBuffer<float>* AudioBuffer::split_data_f() const {
+  return split_data_.get() ? split_data_->fbuf_const() : data_->fbuf_const();
+}
+
+const int16_t* AudioBuffer::mixed_low_pass_data() {
+  if (num_proc_channels_ == 1) {
+    return split_bands_const(0)[kBand0To8kHz];
+  }
+
+  if (!mixed_low_pass_valid_) {
+    if (!mixed_low_pass_channels_.get()) {
+      mixed_low_pass_channels_.reset(
+          new ChannelBuffer<int16_t>(num_split_frames_, 1));
+    }
+
+    DownmixToMono<int16_t, int32_t>(split_channels_const(kBand0To8kHz),
+                                    num_split_frames_, num_channels_,
+                                    mixed_low_pass_channels_->channels()[0]);
+    mixed_low_pass_valid_ = true;
+  }
+  return mixed_low_pass_channels_->channels()[0];
+}
+
+const int16_t* AudioBuffer::low_pass_reference(int channel) const {
+  if (!reference_copied_) {
+    return NULL;
+  }
+
+  return low_pass_reference_channels_->channels()[channel];
+}
+
+const float* AudioBuffer::keyboard_data() const {
+  return keyboard_data_;
+}
+
+void AudioBuffer::set_activity(AudioFrame::VADActivity activity) {
+  activity_ = activity;
+}
+
+AudioFrame::VADActivity AudioBuffer::activity() const {
+  return activity_;
+}
+
+size_t AudioBuffer::num_channels() const {
+  return num_channels_;
+}
+
+void AudioBuffer::set_num_channels(size_t num_channels) {
+  num_channels_ = num_channels;
+  data_->set_num_channels(num_channels);
+  if (split_data_.get()) {
+    split_data_->set_num_channels(num_channels);
+  }
+}
+
+size_t AudioBuffer::num_frames() const {
+  return proc_num_frames_;
+}
+
+size_t AudioBuffer::num_frames_per_band() const {
+  return num_split_frames_;
+}
+
+size_t AudioBuffer::num_keyboard_frames() const {
+  // We don't resample the keyboard channel.
+  return input_num_frames_;
+}
+
+size_t AudioBuffer::num_bands() const {
+  return num_bands_;
+}
+
+// The resampler is only for supporting 48kHz to 16kHz in the reverse stream.
+void AudioBuffer::DeinterleaveFrom(AudioFrame* frame) {
+  RTC_DCHECK_EQ(frame->num_channels_, num_input_channels_);
+  RTC_DCHECK_EQ(frame->samples_per_channel_, input_num_frames_);
+  InitForNewData();
+  // Initialized lazily because there's a different condition in CopyFrom.
+  if ((input_num_frames_ != proc_num_frames_) && !input_buffer_) {
+    input_buffer_.reset(
+        new IFChannelBuffer(input_num_frames_, num_proc_channels_));
+  }
+  activity_ = frame->vad_activity_;
+
+  int16_t* const* deinterleaved;
+  if (input_num_frames_ == proc_num_frames_) {
+    deinterleaved = data_->ibuf()->channels();
+  } else {
+    deinterleaved = input_buffer_->ibuf()->channels();
+  }
+  if (num_proc_channels_ == 1) {
+    // Downmix and deinterleave simultaneously.
+    DownmixInterleavedToMono(frame->data_, input_num_frames_,
+                             num_input_channels_, deinterleaved[0]);
+  } else {
+    RTC_DCHECK_EQ(num_proc_channels_, num_input_channels_);
+    Deinterleave(frame->data_,
+                 input_num_frames_,
+                 num_proc_channels_,
+                 deinterleaved);
+  }
+
+  // Resample.
+  if (input_num_frames_ != proc_num_frames_) {
+    for (size_t i = 0; i < num_proc_channels_; ++i) {
+      input_resamplers_[i]->Resample(input_buffer_->fbuf_const()->channels()[i],
+                                     input_num_frames_,
+                                     data_->fbuf()->channels()[i],
+                                     proc_num_frames_);
+    }
+  }
+}
+
+void AudioBuffer::InterleaveTo(AudioFrame* frame, bool data_changed) const {
+  frame->vad_activity_ = activity_;
+  if (!data_changed) {
+    return;
+  }
+
+  RTC_DCHECK(frame->num_channels_ == num_channels_ || num_channels_ == 1);
+  RTC_DCHECK_EQ(frame->samples_per_channel_, output_num_frames_);
+
+  // Resample if necessary.
+  IFChannelBuffer* data_ptr = data_.get();
+  if (proc_num_frames_ != output_num_frames_) {
+    for (size_t i = 0; i < num_channels_; ++i) {
+      output_resamplers_[i]->Resample(
+          data_->fbuf()->channels()[i], proc_num_frames_,
+          output_buffer_->fbuf()->channels()[i], output_num_frames_);
+    }
+    data_ptr = output_buffer_.get();
+  }
+
+  if (frame->num_channels_ == num_channels_) {
+    Interleave(data_ptr->ibuf()->channels(), output_num_frames_, num_channels_,
+               frame->data_);
+  } else {
+    UpmixMonoToInterleaved(data_ptr->ibuf()->channels()[0], output_num_frames_,
+                           frame->num_channels_, frame->data_);
+  }
+}
+
+void AudioBuffer::CopyLowPassToReference() {
+  reference_copied_ = true;
+  if (!low_pass_reference_channels_.get() ||
+      low_pass_reference_channels_->num_channels() != num_channels_) {
+    low_pass_reference_channels_.reset(
+        new ChannelBuffer<int16_t>(num_split_frames_,
+                                   num_proc_channels_));
+  }
+  for (size_t i = 0; i < num_proc_channels_; i++) {
+    memcpy(low_pass_reference_channels_->channels()[i],
+           split_bands_const(i)[kBand0To8kHz],
+           low_pass_reference_channels_->num_frames_per_band() *
+               sizeof(split_bands_const(i)[kBand0To8kHz][0]));
+  }
+}
+
+void AudioBuffer::SplitIntoFrequencyBands() {
+  splitting_filter_->Analysis(data_.get(), split_data_.get());
+}
+
+void AudioBuffer::MergeFrequencyBands() {
+  splitting_filter_->Synthesis(split_data_.get(), data_.get());
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/audio_buffer.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/audio_buffer.h
new file mode 100644
index 0000000..da75dbf
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/audio_buffer.h
@@ -0,0 +1,166 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
+
+#include <memory>
+#include <vector>
+
+#include "webrtc/common_audio/channel_buffer.h"
+#include "webrtc/modules/audio_processing/include/audio_processing.h"
+#include "webrtc/modules/audio_processing/splitting_filter.h"
+#include "webrtc/modules/include/module_common_types.h"
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+class PushSincResampler;
+class IFChannelBuffer;
+
+enum Band {
+  kBand0To8kHz = 0,
+  kBand8To16kHz = 1,
+  kBand16To24kHz = 2
+};
+
+class AudioBuffer {
+ public:
+  // TODO(ajm): Switch to take ChannelLayouts.
+  AudioBuffer(size_t input_num_frames,
+              size_t num_input_channels,
+              size_t process_num_frames,
+              size_t num_process_channels,
+              size_t output_num_frames);
+  virtual ~AudioBuffer();
+
+  size_t num_channels() const;
+  void set_num_channels(size_t num_channels);
+  size_t num_frames() const;
+  size_t num_frames_per_band() const;
+  size_t num_keyboard_frames() const;
+  size_t num_bands() const;
+
+  // Returns a pointer array to the full-band channels.
+  // Usage:
+  // channels()[channel][sample].
+  // Where:
+  // 0 <= channel < |num_proc_channels_|
+  // 0 <= sample < |proc_num_frames_|
+  int16_t* const* channels();
+  const int16_t* const* channels_const() const;
+  float* const* channels_f();
+  const float* const* channels_const_f() const;
+
+  // Returns a pointer array to the bands for a specific channel.
+  // Usage:
+  // split_bands(channel)[band][sample].
+  // Where:
+  // 0 <= channel < |num_proc_channels_|
+  // 0 <= band < |num_bands_|
+  // 0 <= sample < |num_split_frames_|
+  int16_t* const* split_bands(size_t channel);
+  const int16_t* const* split_bands_const(size_t channel) const;
+  float* const* split_bands_f(size_t channel);
+  const float* const* split_bands_const_f(size_t channel) const;
+
+  // Returns a pointer array to the channels for a specific band.
+  // Usage:
+  // split_channels(band)[channel][sample].
+  // Where:
+  // 0 <= band < |num_bands_|
+  // 0 <= channel < |num_proc_channels_|
+  // 0 <= sample < |num_split_frames_|
+  int16_t* const* split_channels(Band band);
+  const int16_t* const* split_channels_const(Band band) const;
+  float* const* split_channels_f(Band band);
+  const float* const* split_channels_const_f(Band band) const;
+
+  // Returns a pointer to the ChannelBuffer that encapsulates the full-band
+  // data.
+  ChannelBuffer<int16_t>* data();
+  const ChannelBuffer<int16_t>* data() const;
+  ChannelBuffer<float>* data_f();
+  const ChannelBuffer<float>* data_f() const;
+
+  // Returns a pointer to the ChannelBuffer that encapsulates the split data.
+  ChannelBuffer<int16_t>* split_data();
+  const ChannelBuffer<int16_t>* split_data() const;
+  ChannelBuffer<float>* split_data_f();
+  const ChannelBuffer<float>* split_data_f() const;
+
+  // Returns a pointer to the low-pass data downmixed to mono. If this data
+  // isn't already available it re-calculates it.
+  const int16_t* mixed_low_pass_data();
+  const int16_t* low_pass_reference(int channel) const;
+
+  const float* keyboard_data() const;
+
+  void set_activity(AudioFrame::VADActivity activity);
+  AudioFrame::VADActivity activity() const;
+
+  // Use for int16 interleaved data.
+  void DeinterleaveFrom(AudioFrame* audioFrame);
+  // If |data_changed| is false, only the non-audio data members will be copied
+  // to |frame|.
+  void InterleaveTo(AudioFrame* frame, bool data_changed) const;
+
+  // Use for float deinterleaved data.
+  void CopyFrom(const float* const* data, const StreamConfig& stream_config);
+  void CopyTo(const StreamConfig& stream_config, float* const* data);
+  void CopyLowPassToReference();
+
+  // Splits the signal into different bands.
+  void SplitIntoFrequencyBands();
+  // Recombine the different bands into one signal.
+  void MergeFrequencyBands();
+
+ private:
+  FRIEND_TEST_ALL_PREFIXES(AudioBufferTest,
+                           SetNumChannelsSetsChannelBuffersNumChannels);
+  // Called from DeinterleaveFrom() and CopyFrom().
+  void InitForNewData();
+
+  // The audio is passed into DeinterleaveFrom() or CopyFrom() with input
+  // format (samples per channel and number of channels).
+  const size_t input_num_frames_;
+  const size_t num_input_channels_;
+  // The audio is stored by DeinterleaveFrom() or CopyFrom() with processing
+  // format.
+  const size_t proc_num_frames_;
+  const size_t num_proc_channels_;
+  // The audio is returned by InterleaveTo() and CopyTo() with output samples
+  // per channels and the current number of channels. This last one can be
+  // changed at any time using set_num_channels().
+  const size_t output_num_frames_;
+  size_t num_channels_;
+
+  size_t num_bands_;
+  size_t num_split_frames_;
+  bool mixed_low_pass_valid_;
+  bool reference_copied_;
+  AudioFrame::VADActivity activity_;
+
+  const float* keyboard_data_;
+  std::unique_ptr<IFChannelBuffer> data_;
+  std::unique_ptr<IFChannelBuffer> split_data_;
+  std::unique_ptr<SplittingFilter> splitting_filter_;
+  std::unique_ptr<ChannelBuffer<int16_t> > mixed_low_pass_channels_;
+  std::unique_ptr<ChannelBuffer<int16_t> > low_pass_reference_channels_;
+  std::unique_ptr<IFChannelBuffer> input_buffer_;
+  std::unique_ptr<IFChannelBuffer> output_buffer_;
+  std::unique_ptr<ChannelBuffer<float> > process_buffer_;
+  std::vector<std::unique_ptr<PushSincResampler>> input_resamplers_;
+  std::vector<std::unique_ptr<PushSincResampler>> output_resamplers_;
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/common.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/common.h
new file mode 100644
index 0000000..184e2a5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/common.h
@@ -0,0 +1,34 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_COMMON_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_COMMON_H_
+
+#include "webrtc/base/checks.h"
+#include "webrtc/modules/audio_processing/include/audio_processing.h"
+
+namespace webrtc {
+
+static inline size_t ChannelsFromLayout(AudioProcessing::ChannelLayout layout) {
+  switch (layout) {
+    case AudioProcessing::kMono:
+    case AudioProcessing::kMonoAndKeyboard:
+      return 1;
+    case AudioProcessing::kStereo:
+    case AudioProcessing::kStereoAndKeyboard:
+      return 2;
+  }
+  RTC_NOTREACHED();
+  return 0;
+}
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_COMMON_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/include/audio_processing.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/include/audio_processing.h
new file mode 100644
index 0000000..6ea223a
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/include/audio_processing.h
@@ -0,0 +1,159 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_INCLUDE_AUDIO_PROCESSING_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_INCLUDE_AUDIO_PROCESSING_H_
+
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+class AudioProcessing {
+ public:
+  // TODO(mgraczyk): Remove once all methods that use ChannelLayout are gone.
+  enum ChannelLayout {
+    kMono,
+    // Left, right.
+    kStereo,
+    // Mono, keyboard, and mic.
+    kMonoAndKeyboard,
+    // Left, right, keyboard, and mic.
+    kStereoAndKeyboard
+  };
+
+  enum Error {
+	  // Fatal errors.
+	  kNoError = 0,
+	  kUnspecifiedError = -1,
+	  kCreationFailedError = -2,
+	  kUnsupportedComponentError = -3,
+	  kUnsupportedFunctionError = -4,
+	  kNullPointerError = -5,
+	  kBadParameterError = -6,
+	  kBadSampleRateError = -7,
+	  kBadDataLengthError = -8,
+	  kBadNumberChannelsError = -9,
+	  kFileError = -10,
+	  kStreamParameterNotSetError = -11,
+	  kNotEnabledError = -12,
+
+	  // Warnings are non-fatal.
+	  // This results when a set_stream_ parameter is out of range. Processing
+	  // will continue, but the parameter may have been truncated.
+	  kBadStreamParameterWarning = -13
+  };
+
+  enum NativeRate {
+	  kSampleRate8kHz = 8000,
+	  kSampleRate16kHz = 16000,
+	  kSampleRate32kHz = 32000,
+	  kSampleRate48kHz = 48000
+  };
+
+  static const int kChunkSizeMs = 10;
+};
+
+class StreamConfig {
+ public:
+  // sample_rate_hz: The sampling rate of the stream.
+  //
+  // num_channels: The number of audio channels in the stream, excluding the
+  //               keyboard channel if it is present. When passing a
+  //               StreamConfig with an array of arrays T*[N],
+  //
+  //                N == {num_channels + 1  if  has_keyboard
+  //                     {num_channels      if  !has_keyboard
+  //
+  // has_keyboard: True if the stream has a keyboard channel. When has_keyboard
+  //               is true, the last channel in any corresponding list of
+  //               channels is the keyboard channel.
+  StreamConfig(int sample_rate_hz = 0,
+               size_t num_channels = 0,
+               bool has_keyboard = false)
+      : sample_rate_hz_(sample_rate_hz),
+        num_channels_(num_channels),
+        has_keyboard_(has_keyboard),
+        num_frames_(calculate_frames(sample_rate_hz)) {}
+
+  void set_sample_rate_hz(int value) {
+    sample_rate_hz_ = value;
+    num_frames_ = calculate_frames(value);
+  }
+  void set_num_channels(size_t value) { num_channels_ = value; }
+  void set_has_keyboard(bool value) { has_keyboard_ = value; }
+
+  int sample_rate_hz() const { return sample_rate_hz_; }
+
+  // The number of channels in the stream, not including the keyboard channel if
+  // present.
+  size_t num_channels() const { return num_channels_; }
+
+  bool has_keyboard() const { return has_keyboard_; }
+  size_t num_frames() const { return num_frames_; }
+  size_t num_samples() const { return num_channels_ * num_frames_; }
+
+  bool operator==(const StreamConfig& other) const {
+    return sample_rate_hz_ == other.sample_rate_hz_ &&
+           num_channels_ == other.num_channels_ &&
+           has_keyboard_ == other.has_keyboard_;
+  }
+
+  bool operator!=(const StreamConfig& other) const { return !(*this == other); }
+
+ private:
+  static size_t calculate_frames(int sample_rate_hz) {
+    return static_cast<size_t>(
+        AudioProcessing::kChunkSizeMs * sample_rate_hz / 1000);
+  }
+
+  int sample_rate_hz_;
+  size_t num_channels_;
+  bool has_keyboard_;
+  size_t num_frames_;
+};
+
+
+//
+// The noise suppression (NS) component attempts to remove noise while
+// retaining speech. Recommended to be enabled on the client-side.
+//
+// Recommended to be enabled on the client-side.
+class NoiseSuppression {
+ public:
+  virtual int Enable(bool enable) = 0;
+  virtual bool is_enabled() const = 0;
+
+  // Determines the aggressiveness of the suppression. Increasing the level
+  // will reduce the noise level at the expense of a higher speech distortion.
+  enum Level {
+    kLow,
+    kModerate,
+    kHigh,
+    kVeryHigh
+  };
+
+  virtual int set_level(Level level) = 0;
+  virtual Level level() const = 0;
+
+  // Returns the internally computed prior speech probability of current frame
+  // averaged over output channels. This is not supported in fixed point, for
+  // which |kUnsupportedFunctionError| is returned.
+  virtual float speech_probability() const = 0;
+
+  // Returns the noise estimate per frequency bin averaged over all channels.
+  virtual std::vector<float> NoiseEstimate() = 0;
+
+ protected:
+  virtual ~NoiseSuppression() {}
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_INCLUDE_AUDIO_PROCESSING_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/noise_suppression_impl.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/noise_suppression_impl.cc
new file mode 100644
index 0000000..628b951
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/noise_suppression_impl.cc
@@ -0,0 +1,213 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/noise_suppression_impl.h"
+
+#include "webrtc/base/constructormagic.h"
+#include "webrtc/modules/audio_processing/audio_buffer.h"
+#if defined(WEBRTC_NS_FLOAT)
+#include "webrtc/modules/audio_processing/ns/noise_suppression.h"
+#define NS_CREATE WebRtcNs_Create
+#define NS_FREE WebRtcNs_Free
+#define NS_INIT WebRtcNs_Init
+#define NS_SET_POLICY WebRtcNs_set_policy
+typedef NsHandle NsState;
+#elif defined(WEBRTC_NS_FIXED)
+#include "webrtc/modules/audio_processing/ns/noise_suppression_x.h"
+#define NS_CREATE WebRtcNsx_Create
+#define NS_FREE WebRtcNsx_Free
+#define NS_INIT WebRtcNsx_Init
+#define NS_SET_POLICY WebRtcNsx_set_policy
+typedef NsxHandle NsState;
+#endif
+
+namespace webrtc {
+class NoiseSuppressionImpl::Suppressor {
+ public:
+  explicit Suppressor(int sample_rate_hz) {
+    state_ = NS_CREATE();
+    RTC_CHECK(state_);
+    int error = NS_INIT(state_, sample_rate_hz);
+    RTC_DCHECK_EQ(0, error);
+  }
+  ~Suppressor() {
+    NS_FREE(state_);
+  }
+  NsState* state() { return state_; }
+ private:
+  NsState* state_ = nullptr;
+  RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(Suppressor);
+};
+
+NoiseSuppressionImpl::NoiseSuppressionImpl(rtc::CriticalSection* crit)
+    : crit_(crit) {
+  RTC_DCHECK(crit);
+}
+
+NoiseSuppressionImpl::~NoiseSuppressionImpl() {}
+
+void NoiseSuppressionImpl::Initialize(size_t channels, int sample_rate_hz) {
+  rtc::CritScope cs(crit_);
+  channels_ = channels;
+  sample_rate_hz_ = sample_rate_hz;
+  std::vector<std::unique_ptr<Suppressor>> new_suppressors;
+  if (enabled_) {
+    new_suppressors.resize(channels);
+    for (size_t i = 0; i < channels; i++) {
+      new_suppressors[i].reset(new Suppressor(sample_rate_hz));
+    }
+  }
+  suppressors_.swap(new_suppressors);
+  set_level(level_);
+}
+
+void NoiseSuppressionImpl::AnalyzeCaptureAudio(AudioBuffer* audio) {
+  RTC_DCHECK(audio);
+#if defined(WEBRTC_NS_FLOAT)
+  rtc::CritScope cs(crit_);
+  if (!enabled_) {
+    return;
+  }
+
+  RTC_DCHECK_GE(160, audio->num_frames_per_band());
+  RTC_DCHECK_EQ(suppressors_.size(), audio->num_channels());
+  for (size_t i = 0; i < suppressors_.size(); i++) {
+    WebRtcNs_Analyze(suppressors_[i]->state(),
+                     audio->split_bands_const_f(i)[kBand0To8kHz]);
+  }
+#endif
+}
+
+void NoiseSuppressionImpl::ProcessCaptureAudio(AudioBuffer* audio) {
+  RTC_DCHECK(audio);
+  rtc::CritScope cs(crit_);
+  if (!enabled_) {
+    return;
+  }
+
+  RTC_DCHECK_GE(160, audio->num_frames_per_band());
+  RTC_DCHECK_EQ(suppressors_.size(), audio->num_channels());
+  for (size_t i = 0; i < suppressors_.size(); i++) {
+#if defined(WEBRTC_NS_FLOAT)
+    WebRtcNs_Process(suppressors_[i]->state(),
+                     audio->split_bands_const_f(i),
+                     audio->num_bands(),
+                     audio->split_bands_f(i));
+#elif defined(WEBRTC_NS_FIXED)
+    WebRtcNsx_Process(suppressors_[i]->state(),
+                      audio->split_bands_const(i),
+                      audio->num_bands(),
+                      audio->split_bands(i));
+#endif
+  }
+}
+
+int NoiseSuppressionImpl::Enable(bool enable) {
+  rtc::CritScope cs(crit_);
+  if (enabled_ != enable) {
+    enabled_ = enable;
+    Initialize(channels_, sample_rate_hz_);
+  }
+  return AudioProcessing::kNoError;
+}
+
+bool NoiseSuppressionImpl::is_enabled() const {
+  rtc::CritScope cs(crit_);
+  return enabled_;
+}
+
+int NoiseSuppressionImpl::set_level(Level level) {
+  int policy = 1;
+  switch (level) {
+    case NoiseSuppression::kLow:
+      policy = 0;
+      break;
+    case NoiseSuppression::kModerate:
+      policy = 1;
+      break;
+    case NoiseSuppression::kHigh:
+      policy = 2;
+      break;
+    case NoiseSuppression::kVeryHigh:
+      policy = 3;
+      break;
+    default:
+      RTC_NOTREACHED();
+  }
+  rtc::CritScope cs(crit_);
+  level_ = level;
+  for (auto& suppressor : suppressors_) {
+    int error = NS_SET_POLICY(suppressor->state(), policy);
+    RTC_DCHECK_EQ(0, error);
+  }
+  return AudioProcessing::kNoError;
+}
+
+NoiseSuppression::Level NoiseSuppressionImpl::level() const {
+  rtc::CritScope cs(crit_);
+  return level_;
+}
+
+float NoiseSuppressionImpl::speech_probability() const {
+  rtc::CritScope cs(crit_);
+#if defined(WEBRTC_NS_FLOAT)
+  float probability_average = 0.0f;
+  for (auto& suppressor : suppressors_) {
+    probability_average +=
+        WebRtcNs_prior_speech_probability(suppressor->state());
+  }
+  if (!suppressors_.empty()) {
+    probability_average /= suppressors_.size();
+  }
+  return probability_average;
+#elif defined(WEBRTC_NS_FIXED)
+  // TODO(peah): Returning error code as a float! Remove this.
+  // Currently not available for the fixed point implementation.
+  return AudioProcessing::kUnsupportedFunctionError;
+#endif
+}
+
+std::vector<float> NoiseSuppressionImpl::NoiseEstimate() {
+  rtc::CritScope cs(crit_);
+  std::vector<float> noise_estimate;
+#if defined(WEBRTC_NS_FLOAT)
+  const float kNumChannelsFraction = 1.f / suppressors_.size();
+  noise_estimate.assign(WebRtcNs_num_freq(), 0.f);
+  for (auto& suppressor : suppressors_) {
+    const float* noise = WebRtcNs_noise_estimate(suppressor->state());
+    for (size_t i = 0; i < noise_estimate.size(); ++i) {
+      noise_estimate[i] += kNumChannelsFraction * noise[i];
+    }
+  }
+#elif defined(WEBRTC_NS_FIXED)
+  noise_estimate.assign(WebRtcNsx_num_freq(), 0.f);
+  for (auto& suppressor : suppressors_) {
+    int q_noise;
+    const uint32_t* noise = WebRtcNsx_noise_estimate(suppressor->state(),
+                                                     &q_noise);
+    const float kNormalizationFactor =
+        1.f / ((1 << q_noise) * suppressors_.size());
+    for (size_t i = 0; i < noise_estimate.size(); ++i) {
+      noise_estimate[i] += kNormalizationFactor * noise[i];
+    }
+  }
+#endif
+  return noise_estimate;
+}
+
+size_t NoiseSuppressionImpl::num_noise_bins() {
+#if defined(WEBRTC_NS_FLOAT)
+  return WebRtcNs_num_freq();
+#elif defined(WEBRTC_NS_FIXED)
+  return WebRtcNsx_num_freq();
+#endif
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/noise_suppression_impl.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/noise_suppression_impl.h
new file mode 100644
index 0000000..9fa6e12
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/noise_suppression_impl.h
@@ -0,0 +1,56 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NOISE_SUPPRESSION_IMPL_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NOISE_SUPPRESSION_IMPL_H_
+
+#include <memory>
+#include <vector>
+
+#include "webrtc/base/constructormagic.h"
+#include "webrtc/base/criticalsection.h"
+#include "webrtc/modules/audio_processing/include/audio_processing.h"
+
+namespace webrtc {
+
+class AudioBuffer;
+
+class NoiseSuppressionImpl : public NoiseSuppression {
+ public:
+  explicit NoiseSuppressionImpl(rtc::CriticalSection* crit);
+  ~NoiseSuppressionImpl() override;
+
+  // TODO(peah): Fold into ctor, once public API is removed.
+  void Initialize(size_t channels, int sample_rate_hz);
+  void AnalyzeCaptureAudio(AudioBuffer* audio);
+  void ProcessCaptureAudio(AudioBuffer* audio);
+
+  // NoiseSuppression implementation.
+  int Enable(bool enable) override;
+  bool is_enabled() const override;
+  int set_level(Level level) override;
+  Level level() const override;
+  float speech_probability() const override;
+  std::vector<float> NoiseEstimate() override;
+  static size_t num_noise_bins();
+
+ private:
+  class Suppressor;
+  rtc::CriticalSection* const crit_;
+  bool enabled_ GUARDED_BY(crit_) = false;
+  Level level_ GUARDED_BY(crit_) = kModerate;
+  size_t channels_ GUARDED_BY(crit_) = 0;
+  int sample_rate_hz_ GUARDED_BY(crit_) = 0;
+  std::vector< std::unique_ptr<Suppressor> > suppressors_ GUARDED_BY(crit_);
+  RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(NoiseSuppressionImpl);
+};
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_NOISE_SUPPRESSION_IMPL_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/defines.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/defines.h
new file mode 100644
index 0000000..8271332
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/defines.h
@@ -0,0 +1,49 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_DEFINES_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_DEFINES_H_
+
+#define BLOCKL_MAX          160 // max processing block length: 160
+#define ANAL_BLOCKL_MAX     256 // max analysis block length: 256
+#define HALF_ANAL_BLOCKL    129 // half max analysis block length + 1
+#define NUM_HIGH_BANDS_MAX  2   // max number of high bands: 2
+
+#define QUANTILE            (float)0.25
+
+#define SIMULT              3
+#define END_STARTUP_LONG    200
+#define END_STARTUP_SHORT   50
+#define FACTOR              (float)40.0
+#define WIDTH               (float)0.01
+
+// Length of fft work arrays.
+#define IP_LENGTH (ANAL_BLOCKL_MAX >> 1) // must be at least ceil(2 + sqrt(ANAL_BLOCKL_MAX/2))
+#define W_LENGTH (ANAL_BLOCKL_MAX >> 1)
+
+//PARAMETERS FOR NEW METHOD
+#define DD_PR_SNR           (float)0.98 // DD update of prior SNR
+#define LRT_TAVG            (float)0.50 // tavg parameter for LRT (previously 0.90)
+#define SPECT_FL_TAVG       (float)0.30 // tavg parameter for spectral flatness measure
+#define SPECT_DIFF_TAVG     (float)0.30 // tavg parameter for spectral difference measure
+#define PRIOR_UPDATE        (float)0.10 // update parameter of prior model
+#define NOISE_UPDATE        (float)0.90 // update parameter for noise
+#define SPEECH_UPDATE       (float)0.99 // update parameter when likely speech
+#define WIDTH_PR_MAP        (float)4.0  // width parameter in sigmoid map for prior model
+#define LRT_FEATURE_THR     (float)0.5  // default threshold for LRT feature
+#define SF_FEATURE_THR      (float)0.5  // default threshold for Spectral Flatness feature
+#define SD_FEATURE_THR      (float)0.5  // default threshold for Spectral Difference feature
+#define PROB_RANGE          (float)0.20 // probability threshold for noise state in
+                                        // speech/noise likelihood
+#define HIST_PAR_EST         1000       // histogram size for estimation of parameters
+#define GAMMA_PAUSE         (float)0.05 // update for conservative noise estimate
+//
+#define B_LIM               (float)0.5  // threshold in final energy gain factor calculation
+#endif // WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_DEFINES_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression.c
new file mode 100644
index 0000000..8b6f45f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression.c
@@ -0,0 +1,71 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/ns/noise_suppression.h"
+
+#include <stdlib.h>
+#include <string.h>
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/modules/audio_processing/ns/defines.h"
+#include "webrtc/modules/audio_processing/ns/ns_core.h"
+
+NsHandle* WebRtcNs_Create() {
+  NoiseSuppressionC* self = malloc(sizeof(NoiseSuppressionC));
+  self->initFlag = 0;
+  return (NsHandle*)self;
+}
+
+void WebRtcNs_Free(NsHandle* NS_inst) {
+  free(NS_inst);
+}
+
+int WebRtcNs_Init(NsHandle* NS_inst, uint32_t fs) {
+  return WebRtcNs_InitCore((NoiseSuppressionC*)NS_inst, fs);
+}
+
+int WebRtcNs_set_policy(NsHandle* NS_inst, int mode) {
+  return WebRtcNs_set_policy_core((NoiseSuppressionC*)NS_inst, mode);
+}
+
+void WebRtcNs_Analyze(NsHandle* NS_inst, const float* spframe) {
+  WebRtcNs_AnalyzeCore((NoiseSuppressionC*)NS_inst, spframe);
+}
+
+void WebRtcNs_Process(NsHandle* NS_inst,
+                      const float* const* spframe,
+                      size_t num_bands,
+                      float* const* outframe) {
+  WebRtcNs_ProcessCore((NoiseSuppressionC*)NS_inst, spframe, num_bands,
+                       outframe);
+}
+
+float WebRtcNs_prior_speech_probability(NsHandle* handle) {
+  NoiseSuppressionC* self = (NoiseSuppressionC*)handle;
+  if (handle == NULL) {
+    return -1;
+  }
+  if (self->initFlag == 0) {
+    return -1;
+  }
+  return self->priorSpeechProb;
+}
+
+const float* WebRtcNs_noise_estimate(const NsHandle* handle) {
+  const NoiseSuppressionC* self = (const NoiseSuppressionC*)handle;
+  if (handle == NULL || self->initFlag == 0) {
+    return NULL;
+  }
+  return self->noise;
+}
+
+size_t WebRtcNs_num_freq() {
+  return HALF_ANAL_BLOCKL;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression.h
new file mode 100644
index 0000000..41cad4e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression.h
@@ -0,0 +1,135 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSION_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSION_H_
+
+#include <stddef.h>
+
+#include "webrtc/typedefs.h"
+
+typedef struct NsHandleT NsHandle;
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/*
+ * This function creates an instance of the floating point Noise Suppression.
+ */
+NsHandle* WebRtcNs_Create();
+
+/*
+ * This function frees the dynamic memory of a specified noise suppression
+ * instance.
+ *
+ * Input:
+ *      - NS_inst       : Pointer to NS instance that should be freed
+ */
+void WebRtcNs_Free(NsHandle* NS_inst);
+
+/*
+ * This function initializes a NS instance and has to be called before any other
+ * processing is made.
+ *
+ * Input:
+ *      - NS_inst       : Instance that should be initialized
+ *      - fs            : sampling frequency
+ *
+ * Output:
+ *      - NS_inst       : Initialized instance
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int WebRtcNs_Init(NsHandle* NS_inst, uint32_t fs);
+
+/*
+ * This changes the aggressiveness of the noise suppression method.
+ *
+ * Input:
+ *      - NS_inst       : Noise suppression instance.
+ *      - mode          : 0: Mild, 1: Medium , 2: Aggressive
+ *
+ * Output:
+ *      - NS_inst       : Updated instance.
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int WebRtcNs_set_policy(NsHandle* NS_inst, int mode);
+
+/*
+ * This functions estimates the background noise for the inserted speech frame.
+ * The input and output signals should always be 10ms (80 or 160 samples).
+ *
+ * Input
+ *      - NS_inst       : Noise suppression instance.
+ *      - spframe       : Pointer to speech frame buffer for L band
+ *
+ * Output:
+ *      - NS_inst       : Updated NS instance
+ */
+void WebRtcNs_Analyze(NsHandle* NS_inst, const float* spframe);
+
+/*
+ * This functions does Noise Suppression for the inserted speech frame. The
+ * input and output signals should always be 10ms (80 or 160 samples).
+ *
+ * Input
+ *      - NS_inst       : Noise suppression instance.
+ *      - spframe       : Pointer to speech frame buffer for each band
+ *      - num_bands     : Number of bands
+ *
+ * Output:
+ *      - NS_inst       : Updated NS instance
+ *      - outframe      : Pointer to output frame for each band
+ */
+void WebRtcNs_Process(NsHandle* NS_inst,
+                     const float* const* spframe,
+                     size_t num_bands,
+                     float* const* outframe);
+
+/* Returns the internally used prior speech probability of the current frame.
+ * There is a frequency bin based one as well, with which this should not be
+ * confused.
+ *
+ * Input
+ *      - handle        : Noise suppression instance.
+ *
+ * Return value         : Prior speech probability in interval [0.0, 1.0].
+ *                        -1 - NULL pointer or uninitialized instance.
+ */
+float WebRtcNs_prior_speech_probability(NsHandle* handle);
+
+/* Returns a pointer to the noise estimate per frequency bin. The number of
+ * frequency bins can be provided using WebRtcNs_num_freq().
+ *
+ * Input
+ *      - handle        : Noise suppression instance.
+ *
+ * Return value         : Pointer to the noise estimate per frequency bin.
+ *                        Returns NULL if the input is a NULL pointer or an
+ *                        uninitialized instance.
+ */
+const float* WebRtcNs_noise_estimate(const NsHandle* handle);
+
+/* Returns the number of frequency bins, which is the length of the noise
+ * estimate for example.
+ *
+ * Return value         : Number of frequency bins.
+ */
+size_t WebRtcNs_num_freq();
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSION_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression_x.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression_x.c
new file mode 100644
index 0000000..28a07e8
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression_x.c
@@ -0,0 +1,61 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/ns/noise_suppression_x.h"
+
+#include <stdlib.h>
+
+#include "webrtc/common_audio/signal_processing/include/real_fft.h"
+#include "webrtc/modules/audio_processing/ns/nsx_core.h"
+#include "webrtc/modules/audio_processing/ns/nsx_defines.h"
+
+NsxHandle* WebRtcNsx_Create() {
+  NoiseSuppressionFixedC* self = malloc(sizeof(NoiseSuppressionFixedC));
+  WebRtcSpl_Init();
+  self->real_fft = NULL;
+  self->initFlag = 0;
+  return (NsxHandle*)self;
+}
+
+void WebRtcNsx_Free(NsxHandle* nsxInst) {
+  WebRtcSpl_FreeRealFFT(((NoiseSuppressionFixedC*)nsxInst)->real_fft);
+  free(nsxInst);
+}
+
+int WebRtcNsx_Init(NsxHandle* nsxInst, uint32_t fs) {
+  return WebRtcNsx_InitCore((NoiseSuppressionFixedC*)nsxInst, fs);
+}
+
+int WebRtcNsx_set_policy(NsxHandle* nsxInst, int mode) {
+  return WebRtcNsx_set_policy_core((NoiseSuppressionFixedC*)nsxInst, mode);
+}
+
+void WebRtcNsx_Process(NsxHandle* nsxInst,
+                      const short* const* speechFrame,
+                      int num_bands,
+                      short* const* outFrame) {
+  WebRtcNsx_ProcessCore((NoiseSuppressionFixedC*)nsxInst, speechFrame,
+                        num_bands, outFrame);
+}
+
+const uint32_t* WebRtcNsx_noise_estimate(const NsxHandle* nsxInst,
+                                         int* q_noise) {
+  *q_noise = 11;
+  const NoiseSuppressionFixedC* self = (const NoiseSuppressionFixedC*)nsxInst;
+  if (nsxInst == NULL || self->initFlag == 0) {
+    return NULL;
+  }
+  *q_noise += self->prevQNoise;
+  return self->prevNoiseU32;
+}
+
+size_t WebRtcNsx_num_freq() {
+  return HALF_ANAL_BLOCKL;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression_x.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression_x.h
new file mode 100644
index 0000000..79a5fc6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/noise_suppression_x.h
@@ -0,0 +1,113 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSION_X_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSION_X_H_
+
+#include <stddef.h>
+
+#include "webrtc/typedefs.h"
+
+typedef struct NsxHandleT NsxHandle;
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/*
+ * This function creates an instance of the fixed point Noise Suppression.
+ */
+NsxHandle* WebRtcNsx_Create();
+
+/*
+ * This function frees the dynamic memory of a specified Noise Suppression
+ * instance.
+ *
+ * Input:
+ *      - nsxInst       : Pointer to NS instance that should be freed
+ */
+void WebRtcNsx_Free(NsxHandle* nsxInst);
+
+/*
+ * This function initializes a NS instance
+ *
+ * Input:
+ *      - nsxInst       : Instance that should be initialized
+ *      - fs            : sampling frequency
+ *
+ * Output:
+ *      - nsxInst       : Initialized instance
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int WebRtcNsx_Init(NsxHandle* nsxInst, uint32_t fs);
+
+/*
+ * This changes the aggressiveness of the noise suppression method.
+ *
+ * Input:
+ *      - nsxInst       : Instance that should be initialized
+ *      - mode          : 0: Mild, 1: Medium , 2: Aggressive
+ *
+ * Output:
+ *      - nsxInst       : Initialized instance
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int WebRtcNsx_set_policy(NsxHandle* nsxInst, int mode);
+
+/*
+ * This functions does noise suppression for the inserted speech frame. The
+ * input and output signals should always be 10ms (80 or 160 samples).
+ *
+ * Input
+ *      - nsxInst       : NSx instance. Needs to be initiated before call.
+ *      - speechFrame   : Pointer to speech frame buffer for each band
+ *      - num_bands     : Number of bands
+ *
+ * Output:
+ *      - nsxInst       : Updated NSx instance
+ *      - outFrame      : Pointer to output frame for each band
+ */
+void WebRtcNsx_Process(NsxHandle* nsxInst,
+                       const short* const* speechFrame,
+                       int num_bands,
+                       short* const* outFrame);
+
+/* Returns a pointer to the noise estimate per frequency bin. The number of
+ * frequency bins can be provided using WebRtcNsx_num_freq().
+ *
+ * Input
+ *      - nsxInst       : NSx instance. Needs to be initiated before call.
+ *      - q_noise       : Q value of the noise estimate, which is the number of
+ *                        bits that it needs to be right-shifted to be
+ *                        normalized.
+ *
+ * Return value         : Pointer to the noise estimate per frequency bin.
+ *                        Returns NULL if the input is a NULL pointer or an
+ *                        uninitialized instance.
+ */
+const uint32_t* WebRtcNsx_noise_estimate(const NsxHandle* nsxInst,
+                                         int* q_noise);
+
+/* Returns the number of frequency bins, which is the length of the noise
+ * estimate for example.
+ *
+ * Return value         : Number of frequency bins.
+ */
+size_t WebRtcNsx_num_freq();
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_NS_NOISE_SUPPRESSION_X_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/ns_core.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/ns_core.c
new file mode 100644
index 0000000..76589c5
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/ns_core.c
@@ -0,0 +1,1416 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <math.h>
+#include <string.h>
+#include <stdlib.h>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/fft4g.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/modules/audio_processing/ns/noise_suppression.h"
+#include "webrtc/modules/audio_processing/ns/ns_core.h"
+#include "webrtc/modules/audio_processing/ns/windows_private.h"
+
+// Set Feature Extraction Parameters.
+static void set_feature_extraction_parameters(NoiseSuppressionC* self) {
+  // Bin size of histogram.
+  self->featureExtractionParams.binSizeLrt = 0.1f;
+  self->featureExtractionParams.binSizeSpecFlat = 0.05f;
+  self->featureExtractionParams.binSizeSpecDiff = 0.1f;
+
+  // Range of histogram over which LRT threshold is computed.
+  self->featureExtractionParams.rangeAvgHistLrt = 1.f;
+
+  // Scale parameters: multiply dominant peaks of the histograms by scale factor
+  // to obtain thresholds for prior model.
+  // For LRT and spectral difference.
+  self->featureExtractionParams.factor1ModelPars = 1.2f;
+  // For spectral_flatness: used when noise is flatter than speech.
+  self->featureExtractionParams.factor2ModelPars = 0.9f;
+
+  // Peak limit for spectral flatness (varies between 0 and 1).
+  self->featureExtractionParams.thresPosSpecFlat = 0.6f;
+
+  // Limit on spacing of two highest peaks in histogram: spacing determined by
+  // bin size.
+  self->featureExtractionParams.limitPeakSpacingSpecFlat =
+      2 * self->featureExtractionParams.binSizeSpecFlat;
+  self->featureExtractionParams.limitPeakSpacingSpecDiff =
+      2 * self->featureExtractionParams.binSizeSpecDiff;
+
+  // Limit on relevance of second peak.
+  self->featureExtractionParams.limitPeakWeightsSpecFlat = 0.5f;
+  self->featureExtractionParams.limitPeakWeightsSpecDiff = 0.5f;
+
+  // Fluctuation limit of LRT feature.
+  self->featureExtractionParams.thresFluctLrt = 0.05f;
+
+  // Limit on the max and min values for the feature thresholds.
+  self->featureExtractionParams.maxLrt = 1.f;
+  self->featureExtractionParams.minLrt = 0.2f;
+
+  self->featureExtractionParams.maxSpecFlat = 0.95f;
+  self->featureExtractionParams.minSpecFlat = 0.1f;
+
+  self->featureExtractionParams.maxSpecDiff = 1.f;
+  self->featureExtractionParams.minSpecDiff = 0.16f;
+
+  // Criteria of weight of histogram peak to accept/reject feature.
+  self->featureExtractionParams.thresWeightSpecFlat =
+      (int)(0.3 * (self->modelUpdatePars[1]));  // For spectral flatness.
+  self->featureExtractionParams.thresWeightSpecDiff =
+      (int)(0.3 * (self->modelUpdatePars[1]));  // For spectral difference.
+}
+
+// Initialize state.
+int WebRtcNs_InitCore(NoiseSuppressionC* self, uint32_t fs) {
+  int i;
+  // Check for valid pointer.
+  if (self == NULL) {
+    return -1;
+  }
+
+  // Initialization of struct.
+  if (fs == 8000 || fs == 16000 || fs == 32000 || fs == 48000) {
+    self->fs = fs;
+  } else {
+    return -1;
+  }
+  self->windShift = 0;
+  // We only support 10ms frames.
+  if (fs == 8000) {
+    self->blockLen = 80;
+    self->anaLen = 128;
+    self->window = kBlocks80w128;
+  } else {
+    self->blockLen = 160;
+    self->anaLen = 256;
+    self->window = kBlocks160w256;
+  }
+  self->magnLen = self->anaLen / 2 + 1;  // Number of frequency bins.
+
+  // Initialize FFT work arrays.
+  self->ip[0] = 0;  // Setting this triggers initialization.
+  memset(self->dataBuf, 0, sizeof(float) * ANAL_BLOCKL_MAX);
+  WebRtc_rdft(self->anaLen, 1, self->dataBuf, self->ip, self->wfft);
+
+  memset(self->analyzeBuf, 0, sizeof(float) * ANAL_BLOCKL_MAX);
+  memset(self->dataBuf, 0, sizeof(float) * ANAL_BLOCKL_MAX);
+  memset(self->syntBuf, 0, sizeof(float) * ANAL_BLOCKL_MAX);
+
+  // For HB processing.
+  memset(self->dataBufHB,
+         0,
+         sizeof(float) * NUM_HIGH_BANDS_MAX * ANAL_BLOCKL_MAX);
+
+  // For quantile noise estimation.
+  memset(self->quantile, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  for (i = 0; i < SIMULT * HALF_ANAL_BLOCKL; i++) {
+    self->lquantile[i] = 8.f;
+    self->density[i] = 0.3f;
+  }
+
+  for (i = 0; i < SIMULT; i++) {
+    self->counter[i] =
+        (int)floor((float)(END_STARTUP_LONG * (i + 1)) / (float)SIMULT);
+  }
+
+  self->updates = 0;
+
+  // Wiener filter initialization.
+  for (i = 0; i < HALF_ANAL_BLOCKL; i++) {
+    self->smooth[i] = 1.f;
+  }
+
+  // Set the aggressiveness: default.
+  self->aggrMode = 0;
+
+  // Initialize variables for new method.
+  self->priorSpeechProb = 0.5f;  // Prior prob for speech/noise.
+  // Previous analyze mag spectrum.
+  memset(self->magnPrevAnalyze, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  // Previous process mag spectrum.
+  memset(self->magnPrevProcess, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  // Current noise-spectrum.
+  memset(self->noise, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  // Previous noise-spectrum.
+  memset(self->noisePrev, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  // Conservative noise spectrum estimate.
+  memset(self->magnAvgPause, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  // For estimation of HB in second pass.
+  memset(self->speechProb, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  // Initial average magnitude spectrum.
+  memset(self->initMagnEst, 0, sizeof(float) * HALF_ANAL_BLOCKL);
+  for (i = 0; i < HALF_ANAL_BLOCKL; i++) {
+    // Smooth LR (same as threshold).
+    self->logLrtTimeAvg[i] = LRT_FEATURE_THR;
+  }
+
+  // Feature quantities.
+  // Spectral flatness (start on threshold).
+  self->featureData[0] = SF_FEATURE_THR;
+  self->featureData[1] = 0.f;  // Spectral entropy: not used in this version.
+  self->featureData[2] = 0.f;  // Spectral variance: not used in this version.
+  // Average LRT factor (start on threshold).
+  self->featureData[3] = LRT_FEATURE_THR;
+  // Spectral template diff (start on threshold).
+  self->featureData[4] = SF_FEATURE_THR;
+  self->featureData[5] = 0.f;  // Normalization for spectral difference.
+  // Window time-average of input magnitude spectrum.
+  self->featureData[6] = 0.f;
+
+  // Histogram quantities: used to estimate/update thresholds for features.
+  memset(self->histLrt, 0, sizeof(int) * HIST_PAR_EST);
+  memset(self->histSpecFlat, 0, sizeof(int) * HIST_PAR_EST);
+  memset(self->histSpecDiff, 0, sizeof(int) * HIST_PAR_EST);
+
+
+  self->blockInd = -1;  // Frame counter.
+  // Default threshold for LRT feature.
+  self->priorModelPars[0] = LRT_FEATURE_THR;
+  // Threshold for spectral flatness: determined on-line.
+  self->priorModelPars[1] = 0.5f;
+  // sgn_map par for spectral measure: 1 for flatness measure.
+  self->priorModelPars[2] = 1.f;
+  // Threshold for template-difference feature: determined on-line.
+  self->priorModelPars[3] = 0.5f;
+  // Default weighting parameter for LRT feature.
+  self->priorModelPars[4] = 1.f;
+  // Default weighting parameter for spectral flatness feature.
+  self->priorModelPars[5] = 0.f;
+  // Default weighting parameter for spectral difference feature.
+  self->priorModelPars[6] = 0.f;
+
+  // Update flag for parameters:
+  // 0 no update, 1 = update once, 2 = update every window.
+  self->modelUpdatePars[0] = 2;
+  self->modelUpdatePars[1] = 500;  // Window for update.
+  // Counter for update of conservative noise spectrum.
+  self->modelUpdatePars[2] = 0;
+  // Counter if the feature thresholds are updated during the sequence.
+  self->modelUpdatePars[3] = self->modelUpdatePars[1];
+
+  self->signalEnergy = 0.0;
+  self->sumMagn = 0.0;
+  self->whiteNoiseLevel = 0.0;
+  self->pinkNoiseNumerator = 0.0;
+  self->pinkNoiseExp = 0.0;
+
+  set_feature_extraction_parameters(self);
+
+  // Default mode.
+  WebRtcNs_set_policy_core(self, 0);
+
+  self->initFlag = 1;
+  return 0;
+}
+
+// Estimate noise.
+static void NoiseEstimation(NoiseSuppressionC* self,
+                            float* magn,
+                            float* noise) {
+  size_t i, s, offset;
+  float lmagn[HALF_ANAL_BLOCKL], delta;
+
+  if (self->updates < END_STARTUP_LONG) {
+    self->updates++;
+  }
+
+  for (i = 0; i < self->magnLen; i++) {
+    lmagn[i] = (float)log(magn[i]);
+  }
+
+  // Loop over simultaneous estimates.
+  for (s = 0; s < SIMULT; s++) {
+    offset = s * self->magnLen;
+
+    // newquantest(...)
+    for (i = 0; i < self->magnLen; i++) {
+      // Compute delta.
+      if (self->density[offset + i] > 1.0) {
+        delta = FACTOR * 1.f / self->density[offset + i];
+      } else {
+        delta = FACTOR;
+      }
+
+      // Update log quantile estimate.
+      if (lmagn[i] > self->lquantile[offset + i]) {
+        self->lquantile[offset + i] +=
+            QUANTILE * delta / (float)(self->counter[s] + 1);
+      } else {
+        self->lquantile[offset + i] -=
+            (1.f - QUANTILE) * delta / (float)(self->counter[s] + 1);
+      }
+
+      // Update density estimate.
+      if (fabs(lmagn[i] - self->lquantile[offset + i]) < WIDTH) {
+        self->density[offset + i] =
+            ((float)self->counter[s] * self->density[offset + i] +
+             1.f / (2.f * WIDTH)) /
+            (float)(self->counter[s] + 1);
+      }
+    }  // End loop over magnitude spectrum.
+
+    if (self->counter[s] >= END_STARTUP_LONG) {
+      self->counter[s] = 0;
+      if (self->updates >= END_STARTUP_LONG) {
+        for (i = 0; i < self->magnLen; i++) {
+          self->quantile[i] = (float)exp(self->lquantile[offset + i]);
+        }
+      }
+    }
+
+    self->counter[s]++;
+  }  // End loop over simultaneous estimates.
+
+  // Sequentially update the noise during startup.
+  if (self->updates < END_STARTUP_LONG) {
+    // Use the last "s" to get noise during startup that differ from zero.
+    for (i = 0; i < self->magnLen; i++) {
+      self->quantile[i] = (float)exp(self->lquantile[offset + i]);
+    }
+  }
+
+  for (i = 0; i < self->magnLen; i++) {
+    noise[i] = self->quantile[i];
+  }
+}
+
+// Extract thresholds for feature parameters.
+// Histograms are computed over some window size (given by
+// self->modelUpdatePars[1]).
+// Thresholds and weights are extracted every window.
+// |flag| = 0 updates histogram only, |flag| = 1 computes the threshold/weights.
+// Threshold and weights are returned in: self->priorModelPars.
+static void FeatureParameterExtraction(NoiseSuppressionC* self, int flag) {
+  int i, useFeatureSpecFlat, useFeatureSpecDiff, numHistLrt;
+  int maxPeak1, maxPeak2;
+  int weightPeak1SpecFlat, weightPeak2SpecFlat, weightPeak1SpecDiff,
+      weightPeak2SpecDiff;
+
+  float binMid, featureSum;
+  float posPeak1SpecFlat, posPeak2SpecFlat, posPeak1SpecDiff, posPeak2SpecDiff;
+  float fluctLrt, avgHistLrt, avgSquareHistLrt, avgHistLrtCompl;
+
+  // 3 features: LRT, flatness, difference.
+  // lrt_feature = self->featureData[3];
+  // flat_feature = self->featureData[0];
+  // diff_feature = self->featureData[4];
+
+  // Update histograms.
+  if (flag == 0) {
+    // LRT
+    if ((self->featureData[3] <
+         HIST_PAR_EST * self->featureExtractionParams.binSizeLrt) &&
+        (self->featureData[3] >= 0.0)) {
+      i = (int)(self->featureData[3] /
+                self->featureExtractionParams.binSizeLrt);
+      self->histLrt[i]++;
+    }
+    // Spectral flatness.
+    if ((self->featureData[0] <
+         HIST_PAR_EST * self->featureExtractionParams.binSizeSpecFlat) &&
+        (self->featureData[0] >= 0.0)) {
+      i = (int)(self->featureData[0] /
+                self->featureExtractionParams.binSizeSpecFlat);
+      self->histSpecFlat[i]++;
+    }
+    // Spectral difference.
+    if ((self->featureData[4] <
+         HIST_PAR_EST * self->featureExtractionParams.binSizeSpecDiff) &&
+        (self->featureData[4] >= 0.0)) {
+      i = (int)(self->featureData[4] /
+                self->featureExtractionParams.binSizeSpecDiff);
+      self->histSpecDiff[i]++;
+    }
+  }
+
+  // Extract parameters for speech/noise probability.
+  if (flag == 1) {
+    // LRT feature: compute the average over
+    // self->featureExtractionParams.rangeAvgHistLrt.
+    avgHistLrt = 0.0;
+    avgHistLrtCompl = 0.0;
+    avgSquareHistLrt = 0.0;
+    numHistLrt = 0;
+    for (i = 0; i < HIST_PAR_EST; i++) {
+      binMid = ((float)i + 0.5f) * self->featureExtractionParams.binSizeLrt;
+      if (binMid <= self->featureExtractionParams.rangeAvgHistLrt) {
+        avgHistLrt += self->histLrt[i] * binMid;
+        numHistLrt += self->histLrt[i];
+      }
+      avgSquareHistLrt += self->histLrt[i] * binMid * binMid;
+      avgHistLrtCompl += self->histLrt[i] * binMid;
+    }
+    if (numHistLrt > 0) {
+      avgHistLrt = avgHistLrt / ((float)numHistLrt);
+    }
+    avgHistLrtCompl = avgHistLrtCompl / ((float)self->modelUpdatePars[1]);
+    avgSquareHistLrt = avgSquareHistLrt / ((float)self->modelUpdatePars[1]);
+    fluctLrt = avgSquareHistLrt - avgHistLrt * avgHistLrtCompl;
+    // Get threshold for LRT feature.
+    if (fluctLrt < self->featureExtractionParams.thresFluctLrt) {
+      // Very low fluctuation, so likely noise.
+      self->priorModelPars[0] = self->featureExtractionParams.maxLrt;
+    } else {
+      self->priorModelPars[0] =
+          self->featureExtractionParams.factor1ModelPars * avgHistLrt;
+      // Check if value is within min/max range.
+      if (self->priorModelPars[0] < self->featureExtractionParams.minLrt) {
+        self->priorModelPars[0] = self->featureExtractionParams.minLrt;
+      }
+      if (self->priorModelPars[0] > self->featureExtractionParams.maxLrt) {
+        self->priorModelPars[0] = self->featureExtractionParams.maxLrt;
+      }
+    }
+    // Done with LRT feature.
+
+    // For spectral flatness and spectral difference: compute the main peaks of
+    // histogram.
+    maxPeak1 = 0;
+    maxPeak2 = 0;
+    posPeak1SpecFlat = 0.0;
+    posPeak2SpecFlat = 0.0;
+    weightPeak1SpecFlat = 0;
+    weightPeak2SpecFlat = 0;
+
+    // Peaks for flatness.
+    for (i = 0; i < HIST_PAR_EST; i++) {
+      binMid =
+          (i + 0.5f) * self->featureExtractionParams.binSizeSpecFlat;
+      if (self->histSpecFlat[i] > maxPeak1) {
+        // Found new "first" peak.
+        maxPeak2 = maxPeak1;
+        weightPeak2SpecFlat = weightPeak1SpecFlat;
+        posPeak2SpecFlat = posPeak1SpecFlat;
+
+        maxPeak1 = self->histSpecFlat[i];
+        weightPeak1SpecFlat = self->histSpecFlat[i];
+        posPeak1SpecFlat = binMid;
+      } else if (self->histSpecFlat[i] > maxPeak2) {
+        // Found new "second" peak.
+        maxPeak2 = self->histSpecFlat[i];
+        weightPeak2SpecFlat = self->histSpecFlat[i];
+        posPeak2SpecFlat = binMid;
+      }
+    }
+
+    // Compute two peaks for spectral difference.
+    maxPeak1 = 0;
+    maxPeak2 = 0;
+    posPeak1SpecDiff = 0.0;
+    posPeak2SpecDiff = 0.0;
+    weightPeak1SpecDiff = 0;
+    weightPeak2SpecDiff = 0;
+    // Peaks for spectral difference.
+    for (i = 0; i < HIST_PAR_EST; i++) {
+      binMid =
+          ((float)i + 0.5f) * self->featureExtractionParams.binSizeSpecDiff;
+      if (self->histSpecDiff[i] > maxPeak1) {
+        // Found new "first" peak.
+        maxPeak2 = maxPeak1;
+        weightPeak2SpecDiff = weightPeak1SpecDiff;
+        posPeak2SpecDiff = posPeak1SpecDiff;
+
+        maxPeak1 = self->histSpecDiff[i];
+        weightPeak1SpecDiff = self->histSpecDiff[i];
+        posPeak1SpecDiff = binMid;
+      } else if (self->histSpecDiff[i] > maxPeak2) {
+        // Found new "second" peak.
+        maxPeak2 = self->histSpecDiff[i];
+        weightPeak2SpecDiff = self->histSpecDiff[i];
+        posPeak2SpecDiff = binMid;
+      }
+    }
+
+    // For spectrum flatness feature.
+    useFeatureSpecFlat = 1;
+    // Merge the two peaks if they are close.
+    if ((fabs(posPeak2SpecFlat - posPeak1SpecFlat) <
+         self->featureExtractionParams.limitPeakSpacingSpecFlat) &&
+        (weightPeak2SpecFlat >
+         self->featureExtractionParams.limitPeakWeightsSpecFlat *
+             weightPeak1SpecFlat)) {
+      weightPeak1SpecFlat += weightPeak2SpecFlat;
+      posPeak1SpecFlat = 0.5f * (posPeak1SpecFlat + posPeak2SpecFlat);
+    }
+    // Reject if weight of peaks is not large enough, or peak value too small.
+    if (weightPeak1SpecFlat <
+            self->featureExtractionParams.thresWeightSpecFlat ||
+        posPeak1SpecFlat < self->featureExtractionParams.thresPosSpecFlat) {
+      useFeatureSpecFlat = 0;
+    }
+    // If selected, get the threshold.
+    if (useFeatureSpecFlat == 1) {
+      // Compute the threshold.
+      self->priorModelPars[1] =
+          self->featureExtractionParams.factor2ModelPars * posPeak1SpecFlat;
+      // Check if value is within min/max range.
+      if (self->priorModelPars[1] < self->featureExtractionParams.minSpecFlat) {
+        self->priorModelPars[1] = self->featureExtractionParams.minSpecFlat;
+      }
+      if (self->priorModelPars[1] > self->featureExtractionParams.maxSpecFlat) {
+        self->priorModelPars[1] = self->featureExtractionParams.maxSpecFlat;
+      }
+    }
+    // Done with flatness feature.
+
+    // For template feature.
+    useFeatureSpecDiff = 1;
+    // Merge the two peaks if they are close.
+    if ((fabs(posPeak2SpecDiff - posPeak1SpecDiff) <
+         self->featureExtractionParams.limitPeakSpacingSpecDiff) &&
+        (weightPeak2SpecDiff >
+         self->featureExtractionParams.limitPeakWeightsSpecDiff *
+             weightPeak1SpecDiff)) {
+      weightPeak1SpecDiff += weightPeak2SpecDiff;
+      posPeak1SpecDiff = 0.5f * (posPeak1SpecDiff + posPeak2SpecDiff);
+    }
+    // Get the threshold value.
+    self->priorModelPars[3] =
+        self->featureExtractionParams.factor1ModelPars * posPeak1SpecDiff;
+    // Reject if weight of peaks is not large enough.
+    if (weightPeak1SpecDiff <
+        self->featureExtractionParams.thresWeightSpecDiff) {
+      useFeatureSpecDiff = 0;
+    }
+    // Check if value is within min/max range.
+    if (self->priorModelPars[3] < self->featureExtractionParams.minSpecDiff) {
+      self->priorModelPars[3] = self->featureExtractionParams.minSpecDiff;
+    }
+    if (self->priorModelPars[3] > self->featureExtractionParams.maxSpecDiff) {
+      self->priorModelPars[3] = self->featureExtractionParams.maxSpecDiff;
+    }
+    // Done with spectral difference feature.
+
+    // Don't use template feature if fluctuation of LRT feature is very low:
+    // most likely just noise state.
+    if (fluctLrt < self->featureExtractionParams.thresFluctLrt) {
+      useFeatureSpecDiff = 0;
+    }
+
+    // Select the weights between the features.
+    // self->priorModelPars[4] is weight for LRT: always selected.
+    // self->priorModelPars[5] is weight for spectral flatness.
+    // self->priorModelPars[6] is weight for spectral difference.
+    featureSum = (float)(1 + useFeatureSpecFlat + useFeatureSpecDiff);
+    self->priorModelPars[4] = 1.f / featureSum;
+    self->priorModelPars[5] = ((float)useFeatureSpecFlat) / featureSum;
+    self->priorModelPars[6] = ((float)useFeatureSpecDiff) / featureSum;
+
+    // Set hists to zero for next update.
+    if (self->modelUpdatePars[0] >= 1) {
+      for (i = 0; i < HIST_PAR_EST; i++) {
+        self->histLrt[i] = 0;
+        self->histSpecFlat[i] = 0;
+        self->histSpecDiff[i] = 0;
+      }
+    }
+  }  // End of flag == 1.
+}
+
+// Compute spectral flatness on input spectrum.
+// |magnIn| is the magnitude spectrum.
+// Spectral flatness is returned in self->featureData[0].
+static void ComputeSpectralFlatness(NoiseSuppressionC* self,
+                                    const float* magnIn) {
+  size_t i;
+  size_t shiftLP = 1;  // Option to remove first bin(s) from spectral measures.
+  float avgSpectralFlatnessNum, avgSpectralFlatnessDen, spectralTmp;
+
+  // Compute spectral measures.
+  // For flatness.
+  avgSpectralFlatnessNum = 0.0;
+  avgSpectralFlatnessDen = self->sumMagn;
+  for (i = 0; i < shiftLP; i++) {
+    avgSpectralFlatnessDen -= magnIn[i];
+  }
+  // Compute log of ratio of the geometric to arithmetic mean: check for log(0)
+  // case.
+  for (i = shiftLP; i < self->magnLen; i++) {
+    if (magnIn[i] > 0.0) {
+      avgSpectralFlatnessNum += (float)log(magnIn[i]);
+    } else {
+      self->featureData[0] -= SPECT_FL_TAVG * self->featureData[0];
+      return;
+    }
+  }
+  // Normalize.
+  avgSpectralFlatnessDen = avgSpectralFlatnessDen / self->magnLen;
+  avgSpectralFlatnessNum = avgSpectralFlatnessNum / self->magnLen;
+
+  // Ratio and inverse log: check for case of log(0).
+  spectralTmp = (float)exp(avgSpectralFlatnessNum) / avgSpectralFlatnessDen;
+
+  // Time-avg update of spectral flatness feature.
+  self->featureData[0] += SPECT_FL_TAVG * (spectralTmp - self->featureData[0]);
+  // Done with flatness feature.
+}
+
+// Compute prior and post SNR based on quantile noise estimation.
+// Compute DD estimate of prior SNR.
+// Inputs:
+//   * |magn| is the signal magnitude spectrum estimate.
+//   * |noise| is the magnitude noise spectrum estimate.
+// Outputs:
+//   * |snrLocPrior| is the computed prior SNR.
+//   * |snrLocPost| is the computed post SNR.
+static void ComputeSnr(const NoiseSuppressionC* self,
+                       const float* magn,
+                       const float* noise,
+                       float* snrLocPrior,
+                       float* snrLocPost) {
+  size_t i;
+
+  for (i = 0; i < self->magnLen; i++) {
+    // Previous post SNR.
+    // Previous estimate: based on previous frame with gain filter.
+    float previousEstimateStsa = self->magnPrevAnalyze[i] /
+        (self->noisePrev[i] + 0.0001f) * self->smooth[i];
+    // Post SNR.
+    snrLocPost[i] = 0.f;
+    if (magn[i] > noise[i]) {
+      snrLocPost[i] = magn[i] / (noise[i] + 0.0001f) - 1.f;
+    }
+    // DD estimate is sum of two terms: current estimate and previous estimate.
+    // Directed decision update of snrPrior.
+    snrLocPrior[i] =
+        DD_PR_SNR * previousEstimateStsa + (1.f - DD_PR_SNR) * snrLocPost[i];
+  }  // End of loop over frequencies.
+}
+
+// Compute the difference measure between input spectrum and a template/learned
+// noise spectrum.
+// |magnIn| is the input spectrum.
+// The reference/template spectrum is self->magnAvgPause[i].
+// Returns (normalized) spectral difference in self->featureData[4].
+static void ComputeSpectralDifference(NoiseSuppressionC* self,
+                                      const float* magnIn) {
+  // avgDiffNormMagn = var(magnIn) - cov(magnIn, magnAvgPause)^2 /
+  // var(magnAvgPause)
+  size_t i;
+  float avgPause, avgMagn, covMagnPause, varPause, varMagn, avgDiffNormMagn;
+
+  avgPause = 0.0;
+  avgMagn = self->sumMagn;
+  // Compute average quantities.
+  for (i = 0; i < self->magnLen; i++) {
+    // Conservative smooth noise spectrum from pause frames.
+    avgPause += self->magnAvgPause[i];
+  }
+  avgPause /= self->magnLen;
+  avgMagn /= self->magnLen;
+
+  covMagnPause = 0.0;
+  varPause = 0.0;
+  varMagn = 0.0;
+  // Compute variance and covariance quantities.
+  for (i = 0; i < self->magnLen; i++) {
+    covMagnPause += (magnIn[i] - avgMagn) * (self->magnAvgPause[i] - avgPause);
+    varPause +=
+        (self->magnAvgPause[i] - avgPause) * (self->magnAvgPause[i] - avgPause);
+    varMagn += (magnIn[i] - avgMagn) * (magnIn[i] - avgMagn);
+  }
+  covMagnPause /= self->magnLen;
+  varPause /= self->magnLen;
+  varMagn /= self->magnLen;
+  // Update of average magnitude spectrum.
+  self->featureData[6] += self->signalEnergy;
+
+  avgDiffNormMagn =
+      varMagn - (covMagnPause * covMagnPause) / (varPause + 0.0001f);
+  // Normalize and compute time-avg update of difference feature.
+  avgDiffNormMagn = (float)(avgDiffNormMagn / (self->featureData[5] + 0.0001f));
+  self->featureData[4] +=
+      SPECT_DIFF_TAVG * (avgDiffNormMagn - self->featureData[4]);
+}
+
+// Compute speech/noise probability.
+// Speech/noise probability is returned in |probSpeechFinal|.
+// |magn| is the input magnitude spectrum.
+// |noise| is the noise spectrum.
+// |snrLocPrior| is the prior SNR for each frequency.
+// |snrLocPost| is the post SNR for each frequency.
+static void SpeechNoiseProb(NoiseSuppressionC* self,
+                            float* probSpeechFinal,
+                            const float* snrLocPrior,
+                            const float* snrLocPost) {
+  size_t i;
+  int sgnMap;
+  float invLrt, gainPrior, indPrior;
+  float logLrtTimeAvgKsum, besselTmp;
+  float indicator0, indicator1, indicator2;
+  float tmpFloat1, tmpFloat2;
+  float weightIndPrior0, weightIndPrior1, weightIndPrior2;
+  float threshPrior0, threshPrior1, threshPrior2;
+  float widthPrior, widthPrior0, widthPrior1, widthPrior2;
+
+  widthPrior0 = WIDTH_PR_MAP;
+  // Width for pause region: lower range, so increase width in tanh map.
+  widthPrior1 = 2.f * WIDTH_PR_MAP;
+  widthPrior2 = 2.f * WIDTH_PR_MAP;  // For spectral-difference measure.
+
+  // Threshold parameters for features.
+  threshPrior0 = self->priorModelPars[0];
+  threshPrior1 = self->priorModelPars[1];
+  threshPrior2 = self->priorModelPars[3];
+
+  // Sign for flatness feature.
+  sgnMap = (int)(self->priorModelPars[2]);
+
+  // Weight parameters for features.
+  weightIndPrior0 = self->priorModelPars[4];
+  weightIndPrior1 = self->priorModelPars[5];
+  weightIndPrior2 = self->priorModelPars[6];
+
+  // Compute feature based on average LR factor.
+  // This is the average over all frequencies of the smooth log LRT.
+  logLrtTimeAvgKsum = 0.0;
+  for (i = 0; i < self->magnLen; i++) {
+    tmpFloat1 = 1.f + 2.f * snrLocPrior[i];
+    tmpFloat2 = 2.f * snrLocPrior[i] / (tmpFloat1 + 0.0001f);
+    besselTmp = (snrLocPost[i] + 1.f) * tmpFloat2;
+    self->logLrtTimeAvg[i] +=
+        LRT_TAVG * (besselTmp - (float)log(tmpFloat1) - self->logLrtTimeAvg[i]);
+    logLrtTimeAvgKsum += self->logLrtTimeAvg[i];
+  }
+  logLrtTimeAvgKsum = (float)logLrtTimeAvgKsum / (self->magnLen);
+  self->featureData[3] = logLrtTimeAvgKsum;
+  // Done with computation of LR factor.
+
+  // Compute the indicator functions.
+  // Average LRT feature.
+  widthPrior = widthPrior0;
+  // Use larger width in tanh map for pause regions.
+  if (logLrtTimeAvgKsum < threshPrior0) {
+    widthPrior = widthPrior1;
+  }
+  // Compute indicator function: sigmoid map.
+  indicator0 =
+      0.5f *
+      ((float)tanh(widthPrior * (logLrtTimeAvgKsum - threshPrior0)) + 1.f);
+
+  // Spectral flatness feature.
+  tmpFloat1 = self->featureData[0];
+  widthPrior = widthPrior0;
+  // Use larger width in tanh map for pause regions.
+  if (sgnMap == 1 && (tmpFloat1 > threshPrior1)) {
+    widthPrior = widthPrior1;
+  }
+  if (sgnMap == -1 && (tmpFloat1 < threshPrior1)) {
+    widthPrior = widthPrior1;
+  }
+  // Compute indicator function: sigmoid map.
+  indicator1 =
+      0.5f *
+      ((float)tanh((float)sgnMap * widthPrior * (threshPrior1 - tmpFloat1)) +
+       1.f);
+
+  // For template spectrum-difference.
+  tmpFloat1 = self->featureData[4];
+  widthPrior = widthPrior0;
+  // Use larger width in tanh map for pause regions.
+  if (tmpFloat1 < threshPrior2) {
+    widthPrior = widthPrior2;
+  }
+  // Compute indicator function: sigmoid map.
+  indicator2 =
+      0.5f * ((float)tanh(widthPrior * (tmpFloat1 - threshPrior2)) + 1.f);
+
+  // Combine the indicator function with the feature weights.
+  indPrior = weightIndPrior0 * indicator0 + weightIndPrior1 * indicator1 +
+             weightIndPrior2 * indicator2;
+  // Done with computing indicator function.
+
+  // Compute the prior probability.
+  self->priorSpeechProb += PRIOR_UPDATE * (indPrior - self->priorSpeechProb);
+  // Make sure probabilities are within range: keep floor to 0.01.
+  if (self->priorSpeechProb > 1.f) {
+    self->priorSpeechProb = 1.f;
+  }
+  if (self->priorSpeechProb < 0.01f) {
+    self->priorSpeechProb = 0.01f;
+  }
+
+  // Final speech probability: combine prior model with LR factor:.
+  gainPrior = (1.f - self->priorSpeechProb) / (self->priorSpeechProb + 0.0001f);
+  for (i = 0; i < self->magnLen; i++) {
+    invLrt = (float)exp(-self->logLrtTimeAvg[i]);
+    invLrt = (float)gainPrior * invLrt;
+    probSpeechFinal[i] = 1.f / (1.f + invLrt);
+  }
+}
+
+// Update the noise features.
+// Inputs:
+//   * |magn| is the signal magnitude spectrum estimate.
+//   * |updateParsFlag| is an update flag for parameters.
+static void FeatureUpdate(NoiseSuppressionC* self,
+                          const float* magn,
+                          int updateParsFlag) {
+  // Compute spectral flatness on input spectrum.
+  ComputeSpectralFlatness(self, magn);
+  // Compute difference of input spectrum with learned/estimated noise spectrum.
+  ComputeSpectralDifference(self, magn);
+  // Compute histograms for parameter decisions (thresholds and weights for
+  // features).
+  // Parameters are extracted once every window time.
+  // (=self->modelUpdatePars[1])
+  if (updateParsFlag >= 1) {
+    // Counter update.
+    self->modelUpdatePars[3]--;
+    // Update histogram.
+    if (self->modelUpdatePars[3] > 0) {
+      FeatureParameterExtraction(self, 0);
+    }
+    // Compute model parameters.
+    if (self->modelUpdatePars[3] == 0) {
+      FeatureParameterExtraction(self, 1);
+      self->modelUpdatePars[3] = self->modelUpdatePars[1];
+      // If wish to update only once, set flag to zero.
+      if (updateParsFlag == 1) {
+        self->modelUpdatePars[0] = 0;
+      } else {
+        // Update every window:
+        // Get normalization for spectral difference for next window estimate.
+        self->featureData[6] =
+            self->featureData[6] / ((float)self->modelUpdatePars[1]);
+        self->featureData[5] =
+            0.5f * (self->featureData[6] + self->featureData[5]);
+        self->featureData[6] = 0.f;
+      }
+    }
+  }
+}
+
+// Update the noise estimate.
+// Inputs:
+//   * |magn| is the signal magnitude spectrum estimate.
+//   * |snrLocPrior| is the prior SNR.
+//   * |snrLocPost| is the post SNR.
+// Output:
+//   * |noise| is the updated noise magnitude spectrum estimate.
+static void UpdateNoiseEstimate(NoiseSuppressionC* self,
+                                const float* magn,
+                                const float* snrLocPrior,
+                                const float* snrLocPost,
+                                float* noise) {
+  size_t i;
+  float probSpeech, probNonSpeech;
+  // Time-avg parameter for noise update.
+  float gammaNoiseTmp = NOISE_UPDATE;
+  float gammaNoiseOld;
+  float noiseUpdateTmp;
+
+  for (i = 0; i < self->magnLen; i++) {
+    probSpeech = self->speechProb[i];
+    probNonSpeech = 1.f - probSpeech;
+    // Temporary noise update:
+    // Use it for speech frames if update value is less than previous.
+    noiseUpdateTmp = gammaNoiseTmp * self->noisePrev[i] +
+                     (1.f - gammaNoiseTmp) * (probNonSpeech * magn[i] +
+                                              probSpeech * self->noisePrev[i]);
+    // Time-constant based on speech/noise state.
+    gammaNoiseOld = gammaNoiseTmp;
+    gammaNoiseTmp = NOISE_UPDATE;
+    // Increase gamma (i.e., less noise update) for frame likely to be speech.
+    if (probSpeech > PROB_RANGE) {
+      gammaNoiseTmp = SPEECH_UPDATE;
+    }
+    // Conservative noise update.
+    if (probSpeech < PROB_RANGE) {
+      self->magnAvgPause[i] += GAMMA_PAUSE * (magn[i] - self->magnAvgPause[i]);
+    }
+    // Noise update.
+    if (gammaNoiseTmp == gammaNoiseOld) {
+      noise[i] = noiseUpdateTmp;
+    } else {
+      noise[i] = gammaNoiseTmp * self->noisePrev[i] +
+                 (1.f - gammaNoiseTmp) * (probNonSpeech * magn[i] +
+                                          probSpeech * self->noisePrev[i]);
+      // Allow for noise update downwards:
+      // If noise update decreases the noise, it is safe, so allow it to
+      // happen.
+      if (noiseUpdateTmp < noise[i]) {
+        noise[i] = noiseUpdateTmp;
+      }
+    }
+  }  // End of freq loop.
+}
+
+// Updates |buffer| with a new |frame|.
+// Inputs:
+//   * |frame| is a new speech frame or NULL for setting to zero.
+//   * |frame_length| is the length of the new frame.
+//   * |buffer_length| is the length of the buffer.
+// Output:
+//   * |buffer| is the updated buffer.
+static void UpdateBuffer(const float* frame,
+                         size_t frame_length,
+                         size_t buffer_length,
+                         float* buffer) {
+  RTC_DCHECK_LT(buffer_length, 2 * frame_length);
+
+  memcpy(buffer,
+         buffer + frame_length,
+         sizeof(*buffer) * (buffer_length - frame_length));
+  if (frame) {
+    memcpy(buffer + buffer_length - frame_length,
+           frame,
+           sizeof(*buffer) * frame_length);
+  } else {
+    memset(buffer + buffer_length - frame_length,
+           0,
+           sizeof(*buffer) * frame_length);
+  }
+}
+
+// Transforms the signal from time to frequency domain.
+// Inputs:
+//   * |time_data| is the signal in the time domain.
+//   * |time_data_length| is the length of the analysis buffer.
+//   * |magnitude_length| is the length of the spectrum magnitude, which equals
+//     the length of both |real| and |imag| (time_data_length / 2 + 1).
+// Outputs:
+//   * |time_data| is the signal in the frequency domain.
+//   * |real| is the real part of the frequency domain.
+//   * |imag| is the imaginary part of the frequency domain.
+//   * |magn| is the calculated signal magnitude in the frequency domain.
+static void FFT(NoiseSuppressionC* self,
+                float* time_data,
+                size_t time_data_length,
+                size_t magnitude_length,
+                float* real,
+                float* imag,
+                float* magn) {
+  size_t i;
+
+  RTC_DCHECK_EQ(magnitude_length, time_data_length / 2 + 1);
+
+  WebRtc_rdft(time_data_length, 1, time_data, self->ip, self->wfft);
+
+  imag[0] = 0;
+  real[0] = time_data[0];
+  magn[0] = fabsf(real[0]) + 1.f;
+  imag[magnitude_length - 1] = 0;
+  real[magnitude_length - 1] = time_data[1];
+  magn[magnitude_length - 1] = fabsf(real[magnitude_length - 1]) + 1.f;
+  for (i = 1; i < magnitude_length - 1; ++i) {
+    real[i] = time_data[2 * i];
+    imag[i] = time_data[2 * i + 1];
+    // Magnitude spectrum.
+    magn[i] = sqrtf(real[i] * real[i] + imag[i] * imag[i]) + 1.f;
+  }
+}
+
+// Transforms the signal from frequency to time domain.
+// Inputs:
+//   * |real| is the real part of the frequency domain.
+//   * |imag| is the imaginary part of the frequency domain.
+//   * |magnitude_length| is the length of the spectrum magnitude, which equals
+//     the length of both |real| and |imag|.
+//   * |time_data_length| is the length of the analysis buffer
+//     (2 * (magnitude_length - 1)).
+// Output:
+//   * |time_data| is the signal in the time domain.
+static void IFFT(NoiseSuppressionC* self,
+                 const float* real,
+                 const float* imag,
+                 size_t magnitude_length,
+                 size_t time_data_length,
+                 float* time_data) {
+  size_t i;
+
+  RTC_DCHECK_EQ(time_data_length, 2 * (magnitude_length - 1));
+
+  time_data[0] = real[0];
+  time_data[1] = real[magnitude_length - 1];
+  for (i = 1; i < magnitude_length - 1; ++i) {
+    time_data[2 * i] = real[i];
+    time_data[2 * i + 1] = imag[i];
+  }
+  WebRtc_rdft(time_data_length, -1, time_data, self->ip, self->wfft);
+
+  for (i = 0; i < time_data_length; ++i) {
+    time_data[i] *= 2.f / time_data_length;  // FFT scaling.
+  }
+}
+
+// Calculates the energy of a buffer.
+// Inputs:
+//   * |buffer| is the buffer over which the energy is calculated.
+//   * |length| is the length of the buffer.
+// Returns the calculated energy.
+static float Energy(const float* buffer, size_t length) {
+  size_t i;
+  float energy = 0.f;
+
+  for (i = 0; i < length; ++i) {
+    energy += buffer[i] * buffer[i];
+  }
+
+  return energy;
+}
+
+// Windows a buffer.
+// Inputs:
+//   * |window| is the window by which to multiply.
+//   * |data| is the data without windowing.
+//   * |length| is the length of the window and data.
+// Output:
+//   * |data_windowed| is the windowed data.
+static void Windowing(const float* window,
+                      const float* data,
+                      size_t length,
+                      float* data_windowed) {
+  size_t i;
+
+  for (i = 0; i < length; ++i) {
+    data_windowed[i] = window[i] * data[i];
+  }
+}
+
+// Estimate prior SNR decision-directed and compute DD based Wiener Filter.
+// Input:
+//   * |magn| is the signal magnitude spectrum estimate.
+// Output:
+//   * |theFilter| is the frequency response of the computed Wiener filter.
+static void ComputeDdBasedWienerFilter(const NoiseSuppressionC* self,
+                                       const float* magn,
+                                       float* theFilter) {
+  size_t i;
+  float snrPrior, previousEstimateStsa, currentEstimateStsa;
+
+  for (i = 0; i < self->magnLen; i++) {
+    // Previous estimate: based on previous frame with gain filter.
+    previousEstimateStsa = self->magnPrevProcess[i] /
+                           (self->noisePrev[i] + 0.0001f) * self->smooth[i];
+    // Post and prior SNR.
+    currentEstimateStsa = 0.f;
+    if (magn[i] > self->noise[i]) {
+      currentEstimateStsa = magn[i] / (self->noise[i] + 0.0001f) - 1.f;
+    }
+    // DD estimate is sum of two terms: current estimate and previous estimate.
+    // Directed decision update of |snrPrior|.
+    snrPrior = DD_PR_SNR * previousEstimateStsa +
+               (1.f - DD_PR_SNR) * currentEstimateStsa;
+    // Gain filter.
+    theFilter[i] = snrPrior / (self->overdrive + snrPrior);
+  }  // End of loop over frequencies.
+}
+
+// Changes the aggressiveness of the noise suppression method.
+// |mode| = 0 is mild (6dB), |mode| = 1 is medium (10dB) and |mode| = 2 is
+// aggressive (15dB).
+// Returns 0 on success and -1 otherwise.
+int WebRtcNs_set_policy_core(NoiseSuppressionC* self, int mode) {
+  // Allow for modes: 0, 1, 2, 3.
+  if (mode < 0 || mode > 3) {
+    return (-1);
+  }
+
+  self->aggrMode = mode;
+  if (mode == 0) {
+    self->overdrive = 1.f;
+    self->denoiseBound = 0.5f;
+    self->gainmap = 0;
+  } else if (mode == 1) {
+    // self->overdrive = 1.25f;
+    self->overdrive = 1.f;
+    self->denoiseBound = 0.25f;
+    self->gainmap = 1;
+  } else if (mode == 2) {
+    // self->overdrive = 1.25f;
+    self->overdrive = 1.1f;
+    self->denoiseBound = 0.125f;
+    self->gainmap = 1;
+  } else if (mode == 3) {
+    // self->overdrive = 1.3f;
+    self->overdrive = 1.25f;
+    self->denoiseBound = 0.09f;
+    self->gainmap = 1;
+  }
+  return 0;
+}
+
+void WebRtcNs_AnalyzeCore(NoiseSuppressionC* self, const float* speechFrame) {
+  size_t i;
+  const size_t kStartBand = 5;  // Skip first frequency bins during estimation.
+  int updateParsFlag;
+  float energy;
+  float signalEnergy = 0.f;
+  float sumMagn = 0.f;
+  float tmpFloat1, tmpFloat2, tmpFloat3;
+  float winData[ANAL_BLOCKL_MAX];
+  float magn[HALF_ANAL_BLOCKL], noise[HALF_ANAL_BLOCKL];
+  float snrLocPost[HALF_ANAL_BLOCKL], snrLocPrior[HALF_ANAL_BLOCKL];
+  float real[ANAL_BLOCKL_MAX], imag[HALF_ANAL_BLOCKL];
+  // Variables during startup.
+  float sum_log_i = 0.0;
+  float sum_log_i_square = 0.0;
+  float sum_log_magn = 0.0;
+  float sum_log_i_log_magn = 0.0;
+  float parametric_exp = 0.0;
+  float parametric_num = 0.0;
+
+  // Check that initiation has been done.
+  RTC_DCHECK_EQ(1, self->initFlag);
+  updateParsFlag = self->modelUpdatePars[0];
+
+  // Update analysis buffer for L band.
+  UpdateBuffer(speechFrame, self->blockLen, self->anaLen, self->analyzeBuf);
+
+  Windowing(self->window, self->analyzeBuf, self->anaLen, winData);
+  energy = Energy(winData, self->anaLen);
+  if (energy == 0.0) {
+    // We want to avoid updating statistics in this case:
+    // Updating feature statistics when we have zeros only will cause
+    // thresholds to move towards zero signal situations. This in turn has the
+    // effect that once the signal is "turned on" (non-zero values) everything
+    // will be treated as speech and there is no noise suppression effect.
+    // Depending on the duration of the inactive signal it takes a
+    // considerable amount of time for the system to learn what is noise and
+    // what is speech.
+    return;
+  }
+
+  self->blockInd++;  // Update the block index only when we process a block.
+
+  FFT(self, winData, self->anaLen, self->magnLen, real, imag, magn);
+
+  for (i = 0; i < self->magnLen; i++) {
+    signalEnergy += real[i] * real[i] + imag[i] * imag[i];
+    sumMagn += magn[i];
+    if (self->blockInd < END_STARTUP_SHORT) {
+      if (i >= kStartBand) {
+        tmpFloat2 = logf((float)i);
+        sum_log_i += tmpFloat2;
+        sum_log_i_square += tmpFloat2 * tmpFloat2;
+        tmpFloat1 = logf(magn[i]);
+        sum_log_magn += tmpFloat1;
+        sum_log_i_log_magn += tmpFloat2 * tmpFloat1;
+      }
+    }
+  }
+  signalEnergy /= self->magnLen;
+  self->signalEnergy = signalEnergy;
+  self->sumMagn = sumMagn;
+
+  // Quantile noise estimate.
+  NoiseEstimation(self, magn, noise);
+  // Compute simplified noise model during startup.
+  if (self->blockInd < END_STARTUP_SHORT) {
+    // Estimate White noise.
+    self->whiteNoiseLevel += sumMagn / self->magnLen * self->overdrive;
+    // Estimate Pink noise parameters.
+    tmpFloat1 = sum_log_i_square * (self->magnLen - kStartBand);
+    tmpFloat1 -= (sum_log_i * sum_log_i);
+    tmpFloat2 =
+        (sum_log_i_square * sum_log_magn - sum_log_i * sum_log_i_log_magn);
+    tmpFloat3 = tmpFloat2 / tmpFloat1;
+    // Constrain the estimated spectrum to be positive.
+    if (tmpFloat3 < 0.f) {
+      tmpFloat3 = 0.f;
+    }
+    self->pinkNoiseNumerator += tmpFloat3;
+    tmpFloat2 = (sum_log_i * sum_log_magn);
+    tmpFloat2 -= (self->magnLen - kStartBand) * sum_log_i_log_magn;
+    tmpFloat3 = tmpFloat2 / tmpFloat1;
+    // Constrain the pink noise power to be in the interval [0, 1].
+    if (tmpFloat3 < 0.f) {
+      tmpFloat3 = 0.f;
+    }
+    if (tmpFloat3 > 1.f) {
+      tmpFloat3 = 1.f;
+    }
+    self->pinkNoiseExp += tmpFloat3;
+
+    // Calculate frequency independent parts of parametric noise estimate.
+    if (self->pinkNoiseExp > 0.f) {
+      // Use pink noise estimate.
+      parametric_num =
+          expf(self->pinkNoiseNumerator / (float)(self->blockInd + 1));
+      parametric_num *= (float)(self->blockInd + 1);
+      parametric_exp = self->pinkNoiseExp / (float)(self->blockInd + 1);
+    }
+    for (i = 0; i < self->magnLen; i++) {
+      // Estimate the background noise using the white and pink noise
+      // parameters.
+      if (self->pinkNoiseExp == 0.f) {
+        // Use white noise estimate.
+        self->parametricNoise[i] = self->whiteNoiseLevel;
+      } else {
+        // Use pink noise estimate.
+        float use_band = (float)(i < kStartBand ? kStartBand : i);
+        self->parametricNoise[i] =
+            parametric_num / powf(use_band, parametric_exp);
+      }
+      // Weight quantile noise with modeled noise.
+      noise[i] *= (self->blockInd);
+      tmpFloat2 =
+          self->parametricNoise[i] * (END_STARTUP_SHORT - self->blockInd);
+      noise[i] += (tmpFloat2 / (float)(self->blockInd + 1));
+      noise[i] /= END_STARTUP_SHORT;
+    }
+  }
+  // Compute average signal during END_STARTUP_LONG time:
+  // used to normalize spectral difference measure.
+  if (self->blockInd < END_STARTUP_LONG) {
+    self->featureData[5] *= self->blockInd;
+    self->featureData[5] += signalEnergy;
+    self->featureData[5] /= (self->blockInd + 1);
+  }
+
+  // Post and prior SNR needed for SpeechNoiseProb.
+  ComputeSnr(self, magn, noise, snrLocPrior, snrLocPost);
+
+  FeatureUpdate(self, magn, updateParsFlag);
+  SpeechNoiseProb(self, self->speechProb, snrLocPrior, snrLocPost);
+  UpdateNoiseEstimate(self, magn, snrLocPrior, snrLocPost, noise);
+
+  // Keep track of noise spectrum for next frame.
+  memcpy(self->noise, noise, sizeof(*noise) * self->magnLen);
+  memcpy(self->magnPrevAnalyze, magn, sizeof(*magn) * self->magnLen);
+}
+
+void WebRtcNs_ProcessCore(NoiseSuppressionC* self,
+                          const float* const* speechFrame,
+                          size_t num_bands,
+                          float* const* outFrame) {
+  // Main routine for noise reduction.
+  int flagHB = 0;
+  size_t i, j;
+
+  float energy1, energy2, gain, factor, factor1, factor2;
+  float fout[BLOCKL_MAX];
+  float winData[ANAL_BLOCKL_MAX];
+  float magn[HALF_ANAL_BLOCKL];
+  float theFilter[HALF_ANAL_BLOCKL], theFilterTmp[HALF_ANAL_BLOCKL];
+  float real[ANAL_BLOCKL_MAX], imag[HALF_ANAL_BLOCKL];
+
+  // SWB variables.
+  int deltaBweHB = 1;
+  int deltaGainHB = 1;
+  float decayBweHB = 1.0;
+  float gainMapParHB = 1.0;
+  float gainTimeDomainHB = 1.0;
+  float avgProbSpeechHB, avgProbSpeechHBTmp, avgFilterGainHB, gainModHB;
+  float sumMagnAnalyze, sumMagnProcess;
+
+  // Check that initiation has been done.
+  RTC_DCHECK_EQ(1, self->initFlag);
+  RTC_DCHECK_LE(num_bands - 1, NUM_HIGH_BANDS_MAX);
+
+  const float* const* speechFrameHB = NULL;
+  float* const* outFrameHB = NULL;
+  size_t num_high_bands = 0;
+  if (num_bands > 1) {
+    speechFrameHB = &speechFrame[1];
+    outFrameHB = &outFrame[1];
+    num_high_bands = num_bands - 1;
+    flagHB = 1;
+    // Range for averaging low band quantities for H band gain.
+    deltaBweHB = (int)self->magnLen / 4;
+    deltaGainHB = deltaBweHB;
+  }
+
+  // Update analysis buffer for L band.
+  UpdateBuffer(speechFrame[0], self->blockLen, self->anaLen, self->dataBuf);
+
+  if (flagHB == 1) {
+    // Update analysis buffer for H bands.
+    for (i = 0; i < num_high_bands; ++i) {
+      UpdateBuffer(speechFrameHB[i],
+                   self->blockLen,
+                   self->anaLen,
+                   self->dataBufHB[i]);
+    }
+  }
+
+  Windowing(self->window, self->dataBuf, self->anaLen, winData);
+  energy1 = Energy(winData, self->anaLen);
+  if (energy1 == 0.0) {
+    // Synthesize the special case of zero input.
+    // Read out fully processed segment.
+    for (i = self->windShift; i < self->blockLen + self->windShift; i++) {
+      fout[i - self->windShift] = self->syntBuf[i];
+    }
+    // Update synthesis buffer.
+    UpdateBuffer(NULL, self->blockLen, self->anaLen, self->syntBuf);
+
+    for (i = 0; i < self->blockLen; ++i)
+      outFrame[0][i] =
+          WEBRTC_SPL_SAT(WEBRTC_SPL_WORD16_MAX, fout[i], WEBRTC_SPL_WORD16_MIN);
+
+    // For time-domain gain of HB.
+    if (flagHB == 1) {
+      for (i = 0; i < num_high_bands; ++i) {
+        for (j = 0; j < self->blockLen; ++j) {
+          outFrameHB[i][j] = WEBRTC_SPL_SAT(WEBRTC_SPL_WORD16_MAX,
+                                            self->dataBufHB[i][j],
+                                            WEBRTC_SPL_WORD16_MIN);
+        }
+      }
+    }
+
+    return;
+  }
+
+  FFT(self, winData, self->anaLen, self->magnLen, real, imag, magn);
+
+  if (self->blockInd < END_STARTUP_SHORT) {
+    for (i = 0; i < self->magnLen; i++) {
+      self->initMagnEst[i] += magn[i];
+    }
+  }
+
+  ComputeDdBasedWienerFilter(self, magn, theFilter);
+
+  for (i = 0; i < self->magnLen; i++) {
+    // Flooring bottom.
+    if (theFilter[i] < self->denoiseBound) {
+      theFilter[i] = self->denoiseBound;
+    }
+    // Flooring top.
+    if (theFilter[i] > 1.f) {
+      theFilter[i] = 1.f;
+    }
+    if (self->blockInd < END_STARTUP_SHORT) {
+      theFilterTmp[i] =
+          (self->initMagnEst[i] - self->overdrive * self->parametricNoise[i]);
+      theFilterTmp[i] /= (self->initMagnEst[i] + 0.0001f);
+      // Flooring bottom.
+      if (theFilterTmp[i] < self->denoiseBound) {
+        theFilterTmp[i] = self->denoiseBound;
+      }
+      // Flooring top.
+      if (theFilterTmp[i] > 1.f) {
+        theFilterTmp[i] = 1.f;
+      }
+      // Weight the two suppression filters.
+      theFilter[i] *= (self->blockInd);
+      theFilterTmp[i] *= (END_STARTUP_SHORT - self->blockInd);
+      theFilter[i] += theFilterTmp[i];
+      theFilter[i] /= (END_STARTUP_SHORT);
+    }
+
+    self->smooth[i] = theFilter[i];
+    real[i] *= self->smooth[i];
+    imag[i] *= self->smooth[i];
+  }
+  // Keep track of |magn| spectrum for next frame.
+  memcpy(self->magnPrevProcess, magn, sizeof(*magn) * self->magnLen);
+  memcpy(self->noisePrev, self->noise, sizeof(self->noise[0]) * self->magnLen);
+  // Back to time domain.
+  IFFT(self, real, imag, self->magnLen, self->anaLen, winData);
+
+  // Scale factor: only do it after END_STARTUP_LONG time.
+  factor = 1.f;
+  if (self->gainmap == 1 && self->blockInd > END_STARTUP_LONG) {
+    factor1 = 1.f;
+    factor2 = 1.f;
+
+    energy2 = Energy(winData, self->anaLen);
+    gain = (float)sqrt(energy2 / (energy1 + 1.f));
+
+    // Scaling for new version.
+    if (gain > B_LIM) {
+      factor1 = 1.f + 1.3f * (gain - B_LIM);
+      if (gain * factor1 > 1.f) {
+        factor1 = 1.f / gain;
+      }
+    }
+    if (gain < B_LIM) {
+      // Don't reduce scale too much for pause regions:
+      // attenuation here should be controlled by flooring.
+      if (gain <= self->denoiseBound) {
+        gain = self->denoiseBound;
+      }
+      factor2 = 1.f - 0.3f * (B_LIM - gain);
+    }
+    // Combine both scales with speech/noise prob:
+    // note prior (priorSpeechProb) is not frequency dependent.
+    factor = self->priorSpeechProb * factor1 +
+             (1.f - self->priorSpeechProb) * factor2;
+  }  // Out of self->gainmap == 1.
+
+  Windowing(self->window, winData, self->anaLen, winData);
+
+  // Synthesis.
+  for (i = 0; i < self->anaLen; i++) {
+    self->syntBuf[i] += factor * winData[i];
+  }
+  // Read out fully processed segment.
+  for (i = self->windShift; i < self->blockLen + self->windShift; i++) {
+    fout[i - self->windShift] = self->syntBuf[i];
+  }
+  // Update synthesis buffer.
+  UpdateBuffer(NULL, self->blockLen, self->anaLen, self->syntBuf);
+
+  for (i = 0; i < self->blockLen; ++i)
+    outFrame[0][i] =
+        WEBRTC_SPL_SAT(WEBRTC_SPL_WORD16_MAX, fout[i], WEBRTC_SPL_WORD16_MIN);
+
+  // For time-domain gain of HB.
+  if (flagHB == 1) {
+    // Average speech prob from low band.
+    // Average over second half (i.e., 4->8kHz) of frequencies spectrum.
+    avgProbSpeechHB = 0.0;
+    for (i = self->magnLen - deltaBweHB - 1; i < self->magnLen - 1; i++) {
+      avgProbSpeechHB += self->speechProb[i];
+    }
+    avgProbSpeechHB = avgProbSpeechHB / ((float)deltaBweHB);
+    // If the speech was suppressed by a component between Analyze and
+    // Process, for example the AEC, then it should not be considered speech
+    // for high band suppression purposes.
+    sumMagnAnalyze = 0;
+    sumMagnProcess = 0;
+    for (i = 0; i < self->magnLen; ++i) {
+      sumMagnAnalyze += self->magnPrevAnalyze[i];
+      sumMagnProcess += self->magnPrevProcess[i];
+    }
+    avgProbSpeechHB *= sumMagnProcess / sumMagnAnalyze;
+    // Average filter gain from low band.
+    // Average over second half (i.e., 4->8kHz) of frequencies spectrum.
+    avgFilterGainHB = 0.0;
+    for (i = self->magnLen - deltaGainHB - 1; i < self->magnLen - 1; i++) {
+      avgFilterGainHB += self->smooth[i];
+    }
+    avgFilterGainHB = avgFilterGainHB / ((float)(deltaGainHB));
+    avgProbSpeechHBTmp = 2.f * avgProbSpeechHB - 1.f;
+    // Gain based on speech probability.
+    gainModHB = 0.5f * (1.f + (float)tanh(gainMapParHB * avgProbSpeechHBTmp));
+    // Combine gain with low band gain.
+    gainTimeDomainHB = 0.5f * gainModHB + 0.5f * avgFilterGainHB;
+    if (avgProbSpeechHB >= 0.5f) {
+      gainTimeDomainHB = 0.25f * gainModHB + 0.75f * avgFilterGainHB;
+    }
+    gainTimeDomainHB = gainTimeDomainHB * decayBweHB;
+    // Make sure gain is within flooring range.
+    // Flooring bottom.
+    if (gainTimeDomainHB < self->denoiseBound) {
+      gainTimeDomainHB = self->denoiseBound;
+    }
+    // Flooring top.
+    if (gainTimeDomainHB > 1.f) {
+      gainTimeDomainHB = 1.f;
+    }
+    // Apply gain.
+    for (i = 0; i < num_high_bands; ++i) {
+      for (j = 0; j < self->blockLen; j++) {
+        outFrameHB[i][j] =
+            WEBRTC_SPL_SAT(WEBRTC_SPL_WORD16_MAX,
+                           gainTimeDomainHB * self->dataBufHB[i][j],
+                           WEBRTC_SPL_WORD16_MIN);
+      }
+    }
+  }  // End of H band gain computation.
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/ns_core.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/ns_core.h
new file mode 100644
index 0000000..aba1c46
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/ns_core.h
@@ -0,0 +1,190 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_NS_CORE_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_NS_CORE_H_
+
+#include "webrtc/modules/audio_processing/ns/defines.h"
+
+typedef struct NSParaExtract_ {
+  // Bin size of histogram.
+  float binSizeLrt;
+  float binSizeSpecFlat;
+  float binSizeSpecDiff;
+  // Range of histogram over which LRT threshold is computed.
+  float rangeAvgHistLrt;
+  // Scale parameters: multiply dominant peaks of the histograms by scale factor
+  // to obtain thresholds for prior model.
+  float factor1ModelPars;  // For LRT and spectral difference.
+  float factor2ModelPars;  // For spectral_flatness: used when noise is flatter
+                           // than speech.
+  // Peak limit for spectral flatness (varies between 0 and 1).
+  float thresPosSpecFlat;
+  // Limit on spacing of two highest peaks in histogram: spacing determined by
+  // bin size.
+  float limitPeakSpacingSpecFlat;
+  float limitPeakSpacingSpecDiff;
+  // Limit on relevance of second peak.
+  float limitPeakWeightsSpecFlat;
+  float limitPeakWeightsSpecDiff;
+  // Limit on fluctuation of LRT feature.
+  float thresFluctLrt;
+  // Limit on the max and min values for the feature thresholds.
+  float maxLrt;
+  float minLrt;
+  float maxSpecFlat;
+  float minSpecFlat;
+  float maxSpecDiff;
+  float minSpecDiff;
+  // Criteria of weight of histogram peak to accept/reject feature.
+  int thresWeightSpecFlat;
+  int thresWeightSpecDiff;
+
+} NSParaExtract;
+
+typedef struct NoiseSuppressionC_ {
+  uint32_t fs;
+  size_t blockLen;
+  size_t windShift;
+  size_t anaLen;
+  size_t magnLen;
+  int aggrMode;
+  const float* window;
+  float analyzeBuf[ANAL_BLOCKL_MAX];
+  float dataBuf[ANAL_BLOCKL_MAX];
+  float syntBuf[ANAL_BLOCKL_MAX];
+
+  int initFlag;
+  // Parameters for quantile noise estimation.
+  float density[SIMULT * HALF_ANAL_BLOCKL];
+  float lquantile[SIMULT * HALF_ANAL_BLOCKL];
+  float quantile[HALF_ANAL_BLOCKL];
+  int counter[SIMULT];
+  int updates;
+  // Parameters for Wiener filter.
+  float smooth[HALF_ANAL_BLOCKL];
+  float overdrive;
+  float denoiseBound;
+  int gainmap;
+  // FFT work arrays.
+  size_t ip[IP_LENGTH];
+  float wfft[W_LENGTH];
+
+  // Parameters for new method: some not needed, will reduce/cleanup later.
+  int32_t blockInd;  // Frame index counter.
+  int modelUpdatePars[4];  // Parameters for updating or estimating.
+  // Thresholds/weights for prior model.
+  float priorModelPars[7];  // Parameters for prior model.
+  float noise[HALF_ANAL_BLOCKL];  // Noise spectrum from current frame.
+  float noisePrev[HALF_ANAL_BLOCKL];  // Noise spectrum from previous frame.
+  // Magnitude spectrum of previous analyze frame.
+  float magnPrevAnalyze[HALF_ANAL_BLOCKL];
+  // Magnitude spectrum of previous process frame.
+  float magnPrevProcess[HALF_ANAL_BLOCKL];
+  float logLrtTimeAvg[HALF_ANAL_BLOCKL];  // Log LRT factor with time-smoothing.
+  float priorSpeechProb;  // Prior speech/noise probability.
+  float featureData[7];
+  // Conservative noise spectrum estimate.
+  float magnAvgPause[HALF_ANAL_BLOCKL];
+  float signalEnergy;  // Energy of |magn|.
+  float sumMagn;
+  float whiteNoiseLevel;  // Initial noise estimate.
+  float initMagnEst[HALF_ANAL_BLOCKL];  // Initial magnitude spectrum estimate.
+  float pinkNoiseNumerator;  // Pink noise parameter: numerator.
+  float pinkNoiseExp;  // Pink noise parameter: power of frequencies.
+  float parametricNoise[HALF_ANAL_BLOCKL];
+  // Parameters for feature extraction.
+  NSParaExtract featureExtractionParams;
+  // Histograms for parameter estimation.
+  int histLrt[HIST_PAR_EST];
+  int histSpecFlat[HIST_PAR_EST];
+  int histSpecDiff[HIST_PAR_EST];
+  // Quantities for high band estimate.
+  float speechProb[HALF_ANAL_BLOCKL];  // Final speech/noise prob: prior + LRT.
+  // Buffering data for HB.
+  float dataBufHB[NUM_HIGH_BANDS_MAX][ANAL_BLOCKL_MAX];
+
+} NoiseSuppressionC;
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/****************************************************************************
+ * WebRtcNs_InitCore(...)
+ *
+ * This function initializes a noise suppression instance
+ *
+ * Input:
+ *      - self          : Instance that should be initialized
+ *      - fs            : Sampling frequency
+ *
+ * Output:
+ *      - self          : Initialized instance
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int WebRtcNs_InitCore(NoiseSuppressionC* self, uint32_t fs);
+
+/****************************************************************************
+ * WebRtcNs_set_policy_core(...)
+ *
+ * This changes the aggressiveness of the noise suppression method.
+ *
+ * Input:
+ *      - self          : Instance that should be initialized
+ *      - mode          : 0: Mild (6dB), 1: Medium (10dB), 2: Aggressive (15dB)
+ *
+ * Output:
+ *      - self          : Initialized instance
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int WebRtcNs_set_policy_core(NoiseSuppressionC* self, int mode);
+
+/****************************************************************************
+ * WebRtcNs_AnalyzeCore
+ *
+ * Estimate the background noise.
+ *
+ * Input:
+ *      - self          : Instance that should be initialized
+ *      - speechFrame   : Input speech frame for lower band
+ *
+ * Output:
+ *      - self          : Updated instance
+ */
+void WebRtcNs_AnalyzeCore(NoiseSuppressionC* self, const float* speechFrame);
+
+/****************************************************************************
+ * WebRtcNs_ProcessCore
+ *
+ * Do noise suppression.
+ *
+ * Input:
+ *      - self          : Instance that should be initialized
+ *      - inFrame       : Input speech frame for each band
+ *      - num_bands     : Number of bands
+ *
+ * Output:
+ *      - self          : Updated instance
+ *      - outFrame      : Output speech frame for each band
+ */
+void WebRtcNs_ProcessCore(NoiseSuppressionC* self,
+                          const float* const* inFrame,
+                          size_t num_bands,
+                          float* const* outFrame);
+
+#ifdef __cplusplus
+}
+#endif
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_NS_NS_CORE_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core.c
new file mode 100644
index 0000000..acd8b70
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core.c
@@ -0,0 +1,2107 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/ns/noise_suppression_x.h"
+
+#include <math.h>
+#include <stdlib.h>
+#include <string.h>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/real_fft.h"
+#include "webrtc/modules/audio_processing/ns/nsx_core.h"
+#include "webrtc/system_wrappers/include/cpu_features_wrapper.h"
+
+#if defined(WEBRTC_HAS_NEON)
+/* Tables are defined in ARM assembly files. */
+extern const int16_t WebRtcNsx_kLogTable[9];
+extern const int16_t WebRtcNsx_kCounterDiv[201];
+extern const int16_t WebRtcNsx_kLogTableFrac[256];
+#else
+static const int16_t WebRtcNsx_kLogTable[9] = {
+  0, 177, 355, 532, 710, 887, 1065, 1242, 1420
+};
+
+static const int16_t WebRtcNsx_kCounterDiv[201] = {
+  32767, 16384, 10923, 8192, 6554, 5461, 4681, 4096, 3641, 3277, 2979, 2731,
+  2521, 2341, 2185, 2048, 1928, 1820, 1725, 1638, 1560, 1489, 1425, 1365, 1311,
+  1260, 1214, 1170, 1130, 1092, 1057, 1024, 993, 964, 936, 910, 886, 862, 840,
+  819, 799, 780, 762, 745, 728, 712, 697, 683, 669, 655, 643, 630, 618, 607,
+  596, 585, 575, 565, 555, 546, 537, 529, 520, 512, 504, 496, 489, 482, 475,
+  468, 462, 455, 449, 443, 437, 431, 426, 420, 415, 410, 405, 400, 395, 390,
+  386, 381, 377, 372, 368, 364, 360, 356, 352, 349, 345, 341, 338, 334, 331,
+  328, 324, 321, 318, 315, 312, 309, 306, 303, 301, 298, 295, 293, 290, 287,
+  285, 282, 280, 278, 275, 273, 271, 269, 266, 264, 262, 260, 258, 256, 254,
+  252, 250, 248, 246, 245, 243, 241, 239, 237, 236, 234, 232, 231, 229, 228,
+  226, 224, 223, 221, 220, 218, 217, 216, 214, 213, 211, 210, 209, 207, 206,
+  205, 204, 202, 201, 200, 199, 197, 196, 195, 194, 193, 192, 191, 189, 188,
+  187, 186, 185, 184, 183, 182, 181, 180, 179, 178, 177, 176, 175, 174, 173,
+  172, 172, 171, 170, 169, 168, 167, 166, 165, 165, 164, 163
+};
+
+static const int16_t WebRtcNsx_kLogTableFrac[256] = {
+  0,   1,   3,   4,   6,   7,   9,  10,  11,  13,  14,  16,  17,  18,  20,  21,
+  22,  24,  25,  26,  28,  29,  30,  32,  33,  34,  36,  37,  38,  40,  41,  42,
+  44,  45,  46,  47,  49,  50,  51,  52,  54,  55,  56,  57,  59,  60,  61,  62,
+  63,  65,  66,  67,  68,  69,  71,  72,  73,  74,  75,  77,  78,  79,  80,  81,
+  82,  84,  85,  86,  87,  88,  89,  90,  92,  93,  94,  95,  96,  97,  98,  99,
+  100, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 116,
+  117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131,
+  132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146,
+  147, 148, 149, 150, 151, 152, 153, 154, 155, 155, 156, 157, 158, 159, 160,
+  161, 162, 163, 164, 165, 166, 167, 168, 169, 169, 170, 171, 172, 173, 174,
+  175, 176, 177, 178, 178, 179, 180, 181, 182, 183, 184, 185, 185, 186, 187,
+  188, 189, 190, 191, 192, 192, 193, 194, 195, 196, 197, 198, 198, 199, 200,
+  201, 202, 203, 203, 204, 205, 206, 207, 208, 208, 209, 210, 211, 212, 212,
+  213, 214, 215, 216, 216, 217, 218, 219, 220, 220, 221, 222, 223, 224, 224,
+  225, 226, 227, 228, 228, 229, 230, 231, 231, 232, 233, 234, 234, 235, 236,
+  237, 238, 238, 239, 240, 241, 241, 242, 243, 244, 244, 245, 246, 247, 247,
+  248, 249, 249, 250, 251, 252, 252, 253, 254, 255, 255
+};
+#endif  // WEBRTC_HAS_NEON
+
+// Skip first frequency bins during estimation. (0 <= value < 64)
+static const size_t kStartBand = 5;
+
+// hybrib Hanning & flat window
+static const int16_t kBlocks80w128x[128] = {
+  0,    536,   1072,   1606,   2139,   2669,   3196,   3720,   4240,   4756,   5266,
+  5771,   6270,   6762,   7246,   7723,   8192,   8652,   9102,   9543,   9974,  10394,
+  10803,  11200,  11585,  11958,  12318,  12665,  12998,  13318,  13623,  13913,  14189,
+  14449,  14694,  14924,  15137,  15334,  15515,  15679,  15826,  15956,  16069,  16165,
+  16244,  16305,  16349,  16375,  16384,  16384,  16384,  16384,  16384,  16384,  16384,
+  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,
+  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,  16384,
+  16384,  16384,  16384,  16384,  16375,  16349,  16305,  16244,  16165,  16069,  15956,
+  15826,  15679,  15515,  15334,  15137,  14924,  14694,  14449,  14189,  13913,  13623,
+  13318,  12998,  12665,  12318,  11958,  11585,  11200,  10803,  10394,   9974,   9543,
+  9102,   8652,   8192,   7723,   7246,   6762,   6270,   5771,   5266,   4756,   4240,
+  3720,   3196,   2669,   2139,   1606,   1072,    536
+};
+
+// hybrib Hanning & flat window
+static const int16_t kBlocks160w256x[256] = {
+  0,   268,   536,   804,  1072,  1339,  1606,  1872,
+  2139,  2404,  2669,  2933,  3196,  3459,  3720,  3981,
+  4240,  4499,  4756,  5012,  5266,  5520,  5771,  6021,
+  6270,  6517,  6762,  7005,  7246,  7486,  7723,  7959,
+  8192,  8423,  8652,  8878,  9102,  9324,  9543,  9760,
+  9974, 10185, 10394, 10600, 10803, 11003, 11200, 11394,
+  11585, 11773, 11958, 12140, 12318, 12493, 12665, 12833,
+  12998, 13160, 13318, 13472, 13623, 13770, 13913, 14053,
+  14189, 14321, 14449, 14574, 14694, 14811, 14924, 15032,
+  15137, 15237, 15334, 15426, 15515, 15599, 15679, 15754,
+  15826, 15893, 15956, 16015, 16069, 16119, 16165, 16207,
+  16244, 16277, 16305, 16329, 16349, 16364, 16375, 16382,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16384, 16384, 16384, 16384, 16384, 16384, 16384,
+  16384, 16382, 16375, 16364, 16349, 16329, 16305, 16277,
+  16244, 16207, 16165, 16119, 16069, 16015, 15956, 15893,
+  15826, 15754, 15679, 15599, 15515, 15426, 15334, 15237,
+  15137, 15032, 14924, 14811, 14694, 14574, 14449, 14321,
+  14189, 14053, 13913, 13770, 13623, 13472, 13318, 13160,
+  12998, 12833, 12665, 12493, 12318, 12140, 11958, 11773,
+  11585, 11394, 11200, 11003, 10803, 10600, 10394, 10185,
+  9974,  9760,  9543,  9324,  9102,  8878,  8652,  8423,
+  8192,  7959,  7723,  7486,  7246,  7005,  6762,  6517,
+  6270,  6021,  5771,  5520,  5266,  5012,  4756,  4499,
+  4240,  3981,  3720,  3459,  3196,  2933,  2669,  2404,
+  2139,  1872,  1606,  1339,  1072,   804,   536,   268
+};
+
+// Gain factor1 table: Input value in Q8 and output value in Q13
+// original floating point code
+//  if (gain > blim) {
+//    factor1 = 1.0 + 1.3 * (gain - blim);
+//    if (gain * factor1 > 1.0) {
+//      factor1 = 1.0 / gain;
+//    }
+//  } else {
+//    factor1 = 1.0;
+//  }
+static const int16_t kFactor1Table[257] = {
+  8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8233, 8274, 8315, 8355, 8396, 8436, 8475, 8515, 8554, 8592, 8631, 8669,
+  8707, 8745, 8783, 8820, 8857, 8894, 8931, 8967, 9003, 9039, 9075, 9111, 9146, 9181,
+  9216, 9251, 9286, 9320, 9354, 9388, 9422, 9456, 9489, 9523, 9556, 9589, 9622, 9655,
+  9687, 9719, 9752, 9784, 9816, 9848, 9879, 9911, 9942, 9973, 10004, 10035, 10066,
+  10097, 10128, 10158, 10188, 10218, 10249, 10279, 10308, 10338, 10368, 10397, 10426,
+  10456, 10485, 10514, 10543, 10572, 10600, 10629, 10657, 10686, 10714, 10742, 10770,
+  10798, 10826, 10854, 10882, 10847, 10810, 10774, 10737, 10701, 10666, 10631, 10596,
+  10562, 10527, 10494, 10460, 10427, 10394, 10362, 10329, 10297, 10266, 10235, 10203,
+  10173, 10142, 10112, 10082, 10052, 10023, 9994, 9965, 9936, 9908, 9879, 9851, 9824,
+  9796, 9769, 9742, 9715, 9689, 9662, 9636, 9610, 9584, 9559, 9534, 9508, 9484, 9459,
+  9434, 9410, 9386, 9362, 9338, 9314, 9291, 9268, 9245, 9222, 9199, 9176, 9154, 9132,
+  9110, 9088, 9066, 9044, 9023, 9002, 8980, 8959, 8939, 8918, 8897, 8877, 8857, 8836,
+  8816, 8796, 8777, 8757, 8738, 8718, 8699, 8680, 8661, 8642, 8623, 8605, 8586, 8568,
+  8550, 8532, 8514, 8496, 8478, 8460, 8443, 8425, 8408, 8391, 8373, 8356, 8339, 8323,
+  8306, 8289, 8273, 8256, 8240, 8224, 8208, 8192
+};
+
+// For Factor2 tables
+// original floating point code
+// if (gain > blim) {
+//   factor2 = 1.0;
+// } else {
+//   factor2 = 1.0 - 0.3 * (blim - gain);
+//   if (gain <= inst->denoiseBound) {
+//     factor2 = 1.0 - 0.3 * (blim - inst->denoiseBound);
+//   }
+// }
+//
+// Gain factor table: Input value in Q8 and output value in Q13
+static const int16_t kFactor2Aggressiveness1[257] = {
+  7577, 7577, 7577, 7577, 7577, 7577,
+  7577, 7577, 7577, 7577, 7577, 7577, 7577, 7577, 7577, 7577, 7577, 7596, 7614, 7632,
+  7650, 7667, 7683, 7699, 7715, 7731, 7746, 7761, 7775, 7790, 7804, 7818, 7832, 7845,
+  7858, 7871, 7884, 7897, 7910, 7922, 7934, 7946, 7958, 7970, 7982, 7993, 8004, 8016,
+  8027, 8038, 8049, 8060, 8070, 8081, 8091, 8102, 8112, 8122, 8132, 8143, 8152, 8162,
+  8172, 8182, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192
+};
+
+// Gain factor table: Input value in Q8 and output value in Q13
+static const int16_t kFactor2Aggressiveness2[257] = {
+  7270, 7270, 7270, 7270, 7270, 7306,
+  7339, 7369, 7397, 7424, 7448, 7472, 7495, 7517, 7537, 7558, 7577, 7596, 7614, 7632,
+  7650, 7667, 7683, 7699, 7715, 7731, 7746, 7761, 7775, 7790, 7804, 7818, 7832, 7845,
+  7858, 7871, 7884, 7897, 7910, 7922, 7934, 7946, 7958, 7970, 7982, 7993, 8004, 8016,
+  8027, 8038, 8049, 8060, 8070, 8081, 8091, 8102, 8112, 8122, 8132, 8143, 8152, 8162,
+  8172, 8182, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192
+};
+
+// Gain factor table: Input value in Q8 and output value in Q13
+static const int16_t kFactor2Aggressiveness3[257] = {
+  7184, 7184, 7184, 7229, 7270, 7306,
+  7339, 7369, 7397, 7424, 7448, 7472, 7495, 7517, 7537, 7558, 7577, 7596, 7614, 7632,
+  7650, 7667, 7683, 7699, 7715, 7731, 7746, 7761, 7775, 7790, 7804, 7818, 7832, 7845,
+  7858, 7871, 7884, 7897, 7910, 7922, 7934, 7946, 7958, 7970, 7982, 7993, 8004, 8016,
+  8027, 8038, 8049, 8060, 8070, 8081, 8091, 8102, 8112, 8122, 8132, 8143, 8152, 8162,
+  8172, 8182, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192,
+  8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192, 8192
+};
+
+// sum of log2(i) from table index to inst->anaLen2 in Q5
+// Note that the first table value is invalid, since log2(0) = -infinity
+static const int16_t kSumLogIndex[66] = {
+  0,  22917,  22917,  22885,  22834,  22770,  22696,  22613,
+  22524,  22428,  22326,  22220,  22109,  21994,  21876,  21754,
+  21629,  21501,  21370,  21237,  21101,  20963,  20822,  20679,
+  20535,  20388,  20239,  20089,  19937,  19783,  19628,  19470,
+  19312,  19152,  18991,  18828,  18664,  18498,  18331,  18164,
+  17994,  17824,  17653,  17480,  17306,  17132,  16956,  16779,
+  16602,  16423,  16243,  16063,  15881,  15699,  15515,  15331,
+  15146,  14960,  14774,  14586,  14398,  14209,  14019,  13829,
+  13637,  13445
+};
+
+// sum of log2(i)^2 from table index to inst->anaLen2 in Q2
+// Note that the first table value is invalid, since log2(0) = -infinity
+static const int16_t kSumSquareLogIndex[66] = {
+  0,  16959,  16959,  16955,  16945,  16929,  16908,  16881,
+  16850,  16814,  16773,  16729,  16681,  16630,  16575,  16517,
+  16456,  16392,  16325,  16256,  16184,  16109,  16032,  15952,
+  15870,  15786,  15700,  15612,  15521,  15429,  15334,  15238,
+  15140,  15040,  14938,  14834,  14729,  14622,  14514,  14404,
+  14292,  14179,  14064,  13947,  13830,  13710,  13590,  13468,
+  13344,  13220,  13094,  12966,  12837,  12707,  12576,  12444,
+  12310,  12175,  12039,  11902,  11763,  11624,  11483,  11341,
+  11198,  11054
+};
+
+// log2(table index) in Q12
+// Note that the first table value is invalid, since log2(0) = -infinity
+static const int16_t kLogIndex[129] = {
+  0,      0,   4096,   6492,   8192,   9511,  10588,  11499,
+  12288,  12984,  13607,  14170,  14684,  15157,  15595,  16003,
+  16384,  16742,  17080,  17400,  17703,  17991,  18266,  18529,
+  18780,  19021,  19253,  19476,  19691,  19898,  20099,  20292,
+  20480,  20662,  20838,  21010,  21176,  21338,  21496,  21649,
+  21799,  21945,  22087,  22226,  22362,  22495,  22625,  22752,
+  22876,  22998,  23117,  23234,  23349,  23462,  23572,  23680,
+  23787,  23892,  23994,  24095,  24195,  24292,  24388,  24483,
+  24576,  24668,  24758,  24847,  24934,  25021,  25106,  25189,
+  25272,  25354,  25434,  25513,  25592,  25669,  25745,  25820,
+  25895,  25968,  26041,  26112,  26183,  26253,  26322,  26390,
+  26458,  26525,  26591,  26656,  26721,  26784,  26848,  26910,
+  26972,  27033,  27094,  27154,  27213,  27272,  27330,  27388,
+  27445,  27502,  27558,  27613,  27668,  27722,  27776,  27830,
+  27883,  27935,  27988,  28039,  28090,  28141,  28191,  28241,
+  28291,  28340,  28388,  28437,  28484,  28532,  28579,  28626,
+  28672
+};
+
+// determinant of estimation matrix in Q0 corresponding to the log2 tables above
+// Note that the first table value is invalid, since log2(0) = -infinity
+static const int16_t kDeterminantEstMatrix[66] = {
+  0,  29814,  25574,  22640,  20351,  18469,  16873,  15491,
+  14277,  13199,  12233,  11362,  10571,   9851,   9192,   8587,
+  8030,   7515,   7038,   6596,   6186,   5804,   5448,   5115,
+  4805,   4514,   4242,   3988,   3749,   3524,   3314,   3116,
+  2930,   2755,   2590,   2435,   2289,   2152,   2022,   1900,
+  1785,   1677,   1575,   1478,   1388,   1302,   1221,   1145,
+  1073,   1005,    942,    881,    825,    771,    721,    674,
+  629,    587,    547,    510,    475,    442,    411,    382,
+  355,    330
+};
+
+// Update the noise estimation information.
+static void UpdateNoiseEstimate(NoiseSuppressionFixedC* inst, int offset) {
+  int32_t tmp32no1 = 0;
+  int32_t tmp32no2 = 0;
+  int16_t tmp16 = 0;
+  const int16_t kExp2Const = 11819; // Q13
+
+  size_t i = 0;
+
+  tmp16 = WebRtcSpl_MaxValueW16(inst->noiseEstLogQuantile + offset,
+                                   inst->magnLen);
+  // Guarantee a Q-domain as high as possible and still fit in int16
+  inst->qNoise = 14 - (int) WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                   kExp2Const, tmp16, 21);
+  for (i = 0; i < inst->magnLen; i++) {
+    // inst->quantile[i]=exp(inst->lquantile[offset+i]);
+    // in Q21
+    tmp32no2 = kExp2Const * inst->noiseEstLogQuantile[offset + i];
+    tmp32no1 = (0x00200000 | (tmp32no2 & 0x001FFFFF)); // 2^21 + frac
+    tmp16 = (int16_t)(tmp32no2 >> 21);
+    tmp16 -= 21;// shift 21 to get result in Q0
+    tmp16 += (int16_t) inst->qNoise; //shift to get result in Q(qNoise)
+    if (tmp16 < 0) {
+      tmp32no1 >>= -tmp16;
+    } else {
+      tmp32no1 <<= tmp16;
+    }
+    inst->noiseEstQuantile[i] = WebRtcSpl_SatW32ToW16(tmp32no1);
+  }
+}
+
+// Noise Estimation
+static void NoiseEstimationC(NoiseSuppressionFixedC* inst,
+                             uint16_t* magn,
+                             uint32_t* noise,
+                             int16_t* q_noise) {
+  int16_t lmagn[HALF_ANAL_BLOCKL], counter, countDiv;
+  int16_t countProd, delta, zeros, frac;
+  int16_t log2, tabind, logval, tmp16, tmp16no1, tmp16no2;
+  const int16_t log2_const = 22713; // Q15
+  const int16_t width_factor = 21845;
+
+  size_t i, s, offset;
+
+  tabind = inst->stages - inst->normData;
+  RTC_DCHECK_LT(tabind, 9);
+  RTC_DCHECK_GT(tabind, -9);
+  if (tabind < 0) {
+    logval = -WebRtcNsx_kLogTable[-tabind];
+  } else {
+    logval = WebRtcNsx_kLogTable[tabind];
+  }
+
+  // lmagn(i)=log(magn(i))=log(2)*log2(magn(i))
+  // magn is in Q(-stages), and the real lmagn values are:
+  // real_lmagn(i)=log(magn(i)*2^stages)=log(magn(i))+log(2^stages)
+  // lmagn in Q8
+  for (i = 0; i < inst->magnLen; i++) {
+    if (magn[i]) {
+      zeros = WebRtcSpl_NormU32((uint32_t)magn[i]);
+      frac = (int16_t)((((uint32_t)magn[i] << zeros)
+                              & 0x7FFFFFFF) >> 23);
+      // log2(magn(i))
+      RTC_DCHECK_LT(frac, 256);
+      log2 = (int16_t)(((31 - zeros) << 8)
+                             + WebRtcNsx_kLogTableFrac[frac]);
+      // log2(magn(i))*log(2)
+      lmagn[i] = (int16_t)((log2 * log2_const) >> 15);
+      // + log(2^stages)
+      lmagn[i] += logval;
+    } else {
+      lmagn[i] = logval;//0;
+    }
+  }
+
+  // loop over simultaneous estimates
+  for (s = 0; s < SIMULT; s++) {
+    offset = s * inst->magnLen;
+
+    // Get counter values from state
+    counter = inst->noiseEstCounter[s];
+    RTC_DCHECK_LT(counter, 201);
+    countDiv = WebRtcNsx_kCounterDiv[counter];
+    countProd = (int16_t)(counter * countDiv);
+
+    // quant_est(...)
+    for (i = 0; i < inst->magnLen; i++) {
+      // compute delta
+      if (inst->noiseEstDensity[offset + i] > 512) {
+        // Get the value for delta by shifting intead of dividing.
+        int factor = WebRtcSpl_NormW16(inst->noiseEstDensity[offset + i]);
+        delta = (int16_t)(FACTOR_Q16 >> (14 - factor));
+      } else {
+        delta = FACTOR_Q7;
+        if (inst->blockIndex < END_STARTUP_LONG) {
+          // Smaller step size during startup. This prevents from using
+          // unrealistic values causing overflow.
+          delta = FACTOR_Q7_STARTUP;
+        }
+      }
+
+      // update log quantile estimate
+      tmp16 = (int16_t)((delta * countDiv) >> 14);
+      if (lmagn[i] > inst->noiseEstLogQuantile[offset + i]) {
+        // +=QUANTILE*delta/(inst->counter[s]+1) QUANTILE=0.25, =1 in Q2
+        // CounterDiv=1/(inst->counter[s]+1) in Q15
+        tmp16 += 2;
+        inst->noiseEstLogQuantile[offset + i] += tmp16 / 4;
+      } else {
+        tmp16 += 1;
+        // *(1-QUANTILE), in Q2 QUANTILE=0.25, 1-0.25=0.75=3 in Q2
+        // TODO(bjornv): investigate why we need to truncate twice.
+        tmp16no2 = (int16_t)((tmp16 / 2) * 3 / 2);
+        inst->noiseEstLogQuantile[offset + i] -= tmp16no2;
+        if (inst->noiseEstLogQuantile[offset + i] < logval) {
+          // This is the smallest fixed point representation we can
+          // have, hence we limit the output.
+          inst->noiseEstLogQuantile[offset + i] = logval;
+        }
+      }
+
+      // update density estimate
+      if (WEBRTC_SPL_ABS_W16(lmagn[i] - inst->noiseEstLogQuantile[offset + i])
+          < WIDTH_Q8) {
+        tmp16no1 = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                     inst->noiseEstDensity[offset + i], countProd, 15);
+        tmp16no2 = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                     width_factor, countDiv, 15);
+        inst->noiseEstDensity[offset + i] = tmp16no1 + tmp16no2;
+      }
+    }  // end loop over magnitude spectrum
+
+    if (counter >= END_STARTUP_LONG) {
+      inst->noiseEstCounter[s] = 0;
+      if (inst->blockIndex >= END_STARTUP_LONG) {
+        UpdateNoiseEstimate(inst, offset);
+      }
+    }
+    inst->noiseEstCounter[s]++;
+
+  }  // end loop over simultaneous estimates
+
+  // Sequentially update the noise during startup
+  if (inst->blockIndex < END_STARTUP_LONG) {
+    UpdateNoiseEstimate(inst, offset);
+  }
+
+  for (i = 0; i < inst->magnLen; i++) {
+    noise[i] = (uint32_t)(inst->noiseEstQuantile[i]); // Q(qNoise)
+  }
+  (*q_noise) = (int16_t)inst->qNoise;
+}
+
+// Filter the data in the frequency domain, and create spectrum.
+static void PrepareSpectrumC(NoiseSuppressionFixedC* inst, int16_t* freq_buf) {
+  size_t i = 0, j = 0;
+
+  for (i = 0; i < inst->magnLen; i++) {
+    inst->real[i] = (int16_t)((inst->real[i] *
+        (int16_t)(inst->noiseSupFilter[i])) >> 14);  // Q(normData-stages)
+    inst->imag[i] = (int16_t)((inst->imag[i] *
+        (int16_t)(inst->noiseSupFilter[i])) >> 14);  // Q(normData-stages)
+  }
+
+  freq_buf[0] = inst->real[0];
+  freq_buf[1] = -inst->imag[0];
+  for (i = 1, j = 2; i < inst->anaLen2; i += 1, j += 2) {
+    freq_buf[j] = inst->real[i];
+    freq_buf[j + 1] = -inst->imag[i];
+  }
+  freq_buf[inst->anaLen] = inst->real[inst->anaLen2];
+  freq_buf[inst->anaLen + 1] = -inst->imag[inst->anaLen2];
+}
+
+// Denormalize the real-valued signal |in|, the output from inverse FFT.
+static void DenormalizeC(NoiseSuppressionFixedC* inst,
+                         int16_t* in,
+                         int factor) {
+  size_t i = 0;
+  int32_t tmp32 = 0;
+  for (i = 0; i < inst->anaLen; i += 1) {
+    tmp32 = WEBRTC_SPL_SHIFT_W32((int32_t)in[i],
+                                 factor - inst->normData);
+    inst->real[i] = WebRtcSpl_SatW32ToW16(tmp32); // Q0
+  }
+}
+
+// For the noise supression process, synthesis, read out fully processed
+// segment, and update synthesis buffer.
+static void SynthesisUpdateC(NoiseSuppressionFixedC* inst,
+                             int16_t* out_frame,
+                             int16_t gain_factor) {
+  size_t i = 0;
+  int16_t tmp16a = 0;
+  int16_t tmp16b = 0;
+  int32_t tmp32 = 0;
+
+  // synthesis
+  for (i = 0; i < inst->anaLen; i++) {
+    tmp16a = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                 inst->window[i], inst->real[i], 14); // Q0, window in Q14
+    tmp32 = WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(tmp16a, gain_factor, 13); // Q0
+    // Down shift with rounding
+    tmp16b = WebRtcSpl_SatW32ToW16(tmp32); // Q0
+    inst->synthesisBuffer[i] = WebRtcSpl_AddSatW16(inst->synthesisBuffer[i],
+                                                   tmp16b); // Q0
+  }
+
+  // read out fully processed segment
+  for (i = 0; i < inst->blockLen10ms; i++) {
+    out_frame[i] = inst->synthesisBuffer[i]; // Q0
+  }
+
+  // update synthesis buffer
+  memcpy(inst->synthesisBuffer, inst->synthesisBuffer + inst->blockLen10ms,
+      (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->synthesisBuffer));
+  WebRtcSpl_ZerosArrayW16(inst->synthesisBuffer
+      + inst->anaLen - inst->blockLen10ms, inst->blockLen10ms);
+}
+
+// Update analysis buffer for lower band, and window data before FFT.
+static void AnalysisUpdateC(NoiseSuppressionFixedC* inst,
+                            int16_t* out,
+                            int16_t* new_speech) {
+  size_t i = 0;
+
+  // For lower band update analysis buffer.
+  memcpy(inst->analysisBuffer, inst->analysisBuffer + inst->blockLen10ms,
+      (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->analysisBuffer));
+  memcpy(inst->analysisBuffer + inst->anaLen - inst->blockLen10ms, new_speech,
+      inst->blockLen10ms * sizeof(*inst->analysisBuffer));
+
+  // Window data before FFT.
+  for (i = 0; i < inst->anaLen; i++) {
+    out[i] = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+               inst->window[i], inst->analysisBuffer[i], 14); // Q0
+  }
+}
+
+// Normalize the real-valued signal |in|, the input to forward FFT.
+static void NormalizeRealBufferC(NoiseSuppressionFixedC* inst,
+                                 const int16_t* in,
+                                 int16_t* out) {
+  size_t i = 0;
+  RTC_DCHECK_GE(inst->normData, 0);
+  for (i = 0; i < inst->anaLen; ++i) {
+    out[i] = in[i] << inst->normData;  // Q(normData)
+  }
+}
+
+// Declare function pointers.
+NoiseEstimation WebRtcNsx_NoiseEstimation;
+PrepareSpectrum WebRtcNsx_PrepareSpectrum;
+SynthesisUpdate WebRtcNsx_SynthesisUpdate;
+AnalysisUpdate WebRtcNsx_AnalysisUpdate;
+Denormalize WebRtcNsx_Denormalize;
+NormalizeRealBuffer WebRtcNsx_NormalizeRealBuffer;
+
+#if defined(WEBRTC_HAS_NEON)
+// Initialize function pointers for ARM Neon platform.
+static void WebRtcNsx_InitNeon(void) {
+  WebRtcNsx_NoiseEstimation = WebRtcNsx_NoiseEstimationNeon;
+  WebRtcNsx_PrepareSpectrum = WebRtcNsx_PrepareSpectrumNeon;
+  WebRtcNsx_SynthesisUpdate = WebRtcNsx_SynthesisUpdateNeon;
+  WebRtcNsx_AnalysisUpdate = WebRtcNsx_AnalysisUpdateNeon;
+}
+#endif
+
+#if defined(MIPS32_LE)
+// Initialize function pointers for MIPS platform.
+static void WebRtcNsx_InitMips(void) {
+  WebRtcNsx_PrepareSpectrum = WebRtcNsx_PrepareSpectrum_mips;
+  WebRtcNsx_SynthesisUpdate = WebRtcNsx_SynthesisUpdate_mips;
+  WebRtcNsx_AnalysisUpdate = WebRtcNsx_AnalysisUpdate_mips;
+  WebRtcNsx_NormalizeRealBuffer = WebRtcNsx_NormalizeRealBuffer_mips;
+#if defined(MIPS_DSP_R1_LE)
+  WebRtcNsx_Denormalize = WebRtcNsx_Denormalize_mips;
+#endif
+}
+#endif
+
+void WebRtcNsx_CalcParametricNoiseEstimate(NoiseSuppressionFixedC* inst,
+                                           int16_t pink_noise_exp_avg,
+                                           int32_t pink_noise_num_avg,
+                                           int freq_index,
+                                           uint32_t* noise_estimate,
+                                           uint32_t* noise_estimate_avg) {
+  int32_t tmp32no1 = 0;
+  int32_t tmp32no2 = 0;
+
+  int16_t int_part = 0;
+  int16_t frac_part = 0;
+
+  // Use pink noise estimate
+  // noise_estimate = 2^(pinkNoiseNumerator + pinkNoiseExp * log2(j))
+  RTC_DCHECK_GE(freq_index, 0);
+  RTC_DCHECK_LT(freq_index, 129);
+  tmp32no2 = (pink_noise_exp_avg * kLogIndex[freq_index]) >> 15;  // Q11
+  tmp32no1 = pink_noise_num_avg - tmp32no2; // Q11
+
+  // Calculate output: 2^tmp32no1
+  // Output in Q(minNorm-stages)
+  tmp32no1 += (inst->minNorm - inst->stages) << 11;
+  if (tmp32no1 > 0) {
+    int_part = (int16_t)(tmp32no1 >> 11);
+    frac_part = (int16_t)(tmp32no1 & 0x000007ff); // Q11
+    // Piecewise linear approximation of 'b' in
+    // 2^(int_part+frac_part) = 2^int_part * (1 + b)
+    // 'b' is given in Q11 and below stored in frac_part.
+    if (frac_part >> 10) {
+      // Upper fractional part
+      tmp32no2 = (2048 - frac_part) * 1244;  // Q21
+      tmp32no2 = 2048 - (tmp32no2 >> 10);
+    } else {
+      // Lower fractional part
+      tmp32no2 = (frac_part * 804) >> 10;
+    }
+    // Shift fractional part to Q(minNorm-stages)
+    tmp32no2 = WEBRTC_SPL_SHIFT_W32(tmp32no2, int_part - 11);
+    *noise_estimate_avg = (1 << int_part) + (uint32_t)tmp32no2;
+    // Scale up to initMagnEst, which is not block averaged
+    *noise_estimate = (*noise_estimate_avg) * (uint32_t)(inst->blockIndex + 1);
+  }
+}
+
+// Initialize state
+int32_t WebRtcNsx_InitCore(NoiseSuppressionFixedC* inst, uint32_t fs) {
+  int i;
+
+  //check for valid pointer
+  if (inst == NULL) {
+    return -1;
+  }
+  //
+
+  // Initialization of struct
+  if (fs == 8000 || fs == 16000 || fs == 32000 || fs == 48000) {
+    inst->fs = fs;
+  } else {
+    return -1;
+  }
+
+  if (fs == 8000) {
+    inst->blockLen10ms = 80;
+    inst->anaLen = 128;
+    inst->stages = 7;
+    inst->window = kBlocks80w128x;
+    inst->thresholdLogLrt = 131072; //default threshold for LRT feature
+    inst->maxLrt = 0x0040000;
+    inst->minLrt = 52429;
+  } else {
+    inst->blockLen10ms = 160;
+    inst->anaLen = 256;
+    inst->stages = 8;
+    inst->window = kBlocks160w256x;
+    inst->thresholdLogLrt = 212644; //default threshold for LRT feature
+    inst->maxLrt = 0x0080000;
+    inst->minLrt = 104858;
+  }
+  inst->anaLen2 = inst->anaLen / 2;
+  inst->magnLen = inst->anaLen2 + 1;
+
+  if (inst->real_fft != NULL) {
+    WebRtcSpl_FreeRealFFT(inst->real_fft);
+  }
+  inst->real_fft = WebRtcSpl_CreateRealFFT(inst->stages);
+  if (inst->real_fft == NULL) {
+    return -1;
+  }
+
+  WebRtcSpl_ZerosArrayW16(inst->analysisBuffer, ANAL_BLOCKL_MAX);
+  WebRtcSpl_ZerosArrayW16(inst->synthesisBuffer, ANAL_BLOCKL_MAX);
+
+  // for HB processing
+  WebRtcSpl_ZerosArrayW16(inst->dataBufHBFX[0],
+                          NUM_HIGH_BANDS_MAX * ANAL_BLOCKL_MAX);
+  // for quantile noise estimation
+  WebRtcSpl_ZerosArrayW16(inst->noiseEstQuantile, HALF_ANAL_BLOCKL);
+  for (i = 0; i < SIMULT * HALF_ANAL_BLOCKL; i++) {
+    inst->noiseEstLogQuantile[i] = 2048; // Q8
+    inst->noiseEstDensity[i] = 153; // Q9
+  }
+  for (i = 0; i < SIMULT; i++) {
+    inst->noiseEstCounter[i] = (int16_t)(END_STARTUP_LONG * (i + 1)) / SIMULT;
+  }
+
+  // Initialize suppression filter with ones
+  WebRtcSpl_MemSetW16((int16_t*)inst->noiseSupFilter, 16384, HALF_ANAL_BLOCKL);
+
+  // Set the aggressiveness: default
+  inst->aggrMode = 0;
+
+  //initialize variables for new method
+  inst->priorNonSpeechProb = 8192; // Q14(0.5) prior probability for speech/noise
+  for (i = 0; i < HALF_ANAL_BLOCKL; i++) {
+    inst->prevMagnU16[i] = 0;
+    inst->prevNoiseU32[i] = 0; //previous noise-spectrum
+    inst->logLrtTimeAvgW32[i] = 0; //smooth LR ratio
+    inst->avgMagnPause[i] = 0; //conservative noise spectrum estimate
+    inst->initMagnEst[i] = 0; //initial average magnitude spectrum
+  }
+
+  //feature quantities
+  inst->thresholdSpecDiff = 50; //threshold for difference feature: determined on-line
+  inst->thresholdSpecFlat = 20480; //threshold for flatness: determined on-line
+  inst->featureLogLrt = inst->thresholdLogLrt; //average LRT factor (= threshold)
+  inst->featureSpecFlat = inst->thresholdSpecFlat; //spectral flatness (= threshold)
+  inst->featureSpecDiff = inst->thresholdSpecDiff; //spectral difference (= threshold)
+  inst->weightLogLrt = 6; //default weighting par for LRT feature
+  inst->weightSpecFlat = 0; //default weighting par for spectral flatness feature
+  inst->weightSpecDiff = 0; //default weighting par for spectral difference feature
+
+  inst->curAvgMagnEnergy = 0; //window time-average of input magnitude spectrum
+  inst->timeAvgMagnEnergy = 0; //normalization for spectral difference
+  inst->timeAvgMagnEnergyTmp = 0; //normalization for spectral difference
+
+  //histogram quantities: used to estimate/update thresholds for features
+  WebRtcSpl_ZerosArrayW16(inst->histLrt, HIST_PAR_EST);
+  WebRtcSpl_ZerosArrayW16(inst->histSpecDiff, HIST_PAR_EST);
+  WebRtcSpl_ZerosArrayW16(inst->histSpecFlat, HIST_PAR_EST);
+
+  inst->blockIndex = -1; //frame counter
+
+  //inst->modelUpdate    = 500;   //window for update
+  inst->modelUpdate = (1 << STAT_UPDATES); //window for update
+  inst->cntThresUpdate = 0; //counter feature thresholds updates
+
+  inst->sumMagn = 0;
+  inst->magnEnergy = 0;
+  inst->prevQMagn = 0;
+  inst->qNoise = 0;
+  inst->prevQNoise = 0;
+
+  inst->energyIn = 0;
+  inst->scaleEnergyIn = 0;
+
+  inst->whiteNoiseLevel = 0;
+  inst->pinkNoiseNumerator = 0;
+  inst->pinkNoiseExp = 0;
+  inst->minNorm = 15; // Start with full scale
+  inst->zeroInputSignal = 0;
+
+  //default mode
+  WebRtcNsx_set_policy_core(inst, 0);
+
+#ifdef NS_FILEDEBUG
+  inst->infile = fopen("indebug.pcm", "wb");
+  inst->outfile = fopen("outdebug.pcm", "wb");
+  inst->file1 = fopen("file1.pcm", "wb");
+  inst->file2 = fopen("file2.pcm", "wb");
+  inst->file3 = fopen("file3.pcm", "wb");
+  inst->file4 = fopen("file4.pcm", "wb");
+  inst->file5 = fopen("file5.pcm", "wb");
+#endif
+
+  // Initialize function pointers.
+  WebRtcNsx_NoiseEstimation = NoiseEstimationC;
+  WebRtcNsx_PrepareSpectrum = PrepareSpectrumC;
+  WebRtcNsx_SynthesisUpdate = SynthesisUpdateC;
+  WebRtcNsx_AnalysisUpdate = AnalysisUpdateC;
+  WebRtcNsx_Denormalize = DenormalizeC;
+  WebRtcNsx_NormalizeRealBuffer = NormalizeRealBufferC;
+
+#if defined(WEBRTC_HAS_NEON)
+  WebRtcNsx_InitNeon();
+#endif
+
+#if defined(MIPS32_LE)
+  WebRtcNsx_InitMips();
+#endif
+
+  inst->initFlag = 1;
+
+  return 0;
+}
+
+int WebRtcNsx_set_policy_core(NoiseSuppressionFixedC* inst, int mode) {
+  // allow for modes:0,1,2,3
+  if (mode < 0 || mode > 3) {
+    return -1;
+  }
+
+  inst->aggrMode = mode;
+  if (mode == 0) {
+    inst->overdrive = 256; // Q8(1.0)
+    inst->denoiseBound = 8192; // Q14(0.5)
+    inst->gainMap = 0; // No gain compensation
+  } else if (mode == 1) {
+    inst->overdrive = 256; // Q8(1.0)
+    inst->denoiseBound = 4096; // Q14(0.25)
+    inst->factor2Table = kFactor2Aggressiveness1;
+    inst->gainMap = 1;
+  } else if (mode == 2) {
+    inst->overdrive = 282; // ~= Q8(1.1)
+    inst->denoiseBound = 2048; // Q14(0.125)
+    inst->factor2Table = kFactor2Aggressiveness2;
+    inst->gainMap = 1;
+  } else if (mode == 3) {
+    inst->overdrive = 320; // Q8(1.25)
+    inst->denoiseBound = 1475; // ~= Q14(0.09)
+    inst->factor2Table = kFactor2Aggressiveness3;
+    inst->gainMap = 1;
+  }
+  return 0;
+}
+
+// Extract thresholds for feature parameters
+// histograms are computed over some window_size (given by window_pars)
+// thresholds and weights are extracted every window
+// flag 0 means update histogram only, flag 1 means compute the thresholds/weights
+// threshold and weights are returned in: inst->priorModelPars
+void WebRtcNsx_FeatureParameterExtraction(NoiseSuppressionFixedC* inst,
+                                          int flag) {
+  uint32_t tmpU32;
+  uint32_t histIndex;
+  uint32_t posPeak1SpecFlatFX, posPeak2SpecFlatFX;
+  uint32_t posPeak1SpecDiffFX, posPeak2SpecDiffFX;
+
+  int32_t tmp32;
+  int32_t fluctLrtFX, thresFluctLrtFX;
+  int32_t avgHistLrtFX, avgSquareHistLrtFX, avgHistLrtComplFX;
+
+  int16_t j;
+  int16_t numHistLrt;
+
+  int i;
+  int useFeatureSpecFlat, useFeatureSpecDiff, featureSum;
+  int maxPeak1, maxPeak2;
+  int weightPeak1SpecFlat, weightPeak2SpecFlat;
+  int weightPeak1SpecDiff, weightPeak2SpecDiff;
+
+  //update histograms
+  if (!flag) {
+    // LRT
+    // Type casting to UWord32 is safe since negative values will not be wrapped to larger
+    // values than HIST_PAR_EST
+    histIndex = (uint32_t)(inst->featureLogLrt);
+    if (histIndex < HIST_PAR_EST) {
+      inst->histLrt[histIndex]++;
+    }
+    // Spectral flatness
+    // (inst->featureSpecFlat*20)>>10 = (inst->featureSpecFlat*5)>>8
+    histIndex = (inst->featureSpecFlat * 5) >> 8;
+    if (histIndex < HIST_PAR_EST) {
+      inst->histSpecFlat[histIndex]++;
+    }
+    // Spectral difference
+    histIndex = HIST_PAR_EST;
+    if (inst->timeAvgMagnEnergy > 0) {
+      // Guard against division by zero
+      // If timeAvgMagnEnergy == 0 we have no normalizing statistics and
+      // therefore can't update the histogram
+      histIndex = ((inst->featureSpecDiff * 5) >> inst->stages) /
+          inst->timeAvgMagnEnergy;
+    }
+    if (histIndex < HIST_PAR_EST) {
+      inst->histSpecDiff[histIndex]++;
+    }
+  }
+
+  // extract parameters for speech/noise probability
+  if (flag) {
+    useFeatureSpecDiff = 1;
+    //for LRT feature:
+    // compute the average over inst->featureExtractionParams.rangeAvgHistLrt
+    avgHistLrtFX = 0;
+    avgSquareHistLrtFX = 0;
+    numHistLrt = 0;
+    for (i = 0; i < BIN_SIZE_LRT; i++) {
+      j = (2 * i + 1);
+      tmp32 = inst->histLrt[i] * j;
+      avgHistLrtFX += tmp32;
+      numHistLrt += inst->histLrt[i];
+      avgSquareHistLrtFX += tmp32 * j;
+    }
+    avgHistLrtComplFX = avgHistLrtFX;
+    for (; i < HIST_PAR_EST; i++) {
+      j = (2 * i + 1);
+      tmp32 = inst->histLrt[i] * j;
+      avgHistLrtComplFX += tmp32;
+      avgSquareHistLrtFX += tmp32 * j;
+    }
+    fluctLrtFX = avgSquareHistLrtFX * numHistLrt -
+        avgHistLrtFX * avgHistLrtComplFX;
+    thresFluctLrtFX = THRES_FLUCT_LRT * numHistLrt;
+    // get threshold for LRT feature:
+    tmpU32 = (FACTOR_1_LRT_DIFF * (uint32_t)avgHistLrtFX);
+    if ((fluctLrtFX < thresFluctLrtFX) || (numHistLrt == 0) ||
+        (tmpU32 > (uint32_t)(100 * numHistLrt))) {
+      //very low fluctuation, so likely noise
+      inst->thresholdLogLrt = inst->maxLrt;
+    } else {
+      tmp32 = (int32_t)((tmpU32 << (9 + inst->stages)) / numHistLrt /
+                              25);
+      // check if value is within min/max range
+      inst->thresholdLogLrt = WEBRTC_SPL_SAT(inst->maxLrt,
+                                             tmp32,
+                                             inst->minLrt);
+    }
+    if (fluctLrtFX < thresFluctLrtFX) {
+      // Do not use difference feature if fluctuation of LRT feature is very low:
+      // most likely just noise state
+      useFeatureSpecDiff = 0;
+    }
+
+    // for spectral flatness and spectral difference: compute the main peaks of histogram
+    maxPeak1 = 0;
+    maxPeak2 = 0;
+    posPeak1SpecFlatFX = 0;
+    posPeak2SpecFlatFX = 0;
+    weightPeak1SpecFlat = 0;
+    weightPeak2SpecFlat = 0;
+
+    // peaks for flatness
+    for (i = 0; i < HIST_PAR_EST; i++) {
+      if (inst->histSpecFlat[i] > maxPeak1) {
+        // Found new "first" peak
+        maxPeak2 = maxPeak1;
+        weightPeak2SpecFlat = weightPeak1SpecFlat;
+        posPeak2SpecFlatFX = posPeak1SpecFlatFX;
+
+        maxPeak1 = inst->histSpecFlat[i];
+        weightPeak1SpecFlat = inst->histSpecFlat[i];
+        posPeak1SpecFlatFX = (uint32_t)(2 * i + 1);
+      } else if (inst->histSpecFlat[i] > maxPeak2) {
+        // Found new "second" peak
+        maxPeak2 = inst->histSpecFlat[i];
+        weightPeak2SpecFlat = inst->histSpecFlat[i];
+        posPeak2SpecFlatFX = (uint32_t)(2 * i + 1);
+      }
+    }
+
+    // for spectral flatness feature
+    useFeatureSpecFlat = 1;
+    // merge the two peaks if they are close
+    if ((posPeak1SpecFlatFX - posPeak2SpecFlatFX < LIM_PEAK_SPACE_FLAT_DIFF)
+        && (weightPeak2SpecFlat * LIM_PEAK_WEIGHT_FLAT_DIFF > weightPeak1SpecFlat)) {
+      weightPeak1SpecFlat += weightPeak2SpecFlat;
+      posPeak1SpecFlatFX = (posPeak1SpecFlatFX + posPeak2SpecFlatFX) >> 1;
+    }
+    //reject if weight of peaks is not large enough, or peak value too small
+    if (weightPeak1SpecFlat < THRES_WEIGHT_FLAT_DIFF || posPeak1SpecFlatFX
+        < THRES_PEAK_FLAT) {
+      useFeatureSpecFlat = 0;
+    } else { // if selected, get the threshold
+      // compute the threshold and check if value is within min/max range
+      inst->thresholdSpecFlat = WEBRTC_SPL_SAT(MAX_FLAT_Q10, FACTOR_2_FLAT_Q10
+                                               * posPeak1SpecFlatFX, MIN_FLAT_Q10); //Q10
+    }
+    // done with flatness feature
+
+    if (useFeatureSpecDiff) {
+      //compute two peaks for spectral difference
+      maxPeak1 = 0;
+      maxPeak2 = 0;
+      posPeak1SpecDiffFX = 0;
+      posPeak2SpecDiffFX = 0;
+      weightPeak1SpecDiff = 0;
+      weightPeak2SpecDiff = 0;
+      // peaks for spectral difference
+      for (i = 0; i < HIST_PAR_EST; i++) {
+        if (inst->histSpecDiff[i] > maxPeak1) {
+          // Found new "first" peak
+          maxPeak2 = maxPeak1;
+          weightPeak2SpecDiff = weightPeak1SpecDiff;
+          posPeak2SpecDiffFX = posPeak1SpecDiffFX;
+
+          maxPeak1 = inst->histSpecDiff[i];
+          weightPeak1SpecDiff = inst->histSpecDiff[i];
+          posPeak1SpecDiffFX = (uint32_t)(2 * i + 1);
+        } else if (inst->histSpecDiff[i] > maxPeak2) {
+          // Found new "second" peak
+          maxPeak2 = inst->histSpecDiff[i];
+          weightPeak2SpecDiff = inst->histSpecDiff[i];
+          posPeak2SpecDiffFX = (uint32_t)(2 * i + 1);
+        }
+      }
+
+      // merge the two peaks if they are close
+      if ((posPeak1SpecDiffFX - posPeak2SpecDiffFX < LIM_PEAK_SPACE_FLAT_DIFF)
+          && (weightPeak2SpecDiff * LIM_PEAK_WEIGHT_FLAT_DIFF > weightPeak1SpecDiff)) {
+        weightPeak1SpecDiff += weightPeak2SpecDiff;
+        posPeak1SpecDiffFX = (posPeak1SpecDiffFX + posPeak2SpecDiffFX) >> 1;
+      }
+      // get the threshold value and check if value is within min/max range
+      inst->thresholdSpecDiff = WEBRTC_SPL_SAT(MAX_DIFF, FACTOR_1_LRT_DIFF
+                                               * posPeak1SpecDiffFX, MIN_DIFF); //5x bigger
+      //reject if weight of peaks is not large enough
+      if (weightPeak1SpecDiff < THRES_WEIGHT_FLAT_DIFF) {
+        useFeatureSpecDiff = 0;
+      }
+      // done with spectral difference feature
+    }
+
+    // select the weights between the features
+    // inst->priorModelPars[4] is weight for LRT: always selected
+    featureSum = 6 / (1 + useFeatureSpecFlat + useFeatureSpecDiff);
+    inst->weightLogLrt = featureSum;
+    inst->weightSpecFlat = useFeatureSpecFlat * featureSum;
+    inst->weightSpecDiff = useFeatureSpecDiff * featureSum;
+
+    // set histograms to zero for next update
+    WebRtcSpl_ZerosArrayW16(inst->histLrt, HIST_PAR_EST);
+    WebRtcSpl_ZerosArrayW16(inst->histSpecDiff, HIST_PAR_EST);
+    WebRtcSpl_ZerosArrayW16(inst->histSpecFlat, HIST_PAR_EST);
+  }  // end of flag == 1
+}
+
+
+// Compute spectral flatness on input spectrum
+// magn is the magnitude spectrum
+// spectral flatness is returned in inst->featureSpecFlat
+void WebRtcNsx_ComputeSpectralFlatness(NoiseSuppressionFixedC* inst,
+                                       uint16_t* magn) {
+  uint32_t tmpU32;
+  uint32_t avgSpectralFlatnessNum, avgSpectralFlatnessDen;
+
+  int32_t tmp32;
+  int32_t currentSpectralFlatness, logCurSpectralFlatness;
+
+  int16_t zeros, frac, intPart;
+
+  size_t i;
+
+  // for flatness
+  avgSpectralFlatnessNum = 0;
+  avgSpectralFlatnessDen = inst->sumMagn - (uint32_t)magn[0]; // Q(normData-stages)
+
+  // compute log of ratio of the geometric to arithmetic mean: check for log(0) case
+  // flatness = exp( sum(log(magn[i]))/N - log(sum(magn[i])/N) )
+  //          = exp( sum(log(magn[i]))/N ) * N / sum(magn[i])
+  //          = 2^( sum(log2(magn[i]))/N - (log2(sum(magn[i])) - log2(N)) ) [This is used]
+  for (i = 1; i < inst->magnLen; i++) {
+    // First bin is excluded from spectrum measures. Number of bins is now a power of 2
+    if (magn[i]) {
+      zeros = WebRtcSpl_NormU32((uint32_t)magn[i]);
+      frac = (int16_t)(((uint32_t)((uint32_t)(magn[i]) << zeros)
+                              & 0x7FFFFFFF) >> 23);
+      // log2(magn(i))
+      RTC_DCHECK_LT(frac, 256);
+      tmpU32 = (uint32_t)(((31 - zeros) << 8)
+                                + WebRtcNsx_kLogTableFrac[frac]); // Q8
+      avgSpectralFlatnessNum += tmpU32; // Q8
+    } else {
+      //if at least one frequency component is zero, treat separately
+      tmpU32 = WEBRTC_SPL_UMUL_32_16(inst->featureSpecFlat, SPECT_FLAT_TAVG_Q14); // Q24
+      inst->featureSpecFlat -= tmpU32 >> 14;  // Q10
+      return;
+    }
+  }
+  //ratio and inverse log: check for case of log(0)
+  zeros = WebRtcSpl_NormU32(avgSpectralFlatnessDen);
+  frac = (int16_t)(((avgSpectralFlatnessDen << zeros) & 0x7FFFFFFF) >> 23);
+  // log2(avgSpectralFlatnessDen)
+  RTC_DCHECK_LT(frac, 256);
+  tmp32 = (int32_t)(((31 - zeros) << 8) + WebRtcNsx_kLogTableFrac[frac]); // Q8
+  logCurSpectralFlatness = (int32_t)avgSpectralFlatnessNum;
+  logCurSpectralFlatness += ((int32_t)(inst->stages - 1) << (inst->stages + 7)); // Q(8+stages-1)
+  logCurSpectralFlatness -= (tmp32 << (inst->stages - 1));
+  logCurSpectralFlatness <<= (10 - inst->stages);  // Q17
+  tmp32 = (int32_t)(0x00020000 | (WEBRTC_SPL_ABS_W32(logCurSpectralFlatness)
+                                        & 0x0001FFFF)); //Q17
+  intPart = 7 - (logCurSpectralFlatness >> 17);  // Add 7 for output in Q10.
+  if (intPart > 0) {
+    currentSpectralFlatness = tmp32 >> intPart;
+  } else {
+    currentSpectralFlatness = tmp32 << -intPart;
+  }
+
+  //time average update of spectral flatness feature
+  tmp32 = currentSpectralFlatness - (int32_t)inst->featureSpecFlat; // Q10
+  tmp32 *= SPECT_FLAT_TAVG_Q14;  // Q24
+  inst->featureSpecFlat += tmp32 >> 14;  // Q10
+  // done with flatness feature
+}
+
+
+// Compute the difference measure between input spectrum and a template/learned noise spectrum
+// magn_tmp is the input spectrum
+// the reference/template spectrum is  inst->magn_avg_pause[i]
+// returns (normalized) spectral difference in inst->featureSpecDiff
+void WebRtcNsx_ComputeSpectralDifference(NoiseSuppressionFixedC* inst,
+                                         uint16_t* magnIn) {
+  // This is to be calculated:
+  // avgDiffNormMagn = var(magnIn) - cov(magnIn, magnAvgPause)^2 / var(magnAvgPause)
+
+  uint32_t tmpU32no1, tmpU32no2;
+  uint32_t varMagnUFX, varPauseUFX, avgDiffNormMagnUFX;
+
+  int32_t tmp32no1, tmp32no2;
+  int32_t avgPauseFX, avgMagnFX, covMagnPauseFX;
+  int32_t maxPause, minPause;
+
+  int16_t tmp16no1;
+
+  size_t i;
+  int norm32, nShifts;
+
+  avgPauseFX = 0;
+  maxPause = 0;
+  minPause = inst->avgMagnPause[0]; // Q(prevQMagn)
+  // compute average quantities
+  for (i = 0; i < inst->magnLen; i++) {
+    // Compute mean of magn_pause
+    avgPauseFX += inst->avgMagnPause[i]; // in Q(prevQMagn)
+    maxPause = WEBRTC_SPL_MAX(maxPause, inst->avgMagnPause[i]);
+    minPause = WEBRTC_SPL_MIN(minPause, inst->avgMagnPause[i]);
+  }
+  // normalize by replacing div of "inst->magnLen" with "inst->stages-1" shifts
+  avgPauseFX >>= inst->stages - 1;
+  avgMagnFX = inst->sumMagn >> (inst->stages - 1);
+  // Largest possible deviation in magnPause for (co)var calculations
+  tmp32no1 = WEBRTC_SPL_MAX(maxPause - avgPauseFX, avgPauseFX - minPause);
+  // Get number of shifts to make sure we don't get wrap around in varPause
+  nShifts = WEBRTC_SPL_MAX(0, 10 + inst->stages - WebRtcSpl_NormW32(tmp32no1));
+
+  varMagnUFX = 0;
+  varPauseUFX = 0;
+  covMagnPauseFX = 0;
+  for (i = 0; i < inst->magnLen; i++) {
+    // Compute var and cov of magn and magn_pause
+    tmp16no1 = (int16_t)((int32_t)magnIn[i] - avgMagnFX);
+    tmp32no2 = inst->avgMagnPause[i] - avgPauseFX;
+    varMagnUFX += (uint32_t)(tmp16no1 * tmp16no1);  // Q(2*qMagn)
+    tmp32no1 = tmp32no2 * tmp16no1;  // Q(prevQMagn+qMagn)
+    covMagnPauseFX += tmp32no1; // Q(prevQMagn+qMagn)
+    tmp32no1 = tmp32no2 >> nShifts;  // Q(prevQMagn-minPause).
+    varPauseUFX += tmp32no1 * tmp32no1;  // Q(2*(prevQMagn-minPause))
+  }
+  //update of average magnitude spectrum: Q(-2*stages) and averaging replaced by shifts
+  inst->curAvgMagnEnergy +=
+      inst->magnEnergy >> (2 * inst->normData + inst->stages - 1);
+
+  avgDiffNormMagnUFX = varMagnUFX; // Q(2*qMagn)
+  if ((varPauseUFX) && (covMagnPauseFX)) {
+    tmpU32no1 = (uint32_t)WEBRTC_SPL_ABS_W32(covMagnPauseFX); // Q(prevQMagn+qMagn)
+    norm32 = WebRtcSpl_NormU32(tmpU32no1) - 16;
+    if (norm32 > 0) {
+      tmpU32no1 <<= norm32;  // Q(prevQMagn+qMagn+norm32)
+    } else {
+      tmpU32no1 >>= -norm32;  // Q(prevQMagn+qMagn+norm32)
+    }
+    tmpU32no2 = WEBRTC_SPL_UMUL(tmpU32no1, tmpU32no1); // Q(2*(prevQMagn+qMagn-norm32))
+
+    nShifts += norm32;
+    nShifts <<= 1;
+    if (nShifts < 0) {
+      varPauseUFX >>= (-nShifts); // Q(2*(qMagn+norm32+minPause))
+      nShifts = 0;
+    }
+    if (varPauseUFX > 0) {
+      // Q(2*(qMagn+norm32-16+minPause))
+      tmpU32no1 = tmpU32no2 / varPauseUFX;
+      tmpU32no1 >>= nShifts;
+
+      // Q(2*qMagn)
+      avgDiffNormMagnUFX -= WEBRTC_SPL_MIN(avgDiffNormMagnUFX, tmpU32no1);
+    } else {
+      avgDiffNormMagnUFX = 0;
+    }
+  }
+  //normalize and compute time average update of difference feature
+  tmpU32no1 = avgDiffNormMagnUFX >> (2 * inst->normData);
+  if (inst->featureSpecDiff > tmpU32no1) {
+    tmpU32no2 = WEBRTC_SPL_UMUL_32_16(inst->featureSpecDiff - tmpU32no1,
+                                      SPECT_DIFF_TAVG_Q8); // Q(8-2*stages)
+    inst->featureSpecDiff -= tmpU32no2 >> 8;  // Q(-2*stages)
+  } else {
+    tmpU32no2 = WEBRTC_SPL_UMUL_32_16(tmpU32no1 - inst->featureSpecDiff,
+                                      SPECT_DIFF_TAVG_Q8); // Q(8-2*stages)
+    inst->featureSpecDiff += tmpU32no2 >> 8;  // Q(-2*stages)
+  }
+}
+
+// Transform input (speechFrame) to frequency domain magnitude (magnU16)
+void WebRtcNsx_DataAnalysis(NoiseSuppressionFixedC* inst,
+                            short* speechFrame,
+                            uint16_t* magnU16) {
+  uint32_t tmpU32no1;
+
+  int32_t   tmp_1_w32 = 0;
+  int32_t   tmp_2_w32 = 0;
+  int32_t   sum_log_magn = 0;
+  int32_t   sum_log_i_log_magn = 0;
+
+  uint16_t  sum_log_magn_u16 = 0;
+  uint16_t  tmp_u16 = 0;
+
+  int16_t   sum_log_i = 0;
+  int16_t   sum_log_i_square = 0;
+  int16_t   frac = 0;
+  int16_t   log2 = 0;
+  int16_t   matrix_determinant = 0;
+  int16_t   maxWinData;
+
+  size_t i, j;
+  int zeros;
+  int net_norm = 0;
+  int right_shifts_in_magnU16 = 0;
+  int right_shifts_in_initMagnEst = 0;
+
+  int16_t winData_buff[ANAL_BLOCKL_MAX * 2 + 16];
+  int16_t realImag_buff[ANAL_BLOCKL_MAX * 2 + 16];
+
+  // Align the structures to 32-byte boundary for the FFT function.
+  int16_t* winData = (int16_t*) (((uintptr_t)winData_buff + 31) & ~31);
+  int16_t* realImag = (int16_t*) (((uintptr_t) realImag_buff + 31) & ~31);
+
+  // Update analysis buffer for lower band, and window data before FFT.
+  WebRtcNsx_AnalysisUpdate(inst, winData, speechFrame);
+
+  // Get input energy
+  inst->energyIn =
+      WebRtcSpl_Energy(winData, inst->anaLen, &inst->scaleEnergyIn);
+
+  // Reset zero input flag
+  inst->zeroInputSignal = 0;
+  // Acquire norm for winData
+  maxWinData = WebRtcSpl_MaxAbsValueW16(winData, inst->anaLen);
+  inst->normData = WebRtcSpl_NormW16(maxWinData);
+  if (maxWinData == 0) {
+    // Treat zero input separately.
+    inst->zeroInputSignal = 1;
+    return;
+  }
+
+  // Determine the net normalization in the frequency domain
+  net_norm = inst->stages - inst->normData;
+  // Track lowest normalization factor and use it to prevent wrap around in shifting
+  right_shifts_in_magnU16 = inst->normData - inst->minNorm;
+  right_shifts_in_initMagnEst = WEBRTC_SPL_MAX(-right_shifts_in_magnU16, 0);
+  inst->minNorm -= right_shifts_in_initMagnEst;
+  right_shifts_in_magnU16 = WEBRTC_SPL_MAX(right_shifts_in_magnU16, 0);
+
+  // create realImag as winData interleaved with zeros (= imag. part), normalize it
+  WebRtcNsx_NormalizeRealBuffer(inst, winData, realImag);
+
+  // FFT output will be in winData[].
+  WebRtcSpl_RealForwardFFT(inst->real_fft, realImag, winData);
+
+  inst->imag[0] = 0; // Q(normData-stages)
+  inst->imag[inst->anaLen2] = 0;
+  inst->real[0] = winData[0]; // Q(normData-stages)
+  inst->real[inst->anaLen2] = winData[inst->anaLen];
+  // Q(2*(normData-stages))
+  inst->magnEnergy = (uint32_t)(inst->real[0] * inst->real[0]);
+  inst->magnEnergy += (uint32_t)(inst->real[inst->anaLen2] *
+                                 inst->real[inst->anaLen2]);
+  magnU16[0] = (uint16_t)WEBRTC_SPL_ABS_W16(inst->real[0]); // Q(normData-stages)
+  magnU16[inst->anaLen2] = (uint16_t)WEBRTC_SPL_ABS_W16(inst->real[inst->anaLen2]);
+  inst->sumMagn = (uint32_t)magnU16[0]; // Q(normData-stages)
+  inst->sumMagn += (uint32_t)magnU16[inst->anaLen2];
+
+  if (inst->blockIndex >= END_STARTUP_SHORT) {
+    for (i = 1, j = 2; i < inst->anaLen2; i += 1, j += 2) {
+      inst->real[i] = winData[j];
+      inst->imag[i] = -winData[j + 1];
+      // magnitude spectrum
+      // energy in Q(2*(normData-stages))
+      tmpU32no1 = (uint32_t)(winData[j] * winData[j]);
+      tmpU32no1 += (uint32_t)(winData[j + 1] * winData[j + 1]);
+      inst->magnEnergy += tmpU32no1; // Q(2*(normData-stages))
+
+      magnU16[i] = (uint16_t)WebRtcSpl_SqrtFloor(tmpU32no1); // Q(normData-stages)
+      inst->sumMagn += (uint32_t)magnU16[i]; // Q(normData-stages)
+    }
+  } else {
+    //
+    // Gather information during startup for noise parameter estimation
+    //
+
+    // Switch initMagnEst to Q(minNorm-stages)
+    inst->initMagnEst[0] >>= right_shifts_in_initMagnEst;
+    inst->initMagnEst[inst->anaLen2] >>= right_shifts_in_initMagnEst;
+
+    // Update initMagnEst with magnU16 in Q(minNorm-stages).
+    inst->initMagnEst[0] += magnU16[0] >> right_shifts_in_magnU16;
+    inst->initMagnEst[inst->anaLen2] +=
+        magnU16[inst->anaLen2] >> right_shifts_in_magnU16;
+
+    log2 = 0;
+    if (magnU16[inst->anaLen2]) {
+      // Calculate log2(magnU16[inst->anaLen2])
+      zeros = WebRtcSpl_NormU32((uint32_t)magnU16[inst->anaLen2]);
+      frac = (int16_t)((((uint32_t)magnU16[inst->anaLen2] << zeros) &
+                              0x7FFFFFFF) >> 23); // Q8
+      // log2(magnU16(i)) in Q8
+      RTC_DCHECK_LT(frac, 256);
+      log2 = (int16_t)(((31 - zeros) << 8) + WebRtcNsx_kLogTableFrac[frac]);
+    }
+
+    sum_log_magn = (int32_t)log2; // Q8
+    // sum_log_i_log_magn in Q17
+    sum_log_i_log_magn = (kLogIndex[inst->anaLen2] * log2) >> 3;
+
+    for (i = 1, j = 2; i < inst->anaLen2; i += 1, j += 2) {
+      inst->real[i] = winData[j];
+      inst->imag[i] = -winData[j + 1];
+      // magnitude spectrum
+      // energy in Q(2*(normData-stages))
+      tmpU32no1 = (uint32_t)(winData[j] * winData[j]);
+      tmpU32no1 += (uint32_t)(winData[j + 1] * winData[j + 1]);
+      inst->magnEnergy += tmpU32no1; // Q(2*(normData-stages))
+
+      magnU16[i] = (uint16_t)WebRtcSpl_SqrtFloor(tmpU32no1); // Q(normData-stages)
+      inst->sumMagn += (uint32_t)magnU16[i]; // Q(normData-stages)
+
+      // Switch initMagnEst to Q(minNorm-stages)
+      inst->initMagnEst[i] >>= right_shifts_in_initMagnEst;
+
+      // Update initMagnEst with magnU16 in Q(minNorm-stages).
+      inst->initMagnEst[i] += magnU16[i] >> right_shifts_in_magnU16;
+
+      if (i >= kStartBand) {
+        // For pink noise estimation. Collect data neglecting lower frequency band
+        log2 = 0;
+        if (magnU16[i]) {
+          zeros = WebRtcSpl_NormU32((uint32_t)magnU16[i]);
+          frac = (int16_t)((((uint32_t)magnU16[i] << zeros) &
+                                  0x7FFFFFFF) >> 23);
+          // log2(magnU16(i)) in Q8
+          RTC_DCHECK_LT(frac, 256);
+          log2 = (int16_t)(((31 - zeros) << 8)
+                                 + WebRtcNsx_kLogTableFrac[frac]);
+        }
+        sum_log_magn += (int32_t)log2; // Q8
+        // sum_log_i_log_magn in Q17
+        sum_log_i_log_magn += (kLogIndex[i] * log2) >> 3;
+      }
+    }
+
+    //
+    //compute simplified noise model during startup
+    //
+
+    // Estimate White noise
+
+    // Switch whiteNoiseLevel to Q(minNorm-stages)
+    inst->whiteNoiseLevel >>= right_shifts_in_initMagnEst;
+
+    // Update the average magnitude spectrum, used as noise estimate.
+    tmpU32no1 = WEBRTC_SPL_UMUL_32_16(inst->sumMagn, inst->overdrive);
+    tmpU32no1 >>= inst->stages + 8;
+
+    // Replacing division above with 'stages' shifts
+    // Shift to same Q-domain as whiteNoiseLevel
+    tmpU32no1 >>= right_shifts_in_magnU16;
+    // This operation is safe from wrap around as long as END_STARTUP_SHORT < 128
+    RTC_DCHECK_LT(END_STARTUP_SHORT, 128);
+    inst->whiteNoiseLevel += tmpU32no1; // Q(minNorm-stages)
+
+    // Estimate Pink noise parameters
+    // Denominator used in both parameter estimates.
+    // The value is only dependent on the size of the frequency band (kStartBand)
+    // and to reduce computational complexity stored in a table (kDeterminantEstMatrix[])
+    RTC_DCHECK_LT(kStartBand, 66);
+    matrix_determinant = kDeterminantEstMatrix[kStartBand]; // Q0
+    sum_log_i = kSumLogIndex[kStartBand]; // Q5
+    sum_log_i_square = kSumSquareLogIndex[kStartBand]; // Q2
+    if (inst->fs == 8000) {
+      // Adjust values to shorter blocks in narrow band.
+      tmp_1_w32 = (int32_t)matrix_determinant;
+      tmp_1_w32 += (kSumLogIndex[65] * sum_log_i) >> 9;
+      tmp_1_w32 -= (kSumLogIndex[65] * kSumLogIndex[65]) >> 10;
+      tmp_1_w32 -= (int32_t)sum_log_i_square << 4;
+      tmp_1_w32 -= ((inst->magnLen - kStartBand) * kSumSquareLogIndex[65]) >> 2;
+      matrix_determinant = (int16_t)tmp_1_w32;
+      sum_log_i -= kSumLogIndex[65]; // Q5
+      sum_log_i_square -= kSumSquareLogIndex[65]; // Q2
+    }
+
+    // Necessary number of shifts to fit sum_log_magn in a word16
+    zeros = 16 - WebRtcSpl_NormW32(sum_log_magn);
+    if (zeros < 0) {
+      zeros = 0;
+    }
+    tmp_1_w32 = sum_log_magn << 1;  // Q9
+    sum_log_magn_u16 = (uint16_t)(tmp_1_w32 >> zeros);  // Q(9-zeros).
+
+    // Calculate and update pinkNoiseNumerator. Result in Q11.
+    tmp_2_w32 = WEBRTC_SPL_MUL_16_U16(sum_log_i_square, sum_log_magn_u16); // Q(11-zeros)
+    tmpU32no1 = sum_log_i_log_magn >> 12;  // Q5
+
+    // Shift the largest value of sum_log_i and tmp32no3 before multiplication
+    tmp_u16 = ((uint16_t)sum_log_i << 1);  // Q6
+    if ((uint32_t)sum_log_i > tmpU32no1) {
+      tmp_u16 >>= zeros;
+    } else {
+      tmpU32no1 >>= zeros;
+    }
+    tmp_2_w32 -= (int32_t)WEBRTC_SPL_UMUL_32_16(tmpU32no1, tmp_u16); // Q(11-zeros)
+    matrix_determinant >>= zeros;  // Q(-zeros)
+    tmp_2_w32 = WebRtcSpl_DivW32W16(tmp_2_w32, matrix_determinant); // Q11
+    tmp_2_w32 += (int32_t)net_norm << 11;  // Q11
+    if (tmp_2_w32 < 0) {
+      tmp_2_w32 = 0;
+    }
+    inst->pinkNoiseNumerator += tmp_2_w32; // Q11
+
+    // Calculate and update pinkNoiseExp. Result in Q14.
+    tmp_2_w32 = WEBRTC_SPL_MUL_16_U16(sum_log_i, sum_log_magn_u16); // Q(14-zeros)
+    tmp_1_w32 = sum_log_i_log_magn >> (3 + zeros);
+    tmp_1_w32 *= inst->magnLen - kStartBand;
+    tmp_2_w32 -= tmp_1_w32; // Q(14-zeros)
+    if (tmp_2_w32 > 0) {
+      // If the exponential parameter is negative force it to zero, which means a
+      // flat spectrum.
+      tmp_1_w32 = WebRtcSpl_DivW32W16(tmp_2_w32, matrix_determinant); // Q14
+      inst->pinkNoiseExp += WEBRTC_SPL_SAT(16384, tmp_1_w32, 0); // Q14
+    }
+  }
+}
+
+void WebRtcNsx_DataSynthesis(NoiseSuppressionFixedC* inst, short* outFrame) {
+  int32_t energyOut;
+
+  int16_t realImag_buff[ANAL_BLOCKL_MAX * 2 + 16];
+  int16_t rfft_out_buff[ANAL_BLOCKL_MAX * 2 + 16];
+
+  // Align the structures to 32-byte boundary for the FFT function.
+  int16_t* realImag = (int16_t*) (((uintptr_t)realImag_buff + 31) & ~31);
+  int16_t* rfft_out = (int16_t*) (((uintptr_t) rfft_out_buff + 31) & ~31);
+
+  int16_t tmp16no1, tmp16no2;
+  int16_t energyRatio;
+  int16_t gainFactor, gainFactor1, gainFactor2;
+
+  size_t i;
+  int outCIFFT;
+  int scaleEnergyOut = 0;
+
+  if (inst->zeroInputSignal) {
+    // synthesize the special case of zero input
+    // read out fully processed segment
+    for (i = 0; i < inst->blockLen10ms; i++) {
+      outFrame[i] = inst->synthesisBuffer[i]; // Q0
+    }
+    // update synthesis buffer
+    memcpy(inst->synthesisBuffer, inst->synthesisBuffer + inst->blockLen10ms,
+        (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->synthesisBuffer));
+    WebRtcSpl_ZerosArrayW16(inst->synthesisBuffer + inst->anaLen - inst->blockLen10ms,
+                            inst->blockLen10ms);
+    return;
+  }
+
+  // Filter the data in the frequency domain, and create spectrum.
+  WebRtcNsx_PrepareSpectrum(inst, realImag);
+
+  // Inverse FFT output will be in rfft_out[].
+  outCIFFT = WebRtcSpl_RealInverseFFT(inst->real_fft, realImag, rfft_out);
+
+  WebRtcNsx_Denormalize(inst, rfft_out, outCIFFT);
+
+  //scale factor: only do it after END_STARTUP_LONG time
+  gainFactor = 8192; // 8192 = Q13(1.0)
+  if (inst->gainMap == 1 &&
+      inst->blockIndex > END_STARTUP_LONG &&
+      inst->energyIn > 0) {
+    // Q(-scaleEnergyOut)
+    energyOut = WebRtcSpl_Energy(inst->real, inst->anaLen, &scaleEnergyOut);
+    if (scaleEnergyOut == 0 && !(energyOut & 0x7f800000)) {
+      energyOut = WEBRTC_SPL_SHIFT_W32(energyOut, 8 + scaleEnergyOut
+                                       - inst->scaleEnergyIn);
+    } else {
+      // |energyIn| is currently in Q(|scaleEnergyIn|), but to later on end up
+      // with an |energyRatio| in Q8 we need to change the Q-domain to
+      // Q(-8-scaleEnergyOut).
+      inst->energyIn >>= 8 + scaleEnergyOut - inst->scaleEnergyIn;
+    }
+
+    RTC_DCHECK_GT(inst->energyIn, 0);
+    energyRatio = (energyOut + inst->energyIn / 2) / inst->energyIn;  // Q8
+    // Limit the ratio to [0, 1] in Q8, i.e., [0, 256]
+    energyRatio = WEBRTC_SPL_SAT(256, energyRatio, 0);
+
+    // all done in lookup tables now
+    RTC_DCHECK_LT(energyRatio, 257);
+    gainFactor1 = kFactor1Table[energyRatio]; // Q8
+    gainFactor2 = inst->factor2Table[energyRatio]; // Q8
+
+    //combine both scales with speech/noise prob: note prior (priorSpeechProb) is not frequency dependent
+
+    // factor = inst->priorSpeechProb*factor1 + (1.0-inst->priorSpeechProb)*factor2; // original code
+    tmp16no1 = (int16_t)(((16384 - inst->priorNonSpeechProb) * gainFactor1) >>
+        14);  // in Q13, where 16384 = Q14(1.0)
+    tmp16no2 = (int16_t)((inst->priorNonSpeechProb * gainFactor2) >> 14);
+    gainFactor = tmp16no1 + tmp16no2; // Q13
+  }  // out of flag_gain_map==1
+
+  // Synthesis, read out fully processed segment, and update synthesis buffer.
+  WebRtcNsx_SynthesisUpdate(inst, outFrame, gainFactor);
+}
+
+void WebRtcNsx_ProcessCore(NoiseSuppressionFixedC* inst,
+                           const short* const* speechFrame,
+                           int num_bands,
+                           short* const* outFrame) {
+  // main routine for noise suppression
+
+  uint32_t tmpU32no1, tmpU32no2, tmpU32no3;
+  uint32_t satMax, maxNoiseU32;
+  uint32_t tmpMagnU32, tmpNoiseU32;
+  uint32_t nearMagnEst;
+  uint32_t noiseUpdateU32;
+  uint32_t noiseU32[HALF_ANAL_BLOCKL];
+  uint32_t postLocSnr[HALF_ANAL_BLOCKL];
+  uint32_t priorLocSnr[HALF_ANAL_BLOCKL];
+  uint32_t prevNearSnr[HALF_ANAL_BLOCKL];
+  uint32_t curNearSnr;
+  uint32_t priorSnr;
+  uint32_t noise_estimate = 0;
+  uint32_t noise_estimate_avg = 0;
+  uint32_t numerator = 0;
+
+  int32_t tmp32no1, tmp32no2;
+  int32_t pink_noise_num_avg = 0;
+
+  uint16_t tmpU16no1;
+  uint16_t magnU16[HALF_ANAL_BLOCKL];
+  uint16_t prevNoiseU16[HALF_ANAL_BLOCKL];
+  uint16_t nonSpeechProbFinal[HALF_ANAL_BLOCKL];
+  uint16_t gammaNoise, prevGammaNoise;
+  uint16_t noiseSupFilterTmp[HALF_ANAL_BLOCKL];
+
+  int16_t qMagn, qNoise;
+  int16_t avgProbSpeechHB, gainModHB, avgFilterGainHB, gainTimeDomainHB;
+  int16_t pink_noise_exp_avg = 0;
+
+  size_t i, j;
+  int nShifts, postShifts;
+  int norm32no1, norm32no2;
+  int flag, sign;
+  int q_domain_to_use = 0;
+
+  // Code for ARMv7-Neon platform assumes the following:
+  RTC_DCHECK_GT(inst->anaLen, 0);
+  RTC_DCHECK_GT(inst->anaLen2, 0);
+  RTC_DCHECK_EQ(0, inst->anaLen % 16);
+  RTC_DCHECK_EQ(0, inst->anaLen2 % 8);
+  RTC_DCHECK_GT(inst->blockLen10ms, 0);
+  RTC_DCHECK_EQ(0, inst->blockLen10ms % 16);
+  RTC_DCHECK_EQ(inst->magnLen, inst->anaLen2 + 1);
+
+#ifdef NS_FILEDEBUG
+  if (fwrite(spframe, sizeof(short),
+             inst->blockLen10ms, inst->infile) != inst->blockLen10ms) {
+    RTC_NOTREACHED();
+  }
+#endif
+
+  // Check that initialization has been done
+  RTC_DCHECK_EQ(1, inst->initFlag);
+  RTC_DCHECK_LE(num_bands - 1, NUM_HIGH_BANDS_MAX);
+
+  const short* const* speechFrameHB = NULL;
+  short* const* outFrameHB = NULL;
+  size_t num_high_bands = 0;
+  if (num_bands > 1) {
+    speechFrameHB = &speechFrame[1];
+    outFrameHB = &outFrame[1];
+    num_high_bands = (size_t)(num_bands - 1);
+  }
+
+  // Store speechFrame and transform to frequency domain
+  WebRtcNsx_DataAnalysis(inst, (short*)speechFrame[0], magnU16);
+
+  if (inst->zeroInputSignal) {
+    WebRtcNsx_DataSynthesis(inst, outFrame[0]);
+
+    if (num_bands > 1) {
+      // update analysis buffer for H band
+      // append new data to buffer FX
+      for (i = 0; i < num_high_bands; ++i) {
+        int block_shift = inst->anaLen - inst->blockLen10ms;
+        memcpy(inst->dataBufHBFX[i], inst->dataBufHBFX[i] + inst->blockLen10ms,
+            block_shift * sizeof(*inst->dataBufHBFX[i]));
+        memcpy(inst->dataBufHBFX[i] + block_shift, speechFrameHB[i],
+            inst->blockLen10ms * sizeof(*inst->dataBufHBFX[i]));
+        for (j = 0; j < inst->blockLen10ms; j++) {
+          outFrameHB[i][j] = inst->dataBufHBFX[i][j]; // Q0
+        }
+      }
+    }  // end of H band gain computation
+    return;
+  }
+
+  // Update block index when we have something to process
+  inst->blockIndex++;
+  //
+
+  // Norm of magn
+  qMagn = inst->normData - inst->stages;
+
+  // Compute spectral flatness on input spectrum
+  WebRtcNsx_ComputeSpectralFlatness(inst, magnU16);
+
+  // quantile noise estimate
+  WebRtcNsx_NoiseEstimation(inst, magnU16, noiseU32, &qNoise);
+
+  //noise estimate from previous frame
+  for (i = 0; i < inst->magnLen; i++) {
+    prevNoiseU16[i] = (uint16_t)(inst->prevNoiseU32[i] >> 11);  // Q(prevQNoise)
+  }
+
+  if (inst->blockIndex < END_STARTUP_SHORT) {
+    // Noise Q-domain to be used later; see description at end of section.
+    q_domain_to_use = WEBRTC_SPL_MIN((int)qNoise, inst->minNorm - inst->stages);
+
+    // Calculate frequency independent parts in parametric noise estimate and calculate
+    // the estimate for the lower frequency band (same values for all frequency bins)
+    if (inst->pinkNoiseExp) {
+      pink_noise_exp_avg = (int16_t)WebRtcSpl_DivW32W16(inst->pinkNoiseExp,
+                                                              (int16_t)(inst->blockIndex + 1)); // Q14
+      pink_noise_num_avg = WebRtcSpl_DivW32W16(inst->pinkNoiseNumerator,
+                                               (int16_t)(inst->blockIndex + 1)); // Q11
+      WebRtcNsx_CalcParametricNoiseEstimate(inst,
+                                            pink_noise_exp_avg,
+                                            pink_noise_num_avg,
+                                            kStartBand,
+                                            &noise_estimate,
+                                            &noise_estimate_avg);
+    } else {
+      // Use white noise estimate if we have poor pink noise parameter estimates
+      noise_estimate = inst->whiteNoiseLevel; // Q(minNorm-stages)
+      noise_estimate_avg = noise_estimate / (inst->blockIndex + 1); // Q(minNorm-stages)
+    }
+    for (i = 0; i < inst->magnLen; i++) {
+      // Estimate the background noise using the pink noise parameters if permitted
+      if ((inst->pinkNoiseExp) && (i >= kStartBand)) {
+        // Reset noise_estimate
+        noise_estimate = 0;
+        noise_estimate_avg = 0;
+        // Calculate the parametric noise estimate for current frequency bin
+        WebRtcNsx_CalcParametricNoiseEstimate(inst,
+                                              pink_noise_exp_avg,
+                                              pink_noise_num_avg,
+                                              i,
+                                              &noise_estimate,
+                                              &noise_estimate_avg);
+      }
+      // Calculate parametric Wiener filter
+      noiseSupFilterTmp[i] = inst->denoiseBound;
+      if (inst->initMagnEst[i]) {
+        // numerator = (initMagnEst - noise_estimate * overdrive)
+        // Result in Q(8+minNorm-stages)
+        tmpU32no1 = WEBRTC_SPL_UMUL_32_16(noise_estimate, inst->overdrive);
+        numerator = inst->initMagnEst[i] << 8;
+        if (numerator > tmpU32no1) {
+          // Suppression filter coefficient larger than zero, so calculate.
+          numerator -= tmpU32no1;
+
+          // Determine number of left shifts in numerator for best accuracy after
+          // division
+          nShifts = WebRtcSpl_NormU32(numerator);
+          nShifts = WEBRTC_SPL_SAT(6, nShifts, 0);
+
+          // Shift numerator to Q(nShifts+8+minNorm-stages)
+          numerator <<= nShifts;
+
+          // Shift denominator to Q(nShifts-6+minNorm-stages)
+          tmpU32no1 = inst->initMagnEst[i] >> (6 - nShifts);
+          if (tmpU32no1 == 0) {
+            // This is only possible if numerator = 0, in which case
+            // we don't need any division.
+            tmpU32no1 = 1;
+          }
+          tmpU32no2 = numerator / tmpU32no1;  // Q14
+          noiseSupFilterTmp[i] = (uint16_t)WEBRTC_SPL_SAT(16384, tmpU32no2,
+              (uint32_t)(inst->denoiseBound)); // Q14
+        }
+      }
+      // Weight quantile noise 'noiseU32' with modeled noise 'noise_estimate_avg'
+      // 'noiseU32 is in Q(qNoise) and 'noise_estimate' in Q(minNorm-stages)
+      // To guarantee that we do not get wrap around when shifting to the same domain
+      // we use the lowest one. Furthermore, we need to save 6 bits for the weighting.
+      // 'noise_estimate_avg' can handle this operation by construction, but 'noiseU32'
+      // may not.
+
+      // Shift 'noiseU32' to 'q_domain_to_use'
+      tmpU32no1 = noiseU32[i] >> (qNoise - q_domain_to_use);
+      // Shift 'noise_estimate_avg' to 'q_domain_to_use'
+      tmpU32no2 = noise_estimate_avg >>
+          (inst->minNorm - inst->stages - q_domain_to_use);
+      // Make a simple check to see if we have enough room for weighting 'tmpU32no1'
+      // without wrap around
+      nShifts = 0;
+      if (tmpU32no1 & 0xfc000000) {
+        tmpU32no1 >>= 6;
+        tmpU32no2 >>= 6;
+        nShifts = 6;
+      }
+      tmpU32no1 *= inst->blockIndex;
+      tmpU32no2 *= (END_STARTUP_SHORT - inst->blockIndex);
+      // Add them together and divide by startup length
+      noiseU32[i] = WebRtcSpl_DivU32U16(tmpU32no1 + tmpU32no2, END_STARTUP_SHORT);
+      // Shift back if necessary
+      noiseU32[i] <<= nShifts;
+    }
+    // Update new Q-domain for 'noiseU32'
+    qNoise = q_domain_to_use;
+  }
+  // compute average signal during END_STARTUP_LONG time:
+  // used to normalize spectral difference measure
+  if (inst->blockIndex < END_STARTUP_LONG) {
+    // substituting division with shift ending up in Q(-2*stages)
+    inst->timeAvgMagnEnergyTmp +=
+        inst->magnEnergy >> (2 * inst->normData + inst->stages - 1);
+    inst->timeAvgMagnEnergy = WebRtcSpl_DivU32U16(inst->timeAvgMagnEnergyTmp,
+                                                  inst->blockIndex + 1);
+  }
+
+  //start processing at frames == converged+1
+  // STEP 1: compute prior and post SNR based on quantile noise estimates
+
+  // compute direct decision (DD) estimate of prior SNR: needed for new method
+  satMax = (uint32_t)1048575;// Largest possible value without getting overflow despite shifting 12 steps
+  postShifts = 6 + qMagn - qNoise;
+  nShifts = 5 - inst->prevQMagn + inst->prevQNoise;
+  for (i = 0; i < inst->magnLen; i++) {
+    // FLOAT:
+    // post SNR
+    // postLocSnr[i] = 0.0;
+    // if (magn[i] > noise[i])
+    // {
+    //   postLocSnr[i] = magn[i] / (noise[i] + 0.0001);
+    // }
+    // // previous post SNR
+    // // previous estimate: based on previous frame with gain filter (smooth is previous filter)
+    //
+    // prevNearSnr[i] = inst->prevMagnU16[i] / (inst->noisePrev[i] + 0.0001) * (inst->smooth[i]);
+    //
+    // // DD estimate is sum of two terms: current estimate and previous estimate
+    // // directed decision update of priorSnr (or we actually store [2*priorSnr+1])
+    //
+    // priorLocSnr[i] = DD_PR_SNR * prevNearSnr[i] + (1.0 - DD_PR_SNR) * (postLocSnr[i] - 1.0);
+
+    // calculate post SNR: output in Q11
+    postLocSnr[i] = 2048; // 1.0 in Q11
+    tmpU32no1 = (uint32_t)magnU16[i] << 6;  // Q(6+qMagn)
+    if (postShifts < 0) {
+      tmpU32no2 = noiseU32[i] >> -postShifts;  // Q(6+qMagn)
+    } else {
+      tmpU32no2 = noiseU32[i] << postShifts;  // Q(6+qMagn)
+    }
+    if (tmpU32no1 > tmpU32no2) {
+      // Current magnitude larger than noise
+      tmpU32no1 <<= 11;  // Q(17+qMagn)
+      if (tmpU32no2 > 0) {
+        tmpU32no1 /= tmpU32no2;  // Q11
+        postLocSnr[i] = WEBRTC_SPL_MIN(satMax, tmpU32no1); // Q11
+      } else {
+        postLocSnr[i] = satMax;
+      }
+    }
+
+    // calculate prevNearSnr[i] and save for later instead of recalculating it later
+    // |nearMagnEst| in Q(prevQMagn + 14)
+    nearMagnEst = inst->prevMagnU16[i] * inst->noiseSupFilter[i];
+    tmpU32no1 = nearMagnEst << 3;  // Q(prevQMagn+17)
+    tmpU32no2 = inst->prevNoiseU32[i] >> nShifts;  // Q(prevQMagn+6)
+
+    if (tmpU32no2 > 0) {
+      tmpU32no1 /= tmpU32no2;  // Q11
+      tmpU32no1 = WEBRTC_SPL_MIN(satMax, tmpU32no1); // Q11
+    } else {
+      tmpU32no1 = satMax; // Q11
+    }
+    prevNearSnr[i] = tmpU32no1; // Q11
+
+    //directed decision update of priorSnr
+    tmpU32no1 = WEBRTC_SPL_UMUL_32_16(prevNearSnr[i], DD_PR_SNR_Q11); // Q22
+    tmpU32no2 = WEBRTC_SPL_UMUL_32_16(postLocSnr[i] - 2048, ONE_MINUS_DD_PR_SNR_Q11); // Q22
+    priorSnr = tmpU32no1 + tmpU32no2 + 512; // Q22 (added 512 for rounding)
+    // priorLocSnr = 1 + 2*priorSnr
+    priorLocSnr[i] = 2048 + (priorSnr >> 10);  // Q11
+  }  // end of loop over frequencies
+  // done with step 1: DD computation of prior and post SNR
+
+  // STEP 2: compute speech/noise likelihood
+
+  //compute difference of input spectrum with learned/estimated noise spectrum
+  WebRtcNsx_ComputeSpectralDifference(inst, magnU16);
+  //compute histograms for determination of parameters (thresholds and weights for features)
+  //parameters are extracted once every window time (=inst->modelUpdate)
+  //counter update
+  inst->cntThresUpdate++;
+  flag = (int)(inst->cntThresUpdate == inst->modelUpdate);
+  //update histogram
+  WebRtcNsx_FeatureParameterExtraction(inst, flag);
+  //compute model parameters
+  if (flag) {
+    inst->cntThresUpdate = 0; // Reset counter
+    //update every window:
+    // get normalization for spectral difference for next window estimate
+
+    // Shift to Q(-2*stages)
+    inst->curAvgMagnEnergy >>= STAT_UPDATES;
+
+    tmpU32no1 = (inst->curAvgMagnEnergy + inst->timeAvgMagnEnergy + 1) >> 1; //Q(-2*stages)
+    // Update featureSpecDiff
+    if ((tmpU32no1 != inst->timeAvgMagnEnergy) && (inst->featureSpecDiff) &&
+        (inst->timeAvgMagnEnergy > 0)) {
+      norm32no1 = 0;
+      tmpU32no3 = tmpU32no1;
+      while (0xFFFF0000 & tmpU32no3) {
+        tmpU32no3 >>= 1;
+        norm32no1++;
+      }
+      tmpU32no2 = inst->featureSpecDiff;
+      while (0xFFFF0000 & tmpU32no2) {
+        tmpU32no2 >>= 1;
+        norm32no1++;
+      }
+      tmpU32no3 = WEBRTC_SPL_UMUL(tmpU32no3, tmpU32no2);
+      tmpU32no3 /= inst->timeAvgMagnEnergy;
+      if (WebRtcSpl_NormU32(tmpU32no3) < norm32no1) {
+        inst->featureSpecDiff = 0x007FFFFF;
+      } else {
+        inst->featureSpecDiff = WEBRTC_SPL_MIN(0x007FFFFF,
+                                               tmpU32no3 << norm32no1);
+      }
+    }
+
+    inst->timeAvgMagnEnergy = tmpU32no1; // Q(-2*stages)
+    inst->curAvgMagnEnergy = 0;
+  }
+
+  //compute speech/noise probability
+  WebRtcNsx_SpeechNoiseProb(inst, nonSpeechProbFinal, priorLocSnr, postLocSnr);
+
+  //time-avg parameter for noise update
+  gammaNoise = NOISE_UPDATE_Q8; // Q8
+
+  maxNoiseU32 = 0;
+  postShifts = inst->prevQNoise - qMagn;
+  nShifts = inst->prevQMagn - qMagn;
+  for (i = 0; i < inst->magnLen; i++) {
+    // temporary noise update: use it for speech frames if update value is less than previous
+    // the formula has been rewritten into:
+    // noiseUpdate = noisePrev[i] + (1 - gammaNoise) * nonSpeechProb * (magn[i] - noisePrev[i])
+
+    if (postShifts < 0) {
+      tmpU32no2 = magnU16[i] >> -postShifts;  // Q(prevQNoise)
+    } else {
+      tmpU32no2 = (uint32_t)magnU16[i] << postShifts;  // Q(prevQNoise)
+    }
+    if (prevNoiseU16[i] > tmpU32no2) {
+      sign = -1;
+      tmpU32no1 = prevNoiseU16[i] - tmpU32no2;
+    } else {
+      sign = 1;
+      tmpU32no1 = tmpU32no2 - prevNoiseU16[i];
+    }
+    noiseUpdateU32 = inst->prevNoiseU32[i]; // Q(prevQNoise+11)
+    tmpU32no3 = 0;
+    if ((tmpU32no1) && (nonSpeechProbFinal[i])) {
+      // This value will be used later, if gammaNoise changes
+      tmpU32no3 = WEBRTC_SPL_UMUL_32_16(tmpU32no1, nonSpeechProbFinal[i]); // Q(prevQNoise+8)
+      if (0x7c000000 & tmpU32no3) {
+        // Shifting required before multiplication
+        tmpU32no2 = (tmpU32no3 >> 5) * gammaNoise;  // Q(prevQNoise+11)
+      } else {
+        // We can do shifting after multiplication
+        tmpU32no2 = (tmpU32no3 * gammaNoise) >> 5;  // Q(prevQNoise+11)
+      }
+      if (sign > 0) {
+        noiseUpdateU32 += tmpU32no2; // Q(prevQNoise+11)
+      } else {
+        // This operation is safe. We can never get wrap around, since worst
+        // case scenario means magnU16 = 0
+        noiseUpdateU32 -= tmpU32no2; // Q(prevQNoise+11)
+      }
+    }
+
+    //increase gamma (i.e., less noise update) for frame likely to be speech
+    prevGammaNoise = gammaNoise;
+    gammaNoise = NOISE_UPDATE_Q8;
+    //time-constant based on speech/noise state
+    //increase gamma (i.e., less noise update) for frames likely to be speech
+    if (nonSpeechProbFinal[i] < ONE_MINUS_PROB_RANGE_Q8) {
+      gammaNoise = GAMMA_NOISE_TRANS_AND_SPEECH_Q8;
+    }
+
+    if (prevGammaNoise != gammaNoise) {
+      // new noise update
+      // this line is the same as above, only that the result is stored in a different variable and the gammaNoise
+      // has changed
+      //
+      // noiseUpdate = noisePrev[i] + (1 - gammaNoise) * nonSpeechProb * (magn[i] - noisePrev[i])
+
+      if (0x7c000000 & tmpU32no3) {
+        // Shifting required before multiplication
+        tmpU32no2 = (tmpU32no3 >> 5) * gammaNoise;  // Q(prevQNoise+11)
+      } else {
+        // We can do shifting after multiplication
+        tmpU32no2 = (tmpU32no3 * gammaNoise) >> 5;  // Q(prevQNoise+11)
+      }
+      if (sign > 0) {
+        tmpU32no1 = inst->prevNoiseU32[i] + tmpU32no2; // Q(prevQNoise+11)
+      } else {
+        tmpU32no1 = inst->prevNoiseU32[i] - tmpU32no2; // Q(prevQNoise+11)
+      }
+      if (noiseUpdateU32 > tmpU32no1) {
+        noiseUpdateU32 = tmpU32no1; // Q(prevQNoise+11)
+      }
+    }
+    noiseU32[i] = noiseUpdateU32; // Q(prevQNoise+11)
+    if (noiseUpdateU32 > maxNoiseU32) {
+      maxNoiseU32 = noiseUpdateU32;
+    }
+
+    // conservative noise update
+    // // original FLOAT code
+    // if (prob_speech < PROB_RANGE) {
+    // inst->avgMagnPause[i] = inst->avgMagnPause[i] + (1.0 - gamma_pause)*(magn[i] - inst->avgMagnPause[i]);
+    // }
+
+    tmp32no2 = WEBRTC_SPL_SHIFT_W32(inst->avgMagnPause[i], -nShifts);
+    if (nonSpeechProbFinal[i] > ONE_MINUS_PROB_RANGE_Q8) {
+      if (nShifts < 0) {
+        tmp32no1 = (int32_t)magnU16[i] - tmp32no2; // Q(qMagn)
+        tmp32no1 *= ONE_MINUS_GAMMA_PAUSE_Q8;  // Q(8+prevQMagn+nShifts)
+        tmp32no1 = (tmp32no1 + 128) >> 8;  // Q(qMagn).
+      } else {
+        // In Q(qMagn+nShifts)
+        tmp32no1 = ((int32_t)magnU16[i] << nShifts) - inst->avgMagnPause[i];
+        tmp32no1 *= ONE_MINUS_GAMMA_PAUSE_Q8;  // Q(8+prevQMagn+nShifts)
+        tmp32no1 = (tmp32no1 + (128 << nShifts)) >> (8 + nShifts);  // Q(qMagn).
+      }
+      tmp32no2 += tmp32no1; // Q(qMagn)
+    }
+    inst->avgMagnPause[i] = tmp32no2;
+  }  // end of frequency loop
+
+  norm32no1 = WebRtcSpl_NormU32(maxNoiseU32);
+  qNoise = inst->prevQNoise + norm32no1 - 5;
+  // done with step 2: noise update
+
+  // STEP 3: compute dd update of prior snr and post snr based on new noise estimate
+  nShifts = inst->prevQNoise + 11 - qMagn;
+  for (i = 0; i < inst->magnLen; i++) {
+    // FLOAT code
+    // // post and prior SNR
+    // curNearSnr = 0.0;
+    // if (magn[i] > noise[i])
+    // {
+    // curNearSnr = magn[i] / (noise[i] + 0.0001) - 1.0;
+    // }
+    // // DD estimate is sum of two terms: current estimate and previous estimate
+    // // directed decision update of snrPrior
+    // snrPrior = DD_PR_SNR * prevNearSnr[i] + (1.0 - DD_PR_SNR) * curNearSnr;
+    // // gain filter
+    // tmpFloat1 = inst->overdrive + snrPrior;
+    // tmpFloat2 = snrPrior / tmpFloat1;
+    // theFilter[i] = tmpFloat2;
+
+    // calculate curNearSnr again, this is necessary because a new noise estimate has been made since then. for the original
+    curNearSnr = 0; // Q11
+    if (nShifts < 0) {
+      // This case is equivalent with magn < noise which implies curNearSnr = 0;
+      tmpMagnU32 = (uint32_t)magnU16[i]; // Q(qMagn)
+      tmpNoiseU32 = noiseU32[i] << -nShifts;  // Q(qMagn)
+    } else if (nShifts > 17) {
+      tmpMagnU32 = (uint32_t)magnU16[i] << 17;  // Q(qMagn+17)
+      tmpNoiseU32 = noiseU32[i] >> (nShifts - 17);  // Q(qMagn+17)
+    } else {
+      tmpMagnU32 = (uint32_t)magnU16[i] << nShifts;  // Q(qNoise_prev+11)
+      tmpNoiseU32 = noiseU32[i]; // Q(qNoise_prev+11)
+    }
+    if (tmpMagnU32 > tmpNoiseU32) {
+      tmpU32no1 = tmpMagnU32 - tmpNoiseU32; // Q(qCur)
+      norm32no2 = WEBRTC_SPL_MIN(11, WebRtcSpl_NormU32(tmpU32no1));
+      tmpU32no1 <<= norm32no2;  // Q(qCur+norm32no2)
+      tmpU32no2 = tmpNoiseU32 >> (11 - norm32no2);  // Q(qCur+norm32no2-11)
+      if (tmpU32no2 > 0) {
+        tmpU32no1 /= tmpU32no2;  // Q11
+      }
+      curNearSnr = WEBRTC_SPL_MIN(satMax, tmpU32no1); // Q11
+    }
+
+    //directed decision update of priorSnr
+    // FLOAT
+    // priorSnr = DD_PR_SNR * prevNearSnr + (1.0-DD_PR_SNR) * curNearSnr;
+
+    tmpU32no1 = WEBRTC_SPL_UMUL_32_16(prevNearSnr[i], DD_PR_SNR_Q11); // Q22
+    tmpU32no2 = WEBRTC_SPL_UMUL_32_16(curNearSnr, ONE_MINUS_DD_PR_SNR_Q11); // Q22
+    priorSnr = tmpU32no1 + tmpU32no2; // Q22
+
+    //gain filter
+    tmpU32no1 = inst->overdrive + ((priorSnr + 8192) >> 14);  // Q8
+    RTC_DCHECK_GT(inst->overdrive, 0);
+    tmpU16no1 = (priorSnr + tmpU32no1 / 2) / tmpU32no1;  // Q14
+    inst->noiseSupFilter[i] = WEBRTC_SPL_SAT(16384, tmpU16no1, inst->denoiseBound); // 16384 = Q14(1.0) // Q14
+
+    // Weight in the parametric Wiener filter during startup
+    if (inst->blockIndex < END_STARTUP_SHORT) {
+      // Weight the two suppression filters
+      tmpU32no1 = inst->noiseSupFilter[i] * inst->blockIndex;
+      tmpU32no2 = noiseSupFilterTmp[i] *
+          (END_STARTUP_SHORT - inst->blockIndex);
+      tmpU32no1 += tmpU32no2;
+      inst->noiseSupFilter[i] = (uint16_t)WebRtcSpl_DivU32U16(tmpU32no1,
+                                                                    END_STARTUP_SHORT);
+    }
+  }  // end of loop over frequencies
+  //done with step3
+
+  // save noise and magnitude spectrum for next frame
+  inst->prevQNoise = qNoise;
+  inst->prevQMagn = qMagn;
+  if (norm32no1 > 5) {
+    for (i = 0; i < inst->magnLen; i++) {
+      inst->prevNoiseU32[i] = noiseU32[i] << (norm32no1 - 5);  // Q(qNoise+11)
+      inst->prevMagnU16[i] = magnU16[i]; // Q(qMagn)
+    }
+  } else {
+    for (i = 0; i < inst->magnLen; i++) {
+      inst->prevNoiseU32[i] = noiseU32[i] >> (5 - norm32no1);  // Q(qNoise+11)
+      inst->prevMagnU16[i] = magnU16[i]; // Q(qMagn)
+    }
+  }
+
+  WebRtcNsx_DataSynthesis(inst, outFrame[0]);
+#ifdef NS_FILEDEBUG
+  if (fwrite(outframe, sizeof(short),
+             inst->blockLen10ms, inst->outfile) != inst->blockLen10ms) {
+    RTC_NOTREACHED();
+  }
+#endif
+
+  //for H band:
+  // only update data buffer, then apply time-domain gain is applied derived from L band
+  if (num_bands > 1) {
+    // update analysis buffer for H band
+    // append new data to buffer FX
+    for (i = 0; i < num_high_bands; ++i) {
+      memcpy(inst->dataBufHBFX[i], inst->dataBufHBFX[i] + inst->blockLen10ms,
+          (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->dataBufHBFX[i]));
+      memcpy(inst->dataBufHBFX[i] + inst->anaLen - inst->blockLen10ms,
+          speechFrameHB[i], inst->blockLen10ms * sizeof(*inst->dataBufHBFX[i]));
+    }
+    // range for averaging low band quantities for H band gain
+
+    gainTimeDomainHB = 16384; // 16384 = Q14(1.0)
+    //average speech prob from low band
+    //average filter gain from low band
+    //avg over second half (i.e., 4->8kHz) of freq. spectrum
+    tmpU32no1 = 0; // Q12
+    tmpU16no1 = 0; // Q8
+    for (i = inst->anaLen2 - (inst->anaLen2 >> 2); i < inst->anaLen2; i++) {
+      tmpU16no1 += nonSpeechProbFinal[i]; // Q8
+      tmpU32no1 += (uint32_t)(inst->noiseSupFilter[i]); // Q14
+    }
+    RTC_DCHECK_GE(inst->stages, 7);
+    avgProbSpeechHB = (4096 - (tmpU16no1 >> (inst->stages - 7)));  // Q12
+    avgFilterGainHB = (int16_t)(tmpU32no1 >> (inst->stages - 3));  // Q14
+
+    // // original FLOAT code
+    // // gain based on speech probability:
+    // avg_prob_speech_tt=(float)2.0*avg_prob_speech-(float)1.0;
+    // gain_mod=(float)0.5*((float)1.0+(float)tanh(avg_prob_speech_tt)); // between 0 and 1
+
+    // gain based on speech probability:
+    // original expression: "0.5 * (1 + tanh(2x-1))"
+    // avgProbSpeechHB has been anyway saturated to a value between 0 and 1 so the other cases don't have to be dealt with
+    // avgProbSpeechHB and gainModHB are in Q12, 3607 = Q12(0.880615234375) which is a zero point of
+    // |0.5 * (1 + tanh(2x-1)) - x| - |0.5 * (1 + tanh(2x-1)) - 0.880615234375| meaning that from that point the error of approximating
+    // the expression with f(x) = x would be greater than the error of approximating the expression with f(x) = 0.880615234375
+    // error: "|0.5 * (1 + tanh(2x-1)) - x| from x=0 to 0.880615234375" -> http://www.wolframalpha.com/input/?i=|0.5+*+(1+%2B+tanh(2x-1))+-+x|+from+x%3D0+to+0.880615234375
+    // and:  "|0.5 * (1 + tanh(2x-1)) - 0.880615234375| from x=0.880615234375 to 1" -> http://www.wolframalpha.com/input/?i=+|0.5+*+(1+%2B+tanh(2x-1))+-+0.880615234375|+from+x%3D0.880615234375+to+1
+    gainModHB = WEBRTC_SPL_MIN(avgProbSpeechHB, 3607);
+
+    // // original FLOAT code
+    // //combine gain with low band gain
+    // if (avg_prob_speech < (float)0.5) {
+    // gain_time_domain_HB=(float)0.5*gain_mod+(float)0.5*avg_filter_gain;
+    // }
+    // else {
+    // gain_time_domain_HB=(float)0.25*gain_mod+(float)0.75*avg_filter_gain;
+    // }
+
+
+    //combine gain with low band gain
+    if (avgProbSpeechHB < 2048) {
+      // 2048 = Q12(0.5)
+      // the next two lines in float are  "gain_time_domain = 0.5 * gain_mod + 0.5 * avg_filter_gain"; Q2(0.5) = 2 equals one left shift
+      gainTimeDomainHB = (gainModHB << 1) + (avgFilterGainHB >> 1); // Q14
+    } else {
+      // "gain_time_domain = 0.25 * gain_mod + 0.75 * agv_filter_gain;"
+      gainTimeDomainHB = (int16_t)((3 * avgFilterGainHB) >> 2);  // 3 = Q2(0.75)
+      gainTimeDomainHB += gainModHB; // Q14
+    }
+    //make sure gain is within flooring range
+    gainTimeDomainHB
+      = WEBRTC_SPL_SAT(16384, gainTimeDomainHB, (int16_t)(inst->denoiseBound)); // 16384 = Q14(1.0)
+
+
+    //apply gain
+    for (i = 0; i < num_high_bands; ++i) {
+      for (j = 0; j < inst->blockLen10ms; j++) {
+        outFrameHB[i][j] = (int16_t)((gainTimeDomainHB *
+            inst->dataBufHBFX[i][j]) >> 14);  // Q0
+      }
+    }
+  }  // end of H band gain computation
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core.h
new file mode 100644
index 0000000..d1754f3
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core.h
@@ -0,0 +1,263 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_NSX_CORE_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_NSX_CORE_H_
+
+#ifdef NS_FILEDEBUG
+#include <stdio.h>
+#endif
+
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/modules/audio_processing/ns/nsx_defines.h"
+#include "webrtc/typedefs.h"
+
+typedef struct NoiseSuppressionFixedC_ {
+  uint32_t                fs;
+
+  const int16_t*          window;
+  int16_t                 analysisBuffer[ANAL_BLOCKL_MAX];
+  int16_t                 synthesisBuffer[ANAL_BLOCKL_MAX];
+  uint16_t                noiseSupFilter[HALF_ANAL_BLOCKL];
+  uint16_t                overdrive; /* Q8 */
+  uint16_t                denoiseBound; /* Q14 */
+  const int16_t*          factor2Table;
+  int16_t                 noiseEstLogQuantile[SIMULT* HALF_ANAL_BLOCKL];
+  int16_t                 noiseEstDensity[SIMULT* HALF_ANAL_BLOCKL];
+  int16_t                 noiseEstCounter[SIMULT];
+  int16_t                 noiseEstQuantile[HALF_ANAL_BLOCKL];
+
+  size_t                  anaLen;
+  size_t                  anaLen2;
+  size_t                  magnLen;
+  int                     aggrMode;
+  int                     stages;
+  int                     initFlag;
+  int                     gainMap;
+
+  int32_t                 maxLrt;
+  int32_t                 minLrt;
+  // Log LRT factor with time-smoothing in Q8.
+  int32_t                 logLrtTimeAvgW32[HALF_ANAL_BLOCKL];
+  int32_t                 featureLogLrt;
+  int32_t                 thresholdLogLrt;
+  int16_t                 weightLogLrt;
+
+  uint32_t                featureSpecDiff;
+  uint32_t                thresholdSpecDiff;
+  int16_t                 weightSpecDiff;
+
+  uint32_t                featureSpecFlat;
+  uint32_t                thresholdSpecFlat;
+  int16_t                 weightSpecFlat;
+
+  // Conservative estimate of noise spectrum.
+  int32_t                 avgMagnPause[HALF_ANAL_BLOCKL];
+  uint32_t                magnEnergy;
+  uint32_t                sumMagn;
+  uint32_t                curAvgMagnEnergy;
+  uint32_t                timeAvgMagnEnergy;
+  uint32_t                timeAvgMagnEnergyTmp;
+
+  uint32_t                whiteNoiseLevel;  // Initial noise estimate.
+  // Initial magnitude spectrum estimate.
+  uint32_t                initMagnEst[HALF_ANAL_BLOCKL];
+  // Pink noise parameters:
+  int32_t                 pinkNoiseNumerator;  // Numerator.
+  int32_t                 pinkNoiseExp;  // Power of freq.
+  int                     minNorm;  // Smallest normalization factor.
+  int                     zeroInputSignal;  // Zero input signal flag.
+
+  // Noise spectrum from previous frame.
+  uint32_t                prevNoiseU32[HALF_ANAL_BLOCKL];
+  // Magnitude spectrum from previous frame.
+  uint16_t                prevMagnU16[HALF_ANAL_BLOCKL];
+  // Prior speech/noise probability in Q14.
+  int16_t                 priorNonSpeechProb;
+
+  int                     blockIndex;  // Frame index counter.
+  // Parameter for updating or estimating thresholds/weights for prior model.
+  int                     modelUpdate;
+  int                     cntThresUpdate;
+
+  // Histograms for parameter estimation.
+  int16_t                 histLrt[HIST_PAR_EST];
+  int16_t                 histSpecFlat[HIST_PAR_EST];
+  int16_t                 histSpecDiff[HIST_PAR_EST];
+
+  // Quantities for high band estimate.
+  int16_t                 dataBufHBFX[NUM_HIGH_BANDS_MAX][ANAL_BLOCKL_MAX];
+
+  int                     qNoise;
+  int                     prevQNoise;
+  int                     prevQMagn;
+  size_t                  blockLen10ms;
+
+  int16_t                 real[ANAL_BLOCKL_MAX];
+  int16_t                 imag[ANAL_BLOCKL_MAX];
+  int32_t                 energyIn;
+  int                     scaleEnergyIn;
+  int                     normData;
+
+  struct RealFFT* real_fft;
+} NoiseSuppressionFixedC;
+
+#ifdef __cplusplus
+extern "C"
+{
+#endif
+
+/****************************************************************************
+ * WebRtcNsx_InitCore(...)
+ *
+ * This function initializes a noise suppression instance
+ *
+ * Input:
+ *      - inst          : Instance that should be initialized
+ *      - fs            : Sampling frequency
+ *
+ * Output:
+ *      - inst          : Initialized instance
+ *
+ * Return value         :  0 - Ok
+ *                        -1 - Error
+ */
+int32_t WebRtcNsx_InitCore(NoiseSuppressionFixedC* inst, uint32_t fs);
+
+/****************************************************************************
+ * WebRtcNsx_set_policy_core(...)
+ *
+ * This changes the aggressiveness of the noise suppression method.
+ *
+ * Input:
+ *      - inst       : Instance that should be initialized
+ *      - mode       : 0: Mild (6 dB), 1: Medium (10 dB), 2: Aggressive (15 dB)
+ *
+ * Output:
+ *      - inst       : Initialized instance
+ *
+ * Return value      :  0 - Ok
+ *                     -1 - Error
+ */
+int WebRtcNsx_set_policy_core(NoiseSuppressionFixedC* inst, int mode);
+
+/****************************************************************************
+ * WebRtcNsx_ProcessCore
+ *
+ * Do noise suppression.
+ *
+ * Input:
+ *      - inst          : Instance that should be initialized
+ *      - inFrame       : Input speech frame for each band
+ *      - num_bands     : Number of bands
+ *
+ * Output:
+ *      - inst          : Updated instance
+ *      - outFrame      : Output speech frame for each band
+ */
+void WebRtcNsx_ProcessCore(NoiseSuppressionFixedC* inst,
+                           const short* const* inFrame,
+                           int num_bands,
+                           short* const* outFrame);
+
+/****************************************************************************
+ * Some function pointers, for internal functions shared by ARM NEON and
+ * generic C code.
+ */
+// Noise Estimation.
+typedef void (*NoiseEstimation)(NoiseSuppressionFixedC* inst,
+                                uint16_t* magn,
+                                uint32_t* noise,
+                                int16_t* q_noise);
+extern NoiseEstimation WebRtcNsx_NoiseEstimation;
+
+// Filter the data in the frequency domain, and create spectrum.
+typedef void (*PrepareSpectrum)(NoiseSuppressionFixedC* inst,
+                                int16_t* freq_buff);
+extern PrepareSpectrum WebRtcNsx_PrepareSpectrum;
+
+// For the noise supression process, synthesis, read out fully processed
+// segment, and update synthesis buffer.
+typedef void (*SynthesisUpdate)(NoiseSuppressionFixedC* inst,
+                                int16_t* out_frame,
+                                int16_t gain_factor);
+extern SynthesisUpdate WebRtcNsx_SynthesisUpdate;
+
+// Update analysis buffer for lower band, and window data before FFT.
+typedef void (*AnalysisUpdate)(NoiseSuppressionFixedC* inst,
+                               int16_t* out,
+                               int16_t* new_speech);
+extern AnalysisUpdate WebRtcNsx_AnalysisUpdate;
+
+// Denormalize the real-valued signal |in|, the output from inverse FFT.
+typedef void (*Denormalize)(NoiseSuppressionFixedC* inst,
+                            int16_t* in,
+                            int factor);
+extern Denormalize WebRtcNsx_Denormalize;
+
+// Normalize the real-valued signal |in|, the input to forward FFT.
+typedef void (*NormalizeRealBuffer)(NoiseSuppressionFixedC* inst,
+                                    const int16_t* in,
+                                    int16_t* out);
+extern NormalizeRealBuffer WebRtcNsx_NormalizeRealBuffer;
+
+// Compute speech/noise probability.
+// Intended to be private.
+void WebRtcNsx_SpeechNoiseProb(NoiseSuppressionFixedC* inst,
+                               uint16_t* nonSpeechProbFinal,
+                               uint32_t* priorLocSnr,
+                               uint32_t* postLocSnr);
+
+#if defined(WEBRTC_HAS_NEON)
+// For the above function pointers, functions for generic platforms are declared
+// and defined as static in file nsx_core.c, while those for ARM Neon platforms
+// are declared below and defined in file nsx_core_neon.c.
+void WebRtcNsx_NoiseEstimationNeon(NoiseSuppressionFixedC* inst,
+                                   uint16_t* magn,
+                                   uint32_t* noise,
+                                   int16_t* q_noise);
+void WebRtcNsx_SynthesisUpdateNeon(NoiseSuppressionFixedC* inst,
+                                   int16_t* out_frame,
+                                   int16_t gain_factor);
+void WebRtcNsx_AnalysisUpdateNeon(NoiseSuppressionFixedC* inst,
+                                  int16_t* out,
+                                  int16_t* new_speech);
+void WebRtcNsx_PrepareSpectrumNeon(NoiseSuppressionFixedC* inst,
+                                   int16_t* freq_buff);
+#endif
+
+#if defined(MIPS32_LE)
+// For the above function pointers, functions for generic platforms are declared
+// and defined as static in file nsx_core.c, while those for MIPS platforms
+// are declared below and defined in file nsx_core_mips.c.
+void WebRtcNsx_SynthesisUpdate_mips(NoiseSuppressionFixedC* inst,
+                                    int16_t* out_frame,
+                                    int16_t gain_factor);
+void WebRtcNsx_AnalysisUpdate_mips(NoiseSuppressionFixedC* inst,
+                                   int16_t* out,
+                                   int16_t* new_speech);
+void WebRtcNsx_PrepareSpectrum_mips(NoiseSuppressionFixedC* inst,
+                                    int16_t* freq_buff);
+void WebRtcNsx_NormalizeRealBuffer_mips(NoiseSuppressionFixedC* inst,
+                                        const int16_t* in,
+                                        int16_t* out);
+#if defined(MIPS_DSP_R1_LE)
+void WebRtcNsx_Denormalize_mips(NoiseSuppressionFixedC* inst,
+                                int16_t* in,
+                                int factor);
+#endif
+
+#endif
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_NSX_CORE_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_c.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_c.c
new file mode 100644
index 0000000..abfb2c9
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_c.c
@@ -0,0 +1,260 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/base/checks.h"
+#include "webrtc/modules/audio_processing/ns/noise_suppression_x.h"
+#include "webrtc/modules/audio_processing/ns/nsx_core.h"
+#include "webrtc/modules/audio_processing/ns/nsx_defines.h"
+
+static const int16_t kIndicatorTable[17] = {
+  0, 2017, 3809, 5227, 6258, 6963, 7424, 7718,
+  7901, 8014, 8084, 8126, 8152, 8168, 8177, 8183, 8187
+};
+
+// Compute speech/noise probability
+// speech/noise probability is returned in: probSpeechFinal
+//snrLocPrior is the prior SNR for each frequency (in Q11)
+//snrLocPost is the post SNR for each frequency (in Q11)
+void WebRtcNsx_SpeechNoiseProb(NoiseSuppressionFixedC* inst,
+                               uint16_t* nonSpeechProbFinal,
+                               uint32_t* priorLocSnr,
+                               uint32_t* postLocSnr) {
+  uint32_t zeros, num, den, tmpU32no1, tmpU32no2, tmpU32no3;
+  int32_t invLrtFX, indPriorFX, tmp32, tmp32no1, tmp32no2, besselTmpFX32;
+  int32_t frac32, logTmp;
+  int32_t logLrtTimeAvgKsumFX;
+  int16_t indPriorFX16;
+  int16_t tmp16, tmp16no1, tmp16no2, tmpIndFX, tableIndex, frac, intPart;
+  size_t i;
+  int normTmp, normTmp2, nShifts;
+
+  // compute feature based on average LR factor
+  // this is the average over all frequencies of the smooth log LRT
+  logLrtTimeAvgKsumFX = 0;
+  for (i = 0; i < inst->magnLen; i++) {
+    besselTmpFX32 = (int32_t)postLocSnr[i]; // Q11
+    normTmp = WebRtcSpl_NormU32(postLocSnr[i]);
+    num = postLocSnr[i] << normTmp;  // Q(11+normTmp)
+    if (normTmp > 10) {
+      den = priorLocSnr[i] << (normTmp - 11);  // Q(normTmp)
+    } else {
+      den = priorLocSnr[i] >> (11 - normTmp);  // Q(normTmp)
+    }
+    if (den > 0) {
+      besselTmpFX32 -= num / den;  // Q11
+    } else {
+      besselTmpFX32 = 0;
+    }
+
+    // inst->logLrtTimeAvg[i] += LRT_TAVG * (besselTmp - log(snrLocPrior)
+    //                                       - inst->logLrtTimeAvg[i]);
+    // Here, LRT_TAVG = 0.5
+    zeros = WebRtcSpl_NormU32(priorLocSnr[i]);
+    frac32 = (int32_t)(((priorLocSnr[i] << zeros) & 0x7FFFFFFF) >> 19);
+    tmp32 = (frac32 * frac32 * -43) >> 19;
+    tmp32 += ((int16_t)frac32 * 5412) >> 12;
+    frac32 = tmp32 + 37;
+    // tmp32 = log2(priorLocSnr[i])
+    tmp32 = (int32_t)(((31 - zeros) << 12) + frac32) - (11 << 12); // Q12
+    logTmp = (tmp32 * 178) >> 8;  // log2(priorLocSnr[i])*log(2)
+    // tmp32no1 = LRT_TAVG * (log(snrLocPrior) + inst->logLrtTimeAvg[i]) in Q12.
+    tmp32no1 = (logTmp + inst->logLrtTimeAvgW32[i]) / 2;
+    inst->logLrtTimeAvgW32[i] += (besselTmpFX32 - tmp32no1); // Q12
+
+    logLrtTimeAvgKsumFX += inst->logLrtTimeAvgW32[i]; // Q12
+  }
+  inst->featureLogLrt = (logLrtTimeAvgKsumFX * BIN_SIZE_LRT) >>
+      (inst->stages + 11);
+
+  // done with computation of LR factor
+
+  //
+  //compute the indicator functions
+  //
+
+  // average LRT feature
+  // FLOAT code
+  // indicator0 = 0.5 * (tanh(widthPrior *
+  //                      (logLrtTimeAvgKsum - threshPrior0)) + 1.0);
+  tmpIndFX = 16384; // Q14(1.0)
+  tmp32no1 = logLrtTimeAvgKsumFX - inst->thresholdLogLrt; // Q12
+  nShifts = 7 - inst->stages; // WIDTH_PR_MAP_SHIFT - inst->stages + 5;
+  //use larger width in tanh map for pause regions
+  if (tmp32no1 < 0) {
+    tmpIndFX = 0;
+    tmp32no1 = -tmp32no1;
+    //widthPrior = widthPrior * 2.0;
+    nShifts++;
+  }
+  tmp32no1 = WEBRTC_SPL_SHIFT_W32(tmp32no1, nShifts); // Q14
+  // compute indicator function: sigmoid map
+  if (tmp32no1 < (16 << 14) && tmp32no1 >= 0) {
+    tableIndex = (int16_t)(tmp32no1 >> 14);
+    tmp16no2 = kIndicatorTable[tableIndex];
+    tmp16no1 = kIndicatorTable[tableIndex + 1] - kIndicatorTable[tableIndex];
+    frac = (int16_t)(tmp32no1 & 0x00003fff); // Q14
+    tmp16no2 += (int16_t)((tmp16no1 * frac) >> 14);
+    if (tmpIndFX == 0) {
+      tmpIndFX = 8192 - tmp16no2; // Q14
+    } else {
+      tmpIndFX = 8192 + tmp16no2; // Q14
+    }
+  }
+  indPriorFX = inst->weightLogLrt * tmpIndFX;  // 6*Q14
+
+  //spectral flatness feature
+  if (inst->weightSpecFlat) {
+    tmpU32no1 = WEBRTC_SPL_UMUL(inst->featureSpecFlat, 400); // Q10
+    tmpIndFX = 16384; // Q14(1.0)
+    //use larger width in tanh map for pause regions
+    tmpU32no2 = inst->thresholdSpecFlat - tmpU32no1; //Q10
+    nShifts = 4;
+    if (inst->thresholdSpecFlat < tmpU32no1) {
+      tmpIndFX = 0;
+      tmpU32no2 = tmpU32no1 - inst->thresholdSpecFlat;
+      //widthPrior = widthPrior * 2.0;
+      nShifts++;
+    }
+    tmpU32no1 = WebRtcSpl_DivU32U16(tmpU32no2 << nShifts, 25);  // Q14
+    // compute indicator function: sigmoid map
+    // FLOAT code
+    // indicator1 = 0.5 * (tanh(sgnMap * widthPrior *
+    //                          (threshPrior1 - tmpFloat1)) + 1.0);
+    if (tmpU32no1 < (16 << 14)) {
+      tableIndex = (int16_t)(tmpU32no1 >> 14);
+      tmp16no2 = kIndicatorTable[tableIndex];
+      tmp16no1 = kIndicatorTable[tableIndex + 1] - kIndicatorTable[tableIndex];
+      frac = (int16_t)(tmpU32no1 & 0x00003fff); // Q14
+      tmp16no2 += (int16_t)((tmp16no1 * frac) >> 14);
+      if (tmpIndFX) {
+        tmpIndFX = 8192 + tmp16no2; // Q14
+      } else {
+        tmpIndFX = 8192 - tmp16no2; // Q14
+      }
+    }
+    indPriorFX += inst->weightSpecFlat * tmpIndFX;  // 6*Q14
+  }
+
+  //for template spectral-difference
+  if (inst->weightSpecDiff) {
+    tmpU32no1 = 0;
+    if (inst->featureSpecDiff) {
+      normTmp = WEBRTC_SPL_MIN(20 - inst->stages,
+                               WebRtcSpl_NormU32(inst->featureSpecDiff));
+      RTC_DCHECK_GE(normTmp, 0);
+      tmpU32no1 = inst->featureSpecDiff << normTmp;  // Q(normTmp-2*stages)
+      tmpU32no2 = inst->timeAvgMagnEnergy >> (20 - inst->stages - normTmp);
+      if (tmpU32no2 > 0) {
+        // Q(20 - inst->stages)
+        tmpU32no1 /= tmpU32no2;
+      } else {
+        tmpU32no1 = (uint32_t)(0x7fffffff);
+      }
+    }
+    tmpU32no3 = (inst->thresholdSpecDiff << 17) / 25;
+    tmpU32no2 = tmpU32no1 - tmpU32no3;
+    nShifts = 1;
+    tmpIndFX = 16384; // Q14(1.0)
+    //use larger width in tanh map for pause regions
+    if (tmpU32no2 & 0x80000000) {
+      tmpIndFX = 0;
+      tmpU32no2 = tmpU32no3 - tmpU32no1;
+      //widthPrior = widthPrior * 2.0;
+      nShifts--;
+    }
+    tmpU32no1 = tmpU32no2 >> nShifts;
+    // compute indicator function: sigmoid map
+    /* FLOAT code
+     indicator2 = 0.5 * (tanh(widthPrior * (tmpFloat1 - threshPrior2)) + 1.0);
+     */
+    if (tmpU32no1 < (16 << 14)) {
+      tableIndex = (int16_t)(tmpU32no1 >> 14);
+      tmp16no2 = kIndicatorTable[tableIndex];
+      tmp16no1 = kIndicatorTable[tableIndex + 1] - kIndicatorTable[tableIndex];
+      frac = (int16_t)(tmpU32no1 & 0x00003fff); // Q14
+      tmp16no2 += (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                    tmp16no1, frac, 14);
+      if (tmpIndFX) {
+        tmpIndFX = 8192 + tmp16no2;
+      } else {
+        tmpIndFX = 8192 - tmp16no2;
+      }
+    }
+    indPriorFX += inst->weightSpecDiff * tmpIndFX;  // 6*Q14
+  }
+
+  //combine the indicator function with the feature weights
+  // FLOAT code
+  // indPrior = 1 - (weightIndPrior0 * indicator0 + weightIndPrior1 *
+  //                 indicator1 + weightIndPrior2 * indicator2);
+  indPriorFX16 = WebRtcSpl_DivW32W16ResW16(98307 - indPriorFX, 6); // Q14
+  // done with computing indicator function
+
+  //compute the prior probability
+  // FLOAT code
+  // inst->priorNonSpeechProb += PRIOR_UPDATE *
+  //                             (indPriorNonSpeech - inst->priorNonSpeechProb);
+  tmp16 = indPriorFX16 - inst->priorNonSpeechProb; // Q14
+  inst->priorNonSpeechProb += (int16_t)((PRIOR_UPDATE_Q14 * tmp16) >> 14);
+
+  //final speech probability: combine prior model with LR factor:
+
+  memset(nonSpeechProbFinal, 0, sizeof(uint16_t) * inst->magnLen);
+
+  if (inst->priorNonSpeechProb > 0) {
+    for (i = 0; i < inst->magnLen; i++) {
+      // FLOAT code
+      // invLrt = exp(inst->logLrtTimeAvg[i]);
+      // invLrt = inst->priorSpeechProb * invLrt;
+      // nonSpeechProbFinal[i] = (1.0 - inst->priorSpeechProb) /
+      //                         (1.0 - inst->priorSpeechProb + invLrt);
+      // invLrt = (1.0 - inst->priorNonSpeechProb) * invLrt;
+      // nonSpeechProbFinal[i] = inst->priorNonSpeechProb /
+      //                         (inst->priorNonSpeechProb + invLrt);
+      if (inst->logLrtTimeAvgW32[i] < 65300) {
+        tmp32no1 = (inst->logLrtTimeAvgW32[i] * 23637) >> 14;  // Q12
+        intPart = (int16_t)(tmp32no1 >> 12);
+        if (intPart < -8) {
+          intPart = -8;
+        }
+        frac = (int16_t)(tmp32no1 & 0x00000fff); // Q12
+
+        // Quadratic approximation of 2^frac
+        tmp32no2 = (frac * frac * 44) >> 19;  // Q12.
+        tmp32no2 += (frac * 84) >> 7;  // Q12
+        invLrtFX = (1 << (8 + intPart)) +
+            WEBRTC_SPL_SHIFT_W32(tmp32no2, intPart - 4); // Q8
+
+        normTmp = WebRtcSpl_NormW32(invLrtFX);
+        normTmp2 = WebRtcSpl_NormW16((16384 - inst->priorNonSpeechProb));
+        if (normTmp + normTmp2 >= 7) {
+          if (normTmp + normTmp2 < 15) {
+            invLrtFX >>= 15 - normTmp2 - normTmp;
+            // Q(normTmp+normTmp2-7)
+            tmp32no1 = invLrtFX * (16384 - inst->priorNonSpeechProb);
+            // Q(normTmp+normTmp2+7)
+            invLrtFX = WEBRTC_SPL_SHIFT_W32(tmp32no1, 7 - normTmp - normTmp2);
+                                                                  // Q14
+          } else {
+            tmp32no1 = invLrtFX * (16384 - inst->priorNonSpeechProb);
+                                                                  // Q22
+            invLrtFX = tmp32no1 >> 8;  // Q14.
+          }
+
+          tmp32no1 = (int32_t)inst->priorNonSpeechProb << 8;  // Q22
+
+          nonSpeechProbFinal[i] = tmp32no1 /
+              (inst->priorNonSpeechProb + invLrtFX);  // Q8
+        }
+      }
+    }
+  }
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_mips.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_mips.c
new file mode 100644
index 0000000..2baf7df
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_mips.c
@@ -0,0 +1,1002 @@
+/*
+ *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <string.h>
+
+#include "webrtc/base/checks.h"
+#include "webrtc/modules/audio_processing/ns/noise_suppression_x.h"
+#include "webrtc/modules/audio_processing/ns/nsx_core.h"
+
+static const int16_t kIndicatorTable[17] = {
+  0, 2017, 3809, 5227, 6258, 6963, 7424, 7718,
+  7901, 8014, 8084, 8126, 8152, 8168, 8177, 8183, 8187
+};
+
+// Compute speech/noise probability
+// speech/noise probability is returned in: probSpeechFinal
+//snrLocPrior is the prior SNR for each frequency (in Q11)
+//snrLocPost is the post SNR for each frequency (in Q11)
+void WebRtcNsx_SpeechNoiseProb(NoiseSuppressionFixedC* inst,
+                               uint16_t* nonSpeechProbFinal,
+                               uint32_t* priorLocSnr,
+                               uint32_t* postLocSnr) {
+  uint32_t tmpU32no1, tmpU32no2, tmpU32no3;
+  int32_t indPriorFX, tmp32no1;
+  int32_t logLrtTimeAvgKsumFX;
+  int16_t indPriorFX16;
+  int16_t tmp16, tmp16no1, tmp16no2, tmpIndFX, tableIndex, frac;
+  size_t i;
+  int normTmp, nShifts;
+
+  int32_t r0, r1, r2, r3, r4, r5, r6, r7, r8, r9;
+  int32_t const_max = 0x7fffffff;
+  int32_t const_neg43 = -43;
+  int32_t const_5412 = 5412;
+  int32_t const_11rsh12 = (11 << 12);
+  int32_t const_178 = 178;
+
+
+  // compute feature based on average LR factor
+  // this is the average over all frequencies of the smooth log LRT
+  logLrtTimeAvgKsumFX = 0;
+  for (i = 0; i < inst->magnLen; i++) {
+    r0 = postLocSnr[i]; // Q11
+    r1 = priorLocSnr[i];
+    r2 = inst->logLrtTimeAvgW32[i];
+
+    __asm __volatile(
+      ".set       push                                    \n\t"
+      ".set       noreorder                               \n\t"
+      "clz        %[r3],    %[r0]                         \n\t"
+      "clz        %[r5],    %[r1]                         \n\t"
+      "slti       %[r4],    %[r3],    32                  \n\t"
+      "slti       %[r6],    %[r5],    32                  \n\t"
+      "movz       %[r3],    $0,       %[r4]               \n\t"
+      "movz       %[r5],    $0,       %[r6]               \n\t"
+      "slti       %[r4],    %[r3],    11                  \n\t"
+      "addiu      %[r6],    %[r3],    -11                 \n\t"
+      "neg        %[r7],    %[r6]                         \n\t"
+      "sllv       %[r6],    %[r1],    %[r6]               \n\t"
+      "srav       %[r7],    %[r1],    %[r7]               \n\t"
+      "movn       %[r6],    %[r7],    %[r4]               \n\t"
+      "sllv       %[r1],    %[r1],    %[r5]               \n\t"
+      "and        %[r1],    %[r1],    %[const_max]        \n\t"
+      "sra        %[r1],    %[r1],    19                  \n\t"
+      "mul        %[r7],    %[r1],    %[r1]               \n\t"
+      "sllv       %[r3],    %[r0],    %[r3]               \n\t"
+      "divu       %[r8],    %[r3],    %[r6]               \n\t"
+      "slti       %[r6],    %[r6],    1                   \n\t"
+      "mul        %[r7],    %[r7],    %[const_neg43]      \n\t"
+      "sra        %[r7],    %[r7],    19                  \n\t"
+      "movz       %[r3],    %[r8],    %[r6]               \n\t"
+      "subu       %[r0],    %[r0],    %[r3]               \n\t"
+      "movn       %[r0],    $0,       %[r6]               \n\t"
+      "mul        %[r1],    %[r1],    %[const_5412]       \n\t"
+      "sra        %[r1],    %[r1],    12                  \n\t"
+      "addu       %[r7],    %[r7],    %[r1]               \n\t"
+      "addiu      %[r1],    %[r7],    37                  \n\t"
+      "addiu      %[r5],    %[r5],    -31                 \n\t"
+      "neg        %[r5],    %[r5]                         \n\t"
+      "sll        %[r5],    %[r5],    12                  \n\t"
+      "addu       %[r5],    %[r5],    %[r1]               \n\t"
+      "subu       %[r7],    %[r5],    %[const_11rsh12]    \n\t"
+      "mul        %[r7],    %[r7],    %[const_178]        \n\t"
+      "sra        %[r7],    %[r7],    8                   \n\t"
+      "addu       %[r7],    %[r7],    %[r2]               \n\t"
+      "sra        %[r7],    %[r7],    1                   \n\t"
+      "subu       %[r2],    %[r2],    %[r7]               \n\t"
+      "addu       %[r2],    %[r2],    %[r0]               \n\t"
+      ".set       pop                                     \n\t"
+      : [r0] "+r" (r0), [r1] "+r" (r1), [r2] "+r" (r2),
+        [r3] "=&r" (r3), [r4] "=&r" (r4), [r5] "=&r" (r5),
+        [r6] "=&r" (r6), [r7] "=&r" (r7), [r8] "=&r" (r8)
+      : [const_max] "r" (const_max), [const_neg43] "r" (const_neg43),
+        [const_5412] "r" (const_5412), [const_11rsh12] "r" (const_11rsh12),
+        [const_178] "r" (const_178)
+      : "hi", "lo"
+    );
+    inst->logLrtTimeAvgW32[i] = r2;
+    logLrtTimeAvgKsumFX += r2;
+  }
+
+  inst->featureLogLrt = (logLrtTimeAvgKsumFX * BIN_SIZE_LRT) >>
+      (inst->stages + 11);
+
+  // done with computation of LR factor
+
+  //
+  // compute the indicator functions
+  //
+
+  // average LRT feature
+  // FLOAT code
+  // indicator0 = 0.5 * (tanh(widthPrior *
+  //                      (logLrtTimeAvgKsum - threshPrior0)) + 1.0);
+  tmpIndFX = 16384; // Q14(1.0)
+  tmp32no1 = logLrtTimeAvgKsumFX - inst->thresholdLogLrt; // Q12
+  nShifts = 7 - inst->stages; // WIDTH_PR_MAP_SHIFT - inst->stages + 5;
+  //use larger width in tanh map for pause regions
+  if (tmp32no1 < 0) {
+    tmpIndFX = 0;
+    tmp32no1 = -tmp32no1;
+    //widthPrior = widthPrior * 2.0;
+    nShifts++;
+  }
+  tmp32no1 = WEBRTC_SPL_SHIFT_W32(tmp32no1, nShifts); // Q14
+  // compute indicator function: sigmoid map
+  if (tmp32no1 < (16 << 14) && tmp32no1 >= 0) {
+    tableIndex = (int16_t)(tmp32no1 >> 14);
+    tmp16no2 = kIndicatorTable[tableIndex];
+    tmp16no1 = kIndicatorTable[tableIndex + 1] - kIndicatorTable[tableIndex];
+    frac = (int16_t)(tmp32no1 & 0x00003fff); // Q14
+    tmp16no2 += (int16_t)((tmp16no1 * frac) >> 14);
+    if (tmpIndFX == 0) {
+      tmpIndFX = 8192 - tmp16no2; // Q14
+    } else {
+      tmpIndFX = 8192 + tmp16no2; // Q14
+    }
+  }
+  indPriorFX = inst->weightLogLrt * tmpIndFX;  // 6*Q14
+
+  //spectral flatness feature
+  if (inst->weightSpecFlat) {
+    tmpU32no1 = WEBRTC_SPL_UMUL(inst->featureSpecFlat, 400); // Q10
+    tmpIndFX = 16384; // Q14(1.0)
+    //use larger width in tanh map for pause regions
+    tmpU32no2 = inst->thresholdSpecFlat - tmpU32no1; //Q10
+    nShifts = 4;
+    if (inst->thresholdSpecFlat < tmpU32no1) {
+      tmpIndFX = 0;
+      tmpU32no2 = tmpU32no1 - inst->thresholdSpecFlat;
+      //widthPrior = widthPrior * 2.0;
+      nShifts++;
+    }
+    tmpU32no1 = WebRtcSpl_DivU32U16(tmpU32no2 << nShifts, 25);  //Q14
+    // compute indicator function: sigmoid map
+    // FLOAT code
+    // indicator1 = 0.5 * (tanh(sgnMap * widthPrior *
+    //                          (threshPrior1 - tmpFloat1)) + 1.0);
+    if (tmpU32no1 < (16 << 14)) {
+      tableIndex = (int16_t)(tmpU32no1 >> 14);
+      tmp16no2 = kIndicatorTable[tableIndex];
+      tmp16no1 = kIndicatorTable[tableIndex + 1] - kIndicatorTable[tableIndex];
+      frac = (int16_t)(tmpU32no1 & 0x00003fff); // Q14
+      tmp16no2 += (int16_t)((tmp16no1 * frac) >> 14);
+      if (tmpIndFX) {
+        tmpIndFX = 8192 + tmp16no2; // Q14
+      } else {
+        tmpIndFX = 8192 - tmp16no2; // Q14
+      }
+    }
+    indPriorFX += inst->weightSpecFlat * tmpIndFX;  // 6*Q14
+  }
+
+  //for template spectral-difference
+  if (inst->weightSpecDiff) {
+    tmpU32no1 = 0;
+    if (inst->featureSpecDiff) {
+      normTmp = WEBRTC_SPL_MIN(20 - inst->stages,
+                               WebRtcSpl_NormU32(inst->featureSpecDiff));
+      RTC_DCHECK_GE(normTmp, 0);
+      tmpU32no1 = inst->featureSpecDiff << normTmp;  // Q(normTmp-2*stages)
+      tmpU32no2 = inst->timeAvgMagnEnergy >> (20 - inst->stages - normTmp);
+      if (tmpU32no2 > 0) {
+        // Q(20 - inst->stages)
+        tmpU32no1 /= tmpU32no2;
+      } else {
+        tmpU32no1 = (uint32_t)(0x7fffffff);
+      }
+    }
+    tmpU32no3 = (inst->thresholdSpecDiff << 17) / 25;
+    tmpU32no2 = tmpU32no1 - tmpU32no3;
+    nShifts = 1;
+    tmpIndFX = 16384; // Q14(1.0)
+    //use larger width in tanh map for pause regions
+    if (tmpU32no2 & 0x80000000) {
+      tmpIndFX = 0;
+      tmpU32no2 = tmpU32no3 - tmpU32no1;
+      //widthPrior = widthPrior * 2.0;
+      nShifts--;
+    }
+    tmpU32no1 = tmpU32no2 >> nShifts;
+    // compute indicator function: sigmoid map
+    /* FLOAT code
+     indicator2 = 0.5 * (tanh(widthPrior * (tmpFloat1 - threshPrior2)) + 1.0);
+     */
+    if (tmpU32no1 < (16 << 14)) {
+      tableIndex = (int16_t)(tmpU32no1 >> 14);
+      tmp16no2 = kIndicatorTable[tableIndex];
+      tmp16no1 = kIndicatorTable[tableIndex + 1] - kIndicatorTable[tableIndex];
+      frac = (int16_t)(tmpU32no1 & 0x00003fff); // Q14
+      tmp16no2 += (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                    tmp16no1, frac, 14);
+      if (tmpIndFX) {
+        tmpIndFX = 8192 + tmp16no2;
+      } else {
+        tmpIndFX = 8192 - tmp16no2;
+      }
+    }
+    indPriorFX += inst->weightSpecDiff * tmpIndFX;  // 6*Q14
+  }
+
+  //combine the indicator function with the feature weights
+  // FLOAT code
+  // indPrior = 1 - (weightIndPrior0 * indicator0 + weightIndPrior1 *
+  //                 indicator1 + weightIndPrior2 * indicator2);
+  indPriorFX16 = WebRtcSpl_DivW32W16ResW16(98307 - indPriorFX, 6); // Q14
+  // done with computing indicator function
+
+  //compute the prior probability
+  // FLOAT code
+  // inst->priorNonSpeechProb += PRIOR_UPDATE *
+  //                             (indPriorNonSpeech - inst->priorNonSpeechProb);
+  tmp16 = indPriorFX16 - inst->priorNonSpeechProb; // Q14
+  inst->priorNonSpeechProb += (int16_t)((PRIOR_UPDATE_Q14 * tmp16) >> 14);
+
+  //final speech probability: combine prior model with LR factor:
+
+  memset(nonSpeechProbFinal, 0, sizeof(uint16_t) * inst->magnLen);
+
+  if (inst->priorNonSpeechProb > 0) {
+    r0 = inst->priorNonSpeechProb;
+    r1 = 16384 - r0;
+    int32_t const_23637 = 23637;
+    int32_t const_44 = 44;
+    int32_t const_84 = 84;
+    int32_t const_1 = 1;
+    int32_t const_neg8 = -8;
+    for (i = 0; i < inst->magnLen; i++) {
+      r2 = inst->logLrtTimeAvgW32[i];
+      if (r2 < 65300) {
+        __asm __volatile(
+          ".set         push                                      \n\t"
+          ".set         noreorder                                 \n\t"
+          "mul          %[r2],    %[r2],          %[const_23637]  \n\t"
+          "sll          %[r6],    %[r1],          16              \n\t"
+          "clz          %[r7],    %[r6]                           \n\t"
+          "clo          %[r8],    %[r6]                           \n\t"
+          "slt          %[r9],    %[r6],          $0              \n\t"
+          "movn         %[r7],    %[r8],          %[r9]           \n\t"
+          "sra          %[r2],    %[r2],          14              \n\t"
+          "andi         %[r3],    %[r2],          0xfff           \n\t"
+          "mul          %[r4],    %[r3],          %[r3]           \n\t"
+          "mul          %[r3],    %[r3],          %[const_84]     \n\t"
+          "sra          %[r2],    %[r2],          12              \n\t"
+          "slt          %[r5],    %[r2],          %[const_neg8]   \n\t"
+          "movn         %[r2],    %[const_neg8],  %[r5]           \n\t"
+          "mul          %[r4],    %[r4],          %[const_44]     \n\t"
+          "sra          %[r3],    %[r3],          7               \n\t"
+          "addiu        %[r7],    %[r7],          -1              \n\t"
+          "slti         %[r9],    %[r7],          31              \n\t"
+          "movz         %[r7],    $0,             %[r9]           \n\t"
+          "sra          %[r4],    %[r4],          19              \n\t"
+          "addu         %[r4],    %[r4],          %[r3]           \n\t"
+          "addiu        %[r3],    %[r2],          8               \n\t"
+          "addiu        %[r2],    %[r2],          -4              \n\t"
+          "neg          %[r5],    %[r2]                           \n\t"
+          "sllv         %[r6],    %[r4],          %[r2]           \n\t"
+          "srav         %[r5],    %[r4],          %[r5]           \n\t"
+          "slt          %[r2],    %[r2],          $0              \n\t"
+          "movn         %[r6],    %[r5],          %[r2]           \n\t"
+          "sllv         %[r3],    %[const_1],     %[r3]           \n\t"
+          "addu         %[r2],    %[r3],          %[r6]           \n\t"
+          "clz          %[r4],    %[r2]                           \n\t"
+          "clo          %[r5],    %[r2]                           \n\t"
+          "slt          %[r8],    %[r2],          $0              \n\t"
+          "movn         %[r4],    %[r5],          %[r8]           \n\t"
+          "addiu        %[r4],    %[r4],          -1              \n\t"
+          "slt          %[r5],    $0,             %[r2]           \n\t"
+          "or           %[r5],    %[r5],          %[r7]           \n\t"
+          "movz         %[r4],    $0,             %[r5]           \n\t"
+          "addiu        %[r6],    %[r7],          -7              \n\t"
+          "addu         %[r6],    %[r6],          %[r4]           \n\t"
+          "bltz         %[r6],    1f                              \n\t"
+          " nop                                                   \n\t"
+          "addiu        %[r4],    %[r6],          -8              \n\t"
+          "neg          %[r3],    %[r4]                           \n\t"
+          "srav         %[r5],    %[r2],          %[r3]           \n\t"
+          "mul          %[r5],    %[r5],          %[r1]           \n\t"
+          "mul          %[r2],    %[r2],          %[r1]           \n\t"
+          "slt          %[r4],    %[r4],          $0              \n\t"
+          "srav         %[r5],    %[r5],          %[r6]           \n\t"
+          "sra          %[r2],    %[r2],          8               \n\t"
+          "movn         %[r2],    %[r5],          %[r4]           \n\t"
+          "sll          %[r3],    %[r0],          8               \n\t"
+          "addu         %[r2],    %[r0],          %[r2]           \n\t"
+          "divu         %[r3],    %[r3],          %[r2]           \n\t"
+         "1:                                                      \n\t"
+          ".set         pop                                       \n\t"
+          : [r2] "+r" (r2), [r3] "=&r" (r3), [r4] "=&r" (r4),
+            [r5] "=&r" (r5), [r6] "=&r" (r6), [r7] "=&r" (r7),
+            [r8] "=&r" (r8), [r9] "=&r" (r9)
+          : [r0] "r" (r0), [r1] "r" (r1), [const_23637] "r" (const_23637),
+            [const_neg8] "r" (const_neg8), [const_84] "r" (const_84),
+            [const_1] "r" (const_1), [const_44] "r" (const_44)
+          : "hi", "lo"
+        );
+        nonSpeechProbFinal[i] = r3;
+      }
+    }
+  }
+}
+
+// Update analysis buffer for lower band, and window data before FFT.
+void WebRtcNsx_AnalysisUpdate_mips(NoiseSuppressionFixedC* inst,
+                                   int16_t* out,
+                                   int16_t* new_speech) {
+  int iters, after;
+  int anaLen = (int)inst->anaLen;
+  int *window = (int*)inst->window;
+  int *anaBuf = (int*)inst->analysisBuffer;
+  int *outBuf = (int*)out;
+  int r0, r1, r2, r3, r4, r5, r6, r7;
+#if defined(MIPS_DSP_R1_LE)
+  int r8;
+#endif
+
+  // For lower band update analysis buffer.
+  memcpy(inst->analysisBuffer, inst->analysisBuffer + inst->blockLen10ms,
+      (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->analysisBuffer));
+  memcpy(inst->analysisBuffer + inst->anaLen - inst->blockLen10ms, new_speech,
+      inst->blockLen10ms * sizeof(*inst->analysisBuffer));
+
+  // Window data before FFT.
+#if defined(MIPS_DSP_R1_LE)
+  __asm __volatile(
+    ".set              push                                \n\t"
+    ".set              noreorder                           \n\t"
+    "sra               %[iters],   %[anaLen],    3         \n\t"
+   "1:                                                     \n\t"
+    "blez              %[iters],   2f                      \n\t"
+    " nop                                                  \n\t"
+    "lw                %[r0],      0(%[window])            \n\t"
+    "lw                %[r1],      0(%[anaBuf])            \n\t"
+    "lw                %[r2],      4(%[window])            \n\t"
+    "lw                %[r3],      4(%[anaBuf])            \n\t"
+    "lw                %[r4],      8(%[window])            \n\t"
+    "lw                %[r5],      8(%[anaBuf])            \n\t"
+    "lw                %[r6],      12(%[window])           \n\t"
+    "lw                %[r7],      12(%[anaBuf])           \n\t"
+    "muleq_s.w.phl     %[r8],      %[r0],        %[r1]     \n\t"
+    "muleq_s.w.phr     %[r0],      %[r0],        %[r1]     \n\t"
+    "muleq_s.w.phl     %[r1],      %[r2],        %[r3]     \n\t"
+    "muleq_s.w.phr     %[r2],      %[r2],        %[r3]     \n\t"
+    "muleq_s.w.phl     %[r3],      %[r4],        %[r5]     \n\t"
+    "muleq_s.w.phr     %[r4],      %[r4],        %[r5]     \n\t"
+    "muleq_s.w.phl     %[r5],      %[r6],        %[r7]     \n\t"
+    "muleq_s.w.phr     %[r6],      %[r6],        %[r7]     \n\t"
+#if defined(MIPS_DSP_R2_LE)
+    "precr_sra_r.ph.w  %[r8],      %[r0],        15        \n\t"
+    "precr_sra_r.ph.w  %[r1],      %[r2],        15        \n\t"
+    "precr_sra_r.ph.w  %[r3],      %[r4],        15        \n\t"
+    "precr_sra_r.ph.w  %[r5],      %[r6],        15        \n\t"
+    "sw                %[r8],      0(%[outBuf])            \n\t"
+    "sw                %[r1],      4(%[outBuf])            \n\t"
+    "sw                %[r3],      8(%[outBuf])            \n\t"
+    "sw                %[r5],      12(%[outBuf])           \n\t"
+#else
+    "shra_r.w          %[r8],      %[r8],        15        \n\t"
+    "shra_r.w          %[r0],      %[r0],        15        \n\t"
+    "shra_r.w          %[r1],      %[r1],        15        \n\t"
+    "shra_r.w          %[r2],      %[r2],        15        \n\t"
+    "shra_r.w          %[r3],      %[r3],        15        \n\t"
+    "shra_r.w          %[r4],      %[r4],        15        \n\t"
+    "shra_r.w          %[r5],      %[r5],        15        \n\t"
+    "shra_r.w          %[r6],      %[r6],        15        \n\t"
+    "sll               %[r0],      %[r0],        16        \n\t"
+    "sll               %[r2],      %[r2],        16        \n\t"
+    "sll               %[r4],      %[r4],        16        \n\t"
+    "sll               %[r6],      %[r6],        16        \n\t"
+    "packrl.ph         %[r0],      %[r8],        %[r0]     \n\t"
+    "packrl.ph         %[r2],      %[r1],        %[r2]     \n\t"
+    "packrl.ph         %[r4],      %[r3],        %[r4]     \n\t"
+    "packrl.ph         %[r6],      %[r5],        %[r6]     \n\t"
+    "sw                %[r0],      0(%[outBuf])            \n\t"
+    "sw                %[r2],      4(%[outBuf])            \n\t"
+    "sw                %[r4],      8(%[outBuf])            \n\t"
+    "sw                %[r6],      12(%[outBuf])           \n\t"
+#endif
+    "addiu             %[window],  %[window],    16        \n\t"
+    "addiu             %[anaBuf],  %[anaBuf],    16        \n\t"
+    "addiu             %[outBuf],  %[outBuf],    16        \n\t"
+    "b                 1b                                  \n\t"
+    " addiu            %[iters],   %[iters],     -1        \n\t"
+   "2:                                                     \n\t"
+    "andi              %[after],   %[anaLen],    7         \n\t"
+   "3:                                                     \n\t"
+    "blez              %[after],   4f                      \n\t"
+    " nop                                                  \n\t"
+    "lh                %[r0],      0(%[window])            \n\t"
+    "lh                %[r1],      0(%[anaBuf])            \n\t"
+    "mul               %[r0],      %[r0],        %[r1]     \n\t"
+    "addiu             %[window],  %[window],    2         \n\t"
+    "addiu             %[anaBuf],  %[anaBuf],    2         \n\t"
+    "addiu             %[outBuf],  %[outBuf],    2         \n\t"
+    "shra_r.w          %[r0],      %[r0],        14        \n\t"
+    "sh                %[r0],      -2(%[outBuf])           \n\t"
+    "b                 3b                                  \n\t"
+    " addiu            %[after],   %[after],     -1        \n\t"
+   "4:                                                     \n\t"
+    ".set              pop                                 \n\t"
+    : [r0] "=&r" (r0), [r1] "=&r" (r1), [r2] "=&r" (r2),
+      [r3] "=&r" (r3), [r4] "=&r" (r4), [r5] "=&r" (r5),
+      [r6] "=&r" (r6), [r7] "=&r" (r7), [r8] "=&r" (r8),
+      [iters] "=&r" (iters), [after] "=&r" (after),
+      [window] "+r" (window),[anaBuf] "+r" (anaBuf),
+      [outBuf] "+r" (outBuf)
+    : [anaLen] "r" (anaLen)
+    : "memory", "hi", "lo"
+  );
+#else
+  __asm  __volatile(
+    ".set           push                                    \n\t"
+    ".set           noreorder                               \n\t"
+    "sra            %[iters],   %[anaLen],      2           \n\t"
+   "1:                                                      \n\t"
+    "blez           %[iters],   2f                          \n\t"
+    " nop                                                   \n\t"
+    "lh             %[r0],      0(%[window])                \n\t"
+    "lh             %[r1],      0(%[anaBuf])                \n\t"
+    "lh             %[r2],      2(%[window])                \n\t"
+    "lh             %[r3],      2(%[anaBuf])                \n\t"
+    "lh             %[r4],      4(%[window])                \n\t"
+    "lh             %[r5],      4(%[anaBuf])                \n\t"
+    "lh             %[r6],      6(%[window])                \n\t"
+    "lh             %[r7],      6(%[anaBuf])                \n\t"
+    "mul            %[r0],      %[r0],          %[r1]       \n\t"
+    "mul            %[r2],      %[r2],          %[r3]       \n\t"
+    "mul            %[r4],      %[r4],          %[r5]       \n\t"
+    "mul            %[r6],      %[r6],          %[r7]       \n\t"
+    "addiu          %[window],  %[window],      8           \n\t"
+    "addiu          %[anaBuf],  %[anaBuf],      8           \n\t"
+    "addiu          %[r0],      %[r0],          0x2000      \n\t"
+    "addiu          %[r2],      %[r2],          0x2000      \n\t"
+    "addiu          %[r4],      %[r4],          0x2000      \n\t"
+    "addiu          %[r6],      %[r6],          0x2000      \n\t"
+    "sra            %[r0],      %[r0],          14          \n\t"
+    "sra            %[r2],      %[r2],          14          \n\t"
+    "sra            %[r4],      %[r4],          14          \n\t"
+    "sra            %[r6],      %[r6],          14          \n\t"
+    "sh             %[r0],      0(%[outBuf])                \n\t"
+    "sh             %[r2],      2(%[outBuf])                \n\t"
+    "sh             %[r4],      4(%[outBuf])                \n\t"
+    "sh             %[r6],      6(%[outBuf])                \n\t"
+    "addiu          %[outBuf],  %[outBuf],      8           \n\t"
+    "b              1b                                      \n\t"
+    " addiu         %[iters],   %[iters],       -1          \n\t"
+   "2:                                                      \n\t"
+    "andi           %[after],   %[anaLen],      3           \n\t"
+   "3:                                                      \n\t"
+    "blez           %[after],   4f                          \n\t"
+    " nop                                                   \n\t"
+    "lh             %[r0],      0(%[window])                \n\t"
+    "lh             %[r1],      0(%[anaBuf])                \n\t"
+    "mul            %[r0],      %[r0],          %[r1]       \n\t"
+    "addiu          %[window],  %[window],      2           \n\t"
+    "addiu          %[anaBuf],  %[anaBuf],      2           \n\t"
+    "addiu          %[outBuf],  %[outBuf],      2           \n\t"
+    "addiu          %[r0],      %[r0],          0x2000      \n\t"
+    "sra            %[r0],      %[r0],          14          \n\t"
+    "sh             %[r0],      -2(%[outBuf])               \n\t"
+    "b              3b                                      \n\t"
+    " addiu         %[after],   %[after],       -1          \n\t"
+   "4:                                                      \n\t"
+    ".set           pop                                     \n\t"
+    : [r0] "=&r" (r0), [r1] "=&r" (r1), [r2] "=&r" (r2),
+      [r3] "=&r" (r3), [r4] "=&r" (r4), [r5] "=&r" (r5),
+      [r6] "=&r" (r6), [r7] "=&r" (r7), [iters] "=&r" (iters),
+      [after] "=&r" (after), [window] "+r" (window),
+      [anaBuf] "+r" (anaBuf), [outBuf] "+r" (outBuf)
+    : [anaLen] "r" (anaLen)
+    : "memory", "hi", "lo"
+  );
+#endif
+}
+
+// For the noise supression process, synthesis, read out fully processed
+// segment, and update synthesis buffer.
+void WebRtcNsx_SynthesisUpdate_mips(NoiseSuppressionFixedC* inst,
+                                    int16_t* out_frame,
+                                    int16_t gain_factor) {
+  int iters = (int)inst->blockLen10ms >> 2;
+  int after = inst->blockLen10ms & 3;
+  int r0, r1, r2, r3, r4, r5, r6, r7;
+  int16_t *window = (int16_t*)inst->window;
+  int16_t *real = inst->real;
+  int16_t *synthBuf = inst->synthesisBuffer;
+  int16_t *out = out_frame;
+  int sat_pos = 0x7fff;
+  int sat_neg = 0xffff8000;
+  int block10 = (int)inst->blockLen10ms;
+  int anaLen = (int)inst->anaLen;
+
+  __asm __volatile(
+    ".set       push                                        \n\t"
+    ".set       noreorder                                   \n\t"
+   "1:                                                      \n\t"
+    "blez       %[iters],   2f                              \n\t"
+    " nop                                                   \n\t"
+    "lh         %[r0],      0(%[window])                    \n\t"
+    "lh         %[r1],      0(%[real])                      \n\t"
+    "lh         %[r2],      2(%[window])                    \n\t"
+    "lh         %[r3],      2(%[real])                      \n\t"
+    "lh         %[r4],      4(%[window])                    \n\t"
+    "lh         %[r5],      4(%[real])                      \n\t"
+    "lh         %[r6],      6(%[window])                    \n\t"
+    "lh         %[r7],      6(%[real])                      \n\t"
+    "mul        %[r0],      %[r0],          %[r1]           \n\t"
+    "mul        %[r2],      %[r2],          %[r3]           \n\t"
+    "mul        %[r4],      %[r4],          %[r5]           \n\t"
+    "mul        %[r6],      %[r6],          %[r7]           \n\t"
+    "addiu      %[r0],      %[r0],          0x2000          \n\t"
+    "addiu      %[r2],      %[r2],          0x2000          \n\t"
+    "addiu      %[r4],      %[r4],          0x2000          \n\t"
+    "addiu      %[r6],      %[r6],          0x2000          \n\t"
+    "sra        %[r0],      %[r0],          14              \n\t"
+    "sra        %[r2],      %[r2],          14              \n\t"
+    "sra        %[r4],      %[r4],          14              \n\t"
+    "sra        %[r6],      %[r6],          14              \n\t"
+    "mul        %[r0],      %[r0],          %[gain_factor]  \n\t"
+    "mul        %[r2],      %[r2],          %[gain_factor]  \n\t"
+    "mul        %[r4],      %[r4],          %[gain_factor]  \n\t"
+    "mul        %[r6],      %[r6],          %[gain_factor]  \n\t"
+    "addiu      %[r0],      %[r0],          0x1000          \n\t"
+    "addiu      %[r2],      %[r2],          0x1000          \n\t"
+    "addiu      %[r4],      %[r4],          0x1000          \n\t"
+    "addiu      %[r6],      %[r6],          0x1000          \n\t"
+    "sra        %[r0],      %[r0],          13              \n\t"
+    "sra        %[r2],      %[r2],          13              \n\t"
+    "sra        %[r4],      %[r4],          13              \n\t"
+    "sra        %[r6],      %[r6],          13              \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "slt        %[r3],      %[r2],          %[sat_pos]      \n\t"
+    "slt        %[r5],      %[r4],          %[sat_pos]      \n\t"
+    "slt        %[r7],      %[r6],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "movz       %[r2],      %[sat_pos],     %[r3]           \n\t"
+    "movz       %[r4],      %[sat_pos],     %[r5]           \n\t"
+    "movz       %[r6],      %[sat_pos],     %[r7]           \n\t"
+    "lh         %[r1],      0(%[synthBuf])                  \n\t"
+    "lh         %[r3],      2(%[synthBuf])                  \n\t"
+    "lh         %[r5],      4(%[synthBuf])                  \n\t"
+    "lh         %[r7],      6(%[synthBuf])                  \n\t"
+    "addu       %[r0],      %[r0],          %[r1]           \n\t"
+    "addu       %[r2],      %[r2],          %[r3]           \n\t"
+    "addu       %[r4],      %[r4],          %[r5]           \n\t"
+    "addu       %[r6],      %[r6],          %[r7]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "slt        %[r3],      %[r2],          %[sat_pos]      \n\t"
+    "slt        %[r5],      %[r4],          %[sat_pos]      \n\t"
+    "slt        %[r7],      %[r6],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "movz       %[r2],      %[sat_pos],     %[r3]           \n\t"
+    "movz       %[r4],      %[sat_pos],     %[r5]           \n\t"
+    "movz       %[r6],      %[sat_pos],     %[r7]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_neg]      \n\t"
+    "slt        %[r3],      %[r2],          %[sat_neg]      \n\t"
+    "slt        %[r5],      %[r4],          %[sat_neg]      \n\t"
+    "slt        %[r7],      %[r6],          %[sat_neg]      \n\t"
+    "movn       %[r0],      %[sat_neg],     %[r1]           \n\t"
+    "movn       %[r2],      %[sat_neg],     %[r3]           \n\t"
+    "movn       %[r4],      %[sat_neg],     %[r5]           \n\t"
+    "movn       %[r6],      %[sat_neg],     %[r7]           \n\t"
+    "sh         %[r0],      0(%[synthBuf])                  \n\t"
+    "sh         %[r2],      2(%[synthBuf])                  \n\t"
+    "sh         %[r4],      4(%[synthBuf])                  \n\t"
+    "sh         %[r6],      6(%[synthBuf])                  \n\t"
+    "sh         %[r0],      0(%[out])                       \n\t"
+    "sh         %[r2],      2(%[out])                       \n\t"
+    "sh         %[r4],      4(%[out])                       \n\t"
+    "sh         %[r6],      6(%[out])                       \n\t"
+    "addiu      %[window],  %[window],      8               \n\t"
+    "addiu      %[real],    %[real],        8               \n\t"
+    "addiu      %[synthBuf],%[synthBuf],    8               \n\t"
+    "addiu      %[out],     %[out],         8               \n\t"
+    "b          1b                                          \n\t"
+    " addiu     %[iters],   %[iters],       -1              \n\t"
+   "2:                                                      \n\t"
+    "blez       %[after],   3f                              \n\t"
+    " subu      %[block10], %[anaLen],      %[block10]      \n\t"
+    "lh         %[r0],      0(%[window])                    \n\t"
+    "lh         %[r1],      0(%[real])                      \n\t"
+    "mul        %[r0],      %[r0],          %[r1]           \n\t"
+    "addiu      %[window],  %[window],      2               \n\t"
+    "addiu      %[real],    %[real],        2               \n\t"
+    "addiu      %[r0],      %[r0],          0x2000          \n\t"
+    "sra        %[r0],      %[r0],          14              \n\t"
+    "mul        %[r0],      %[r0],          %[gain_factor]  \n\t"
+    "addiu      %[r0],      %[r0],          0x1000          \n\t"
+    "sra        %[r0],      %[r0],          13              \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "lh         %[r1],      0(%[synthBuf])                  \n\t"
+    "addu       %[r0],      %[r0],          %[r1]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_neg]      \n\t"
+    "movn       %[r0],      %[sat_neg],     %[r1]           \n\t"
+    "sh         %[r0],      0(%[synthBuf])                  \n\t"
+    "sh         %[r0],      0(%[out])                       \n\t"
+    "addiu      %[synthBuf],%[synthBuf],    2               \n\t"
+    "addiu      %[out],     %[out],         2               \n\t"
+    "b          2b                                          \n\t"
+    " addiu     %[after],   %[after],       -1              \n\t"
+   "3:                                                      \n\t"
+    "sra        %[iters],   %[block10],     2               \n\t"
+   "4:                                                      \n\t"
+    "blez       %[iters],   5f                              \n\t"
+    " andi      %[after],   %[block10],     3               \n\t"
+    "lh         %[r0],      0(%[window])                    \n\t"
+    "lh         %[r1],      0(%[real])                      \n\t"
+    "lh         %[r2],      2(%[window])                    \n\t"
+    "lh         %[r3],      2(%[real])                      \n\t"
+    "lh         %[r4],      4(%[window])                    \n\t"
+    "lh         %[r5],      4(%[real])                      \n\t"
+    "lh         %[r6],      6(%[window])                    \n\t"
+    "lh         %[r7],      6(%[real])                      \n\t"
+    "mul        %[r0],      %[r0],          %[r1]           \n\t"
+    "mul        %[r2],      %[r2],          %[r3]           \n\t"
+    "mul        %[r4],      %[r4],          %[r5]           \n\t"
+    "mul        %[r6],      %[r6],          %[r7]           \n\t"
+    "addiu      %[r0],      %[r0],          0x2000          \n\t"
+    "addiu      %[r2],      %[r2],          0x2000          \n\t"
+    "addiu      %[r4],      %[r4],          0x2000          \n\t"
+    "addiu      %[r6],      %[r6],          0x2000          \n\t"
+    "sra        %[r0],      %[r0],          14              \n\t"
+    "sra        %[r2],      %[r2],          14              \n\t"
+    "sra        %[r4],      %[r4],          14              \n\t"
+    "sra        %[r6],      %[r6],          14              \n\t"
+    "mul        %[r0],      %[r0],          %[gain_factor]  \n\t"
+    "mul        %[r2],      %[r2],          %[gain_factor]  \n\t"
+    "mul        %[r4],      %[r4],          %[gain_factor]  \n\t"
+    "mul        %[r6],      %[r6],          %[gain_factor]  \n\t"
+    "addiu      %[r0],      %[r0],          0x1000          \n\t"
+    "addiu      %[r2],      %[r2],          0x1000          \n\t"
+    "addiu      %[r4],      %[r4],          0x1000          \n\t"
+    "addiu      %[r6],      %[r6],          0x1000          \n\t"
+    "sra        %[r0],      %[r0],          13              \n\t"
+    "sra        %[r2],      %[r2],          13              \n\t"
+    "sra        %[r4],      %[r4],          13              \n\t"
+    "sra        %[r6],      %[r6],          13              \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "slt        %[r3],      %[r2],          %[sat_pos]      \n\t"
+    "slt        %[r5],      %[r4],          %[sat_pos]      \n\t"
+    "slt        %[r7],      %[r6],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "movz       %[r2],      %[sat_pos],     %[r3]           \n\t"
+    "movz       %[r4],      %[sat_pos],     %[r5]           \n\t"
+    "movz       %[r6],      %[sat_pos],     %[r7]           \n\t"
+    "lh         %[r1],      0(%[synthBuf])                  \n\t"
+    "lh         %[r3],      2(%[synthBuf])                  \n\t"
+    "lh         %[r5],      4(%[synthBuf])                  \n\t"
+    "lh         %[r7],      6(%[synthBuf])                  \n\t"
+    "addu       %[r0],      %[r0],          %[r1]           \n\t"
+    "addu       %[r2],      %[r2],          %[r3]           \n\t"
+    "addu       %[r4],      %[r4],          %[r5]           \n\t"
+    "addu       %[r6],      %[r6],          %[r7]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "slt        %[r3],      %[r2],          %[sat_pos]      \n\t"
+    "slt        %[r5],      %[r4],          %[sat_pos]      \n\t"
+    "slt        %[r7],      %[r6],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "movz       %[r2],      %[sat_pos],     %[r3]           \n\t"
+    "movz       %[r4],      %[sat_pos],     %[r5]           \n\t"
+    "movz       %[r6],      %[sat_pos],     %[r7]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_neg]      \n\t"
+    "slt        %[r3],      %[r2],          %[sat_neg]      \n\t"
+    "slt        %[r5],      %[r4],          %[sat_neg]      \n\t"
+    "slt        %[r7],      %[r6],          %[sat_neg]      \n\t"
+    "movn       %[r0],      %[sat_neg],     %[r1]           \n\t"
+    "movn       %[r2],      %[sat_neg],     %[r3]           \n\t"
+    "movn       %[r4],      %[sat_neg],     %[r5]           \n\t"
+    "movn       %[r6],      %[sat_neg],     %[r7]           \n\t"
+    "sh         %[r0],      0(%[synthBuf])                  \n\t"
+    "sh         %[r2],      2(%[synthBuf])                  \n\t"
+    "sh         %[r4],      4(%[synthBuf])                  \n\t"
+    "sh         %[r6],      6(%[synthBuf])                  \n\t"
+    "addiu      %[window],  %[window],      8               \n\t"
+    "addiu      %[real],    %[real],        8               \n\t"
+    "addiu      %[synthBuf],%[synthBuf],    8               \n\t"
+    "b          4b                                          \n\t"
+    " addiu     %[iters],   %[iters],       -1              \n\t"
+   "5:                                                      \n\t"
+    "blez       %[after],   6f                              \n\t"
+    " nop                                                   \n\t"
+    "lh         %[r0],      0(%[window])                    \n\t"
+    "lh         %[r1],      0(%[real])                      \n\t"
+    "mul        %[r0],      %[r0],          %[r1]           \n\t"
+    "addiu      %[window],  %[window],      2               \n\t"
+    "addiu      %[real],    %[real],        2               \n\t"
+    "addiu      %[r0],      %[r0],          0x2000          \n\t"
+    "sra        %[r0],      %[r0],          14              \n\t"
+    "mul        %[r0],      %[r0],          %[gain_factor]  \n\t"
+    "addiu      %[r0],      %[r0],          0x1000          \n\t"
+    "sra        %[r0],      %[r0],          13              \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "lh         %[r1],      0(%[synthBuf])                  \n\t"
+    "addu       %[r0],      %[r0],          %[r1]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_pos]      \n\t"
+    "movz       %[r0],      %[sat_pos],     %[r1]           \n\t"
+    "slt        %[r1],      %[r0],          %[sat_neg]      \n\t"
+    "movn       %[r0],      %[sat_neg],     %[r1]           \n\t"
+    "sh         %[r0],      0(%[synthBuf])                  \n\t"
+    "addiu      %[synthBuf],%[synthBuf],    2               \n\t"
+    "b          2b                                          \n\t"
+    " addiu     %[after],   %[after],       -1              \n\t"
+   "6:                                                      \n\t"
+    ".set       pop                                         \n\t"
+    : [r0] "=&r" (r0), [r1] "=&r" (r1), [r2] "=&r" (r2),
+      [r3] "=&r" (r3), [r4] "=&r" (r4), [r5] "=&r" (r5),
+      [r6] "=&r" (r6), [r7] "=&r" (r7), [iters] "+r" (iters),
+      [after] "+r" (after), [block10] "+r" (block10),
+      [window] "+r" (window), [real] "+r" (real),
+      [synthBuf] "+r" (synthBuf), [out] "+r" (out)
+    : [gain_factor] "r" (gain_factor), [sat_pos] "r" (sat_pos),
+      [sat_neg] "r" (sat_neg), [anaLen] "r" (anaLen)
+    : "memory", "hi", "lo"
+  );
+
+  // update synthesis buffer
+  memcpy(inst->synthesisBuffer, inst->synthesisBuffer + inst->blockLen10ms,
+      (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->synthesisBuffer));
+  WebRtcSpl_ZerosArrayW16(inst->synthesisBuffer
+      + inst->anaLen - inst->blockLen10ms, inst->blockLen10ms);
+}
+
+// Filter the data in the frequency domain, and create spectrum.
+void WebRtcNsx_PrepareSpectrum_mips(NoiseSuppressionFixedC* inst,
+                                    int16_t* freq_buf) {
+  uint16_t *noiseSupFilter = inst->noiseSupFilter;
+  int16_t *real = inst->real;
+  int16_t *imag = inst->imag;
+  int32_t loop_count = 2;
+  int16_t tmp_1, tmp_2, tmp_3, tmp_4, tmp_5, tmp_6;
+  int16_t tmp16 = (int16_t)(inst->anaLen << 1) - 4;
+  int16_t* freq_buf_f = freq_buf;
+  int16_t* freq_buf_s = &freq_buf[tmp16];
+
+  __asm __volatile (
+    ".set       push                                                 \n\t"
+    ".set       noreorder                                            \n\t"
+    //first sample
+    "lh         %[tmp_1],           0(%[noiseSupFilter])             \n\t"
+    "lh         %[tmp_2],           0(%[real])                       \n\t"
+    "lh         %[tmp_3],           0(%[imag])                       \n\t"
+    "mul        %[tmp_2],           %[tmp_2],             %[tmp_1]   \n\t"
+    "mul        %[tmp_3],           %[tmp_3],             %[tmp_1]   \n\t"
+    "sra        %[tmp_2],           %[tmp_2],             14         \n\t"
+    "sra        %[tmp_3],           %[tmp_3],             14         \n\t"
+    "sh         %[tmp_2],           0(%[real])                       \n\t"
+    "sh         %[tmp_3],           0(%[imag])                       \n\t"
+    "negu       %[tmp_3],           %[tmp_3]                         \n\t"
+    "sh         %[tmp_2],           0(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_3],           2(%[freq_buf_f])                 \n\t"
+    "addiu      %[real],            %[real],              2          \n\t"
+    "addiu      %[imag],            %[imag],              2          \n\t"
+    "addiu      %[noiseSupFilter],  %[noiseSupFilter],    2          \n\t"
+    "addiu      %[freq_buf_f],      %[freq_buf_f],        4          \n\t"
+   "1:                                                               \n\t"
+    "lh         %[tmp_1],           0(%[noiseSupFilter])             \n\t"
+    "lh         %[tmp_2],           0(%[real])                       \n\t"
+    "lh         %[tmp_3],           0(%[imag])                       \n\t"
+    "lh         %[tmp_4],           2(%[noiseSupFilter])             \n\t"
+    "lh         %[tmp_5],           2(%[real])                       \n\t"
+    "lh         %[tmp_6],           2(%[imag])                       \n\t"
+    "mul        %[tmp_2],           %[tmp_2],             %[tmp_1]   \n\t"
+    "mul        %[tmp_3],           %[tmp_3],             %[tmp_1]   \n\t"
+    "mul        %[tmp_5],           %[tmp_5],             %[tmp_4]   \n\t"
+    "mul        %[tmp_6],           %[tmp_6],             %[tmp_4]   \n\t"
+    "addiu      %[loop_count],      %[loop_count],        2          \n\t"
+    "sra        %[tmp_2],           %[tmp_2],             14         \n\t"
+    "sra        %[tmp_3],           %[tmp_3],             14         \n\t"
+    "sra        %[tmp_5],           %[tmp_5],             14         \n\t"
+    "sra        %[tmp_6],           %[tmp_6],             14         \n\t"
+    "addiu      %[noiseSupFilter],  %[noiseSupFilter],    4          \n\t"
+    "sh         %[tmp_2],           0(%[real])                       \n\t"
+    "sh         %[tmp_2],           4(%[freq_buf_s])                 \n\t"
+    "sh         %[tmp_3],           0(%[imag])                       \n\t"
+    "sh         %[tmp_3],           6(%[freq_buf_s])                 \n\t"
+    "negu       %[tmp_3],           %[tmp_3]                         \n\t"
+    "sh         %[tmp_5],           2(%[real])                       \n\t"
+    "sh         %[tmp_5],           0(%[freq_buf_s])                 \n\t"
+    "sh         %[tmp_6],           2(%[imag])                       \n\t"
+    "sh         %[tmp_6],           2(%[freq_buf_s])                 \n\t"
+    "negu       %[tmp_6],           %[tmp_6]                         \n\t"
+    "addiu      %[freq_buf_s],      %[freq_buf_s],        -8         \n\t"
+    "addiu      %[real],            %[real],              4          \n\t"
+    "addiu      %[imag],            %[imag],              4          \n\t"
+    "sh         %[tmp_2],           0(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_3],           2(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_5],           4(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_6],           6(%[freq_buf_f])                 \n\t"
+    "blt        %[loop_count],      %[loop_size],         1b         \n\t"
+    " addiu     %[freq_buf_f],      %[freq_buf_f],        8          \n\t"
+    //last two samples:
+    "lh         %[tmp_1],           0(%[noiseSupFilter])             \n\t"
+    "lh         %[tmp_2],           0(%[real])                       \n\t"
+    "lh         %[tmp_3],           0(%[imag])                       \n\t"
+    "lh         %[tmp_4],           2(%[noiseSupFilter])             \n\t"
+    "lh         %[tmp_5],           2(%[real])                       \n\t"
+    "lh         %[tmp_6],           2(%[imag])                       \n\t"
+    "mul        %[tmp_2],           %[tmp_2],             %[tmp_1]   \n\t"
+    "mul        %[tmp_3],           %[tmp_3],             %[tmp_1]   \n\t"
+    "mul        %[tmp_5],           %[tmp_5],             %[tmp_4]   \n\t"
+    "mul        %[tmp_6],           %[tmp_6],             %[tmp_4]   \n\t"
+    "sra        %[tmp_2],           %[tmp_2],             14         \n\t"
+    "sra        %[tmp_3],           %[tmp_3],             14         \n\t"
+    "sra        %[tmp_5],           %[tmp_5],             14         \n\t"
+    "sra        %[tmp_6],           %[tmp_6],             14         \n\t"
+    "sh         %[tmp_2],           0(%[real])                       \n\t"
+    "sh         %[tmp_2],           4(%[freq_buf_s])                 \n\t"
+    "sh         %[tmp_3],           0(%[imag])                       \n\t"
+    "sh         %[tmp_3],           6(%[freq_buf_s])                 \n\t"
+    "negu       %[tmp_3],           %[tmp_3]                         \n\t"
+    "sh         %[tmp_2],           0(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_3],           2(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_5],           4(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_6],           6(%[freq_buf_f])                 \n\t"
+    "sh         %[tmp_5],           2(%[real])                       \n\t"
+    "sh         %[tmp_6],           2(%[imag])                       \n\t"
+    ".set       pop                                                  \n\t"
+    : [real] "+r" (real), [imag] "+r" (imag),
+      [freq_buf_f] "+r" (freq_buf_f), [freq_buf_s] "+r" (freq_buf_s),
+      [loop_count] "+r" (loop_count), [noiseSupFilter] "+r" (noiseSupFilter),
+      [tmp_1] "=&r" (tmp_1), [tmp_2] "=&r" (tmp_2), [tmp_3] "=&r" (tmp_3),
+      [tmp_4] "=&r" (tmp_4), [tmp_5] "=&r" (tmp_5), [tmp_6] "=&r" (tmp_6)
+    : [loop_size] "r" (inst->anaLen2)
+    : "memory", "hi", "lo"
+  );
+}
+
+#if defined(MIPS_DSP_R1_LE)
+// Denormalize the real-valued signal |in|, the output from inverse FFT.
+void WebRtcNsx_Denormalize_mips(NoiseSuppressionFixedC* inst,
+                                int16_t* in,
+                                int factor) {
+  int32_t r0, r1, r2, r3, t0;
+  int len = (int)inst->anaLen;
+  int16_t *out = &inst->real[0];
+  int shift = factor - inst->normData;
+
+  __asm __volatile (
+    ".set          push                                \n\t"
+    ".set          noreorder                           \n\t"
+    "beqz          %[len],     8f                      \n\t"
+    " nop                                              \n\t"
+    "bltz          %[shift],   4f                      \n\t"
+    " sra          %[t0],      %[len],      2          \n\t"
+    "beqz          %[t0],      2f                      \n\t"
+    " andi         %[len],     %[len],      3          \n\t"
+   "1:                                                 \n\t"
+    "lh            %[r0],      0(%[in])                \n\t"
+    "lh            %[r1],      2(%[in])                \n\t"
+    "lh            %[r2],      4(%[in])                \n\t"
+    "lh            %[r3],      6(%[in])                \n\t"
+    "shllv_s.ph    %[r0],      %[r0],       %[shift]   \n\t"
+    "shllv_s.ph    %[r1],      %[r1],       %[shift]   \n\t"
+    "shllv_s.ph    %[r2],      %[r2],       %[shift]   \n\t"
+    "shllv_s.ph    %[r3],      %[r3],       %[shift]   \n\t"
+    "addiu         %[in],      %[in],       8          \n\t"
+    "addiu         %[t0],      %[t0],       -1         \n\t"
+    "sh            %[r0],      0(%[out])               \n\t"
+    "sh            %[r1],      2(%[out])               \n\t"
+    "sh            %[r2],      4(%[out])               \n\t"
+    "sh            %[r3],      6(%[out])               \n\t"
+    "bgtz          %[t0],      1b                      \n\t"
+    " addiu        %[out],     %[out],      8          \n\t"
+   "2:                                                 \n\t"
+    "beqz          %[len],     8f                      \n\t"
+    " nop                                              \n\t"
+   "3:                                                 \n\t"
+    "lh            %[r0],      0(%[in])                \n\t"
+    "addiu         %[in],      %[in],       2          \n\t"
+    "addiu         %[len],     %[len],      -1         \n\t"
+    "shllv_s.ph    %[r0],      %[r0],       %[shift]   \n\t"
+    "addiu         %[out],     %[out],      2          \n\t"
+    "bgtz          %[len],     3b                      \n\t"
+    " sh           %[r0],      -2(%[out])              \n\t"
+    "b             8f                                  \n\t"
+   "4:                                                 \n\t"
+    "negu          %[shift],   %[shift]                \n\t"
+    "beqz          %[t0],      6f                      \n\t"
+    " andi         %[len],     %[len],      3          \n\t"
+   "5:                                                 \n\t"
+    "lh            %[r0],      0(%[in])                \n\t"
+    "lh            %[r1],      2(%[in])                \n\t"
+    "lh            %[r2],      4(%[in])                \n\t"
+    "lh            %[r3],      6(%[in])                \n\t"
+    "srav          %[r0],      %[r0],       %[shift]   \n\t"
+    "srav          %[r1],      %[r1],       %[shift]   \n\t"
+    "srav          %[r2],      %[r2],       %[shift]   \n\t"
+    "srav          %[r3],      %[r3],       %[shift]   \n\t"
+    "addiu         %[in],      %[in],       8          \n\t"
+    "addiu         %[t0],      %[t0],       -1         \n\t"
+    "sh            %[r0],      0(%[out])               \n\t"
+    "sh            %[r1],      2(%[out])               \n\t"
+    "sh            %[r2],      4(%[out])               \n\t"
+    "sh            %[r3],      6(%[out])               \n\t"
+    "bgtz          %[t0],      5b                      \n\t"
+    " addiu        %[out],     %[out],      8          \n\t"
+   "6:                                                 \n\t"
+    "beqz          %[len],     8f                      \n\t"
+    " nop                                              \n\t"
+   "7:                                                 \n\t"
+    "lh            %[r0],      0(%[in])                \n\t"
+    "addiu         %[in],      %[in],       2          \n\t"
+    "addiu         %[len],     %[len],      -1         \n\t"
+    "srav          %[r0],      %[r0],       %[shift]   \n\t"
+    "addiu         %[out],     %[out],      2          \n\t"
+    "bgtz          %[len],     7b                      \n\t"
+    " sh           %[r0],      -2(%[out])              \n\t"
+   "8:                                                 \n\t"
+    ".set          pop                                 \n\t"
+    : [t0] "=&r" (t0), [r0] "=&r" (r0), [r1] "=&r" (r1),
+      [r2] "=&r" (r2), [r3] "=&r" (r3)
+    : [len] "r" (len), [shift] "r" (shift), [in] "r" (in),
+      [out] "r" (out)
+    : "memory"
+  );
+}
+#endif
+
+// Normalize the real-valued signal |in|, the input to forward FFT.
+void WebRtcNsx_NormalizeRealBuffer_mips(NoiseSuppressionFixedC* inst,
+                                        const int16_t* in,
+                                        int16_t* out) {
+  int32_t r0, r1, r2, r3, t0;
+  int len = (int)inst->anaLen;
+  int shift = inst->normData;
+
+  __asm __volatile (
+    ".set          push                                \n\t"
+    ".set          noreorder                           \n\t"
+    "beqz          %[len],     4f                      \n\t"
+    " sra          %[t0],      %[len],      2          \n\t"
+    "beqz          %[t0],      2f                      \n\t"
+    " andi         %[len],     %[len],      3          \n\t"
+   "1:                                                 \n\t"
+    "lh            %[r0],      0(%[in])                \n\t"
+    "lh            %[r1],      2(%[in])                \n\t"
+    "lh            %[r2],      4(%[in])                \n\t"
+    "lh            %[r3],      6(%[in])                \n\t"
+    "sllv          %[r0],      %[r0],       %[shift]   \n\t"
+    "sllv          %[r1],      %[r1],       %[shift]   \n\t"
+    "sllv          %[r2],      %[r2],       %[shift]   \n\t"
+    "sllv          %[r3],      %[r3],       %[shift]   \n\t"
+    "addiu         %[in],      %[in],       8          \n\t"
+    "addiu         %[t0],      %[t0],       -1         \n\t"
+    "sh            %[r0],      0(%[out])               \n\t"
+    "sh            %[r1],      2(%[out])               \n\t"
+    "sh            %[r2],      4(%[out])               \n\t"
+    "sh            %[r3],      6(%[out])               \n\t"
+    "bgtz          %[t0],      1b                      \n\t"
+    " addiu        %[out],     %[out],      8          \n\t"
+   "2:                                                 \n\t"
+    "beqz          %[len],     4f                      \n\t"
+    " nop                                              \n\t"
+   "3:                                                 \n\t"
+    "lh            %[r0],      0(%[in])                \n\t"
+    "addiu         %[in],      %[in],       2          \n\t"
+    "addiu         %[len],     %[len],      -1         \n\t"
+    "sllv          %[r0],      %[r0],       %[shift]   \n\t"
+    "addiu         %[out],     %[out],      2          \n\t"
+    "bgtz          %[len],     3b                      \n\t"
+    " sh           %[r0],      -2(%[out])              \n\t"
+   "4:                                                 \n\t"
+    ".set          pop                                 \n\t"
+    : [t0] "=&r" (t0), [r0] "=&r" (r0), [r1] "=&r" (r1),
+      [r2] "=&r" (r2), [r3] "=&r" (r3)
+    : [len] "r" (len), [shift] "r" (shift), [in] "r" (in),
+      [out] "r" (out)
+    : "memory"
+  );
+}
+
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_neon.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_neon.c
new file mode 100644
index 0000000..fb1b323
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_core_neon.c
@@ -0,0 +1,606 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/ns/nsx_core.h"
+
+#include <arm_neon.h>
+
+#include "webrtc/base/checks.h"
+
+// Constants to compensate for shifting signal log(2^shifts).
+const int16_t WebRtcNsx_kLogTable[9] = {
+  0, 177, 355, 532, 710, 887, 1065, 1242, 1420
+};
+
+const int16_t WebRtcNsx_kCounterDiv[201] = {
+  32767, 16384, 10923, 8192, 6554, 5461, 4681, 4096, 3641, 3277, 2979, 2731,
+  2521, 2341, 2185, 2048, 1928, 1820, 1725, 1638, 1560, 1489, 1425, 1365, 1311,
+  1260, 1214, 1170, 1130, 1092, 1057, 1024, 993, 964, 936, 910, 886, 862, 840,
+  819, 799, 780, 762, 745, 728, 712, 697, 683, 669, 655, 643, 630, 618, 607,
+  596, 585, 575, 565, 555, 546, 537, 529, 520, 512, 504, 496, 489, 482, 475,
+  468, 462, 455, 449, 443, 437, 431, 426, 420, 415, 410, 405, 400, 395, 390,
+  386, 381, 377, 372, 368, 364, 360, 356, 352, 349, 345, 341, 338, 334, 331,
+  328, 324, 321, 318, 315, 312, 309, 306, 303, 301, 298, 295, 293, 290, 287,
+  285, 282, 280, 278, 275, 273, 271, 269, 266, 264, 262, 260, 258, 256, 254,
+  252, 250, 248, 246, 245, 243, 241, 239, 237, 236, 234, 232, 231, 229, 228,
+  226, 224, 223, 221, 220, 218, 217, 216, 214, 213, 211, 210, 209, 207, 206,
+  205, 204, 202, 201, 200, 199, 197, 196, 195, 194, 193, 192, 191, 189, 188,
+  187, 186, 185, 184, 183, 182, 181, 180, 179, 178, 177, 176, 175, 174, 173,
+  172, 172, 171, 170, 169, 168, 167, 166, 165, 165, 164, 163
+};
+
+const int16_t WebRtcNsx_kLogTableFrac[256] = {
+  0, 1, 3, 4, 6, 7, 9, 10, 11, 13, 14, 16, 17, 18, 20, 21,
+  22, 24, 25, 26, 28, 29, 30, 32, 33, 34, 36, 37, 38, 40, 41, 42,
+  44, 45, 46, 47, 49, 50, 51, 52, 54, 55, 56, 57, 59, 60, 61, 62,
+  63, 65, 66, 67, 68, 69, 71, 72, 73, 74, 75, 77, 78, 79, 80, 81,
+  82, 84, 85, 86, 87, 88, 89, 90, 92, 93, 94, 95, 96, 97, 98, 99,
+  100, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 116,
+  117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131,
+  132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146,
+  147, 148, 149, 150, 151, 152, 153, 154, 155, 155, 156, 157, 158, 159, 160,
+  161, 162, 163, 164, 165, 166, 167, 168, 169, 169, 170, 171, 172, 173, 174,
+  175, 176, 177, 178, 178, 179, 180, 181, 182, 183, 184, 185, 185, 186, 187,
+  188, 189, 190, 191, 192, 192, 193, 194, 195, 196, 197, 198, 198, 199, 200,
+  201, 202, 203, 203, 204, 205, 206, 207, 208, 208, 209, 210, 211, 212, 212,
+  213, 214, 215, 216, 216, 217, 218, 219, 220, 220, 221, 222, 223, 224, 224,
+  225, 226, 227, 228, 228, 229, 230, 231, 231, 232, 233, 234, 234, 235, 236,
+  237, 238, 238, 239, 240, 241, 241, 242, 243, 244, 244, 245, 246, 247, 247,
+  248, 249, 249, 250, 251, 252, 252, 253, 254, 255, 255
+};
+
+// Update the noise estimation information.
+static void UpdateNoiseEstimateNeon(NoiseSuppressionFixedC* inst, int offset) {
+  const int16_t kExp2Const = 11819; // Q13
+  int16_t* ptr_noiseEstLogQuantile = NULL;
+  int16_t* ptr_noiseEstQuantile = NULL;
+  int16x4_t kExp2Const16x4 = vdup_n_s16(kExp2Const);
+  int32x4_t twentyOne32x4 = vdupq_n_s32(21);
+  int32x4_t constA32x4 = vdupq_n_s32(0x1fffff);
+  int32x4_t constB32x4 = vdupq_n_s32(0x200000);
+
+  int16_t tmp16 = WebRtcSpl_MaxValueW16(inst->noiseEstLogQuantile + offset,
+                                        inst->magnLen);
+
+  // Guarantee a Q-domain as high as possible and still fit in int16
+  inst->qNoise = 14 - (int) WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(kExp2Const,
+                                                                 tmp16,
+                                                                 21);
+
+  int32x4_t qNoise32x4 = vdupq_n_s32(inst->qNoise);
+
+  for (ptr_noiseEstLogQuantile = &inst->noiseEstLogQuantile[offset],
+       ptr_noiseEstQuantile = &inst->noiseEstQuantile[0];
+       ptr_noiseEstQuantile < &inst->noiseEstQuantile[inst->magnLen - 3];
+       ptr_noiseEstQuantile += 4, ptr_noiseEstLogQuantile += 4) {
+
+    // tmp32no2 = kExp2Const * inst->noiseEstLogQuantile[offset + i];
+    int16x4_t v16x4 = vld1_s16(ptr_noiseEstLogQuantile);
+    int32x4_t v32x4B = vmull_s16(v16x4, kExp2Const16x4);
+
+    // tmp32no1 = (0x00200000 | (tmp32no2 & 0x001FFFFF)); // 2^21 + frac
+    int32x4_t v32x4A = vandq_s32(v32x4B, constA32x4);
+    v32x4A = vorrq_s32(v32x4A, constB32x4);
+
+    // tmp16 = (int16_t)(tmp32no2 >> 21);
+    v32x4B = vshrq_n_s32(v32x4B, 21);
+
+    // tmp16 -= 21;// shift 21 to get result in Q0
+    v32x4B = vsubq_s32(v32x4B, twentyOne32x4);
+
+    // tmp16 += (int16_t) inst->qNoise;
+    // shift to get result in Q(qNoise)
+    v32x4B = vaddq_s32(v32x4B, qNoise32x4);
+
+    // if (tmp16 < 0) {
+    //   tmp32no1 >>= -tmp16;
+    // } else {
+    //   tmp32no1 <<= tmp16;
+    // }
+    v32x4B = vshlq_s32(v32x4A, v32x4B);
+
+    // tmp16 = WebRtcSpl_SatW32ToW16(tmp32no1);
+    v16x4 = vqmovn_s32(v32x4B);
+
+    //inst->noiseEstQuantile[i] = tmp16;
+    vst1_s16(ptr_noiseEstQuantile, v16x4);
+  }
+
+  // Last iteration:
+
+  // inst->quantile[i]=exp(inst->lquantile[offset+i]);
+  // in Q21
+  int32_t tmp32no2 = kExp2Const * *ptr_noiseEstLogQuantile;
+  int32_t tmp32no1 = (0x00200000 | (tmp32no2 & 0x001FFFFF)); // 2^21 + frac
+
+  tmp16 = (int16_t)(tmp32no2 >> 21);
+  tmp16 -= 21;// shift 21 to get result in Q0
+  tmp16 += (int16_t) inst->qNoise; //shift to get result in Q(qNoise)
+  if (tmp16 < 0) {
+    tmp32no1 >>= -tmp16;
+  } else {
+    tmp32no1 <<= tmp16;
+  }
+  *ptr_noiseEstQuantile = WebRtcSpl_SatW32ToW16(tmp32no1);
+}
+
+// Noise Estimation
+void WebRtcNsx_NoiseEstimationNeon(NoiseSuppressionFixedC* inst,
+                                   uint16_t* magn,
+                                   uint32_t* noise,
+                                   int16_t* q_noise) {
+  int16_t lmagn[HALF_ANAL_BLOCKL], counter, countDiv;
+  int16_t countProd, delta, zeros, frac;
+  int16_t log2, tabind, logval, tmp16, tmp16no1, tmp16no2;
+  const int16_t log2_const = 22713;
+  const int16_t width_factor = 21845;
+
+  size_t i, s, offset;
+
+  tabind = inst->stages - inst->normData;
+  RTC_DCHECK_LT(tabind, 9);
+  RTC_DCHECK_GT(tabind, -9);
+  if (tabind < 0) {
+    logval = -WebRtcNsx_kLogTable[-tabind];
+  } else {
+    logval = WebRtcNsx_kLogTable[tabind];
+  }
+
+  int16x8_t logval_16x8 = vdupq_n_s16(logval);
+
+  // lmagn(i)=log(magn(i))=log(2)*log2(magn(i))
+  // magn is in Q(-stages), and the real lmagn values are:
+  // real_lmagn(i)=log(magn(i)*2^stages)=log(magn(i))+log(2^stages)
+  // lmagn in Q8
+  for (i = 0; i < inst->magnLen; i++) {
+    if (magn[i]) {
+      zeros = WebRtcSpl_NormU32((uint32_t)magn[i]);
+      frac = (int16_t)((((uint32_t)magn[i] << zeros)
+                        & 0x7FFFFFFF) >> 23);
+      RTC_DCHECK_LT(frac, 256);
+      // log2(magn(i))
+      log2 = (int16_t)(((31 - zeros) << 8)
+                       + WebRtcNsx_kLogTableFrac[frac]);
+      // log2(magn(i))*log(2)
+      lmagn[i] = (int16_t)((log2 * log2_const) >> 15);
+      // + log(2^stages)
+      lmagn[i] += logval;
+    } else {
+      lmagn[i] = logval;
+    }
+  }
+
+  int16x4_t Q3_16x4  = vdup_n_s16(3);
+  int16x8_t WIDTHQ8_16x8 = vdupq_n_s16(WIDTH_Q8);
+  int16x8_t WIDTHFACTOR_16x8 = vdupq_n_s16(width_factor);
+
+  int16_t factor = FACTOR_Q7;
+  if (inst->blockIndex < END_STARTUP_LONG)
+    factor = FACTOR_Q7_STARTUP;
+
+  // Loop over simultaneous estimates
+  for (s = 0; s < SIMULT; s++) {
+    offset = s * inst->magnLen;
+
+    // Get counter values from state
+    counter = inst->noiseEstCounter[s];
+    RTC_DCHECK_LT(counter, 201);
+    countDiv = WebRtcNsx_kCounterDiv[counter];
+    countProd = (int16_t)(counter * countDiv);
+
+    // quant_est(...)
+    int16_t deltaBuff[8];
+    int16x4_t tmp16x4_0;
+    int16x4_t tmp16x4_1;
+    int16x4_t countDiv_16x4 = vdup_n_s16(countDiv);
+    int16x8_t countProd_16x8 = vdupq_n_s16(countProd);
+    int16x8_t tmp16x8_0 = vdupq_n_s16(countDiv);
+    int16x8_t prod16x8 = vqrdmulhq_s16(WIDTHFACTOR_16x8, tmp16x8_0);
+    int16x8_t tmp16x8_1;
+    int16x8_t tmp16x8_2;
+    int16x8_t tmp16x8_3;
+    uint16x8_t tmp16x8_4;
+    int32x4_t tmp32x4;
+
+    for (i = 0; i + 7 < inst->magnLen; i += 8) {
+      // Compute delta.
+      // Smaller step size during startup. This prevents from using
+      // unrealistic values causing overflow.
+      tmp16x8_0 = vdupq_n_s16(factor);
+      vst1q_s16(deltaBuff, tmp16x8_0);
+
+      int j;
+      for (j = 0; j < 8; j++) {
+        if (inst->noiseEstDensity[offset + i + j] > 512) {
+          // Get values for deltaBuff by shifting intead of dividing.
+          int factor = WebRtcSpl_NormW16(inst->noiseEstDensity[offset + i + j]);
+          deltaBuff[j] = (int16_t)(FACTOR_Q16 >> (14 - factor));
+        }
+      }
+
+      // Update log quantile estimate
+
+      // tmp16 = (int16_t)((delta * countDiv) >> 14);
+      tmp32x4 = vmull_s16(vld1_s16(&deltaBuff[0]), countDiv_16x4);
+      tmp16x4_1 = vshrn_n_s32(tmp32x4, 14);
+      tmp32x4 = vmull_s16(vld1_s16(&deltaBuff[4]), countDiv_16x4);
+      tmp16x4_0 = vshrn_n_s32(tmp32x4, 14);
+      tmp16x8_0 = vcombine_s16(tmp16x4_1, tmp16x4_0); // Keep for several lines.
+
+      // prepare for the "if" branch
+      // tmp16 += 2;
+      // tmp16_1 = (Word16)(tmp16>>2);
+      tmp16x8_1 = vrshrq_n_s16(tmp16x8_0, 2);
+
+      // inst->noiseEstLogQuantile[offset+i] + tmp16_1;
+      tmp16x8_2 = vld1q_s16(&inst->noiseEstLogQuantile[offset + i]); // Keep
+      tmp16x8_1 = vaddq_s16(tmp16x8_2, tmp16x8_1); // Keep for several lines
+
+      // Prepare for the "else" branch
+      // tmp16 += 1;
+      // tmp16_1 = (Word16)(tmp16>>1);
+      tmp16x8_0 = vrshrq_n_s16(tmp16x8_0, 1);
+
+      // tmp16_2 = (int16_t)((tmp16_1 * 3) >> 1);
+      tmp32x4 = vmull_s16(vget_low_s16(tmp16x8_0), Q3_16x4);
+      tmp16x4_1 = vshrn_n_s32(tmp32x4, 1);
+
+      // tmp16_2 = (int16_t)((tmp16_1 * 3) >> 1);
+      tmp32x4 = vmull_s16(vget_high_s16(tmp16x8_0), Q3_16x4);
+      tmp16x4_0 = vshrn_n_s32(tmp32x4, 1);
+
+      // inst->noiseEstLogQuantile[offset + i] - tmp16_2;
+      tmp16x8_0 = vcombine_s16(tmp16x4_1, tmp16x4_0); // keep
+      tmp16x8_0 = vsubq_s16(tmp16x8_2, tmp16x8_0);
+
+      // logval is the smallest fixed point representation we can have. Values
+      // below that will correspond to values in the interval [0, 1], which
+      // can't possibly occur.
+      tmp16x8_0 = vmaxq_s16(tmp16x8_0, logval_16x8);
+
+      // Do the if-else branches:
+      tmp16x8_3 = vld1q_s16(&lmagn[i]); // keep for several lines
+      tmp16x8_4 = vcgtq_s16(tmp16x8_3, tmp16x8_2);
+      tmp16x8_2 = vbslq_s16(tmp16x8_4, tmp16x8_1, tmp16x8_0);
+      vst1q_s16(&inst->noiseEstLogQuantile[offset + i], tmp16x8_2);
+
+      // Update density estimate
+      // tmp16_1 + tmp16_2
+      tmp16x8_1 = vld1q_s16(&inst->noiseEstDensity[offset + i]);
+      tmp16x8_0 = vqrdmulhq_s16(tmp16x8_1, countProd_16x8);
+      tmp16x8_0 = vaddq_s16(tmp16x8_0, prod16x8);
+
+      // lmagn[i] - inst->noiseEstLogQuantile[offset + i]
+      tmp16x8_3 = vsubq_s16(tmp16x8_3, tmp16x8_2);
+      tmp16x8_3 = vabsq_s16(tmp16x8_3);
+      tmp16x8_4 = vcgtq_s16(WIDTHQ8_16x8, tmp16x8_3);
+      tmp16x8_1 = vbslq_s16(tmp16x8_4, tmp16x8_0, tmp16x8_1);
+      vst1q_s16(&inst->noiseEstDensity[offset + i], tmp16x8_1);
+    }  // End loop over magnitude spectrum
+
+    // Last iteration over magnitude spectrum:
+    // compute delta
+    if (inst->noiseEstDensity[offset + i] > 512) {
+      // Get values for deltaBuff by shifting intead of dividing.
+      int factor = WebRtcSpl_NormW16(inst->noiseEstDensity[offset + i]);
+      delta = (int16_t)(FACTOR_Q16 >> (14 - factor));
+    } else {
+      delta = FACTOR_Q7;
+      if (inst->blockIndex < END_STARTUP_LONG) {
+        // Smaller step size during startup. This prevents from using
+        // unrealistic values causing overflow.
+        delta = FACTOR_Q7_STARTUP;
+      }
+    }
+    // update log quantile estimate
+    tmp16 = (int16_t)((delta * countDiv) >> 14);
+    if (lmagn[i] > inst->noiseEstLogQuantile[offset + i]) {
+      // +=QUANTILE*delta/(inst->counter[s]+1) QUANTILE=0.25, =1 in Q2
+      // CounterDiv=1/(inst->counter[s]+1) in Q15
+      tmp16 += 2;
+      inst->noiseEstLogQuantile[offset + i] += tmp16 / 4;
+    } else {
+      tmp16 += 1;
+      // *(1-QUANTILE), in Q2 QUANTILE=0.25, 1-0.25=0.75=3 in Q2
+      // TODO(bjornv): investigate why we need to truncate twice.
+      tmp16no2 = (int16_t)((tmp16 / 2) * 3 / 2);
+      inst->noiseEstLogQuantile[offset + i] -= tmp16no2;
+      if (inst->noiseEstLogQuantile[offset + i] < logval) {
+        // logval is the smallest fixed point representation we can have.
+        // Values below that will correspond to values in the interval
+        // [0, 1], which can't possibly occur.
+        inst->noiseEstLogQuantile[offset + i] = logval;
+      }
+    }
+
+    // update density estimate
+    if (WEBRTC_SPL_ABS_W16(lmagn[i] - inst->noiseEstLogQuantile[offset + i])
+        < WIDTH_Q8) {
+      tmp16no1 = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                   inst->noiseEstDensity[offset + i], countProd, 15);
+      tmp16no2 = (int16_t)WEBRTC_SPL_MUL_16_16_RSFT_WITH_ROUND(
+                   width_factor, countDiv, 15);
+      inst->noiseEstDensity[offset + i] = tmp16no1 + tmp16no2;
+    }
+
+
+    if (counter >= END_STARTUP_LONG) {
+      inst->noiseEstCounter[s] = 0;
+      if (inst->blockIndex >= END_STARTUP_LONG) {
+        UpdateNoiseEstimateNeon(inst, offset);
+      }
+    }
+    inst->noiseEstCounter[s]++;
+
+  }  // end loop over simultaneous estimates
+
+  // Sequentially update the noise during startup
+  if (inst->blockIndex < END_STARTUP_LONG) {
+    UpdateNoiseEstimateNeon(inst, offset);
+  }
+
+  for (i = 0; i < inst->magnLen; i++) {
+    noise[i] = (uint32_t)(inst->noiseEstQuantile[i]); // Q(qNoise)
+  }
+  (*q_noise) = (int16_t)inst->qNoise;
+}
+
+// Filter the data in the frequency domain, and create spectrum.
+void WebRtcNsx_PrepareSpectrumNeon(NoiseSuppressionFixedC* inst,
+                                   int16_t* freq_buf) {
+  RTC_DCHECK_EQ(1, inst->magnLen % 8);
+  RTC_DCHECK_EQ(0, inst->anaLen2 % 16);
+
+  // (1) Filtering.
+
+  // Fixed point C code for the next block is as follows:
+  // for (i = 0; i < inst->magnLen; i++) {
+  //   inst->real[i] = (int16_t)((inst->real[i] *
+  //      (int16_t)(inst->noiseSupFilter[i])) >> 14);  // Q(normData-stages)
+  //   inst->imag[i] = (int16_t)((inst->imag[i] *
+  //      (int16_t)(inst->noiseSupFilter[i])) >> 14);  // Q(normData-stages)
+  // }
+
+  int16_t* preal = &inst->real[0];
+  int16_t* pimag = &inst->imag[0];
+  int16_t* pns_filter = (int16_t*)&inst->noiseSupFilter[0];
+  int16_t* pimag_end = pimag + inst->magnLen - 4;
+
+  while (pimag < pimag_end) {
+    int16x8_t real = vld1q_s16(preal);
+    int16x8_t imag = vld1q_s16(pimag);
+    int16x8_t ns_filter = vld1q_s16(pns_filter);
+
+    int32x4_t tmp_r_0 = vmull_s16(vget_low_s16(real), vget_low_s16(ns_filter));
+    int32x4_t tmp_i_0 = vmull_s16(vget_low_s16(imag), vget_low_s16(ns_filter));
+    int32x4_t tmp_r_1 = vmull_s16(vget_high_s16(real),
+                                  vget_high_s16(ns_filter));
+    int32x4_t tmp_i_1 = vmull_s16(vget_high_s16(imag),
+                                  vget_high_s16(ns_filter));
+
+    int16x4_t result_r_0 = vshrn_n_s32(tmp_r_0, 14);
+    int16x4_t result_i_0 = vshrn_n_s32(tmp_i_0, 14);
+    int16x4_t result_r_1 = vshrn_n_s32(tmp_r_1, 14);
+    int16x4_t result_i_1 = vshrn_n_s32(tmp_i_1, 14);
+
+    vst1q_s16(preal, vcombine_s16(result_r_0, result_r_1));
+    vst1q_s16(pimag, vcombine_s16(result_i_0, result_i_1));
+    preal += 8;
+    pimag += 8;
+    pns_filter += 8;
+  }
+
+  // Filter the last element
+  *preal = (int16_t)((*preal * *pns_filter) >> 14);
+  *pimag = (int16_t)((*pimag * *pns_filter) >> 14);
+
+  // (2) Create spectrum.
+
+  // Fixed point C code for the rest of the function is as follows:
+  // freq_buf[0] = inst->real[0];
+  // freq_buf[1] = -inst->imag[0];
+  // for (i = 1, j = 2; i < inst->anaLen2; i += 1, j += 2) {
+  //   freq_buf[j] = inst->real[i];
+  //   freq_buf[j + 1] = -inst->imag[i];
+  // }
+  // freq_buf[inst->anaLen] = inst->real[inst->anaLen2];
+  // freq_buf[inst->anaLen + 1] = -inst->imag[inst->anaLen2];
+
+  preal = &inst->real[0];
+  pimag = &inst->imag[0];
+  pimag_end = pimag + inst->anaLen2;
+  int16_t * freq_buf_start = freq_buf;
+  while (pimag < pimag_end) {
+    // loop unroll
+    int16x8x2_t real_imag_0;
+    int16x8x2_t real_imag_1;
+    real_imag_0.val[1] = vld1q_s16(pimag);
+    real_imag_0.val[0] = vld1q_s16(preal);
+    preal += 8;
+    pimag += 8;
+    real_imag_1.val[1] = vld1q_s16(pimag);
+    real_imag_1.val[0] = vld1q_s16(preal);
+    preal += 8;
+    pimag += 8;
+
+    real_imag_0.val[1] = vnegq_s16(real_imag_0.val[1]);
+    real_imag_1.val[1] = vnegq_s16(real_imag_1.val[1]);
+    vst2q_s16(freq_buf_start, real_imag_0);
+    freq_buf_start += 16;
+    vst2q_s16(freq_buf_start, real_imag_1);
+    freq_buf_start += 16;
+  }
+  freq_buf[inst->anaLen] = inst->real[inst->anaLen2];
+  freq_buf[inst->anaLen + 1] = -inst->imag[inst->anaLen2];
+}
+
+// For the noise supress process, synthesis, read out fully processed segment,
+// and update synthesis buffer.
+void WebRtcNsx_SynthesisUpdateNeon(NoiseSuppressionFixedC* inst,
+                                   int16_t* out_frame,
+                                   int16_t gain_factor) {
+  RTC_DCHECK_EQ(0, inst->anaLen % 16);
+  RTC_DCHECK_EQ(0, inst->blockLen10ms % 16);
+
+  int16_t* preal_start = inst->real;
+  const int16_t* pwindow = inst->window;
+  int16_t* preal_end = preal_start + inst->anaLen;
+  int16_t* psynthesis_buffer = inst->synthesisBuffer;
+
+  while (preal_start < preal_end) {
+    // Loop unroll.
+    int16x8_t window_0 = vld1q_s16(pwindow);
+    int16x8_t real_0 = vld1q_s16(preal_start);
+    int16x8_t synthesis_buffer_0 = vld1q_s16(psynthesis_buffer);
+
+    int16x8_t window_1 = vld1q_s16(pwindow + 8);
+    int16x8_t real_1 = vld1q_s16(preal_start + 8);
+    int16x8_t synthesis_buffer_1 = vld1q_s16(psynthesis_buffer + 8);
+
+    int32x4_t tmp32a_0_low = vmull_s16(vget_low_s16(real_0),
+                                       vget_low_s16(window_0));
+    int32x4_t tmp32a_0_high = vmull_s16(vget_high_s16(real_0),
+                                        vget_high_s16(window_0));
+
+    int32x4_t tmp32a_1_low = vmull_s16(vget_low_s16(real_1),
+                                       vget_low_s16(window_1));
+    int32x4_t tmp32a_1_high = vmull_s16(vget_high_s16(real_1),
+                                        vget_high_s16(window_1));
+
+    int16x4_t tmp16a_0_low = vqrshrn_n_s32(tmp32a_0_low, 14);
+    int16x4_t tmp16a_0_high = vqrshrn_n_s32(tmp32a_0_high, 14);
+
+    int16x4_t tmp16a_1_low = vqrshrn_n_s32(tmp32a_1_low, 14);
+    int16x4_t tmp16a_1_high = vqrshrn_n_s32(tmp32a_1_high, 14);
+
+    int32x4_t tmp32b_0_low = vmull_n_s16(tmp16a_0_low, gain_factor);
+    int32x4_t tmp32b_0_high = vmull_n_s16(tmp16a_0_high, gain_factor);
+
+    int32x4_t tmp32b_1_low = vmull_n_s16(tmp16a_1_low, gain_factor);
+    int32x4_t tmp32b_1_high = vmull_n_s16(tmp16a_1_high, gain_factor);
+
+    int16x4_t tmp16b_0_low = vqrshrn_n_s32(tmp32b_0_low, 13);
+    int16x4_t tmp16b_0_high = vqrshrn_n_s32(tmp32b_0_high, 13);
+
+    int16x4_t tmp16b_1_low = vqrshrn_n_s32(tmp32b_1_low, 13);
+    int16x4_t tmp16b_1_high = vqrshrn_n_s32(tmp32b_1_high, 13);
+
+    synthesis_buffer_0 = vqaddq_s16(vcombine_s16(tmp16b_0_low, tmp16b_0_high),
+                                    synthesis_buffer_0);
+    synthesis_buffer_1 = vqaddq_s16(vcombine_s16(tmp16b_1_low, tmp16b_1_high),
+                                    synthesis_buffer_1);
+    vst1q_s16(psynthesis_buffer, synthesis_buffer_0);
+    vst1q_s16(psynthesis_buffer + 8, synthesis_buffer_1);
+
+    pwindow += 16;
+    preal_start += 16;
+    psynthesis_buffer += 16;
+  }
+
+  // Read out fully processed segment.
+  int16_t * p_start = inst->synthesisBuffer;
+  int16_t * p_end = inst->synthesisBuffer + inst->blockLen10ms;
+  int16_t * p_frame = out_frame;
+  while (p_start < p_end) {
+    int16x8_t frame_0 = vld1q_s16(p_start);
+    vst1q_s16(p_frame, frame_0);
+    p_start += 8;
+    p_frame += 8;
+  }
+
+  // Update synthesis buffer.
+  int16_t* p_start_src = inst->synthesisBuffer + inst->blockLen10ms;
+  int16_t* p_end_src = inst->synthesisBuffer + inst->anaLen;
+  int16_t* p_start_dst = inst->synthesisBuffer;
+  while (p_start_src < p_end_src) {
+    int16x8_t frame = vld1q_s16(p_start_src);
+    vst1q_s16(p_start_dst, frame);
+    p_start_src += 8;
+    p_start_dst += 8;
+  }
+
+  p_start = inst->synthesisBuffer + inst->anaLen - inst->blockLen10ms;
+  p_end = p_start + inst->blockLen10ms;
+  int16x8_t zero = vdupq_n_s16(0);
+  for (;p_start < p_end; p_start += 8) {
+    vst1q_s16(p_start, zero);
+  }
+}
+
+// Update analysis buffer for lower band, and window data before FFT.
+void WebRtcNsx_AnalysisUpdateNeon(NoiseSuppressionFixedC* inst,
+                                  int16_t* out,
+                                  int16_t* new_speech) {
+  RTC_DCHECK_EQ(0, inst->blockLen10ms % 16);
+  RTC_DCHECK_EQ(0, inst->anaLen % 16);
+
+  // For lower band update analysis buffer.
+  // memcpy(inst->analysisBuffer, inst->analysisBuffer + inst->blockLen10ms,
+  //     (inst->anaLen - inst->blockLen10ms) * sizeof(*inst->analysisBuffer));
+  int16_t* p_start_src = inst->analysisBuffer + inst->blockLen10ms;
+  int16_t* p_end_src = inst->analysisBuffer + inst->anaLen;
+  int16_t* p_start_dst = inst->analysisBuffer;
+  while (p_start_src < p_end_src) {
+    int16x8_t frame = vld1q_s16(p_start_src);
+    vst1q_s16(p_start_dst, frame);
+
+    p_start_src += 8;
+    p_start_dst += 8;
+  }
+
+  // memcpy(inst->analysisBuffer + inst->anaLen - inst->blockLen10ms,
+  //     new_speech, inst->blockLen10ms * sizeof(*inst->analysisBuffer));
+  p_start_src = new_speech;
+  p_end_src = new_speech + inst->blockLen10ms;
+  p_start_dst = inst->analysisBuffer + inst->anaLen - inst->blockLen10ms;
+  while (p_start_src < p_end_src) {
+    int16x8_t frame = vld1q_s16(p_start_src);
+    vst1q_s16(p_start_dst, frame);
+
+    p_start_src += 8;
+    p_start_dst += 8;
+  }
+
+  // Window data before FFT.
+  int16_t* p_start_window = (int16_t*) inst->window;
+  int16_t* p_start_buffer = inst->analysisBuffer;
+  int16_t* p_end_buffer = inst->analysisBuffer + inst->anaLen;
+  int16_t* p_start_out = out;
+
+  // Load the first element to reduce pipeline bubble.
+  int16x8_t window = vld1q_s16(p_start_window);
+  int16x8_t buffer = vld1q_s16(p_start_buffer);
+  p_start_window += 8;
+  p_start_buffer += 8;
+
+  while (p_start_buffer < p_end_buffer) {
+    // Unroll loop.
+    int32x4_t tmp32_low = vmull_s16(vget_low_s16(window), vget_low_s16(buffer));
+    int32x4_t tmp32_high = vmull_s16(vget_high_s16(window),
+                                     vget_high_s16(buffer));
+    window = vld1q_s16(p_start_window);
+    buffer = vld1q_s16(p_start_buffer);
+
+    int16x4_t result_low = vrshrn_n_s32(tmp32_low, 14);
+    int16x4_t result_high = vrshrn_n_s32(tmp32_high, 14);
+    vst1q_s16(p_start_out, vcombine_s16(result_low, result_high));
+
+    p_start_buffer += 8;
+    p_start_window += 8;
+    p_start_out += 8;
+  }
+  int32x4_t tmp32_low = vmull_s16(vget_low_s16(window), vget_low_s16(buffer));
+  int32x4_t tmp32_high = vmull_s16(vget_high_s16(window),
+                                   vget_high_s16(buffer));
+
+  int16x4_t result_low = vrshrn_n_s32(tmp32_low, 14);
+  int16x4_t result_high = vrshrn_n_s32(tmp32_high, 14);
+  vst1q_s16(p_start_out, vcombine_s16(result_low, result_high));
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_defines.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_defines.h
new file mode 100644
index 0000000..862dc3c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/nsx_defines.h
@@ -0,0 +1,64 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_NSX_DEFINES_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_NSX_DEFINES_H_
+
+#define ANAL_BLOCKL_MAX         256 /* Max analysis block length */
+#define HALF_ANAL_BLOCKL        129 /* Half max analysis block length + 1 */
+#define NUM_HIGH_BANDS_MAX      2   /* Max number of high bands */
+#define SIMULT                  3
+#define END_STARTUP_LONG        200
+#define END_STARTUP_SHORT       50
+#define FACTOR_Q16              2621440 /* 40 in Q16 */
+#define FACTOR_Q7               5120 /* 40 in Q7 */
+#define FACTOR_Q7_STARTUP       1024 /* 8 in Q7 */
+#define WIDTH_Q8                3 /* 0.01 in Q8 (or 25 ) */
+
+/* PARAMETERS FOR NEW METHOD */
+#define DD_PR_SNR_Q11           2007 /* ~= Q11(0.98) DD update of prior SNR */
+#define ONE_MINUS_DD_PR_SNR_Q11 41 /* DD update of prior SNR */
+#define SPECT_FLAT_TAVG_Q14     4915 /* (0.30) tavg parameter for spectral flatness measure */
+#define SPECT_DIFF_TAVG_Q8      77 /* (0.30) tavg parameter for spectral flatness measure */
+#define PRIOR_UPDATE_Q14        1638 /* Q14(0.1) Update parameter of prior model */
+#define NOISE_UPDATE_Q8         26 /* 26 ~= Q8(0.1) Update parameter for noise */
+
+/* Probability threshold for noise state in speech/noise likelihood. */
+#define ONE_MINUS_PROB_RANGE_Q8 205 /* 205 ~= Q8(0.8) */
+#define HIST_PAR_EST            1000 /* Histogram size for estimation of parameters */
+
+/* FEATURE EXTRACTION CONFIG  */
+/* Bin size of histogram */
+#define BIN_SIZE_LRT            10
+/* Scale parameters: multiply dominant peaks of the histograms by scale factor to obtain. */
+/* Thresholds for prior model */
+#define FACTOR_1_LRT_DIFF       6 /* For LRT and spectral difference (5 times bigger) */
+/* For spectral_flatness: used when noise is flatter than speech (10 times bigger). */
+#define FACTOR_2_FLAT_Q10       922
+/* Peak limit for spectral flatness (varies between 0 and 1) */
+#define THRES_PEAK_FLAT         24 /* * 2 * BIN_SIZE_FLAT_FX */
+/* Limit on spacing of two highest peaks in histogram: spacing determined by bin size. */
+#define LIM_PEAK_SPACE_FLAT_DIFF    4 /* * 2 * BIN_SIZE_DIFF_FX */
+/* Limit on relevance of second peak */
+#define LIM_PEAK_WEIGHT_FLAT_DIFF   2
+#define THRES_FLUCT_LRT         10240 /* = 20 * inst->modelUpdate; fluctuation limit of LRT feat. */
+/* Limit on the max and min values for the feature thresholds */
+#define MAX_FLAT_Q10            38912 /*  * 2 * BIN_SIZE_FLAT_FX */
+#define MIN_FLAT_Q10            4096 /*  * 2 * BIN_SIZE_FLAT_FX */
+#define MAX_DIFF                100 /* * 2 * BIN_SIZE_DIFF_FX */
+#define MIN_DIFF                16 /* * 2 * BIN_SIZE_DIFF_FX */
+/* Criteria of weight of histogram peak  to accept/reject feature */
+#define THRES_WEIGHT_FLAT_DIFF  154 /*(int)(0.3*(inst->modelUpdate)) for flatness and difference */
+
+#define STAT_UPDATES            9 /* Update every 512 = 1 << 9 block */
+#define ONE_MINUS_GAMMA_PAUSE_Q8    13 /* ~= Q8(0.05) Update for conservative noise estimate */
+#define GAMMA_NOISE_TRANS_AND_SPEECH_Q8 3 /* ~= Q8(0.01) Update for transition and noise region */
+
+#endif /* WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_NSX_DEFINES_H_ */
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/windows_private.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/windows_private.h
new file mode 100644
index 0000000..44c2e84
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/ns/windows_private.h
@@ -0,0 +1,574 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_WINDOWS_PRIVATE_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_WINDOWS_PRIVATE_H_
+
+// Hanning window for 4ms 16kHz
+static const float kHanning64w128[128] = {
+  0.00000000000000f, 0.02454122852291f, 0.04906767432742f,
+  0.07356456359967f, 0.09801714032956f, 0.12241067519922f,
+  0.14673047445536f, 0.17096188876030f, 0.19509032201613f,
+  0.21910124015687f, 0.24298017990326f, 0.26671275747490f,
+  0.29028467725446f, 0.31368174039889f, 0.33688985339222f,
+  0.35989503653499f, 0.38268343236509f, 0.40524131400499f,
+  0.42755509343028f, 0.44961132965461f, 0.47139673682600f,
+  0.49289819222978f, 0.51410274419322f, 0.53499761988710f,
+  0.55557023301960f, 0.57580819141785f, 0.59569930449243f,
+  0.61523159058063f, 0.63439328416365f, 0.65317284295378f,
+  0.67155895484702f, 0.68954054473707f, 0.70710678118655f,
+  0.72424708295147f, 0.74095112535496f, 0.75720884650648f,
+  0.77301045336274f, 0.78834642762661f, 0.80320753148064f,
+  0.81758481315158f, 0.83146961230255f, 0.84485356524971f,
+  0.85772861000027f, 0.87008699110871f, 0.88192126434835f,
+  0.89322430119552f, 0.90398929312344f, 0.91420975570353f,
+  0.92387953251129f, 0.93299279883474f, 0.94154406518302f,
+  0.94952818059304f, 0.95694033573221f, 0.96377606579544f,
+  0.97003125319454f, 0.97570213003853f, 0.98078528040323f,
+  0.98527764238894f, 0.98917650996478f, 0.99247953459871f,
+  0.99518472667220f, 0.99729045667869f, 0.99879545620517f,
+  0.99969881869620f, 1.00000000000000f,
+  0.99969881869620f, 0.99879545620517f, 0.99729045667869f,
+  0.99518472667220f, 0.99247953459871f, 0.98917650996478f,
+  0.98527764238894f, 0.98078528040323f, 0.97570213003853f,
+  0.97003125319454f, 0.96377606579544f, 0.95694033573221f,
+  0.94952818059304f, 0.94154406518302f, 0.93299279883474f,
+  0.92387953251129f, 0.91420975570353f, 0.90398929312344f,
+  0.89322430119552f, 0.88192126434835f, 0.87008699110871f,
+  0.85772861000027f, 0.84485356524971f, 0.83146961230255f,
+  0.81758481315158f, 0.80320753148064f, 0.78834642762661f,
+  0.77301045336274f, 0.75720884650648f, 0.74095112535496f,
+  0.72424708295147f, 0.70710678118655f, 0.68954054473707f,
+  0.67155895484702f, 0.65317284295378f, 0.63439328416365f,
+  0.61523159058063f, 0.59569930449243f, 0.57580819141785f,
+  0.55557023301960f, 0.53499761988710f, 0.51410274419322f,
+  0.49289819222978f, 0.47139673682600f, 0.44961132965461f,
+  0.42755509343028f, 0.40524131400499f, 0.38268343236509f,
+  0.35989503653499f, 0.33688985339222f, 0.31368174039889f,
+  0.29028467725446f, 0.26671275747490f, 0.24298017990326f,
+  0.21910124015687f, 0.19509032201613f, 0.17096188876030f,
+  0.14673047445536f, 0.12241067519922f, 0.09801714032956f,
+  0.07356456359967f, 0.04906767432742f, 0.02454122852291f
+};
+
+
+
+// hybrib Hanning & flat window
+static const float kBlocks80w128[128] = {
+  (float)0.00000000, (float)0.03271908, (float)0.06540313, (float)0.09801714, (float)0.13052619,
+  (float)0.16289547, (float)0.19509032, (float)0.22707626, (float)0.25881905, (float)0.29028468,
+  (float)0.32143947, (float)0.35225005, (float)0.38268343, (float)0.41270703, (float)0.44228869,
+  (float)0.47139674, (float)0.50000000, (float)0.52806785, (float)0.55557023, (float)0.58247770,
+  (float)0.60876143, (float)0.63439328, (float)0.65934582, (float)0.68359230, (float)0.70710678,
+  (float)0.72986407, (float)0.75183981, (float)0.77301045, (float)0.79335334, (float)0.81284668,
+  (float)0.83146961, (float)0.84920218, (float)0.86602540, (float)0.88192126, (float)0.89687274,
+  (float)0.91086382, (float)0.92387953, (float)0.93590593, (float)0.94693013, (float)0.95694034,
+  (float)0.96592583, (float)0.97387698, (float)0.98078528, (float)0.98664333, (float)0.99144486,
+  (float)0.99518473, (float)0.99785892, (float)0.99946459, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)0.99946459, (float)0.99785892, (float)0.99518473, (float)0.99144486,
+  (float)0.98664333, (float)0.98078528, (float)0.97387698, (float)0.96592583, (float)0.95694034,
+  (float)0.94693013, (float)0.93590593, (float)0.92387953, (float)0.91086382, (float)0.89687274,
+  (float)0.88192126, (float)0.86602540, (float)0.84920218, (float)0.83146961, (float)0.81284668,
+  (float)0.79335334, (float)0.77301045, (float)0.75183981, (float)0.72986407, (float)0.70710678,
+  (float)0.68359230, (float)0.65934582, (float)0.63439328, (float)0.60876143, (float)0.58247770,
+  (float)0.55557023, (float)0.52806785, (float)0.50000000, (float)0.47139674, (float)0.44228869,
+  (float)0.41270703, (float)0.38268343, (float)0.35225005, (float)0.32143947, (float)0.29028468,
+  (float)0.25881905, (float)0.22707626, (float)0.19509032, (float)0.16289547, (float)0.13052619,
+  (float)0.09801714, (float)0.06540313, (float)0.03271908
+};
+
+// hybrib Hanning & flat window
+static const float kBlocks160w256[256] = {
+  (float)0.00000000, (float)0.01636173, (float)0.03271908, (float)0.04906767, (float)0.06540313,
+  (float)0.08172107, (float)0.09801714, (float)0.11428696, (float)0.13052619, (float)0.14673047,
+  (float)0.16289547, (float)0.17901686, (float)0.19509032, (float)0.21111155, (float)0.22707626,
+  (float)0.24298018, (float)0.25881905, (float)0.27458862, (float)0.29028468, (float)0.30590302,
+  (float)0.32143947, (float)0.33688985, (float)0.35225005, (float)0.36751594, (float)0.38268343,
+  (float)0.39774847, (float)0.41270703, (float)0.42755509, (float)0.44228869, (float)0.45690388,
+  (float)0.47139674, (float)0.48576339, (float)0.50000000, (float)0.51410274, (float)0.52806785,
+  (float)0.54189158, (float)0.55557023, (float)0.56910015, (float)0.58247770, (float)0.59569930,
+  (float)0.60876143, (float)0.62166057, (float)0.63439328, (float)0.64695615, (float)0.65934582,
+  (float)0.67155895, (float)0.68359230, (float)0.69544264, (float)0.70710678, (float)0.71858162,
+  (float)0.72986407, (float)0.74095113, (float)0.75183981, (float)0.76252720, (float)0.77301045,
+  (float)0.78328675, (float)0.79335334, (float)0.80320753, (float)0.81284668, (float)0.82226822,
+  (float)0.83146961, (float)0.84044840, (float)0.84920218, (float)0.85772861, (float)0.86602540,
+  (float)0.87409034, (float)0.88192126, (float)0.88951608, (float)0.89687274, (float)0.90398929,
+  (float)0.91086382, (float)0.91749450, (float)0.92387953, (float)0.93001722, (float)0.93590593,
+  (float)0.94154407, (float)0.94693013, (float)0.95206268, (float)0.95694034, (float)0.96156180,
+  (float)0.96592583, (float)0.97003125, (float)0.97387698, (float)0.97746197, (float)0.98078528,
+  (float)0.98384601, (float)0.98664333, (float)0.98917651, (float)0.99144486, (float)0.99344778,
+  (float)0.99518473, (float)0.99665524, (float)0.99785892, (float)0.99879546, (float)0.99946459,
+  (float)0.99986614, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)0.99986614, (float)0.99946459, (float)0.99879546, (float)0.99785892,
+  (float)0.99665524, (float)0.99518473, (float)0.99344778, (float)0.99144486, (float)0.98917651,
+  (float)0.98664333, (float)0.98384601, (float)0.98078528, (float)0.97746197, (float)0.97387698,
+  (float)0.97003125, (float)0.96592583, (float)0.96156180, (float)0.95694034, (float)0.95206268,
+  (float)0.94693013, (float)0.94154407, (float)0.93590593, (float)0.93001722, (float)0.92387953,
+  (float)0.91749450, (float)0.91086382, (float)0.90398929, (float)0.89687274, (float)0.88951608,
+  (float)0.88192126, (float)0.87409034, (float)0.86602540, (float)0.85772861, (float)0.84920218,
+  (float)0.84044840, (float)0.83146961, (float)0.82226822, (float)0.81284668, (float)0.80320753,
+  (float)0.79335334, (float)0.78328675, (float)0.77301045, (float)0.76252720, (float)0.75183981,
+  (float)0.74095113, (float)0.72986407, (float)0.71858162, (float)0.70710678, (float)0.69544264,
+  (float)0.68359230, (float)0.67155895, (float)0.65934582, (float)0.64695615, (float)0.63439328,
+  (float)0.62166057, (float)0.60876143, (float)0.59569930, (float)0.58247770, (float)0.56910015,
+  (float)0.55557023, (float)0.54189158, (float)0.52806785, (float)0.51410274, (float)0.50000000,
+  (float)0.48576339, (float)0.47139674, (float)0.45690388, (float)0.44228869, (float)0.42755509,
+  (float)0.41270703, (float)0.39774847, (float)0.38268343, (float)0.36751594, (float)0.35225005,
+  (float)0.33688985, (float)0.32143947, (float)0.30590302, (float)0.29028468, (float)0.27458862,
+  (float)0.25881905, (float)0.24298018, (float)0.22707626, (float)0.21111155, (float)0.19509032,
+  (float)0.17901686, (float)0.16289547, (float)0.14673047, (float)0.13052619, (float)0.11428696,
+  (float)0.09801714, (float)0.08172107, (float)0.06540313, (float)0.04906767, (float)0.03271908,
+  (float)0.01636173
+};
+
+// hybrib Hanning & flat window: for 20ms
+static const float kBlocks320w512[512] = {
+  (float)0.00000000, (float)0.00818114, (float)0.01636173, (float)0.02454123, (float)0.03271908,
+  (float)0.04089475, (float)0.04906767, (float)0.05723732, (float)0.06540313, (float)0.07356456,
+  (float)0.08172107, (float)0.08987211, (float)0.09801714, (float)0.10615561, (float)0.11428696,
+  (float)0.12241068, (float)0.13052619, (float)0.13863297, (float)0.14673047, (float)0.15481816,
+  (float)0.16289547, (float)0.17096189, (float)0.17901686, (float)0.18705985, (float)0.19509032,
+  (float)0.20310773, (float)0.21111155, (float)0.21910124, (float)0.22707626, (float)0.23503609,
+  (float)0.24298018, (float)0.25090801, (float)0.25881905, (float)0.26671276, (float)0.27458862,
+  (float)0.28244610, (float)0.29028468, (float)0.29810383, (float)0.30590302, (float)0.31368174,
+  (float)0.32143947, (float)0.32917568, (float)0.33688985, (float)0.34458148, (float)0.35225005,
+  (float)0.35989504, (float)0.36751594, (float)0.37511224, (float)0.38268343, (float)0.39022901,
+  (float)0.39774847, (float)0.40524131, (float)0.41270703, (float)0.42014512, (float)0.42755509,
+  (float)0.43493645, (float)0.44228869, (float)0.44961133, (float)0.45690388, (float)0.46416584,
+  (float)0.47139674, (float)0.47859608, (float)0.48576339, (float)0.49289819, (float)0.50000000,
+  (float)0.50706834, (float)0.51410274, (float)0.52110274, (float)0.52806785, (float)0.53499762,
+  (float)0.54189158, (float)0.54874927, (float)0.55557023, (float)0.56235401, (float)0.56910015,
+  (float)0.57580819, (float)0.58247770, (float)0.58910822, (float)0.59569930, (float)0.60225052,
+  (float)0.60876143, (float)0.61523159, (float)0.62166057, (float)0.62804795, (float)0.63439328,
+  (float)0.64069616, (float)0.64695615, (float)0.65317284, (float)0.65934582, (float)0.66547466,
+  (float)0.67155895, (float)0.67759830, (float)0.68359230, (float)0.68954054, (float)0.69544264,
+  (float)0.70129818, (float)0.70710678, (float)0.71286806, (float)0.71858162, (float)0.72424708,
+  (float)0.72986407, (float)0.73543221, (float)0.74095113, (float)0.74642045, (float)0.75183981,
+  (float)0.75720885, (float)0.76252720, (float)0.76779452, (float)0.77301045, (float)0.77817464,
+  (float)0.78328675, (float)0.78834643, (float)0.79335334, (float)0.79830715, (float)0.80320753,
+  (float)0.80805415, (float)0.81284668, (float)0.81758481, (float)0.82226822, (float)0.82689659,
+  (float)0.83146961, (float)0.83598698, (float)0.84044840, (float)0.84485357, (float)0.84920218,
+  (float)0.85349396, (float)0.85772861, (float)0.86190585, (float)0.86602540, (float)0.87008699,
+  (float)0.87409034, (float)0.87803519, (float)0.88192126, (float)0.88574831, (float)0.88951608,
+  (float)0.89322430, (float)0.89687274, (float)0.90046115, (float)0.90398929, (float)0.90745693,
+  (float)0.91086382, (float)0.91420976, (float)0.91749450, (float)0.92071783, (float)0.92387953,
+  (float)0.92697940, (float)0.93001722, (float)0.93299280, (float)0.93590593, (float)0.93875641,
+  (float)0.94154407, (float)0.94426870, (float)0.94693013, (float)0.94952818, (float)0.95206268,
+  (float)0.95453345, (float)0.95694034, (float)0.95928317, (float)0.96156180, (float)0.96377607,
+  (float)0.96592583, (float)0.96801094, (float)0.97003125, (float)0.97198664, (float)0.97387698,
+  (float)0.97570213, (float)0.97746197, (float)0.97915640, (float)0.98078528, (float)0.98234852,
+  (float)0.98384601, (float)0.98527764, (float)0.98664333, (float)0.98794298, (float)0.98917651,
+  (float)0.99034383, (float)0.99144486, (float)0.99247953, (float)0.99344778, (float)0.99434953,
+  (float)0.99518473, (float)0.99595331, (float)0.99665524, (float)0.99729046, (float)0.99785892,
+  (float)0.99836060, (float)0.99879546, (float)0.99916346, (float)0.99946459, (float)0.99969882,
+  (float)0.99986614, (float)0.99996653, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000, (float)1.00000000,
+  (float)1.00000000, (float)0.99996653, (float)0.99986614, (float)0.99969882, (float)0.99946459,
+  (float)0.99916346, (float)0.99879546, (float)0.99836060, (float)0.99785892, (float)0.99729046,
+  (float)0.99665524, (float)0.99595331, (float)0.99518473, (float)0.99434953, (float)0.99344778,
+  (float)0.99247953, (float)0.99144486, (float)0.99034383, (float)0.98917651, (float)0.98794298,
+  (float)0.98664333, (float)0.98527764, (float)0.98384601, (float)0.98234852, (float)0.98078528,
+  (float)0.97915640, (float)0.97746197, (float)0.97570213, (float)0.97387698, (float)0.97198664,
+  (float)0.97003125, (float)0.96801094, (float)0.96592583, (float)0.96377607, (float)0.96156180,
+  (float)0.95928317, (float)0.95694034, (float)0.95453345, (float)0.95206268, (float)0.94952818,
+  (float)0.94693013, (float)0.94426870, (float)0.94154407, (float)0.93875641, (float)0.93590593,
+  (float)0.93299280, (float)0.93001722, (float)0.92697940, (float)0.92387953, (float)0.92071783,
+  (float)0.91749450, (float)0.91420976, (float)0.91086382, (float)0.90745693, (float)0.90398929,
+  (float)0.90046115, (float)0.89687274, (float)0.89322430, (float)0.88951608, (float)0.88574831,
+  (float)0.88192126, (float)0.87803519, (float)0.87409034, (float)0.87008699, (float)0.86602540,
+  (float)0.86190585, (float)0.85772861, (float)0.85349396, (float)0.84920218, (float)0.84485357,
+  (float)0.84044840, (float)0.83598698, (float)0.83146961, (float)0.82689659, (float)0.82226822,
+  (float)0.81758481, (float)0.81284668, (float)0.80805415, (float)0.80320753, (float)0.79830715,
+  (float)0.79335334, (float)0.78834643, (float)0.78328675, (float)0.77817464, (float)0.77301045,
+  (float)0.76779452, (float)0.76252720, (float)0.75720885, (float)0.75183981, (float)0.74642045,
+  (float)0.74095113, (float)0.73543221, (float)0.72986407, (float)0.72424708, (float)0.71858162,
+  (float)0.71286806, (float)0.70710678, (float)0.70129818, (float)0.69544264, (float)0.68954054,
+  (float)0.68359230, (float)0.67759830, (float)0.67155895, (float)0.66547466, (float)0.65934582,
+  (float)0.65317284, (float)0.64695615, (float)0.64069616, (float)0.63439328, (float)0.62804795,
+  (float)0.62166057, (float)0.61523159, (float)0.60876143, (float)0.60225052, (float)0.59569930,
+  (float)0.58910822, (float)0.58247770, (float)0.57580819, (float)0.56910015, (float)0.56235401,
+  (float)0.55557023, (float)0.54874927, (float)0.54189158, (float)0.53499762, (float)0.52806785,
+  (float)0.52110274, (float)0.51410274, (float)0.50706834, (float)0.50000000, (float)0.49289819,
+  (float)0.48576339, (float)0.47859608, (float)0.47139674, (float)0.46416584, (float)0.45690388,
+  (float)0.44961133, (float)0.44228869, (float)0.43493645, (float)0.42755509, (float)0.42014512,
+  (float)0.41270703, (float)0.40524131, (float)0.39774847, (float)0.39022901, (float)0.38268343,
+  (float)0.37511224, (float)0.36751594, (float)0.35989504, (float)0.35225005, (float)0.34458148,
+  (float)0.33688985, (float)0.32917568, (float)0.32143947, (float)0.31368174, (float)0.30590302,
+  (float)0.29810383, (float)0.29028468, (float)0.28244610, (float)0.27458862, (float)0.26671276,
+  (float)0.25881905, (float)0.25090801, (float)0.24298018, (float)0.23503609, (float)0.22707626,
+  (float)0.21910124, (float)0.21111155, (float)0.20310773, (float)0.19509032, (float)0.18705985,
+  (float)0.17901686, (float)0.17096189, (float)0.16289547, (float)0.15481816, (float)0.14673047,
+  (float)0.13863297, (float)0.13052619, (float)0.12241068, (float)0.11428696, (float)0.10615561,
+  (float)0.09801714, (float)0.08987211, (float)0.08172107, (float)0.07356456, (float)0.06540313,
+  (float)0.05723732, (float)0.04906767, (float)0.04089475, (float)0.03271908, (float)0.02454123,
+  (float)0.01636173, (float)0.00818114
+};
+
+
+// Hanning window: for 15ms at 16kHz with symmetric zeros
+static const float kBlocks240w512[512] = {
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00654494, (float)0.01308960, (float)0.01963369,
+  (float)0.02617695, (float)0.03271908, (float)0.03925982, (float)0.04579887, (float)0.05233596,
+  (float)0.05887080, (float)0.06540313, (float)0.07193266, (float)0.07845910, (float)0.08498218,
+  (float)0.09150162, (float)0.09801714, (float)0.10452846, (float)0.11103531, (float)0.11753740,
+  (float)0.12403446, (float)0.13052620, (float)0.13701233, (float)0.14349262, (float)0.14996676,
+  (float)0.15643448, (float)0.16289547, (float)0.16934951, (float)0.17579629, (float)0.18223552,
+  (float)0.18866697, (float)0.19509032, (float)0.20150533, (float)0.20791170, (float)0.21430916,
+  (float)0.22069745, (float)0.22707628, (float)0.23344538, (float)0.23980446, (float)0.24615330,
+  (float)0.25249159, (float)0.25881904, (float)0.26513544, (float)0.27144045, (float)0.27773386,
+  (float)0.28401536, (float)0.29028466, (float)0.29654160, (float)0.30278578, (float)0.30901700,
+  (float)0.31523499, (float)0.32143945, (float)0.32763019, (float)0.33380687, (float)0.33996925,
+  (float)0.34611708, (float)0.35225007, (float)0.35836795, (float)0.36447051, (float)0.37055743,
+  (float)0.37662852, (float)0.38268346, (float)0.38872197, (float)0.39474389, (float)0.40074885,
+  (float)0.40673664, (float)0.41270703, (float)0.41865975, (float)0.42459452, (float)0.43051112,
+  (float)0.43640924, (float)0.44228873, (float)0.44814920, (float)0.45399052, (float)0.45981237,
+  (float)0.46561453, (float)0.47139674, (float)0.47715878, (float)0.48290035, (float)0.48862126,
+  (float)0.49432120, (float)0.50000000, (float)0.50565743, (float)0.51129311, (float)0.51690692,
+  (float)0.52249855, (float)0.52806789, (float)0.53361452, (float)0.53913832, (float)0.54463905,
+  (float)0.55011642, (float)0.55557024, (float)0.56100029, (float)0.56640625, (float)0.57178795,
+  (float)0.57714522, (float)0.58247769, (float)0.58778524, (float)0.59306765, (float)0.59832460,
+  (float)0.60355598, (float)0.60876143, (float)0.61394083, (float)0.61909395, (float)0.62422055,
+  (float)0.62932038, (float)0.63439333, (float)0.63943899, (float)0.64445734, (float)0.64944810,
+  (float)0.65441096, (float)0.65934587, (float)0.66425246, (float)0.66913062, (float)0.67398012,
+  (float)0.67880076, (float)0.68359232, (float)0.68835455, (float)0.69308740, (float)0.69779050,
+  (float)0.70246369, (float)0.70710677, (float)0.71171963, (float)0.71630198, (float)0.72085363,
+  (float)0.72537440, (float)0.72986406, (float)0.73432255, (float)0.73874950, (float)0.74314487,
+  (float)0.74750835, (float)0.75183982, (float)0.75613910, (float)0.76040596, (float)0.76464027,
+  (float)0.76884186, (float)0.77301043, (float)0.77714598, (float)0.78124821, (float)0.78531694,
+  (float)0.78935206, (float)0.79335338, (float)0.79732066, (float)0.80125386, (float)0.80515265,
+  (float)0.80901700, (float)0.81284672, (float)0.81664157, (float)0.82040149, (float)0.82412618,
+  (float)0.82781565, (float)0.83146966, (float)0.83508795, (float)0.83867061, (float)0.84221727,
+  (float)0.84572780, (float)0.84920216, (float)0.85264021, (float)0.85604161, (float)0.85940641,
+  (float)0.86273444, (float)0.86602545, (float)0.86927933, (float)0.87249607, (float)0.87567532,
+  (float)0.87881714, (float)0.88192129, (float)0.88498765, (float)0.88801610, (float)0.89100653,
+  (float)0.89395881, (float)0.89687276, (float)0.89974827, (float)0.90258533, (float)0.90538365,
+  (float)0.90814316, (float)0.91086388, (float)0.91354549, (float)0.91618794, (float)0.91879123,
+  (float)0.92135513, (float)0.92387950, (float)0.92636442, (float)0.92880958, (float)0.93121493,
+  (float)0.93358046, (float)0.93590593, (float)0.93819135, (float)0.94043654, (float)0.94264150,
+  (float)0.94480604, (float)0.94693011, (float)0.94901365, (float)0.95105654, (float)0.95305866,
+  (float)0.95501995, (float)0.95694035, (float)0.95881975, (float)0.96065807, (float)0.96245527,
+  (float)0.96421117, (float)0.96592581, (float)0.96759909, (float)0.96923089, (float)0.97082120,
+  (float)0.97236991, (float)0.97387701, (float)0.97534233, (float)0.97676587, (float)0.97814763,
+  (float)0.97948742, (float)0.98078531, (float)0.98204112, (float)0.98325491, (float)0.98442656,
+  (float)0.98555607, (float)0.98664331, (float)0.98768836, (float)0.98869103, (float)0.98965138,
+  (float)0.99056935, (float)0.99144489, (float)0.99227792, (float)0.99306846, (float)0.99381649,
+  (float)0.99452192, (float)0.99518472, (float)0.99580491, (float)0.99638247, (float)0.99691731,
+  (float)0.99740952, (float)0.99785894, (float)0.99826562, (float)0.99862951, (float)0.99895066,
+  (float)0.99922901, (float)0.99946457, (float)0.99965733, (float)0.99980724, (float)0.99991435,
+  (float)0.99997860, (float)1.00000000, (float)0.99997860, (float)0.99991435, (float)0.99980724,
+  (float)0.99965733, (float)0.99946457, (float)0.99922901, (float)0.99895066, (float)0.99862951,
+  (float)0.99826562, (float)0.99785894, (float)0.99740946, (float)0.99691731, (float)0.99638247,
+  (float)0.99580491, (float)0.99518472, (float)0.99452192, (float)0.99381644, (float)0.99306846,
+  (float)0.99227792, (float)0.99144489, (float)0.99056935, (float)0.98965138, (float)0.98869103,
+  (float)0.98768836, (float)0.98664331, (float)0.98555607, (float)0.98442656, (float)0.98325491,
+  (float)0.98204112, (float)0.98078525, (float)0.97948742, (float)0.97814757, (float)0.97676587,
+  (float)0.97534227, (float)0.97387695, (float)0.97236991, (float)0.97082120, (float)0.96923089,
+  (float)0.96759909, (float)0.96592581, (float)0.96421117, (float)0.96245521, (float)0.96065807,
+  (float)0.95881969, (float)0.95694029, (float)0.95501995, (float)0.95305860, (float)0.95105648,
+  (float)0.94901365, (float)0.94693011, (float)0.94480604, (float)0.94264150, (float)0.94043654,
+  (float)0.93819129, (float)0.93590593, (float)0.93358046, (float)0.93121493, (float)0.92880952,
+  (float)0.92636436, (float)0.92387950, (float)0.92135507, (float)0.91879123, (float)0.91618794,
+  (float)0.91354543, (float)0.91086382, (float)0.90814310, (float)0.90538365, (float)0.90258527,
+  (float)0.89974827, (float)0.89687276, (float)0.89395875, (float)0.89100647, (float)0.88801610,
+  (float)0.88498759, (float)0.88192123, (float)0.87881714, (float)0.87567532, (float)0.87249595,
+  (float)0.86927933, (float)0.86602539, (float)0.86273432, (float)0.85940641, (float)0.85604161,
+  (float)0.85264009, (float)0.84920216, (float)0.84572780, (float)0.84221715, (float)0.83867055,
+  (float)0.83508795, (float)0.83146954, (float)0.82781565, (float)0.82412612, (float)0.82040137,
+  (float)0.81664157, (float)0.81284660, (float)0.80901700, (float)0.80515265, (float)0.80125374,
+  (float)0.79732066, (float)0.79335332, (float)0.78935200, (float)0.78531694, (float)0.78124815,
+  (float)0.77714586, (float)0.77301049, (float)0.76884180, (float)0.76464021, (float)0.76040596,
+  (float)0.75613904, (float)0.75183970, (float)0.74750835, (float)0.74314481, (float)0.73874938,
+  (float)0.73432249, (float)0.72986400, (float)0.72537428, (float)0.72085363, (float)0.71630186,
+  (float)0.71171951, (float)0.70710677, (float)0.70246363, (float)0.69779032, (float)0.69308734,
+  (float)0.68835449, (float)0.68359220, (float)0.67880070, (float)0.67398006, (float)0.66913044,
+  (float)0.66425240, (float)0.65934575, (float)0.65441096, (float)0.64944804, (float)0.64445722,
+  (float)0.63943905, (float)0.63439327, (float)0.62932026, (float)0.62422055, (float)0.61909389,
+  (float)0.61394072, (float)0.60876143, (float)0.60355592, (float)0.59832448, (float)0.59306765,
+  (float)0.58778518, (float)0.58247757, (float)0.57714522, (float)0.57178789, (float)0.56640613,
+  (float)0.56100023, (float)0.55557019, (float)0.55011630, (float)0.54463905, (float)0.53913826,
+  (float)0.53361434, (float)0.52806783, (float)0.52249849, (float)0.51690674, (float)0.51129305,
+  (float)0.50565726, (float)0.50000006, (float)0.49432117, (float)0.48862115, (float)0.48290038,
+  (float)0.47715873, (float)0.47139663, (float)0.46561456, (float)0.45981231, (float)0.45399037,
+  (float)0.44814920, (float)0.44228864, (float)0.43640912, (float)0.43051112, (float)0.42459446,
+  (float)0.41865960, (float)0.41270703, (float)0.40673658, (float)0.40074870, (float)0.39474386,
+  (float)0.38872188, (float)0.38268328, (float)0.37662849, (float)0.37055734, (float)0.36447033,
+  (float)0.35836792, (float)0.35224995, (float)0.34611690, (float)0.33996922, (float)0.33380675,
+  (float)0.32763001, (float)0.32143945, (float)0.31523487, (float)0.30901679, (float)0.30278572,
+  (float)0.29654145, (float)0.29028472, (float)0.28401530, (float)0.27773371, (float)0.27144048,
+  (float)0.26513538, (float)0.25881892, (float)0.25249159, (float)0.24615324, (float)0.23980433,
+  (float)0.23344538, (float)0.22707619, (float)0.22069728, (float)0.21430916, (float)0.20791161,
+  (float)0.20150517, (float)0.19509031, (float)0.18866688, (float)0.18223536, (float)0.17579627,
+  (float)0.16934940, (float)0.16289529, (float)0.15643445, (float)0.14996666, (float)0.14349243,
+  (float)0.13701232, (float)0.13052608, (float)0.12403426, (float)0.11753736, (float)0.11103519,
+  (float)0.10452849, (float)0.09801710, (float)0.09150149, (float)0.08498220, (float)0.07845904,
+  (float)0.07193252, (float)0.06540315, (float)0.05887074, (float)0.05233581, (float)0.04579888,
+  (float)0.03925974, (float)0.03271893, (float)0.02617695, (float)0.01963361, (float)0.01308943,
+  (float)0.00654493, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000
+};
+
+
+// Hanning window: for 30ms with 1024 fft with symmetric zeros at 16kHz
+static const float kBlocks480w1024[1024] = {
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00327249, (float)0.00654494,
+  (float)0.00981732, (float)0.01308960, (float)0.01636173, (float)0.01963369, (float)0.02290544,
+  (float)0.02617695, (float)0.02944817, (float)0.03271908, (float)0.03598964, (float)0.03925982,
+  (float)0.04252957, (float)0.04579887, (float)0.04906768, (float)0.05233596, (float)0.05560368,
+  (float)0.05887080, (float)0.06213730, (float)0.06540313, (float)0.06866825, (float)0.07193266,
+  (float)0.07519628, (float)0.07845910, (float)0.08172107, (float)0.08498218, (float)0.08824237,
+  (float)0.09150162, (float)0.09475989, (float)0.09801714, (float)0.10127335, (float)0.10452846,
+  (float)0.10778246, (float)0.11103531, (float)0.11428697, (float)0.11753740, (float)0.12078657,
+  (float)0.12403446, (float)0.12728101, (float)0.13052620, (float)0.13376999, (float)0.13701233,
+  (float)0.14025325, (float)0.14349262, (float)0.14673047, (float)0.14996676, (float)0.15320145,
+  (float)0.15643448, (float)0.15966582, (float)0.16289547, (float)0.16612339, (float)0.16934951,
+  (float)0.17257382, (float)0.17579629, (float)0.17901687, (float)0.18223552, (float)0.18545224,
+  (float)0.18866697, (float)0.19187967, (float)0.19509032, (float)0.19829889, (float)0.20150533,
+  (float)0.20470962, (float)0.20791170, (float)0.21111156, (float)0.21430916, (float)0.21750447,
+  (float)0.22069745, (float)0.22388805, (float)0.22707628, (float)0.23026206, (float)0.23344538,
+  (float)0.23662618, (float)0.23980446, (float)0.24298020, (float)0.24615330, (float)0.24932377,
+  (float)0.25249159, (float)0.25565669, (float)0.25881904, (float)0.26197866, (float)0.26513544,
+  (float)0.26828939, (float)0.27144045, (float)0.27458861, (float)0.27773386, (float)0.28087610,
+  (float)0.28401536, (float)0.28715158, (float)0.29028466, (float)0.29341471, (float)0.29654160,
+  (float)0.29966527, (float)0.30278578, (float)0.30590302, (float)0.30901700, (float)0.31212768,
+  (float)0.31523499, (float)0.31833893, (float)0.32143945, (float)0.32453656, (float)0.32763019,
+  (float)0.33072028, (float)0.33380687, (float)0.33688986, (float)0.33996925, (float)0.34304500,
+  (float)0.34611708, (float)0.34918544, (float)0.35225007, (float)0.35531089, (float)0.35836795,
+  (float)0.36142117, (float)0.36447051, (float)0.36751595, (float)0.37055743, (float)0.37359497,
+  (float)0.37662852, (float)0.37965801, (float)0.38268346, (float)0.38570479, (float)0.38872197,
+  (float)0.39173502, (float)0.39474389, (float)0.39774847, (float)0.40074885, (float)0.40374491,
+  (float)0.40673664, (float)0.40972406, (float)0.41270703, (float)0.41568562, (float)0.41865975,
+  (float)0.42162940, (float)0.42459452, (float)0.42755508, (float)0.43051112, (float)0.43346250,
+  (float)0.43640924, (float)0.43935132, (float)0.44228873, (float)0.44522133, (float)0.44814920,
+  (float)0.45107228, (float)0.45399052, (float)0.45690390, (float)0.45981237, (float)0.46271592,
+  (float)0.46561453, (float)0.46850815, (float)0.47139674, (float)0.47428030, (float)0.47715878,
+  (float)0.48003215, (float)0.48290035, (float)0.48576337, (float)0.48862126, (float)0.49147385,
+  (float)0.49432120, (float)0.49716330, (float)0.50000000, (float)0.50283140, (float)0.50565743,
+  (float)0.50847799, (float)0.51129311, (float)0.51410276, (float)0.51690692, (float)0.51970553,
+  (float)0.52249855, (float)0.52528602, (float)0.52806789, (float)0.53084403, (float)0.53361452,
+  (float)0.53637928, (float)0.53913832, (float)0.54189163, (float)0.54463905, (float)0.54738063,
+  (float)0.55011642, (float)0.55284631, (float)0.55557024, (float)0.55828828, (float)0.56100029,
+  (float)0.56370628, (float)0.56640625, (float)0.56910014, (float)0.57178795, (float)0.57446963,
+  (float)0.57714522, (float)0.57981455, (float)0.58247769, (float)0.58513463, (float)0.58778524,
+  (float)0.59042960, (float)0.59306765, (float)0.59569931, (float)0.59832460, (float)0.60094351,
+  (float)0.60355598, (float)0.60616195, (float)0.60876143, (float)0.61135441, (float)0.61394083,
+  (float)0.61652070, (float)0.61909395, (float)0.62166059, (float)0.62422055, (float)0.62677383,
+  (float)0.62932038, (float)0.63186020, (float)0.63439333, (float)0.63691956, (float)0.63943899,
+  (float)0.64195162, (float)0.64445734, (float)0.64695615, (float)0.64944810, (float)0.65193301,
+  (float)0.65441096, (float)0.65688187, (float)0.65934587, (float)0.66180271, (float)0.66425246,
+  (float)0.66669512, (float)0.66913062, (float)0.67155898, (float)0.67398012, (float)0.67639405,
+  (float)0.67880076, (float)0.68120021, (float)0.68359232, (float)0.68597710, (float)0.68835455,
+  (float)0.69072467, (float)0.69308740, (float)0.69544262, (float)0.69779050, (float)0.70013082,
+  (float)0.70246369, (float)0.70478904, (float)0.70710677, (float)0.70941699, (float)0.71171963,
+  (float)0.71401459, (float)0.71630198, (float)0.71858168, (float)0.72085363, (float)0.72311789,
+  (float)0.72537440, (float)0.72762316, (float)0.72986406, (float)0.73209721, (float)0.73432255,
+  (float)0.73653996, (float)0.73874950, (float)0.74095118, (float)0.74314487, (float)0.74533057,
+  (float)0.74750835, (float)0.74967808, (float)0.75183982, (float)0.75399351, (float)0.75613910,
+  (float)0.75827658, (float)0.76040596, (float)0.76252723, (float)0.76464027, (float)0.76674515,
+  (float)0.76884186, (float)0.77093029, (float)0.77301043, (float)0.77508241, (float)0.77714598,
+  (float)0.77920127, (float)0.78124821, (float)0.78328675, (float)0.78531694, (float)0.78733873,
+  (float)0.78935206, (float)0.79135692, (float)0.79335338, (float)0.79534125, (float)0.79732066,
+  (float)0.79929149, (float)0.80125386, (float)0.80320752, (float)0.80515265, (float)0.80708915,
+  (float)0.80901700, (float)0.81093621, (float)0.81284672, (float)0.81474853, (float)0.81664157,
+  (float)0.81852591, (float)0.82040149, (float)0.82226825, (float)0.82412618, (float)0.82597536,
+  (float)0.82781565, (float)0.82964706, (float)0.83146966, (float)0.83328325, (float)0.83508795,
+  (float)0.83688378, (float)0.83867061, (float)0.84044838, (float)0.84221727, (float)0.84397703,
+  (float)0.84572780, (float)0.84746957, (float)0.84920216, (float)0.85092574, (float)0.85264021,
+  (float)0.85434544, (float)0.85604161, (float)0.85772866, (float)0.85940641, (float)0.86107504,
+  (float)0.86273444, (float)0.86438453, (float)0.86602545, (float)0.86765707, (float)0.86927933,
+  (float)0.87089235, (float)0.87249607, (float)0.87409031, (float)0.87567532, (float)0.87725097,
+  (float)0.87881714, (float)0.88037390, (float)0.88192129, (float)0.88345921, (float)0.88498765,
+  (float)0.88650668, (float)0.88801610, (float)0.88951612, (float)0.89100653, (float)0.89248741,
+  (float)0.89395881, (float)0.89542055, (float)0.89687276, (float)0.89831537, (float)0.89974827,
+  (float)0.90117162, (float)0.90258533, (float)0.90398932, (float)0.90538365, (float)0.90676826,
+  (float)0.90814316, (float)0.90950841, (float)0.91086388, (float)0.91220951, (float)0.91354549,
+  (float)0.91487163, (float)0.91618794, (float)0.91749454, (float)0.91879123, (float)0.92007810,
+  (float)0.92135513, (float)0.92262226, (float)0.92387950, (float)0.92512691, (float)0.92636442,
+  (float)0.92759192, (float)0.92880958, (float)0.93001723, (float)0.93121493, (float)0.93240267,
+  (float)0.93358046, (float)0.93474817, (float)0.93590593, (float)0.93705362, (float)0.93819135,
+  (float)0.93931901, (float)0.94043654, (float)0.94154406, (float)0.94264150, (float)0.94372880,
+  (float)0.94480604, (float)0.94587320, (float)0.94693011, (float)0.94797695, (float)0.94901365,
+  (float)0.95004016, (float)0.95105654, (float)0.95206273, (float)0.95305866, (float)0.95404440,
+  (float)0.95501995, (float)0.95598525, (float)0.95694035, (float)0.95788521, (float)0.95881975,
+  (float)0.95974404, (float)0.96065807, (float)0.96156180, (float)0.96245527, (float)0.96333838,
+  (float)0.96421117, (float)0.96507370, (float)0.96592581, (float)0.96676767, (float)0.96759909,
+  (float)0.96842021, (float)0.96923089, (float)0.97003126, (float)0.97082120, (float)0.97160077,
+  (float)0.97236991, (float)0.97312868, (float)0.97387701, (float)0.97461486, (float)0.97534233,
+  (float)0.97605932, (float)0.97676587, (float)0.97746199, (float)0.97814763, (float)0.97882277,
+  (float)0.97948742, (float)0.98014158, (float)0.98078531, (float)0.98141843, (float)0.98204112,
+  (float)0.98265332, (float)0.98325491, (float)0.98384601, (float)0.98442656, (float)0.98499662,
+  (float)0.98555607, (float)0.98610497, (float)0.98664331, (float)0.98717111, (float)0.98768836,
+  (float)0.98819500, (float)0.98869103, (float)0.98917651, (float)0.98965138, (float)0.99011570,
+  (float)0.99056935, (float)0.99101239, (float)0.99144489, (float)0.99186671, (float)0.99227792,
+  (float)0.99267852, (float)0.99306846, (float)0.99344778, (float)0.99381649, (float)0.99417448,
+  (float)0.99452192, (float)0.99485862, (float)0.99518472, (float)0.99550015, (float)0.99580491,
+  (float)0.99609905, (float)0.99638247, (float)0.99665523, (float)0.99691731, (float)0.99716878,
+  (float)0.99740952, (float)0.99763954, (float)0.99785894, (float)0.99806762, (float)0.99826562,
+  (float)0.99845290, (float)0.99862951, (float)0.99879545, (float)0.99895066, (float)0.99909520,
+  (float)0.99922901, (float)0.99935216, (float)0.99946457, (float)0.99956632, (float)0.99965733,
+  (float)0.99973762, (float)0.99980724, (float)0.99986613, (float)0.99991435, (float)0.99995178,
+  (float)0.99997860, (float)0.99999464, (float)1.00000000, (float)0.99999464, (float)0.99997860,
+  (float)0.99995178, (float)0.99991435, (float)0.99986613, (float)0.99980724, (float)0.99973762,
+  (float)0.99965733, (float)0.99956632, (float)0.99946457, (float)0.99935216, (float)0.99922901,
+  (float)0.99909520, (float)0.99895066, (float)0.99879545, (float)0.99862951, (float)0.99845290,
+  (float)0.99826562, (float)0.99806762, (float)0.99785894, (float)0.99763954, (float)0.99740946,
+  (float)0.99716872, (float)0.99691731, (float)0.99665523, (float)0.99638247, (float)0.99609905,
+  (float)0.99580491, (float)0.99550015, (float)0.99518472, (float)0.99485862, (float)0.99452192,
+  (float)0.99417448, (float)0.99381644, (float)0.99344778, (float)0.99306846, (float)0.99267852,
+  (float)0.99227792, (float)0.99186671, (float)0.99144489, (float)0.99101239, (float)0.99056935,
+  (float)0.99011564, (float)0.98965138, (float)0.98917651, (float)0.98869103, (float)0.98819494,
+  (float)0.98768836, (float)0.98717111, (float)0.98664331, (float)0.98610497, (float)0.98555607,
+  (float)0.98499656, (float)0.98442656, (float)0.98384601, (float)0.98325491, (float)0.98265326,
+  (float)0.98204112, (float)0.98141843, (float)0.98078525, (float)0.98014158, (float)0.97948742,
+  (float)0.97882277, (float)0.97814757, (float)0.97746193, (float)0.97676587, (float)0.97605932,
+  (float)0.97534227, (float)0.97461486, (float)0.97387695, (float)0.97312862, (float)0.97236991,
+  (float)0.97160077, (float)0.97082120, (float)0.97003126, (float)0.96923089, (float)0.96842015,
+  (float)0.96759909, (float)0.96676761, (float)0.96592581, (float)0.96507365, (float)0.96421117,
+  (float)0.96333838, (float)0.96245521, (float)0.96156180, (float)0.96065807, (float)0.95974404,
+  (float)0.95881969, (float)0.95788515, (float)0.95694029, (float)0.95598525, (float)0.95501995,
+  (float)0.95404440, (float)0.95305860, (float)0.95206267, (float)0.95105648, (float)0.95004016,
+  (float)0.94901365, (float)0.94797695, (float)0.94693011, (float)0.94587314, (float)0.94480604,
+  (float)0.94372880, (float)0.94264150, (float)0.94154406, (float)0.94043654, (float)0.93931895,
+  (float)0.93819129, (float)0.93705362, (float)0.93590593, (float)0.93474817, (float)0.93358046,
+  (float)0.93240267, (float)0.93121493, (float)0.93001723, (float)0.92880952, (float)0.92759192,
+  (float)0.92636436, (float)0.92512691, (float)0.92387950, (float)0.92262226, (float)0.92135507,
+  (float)0.92007804, (float)0.91879123, (float)0.91749448, (float)0.91618794, (float)0.91487157,
+  (float)0.91354543, (float)0.91220951, (float)0.91086382, (float)0.90950835, (float)0.90814310,
+  (float)0.90676820, (float)0.90538365, (float)0.90398932, (float)0.90258527, (float)0.90117157,
+  (float)0.89974827, (float)0.89831525, (float)0.89687276, (float)0.89542055, (float)0.89395875,
+  (float)0.89248741, (float)0.89100647, (float)0.88951600, (float)0.88801610, (float)0.88650662,
+  (float)0.88498759, (float)0.88345915, (float)0.88192123, (float)0.88037384, (float)0.87881714,
+  (float)0.87725091, (float)0.87567532, (float)0.87409031, (float)0.87249595, (float)0.87089223,
+  (float)0.86927933, (float)0.86765701, (float)0.86602539, (float)0.86438447, (float)0.86273432,
+  (float)0.86107504, (float)0.85940641, (float)0.85772860, (float)0.85604161, (float)0.85434544,
+  (float)0.85264009, (float)0.85092574, (float)0.84920216, (float)0.84746951, (float)0.84572780,
+  (float)0.84397697, (float)0.84221715, (float)0.84044844, (float)0.83867055, (float)0.83688372,
+  (float)0.83508795, (float)0.83328319, (float)0.83146954, (float)0.82964706, (float)0.82781565,
+  (float)0.82597530, (float)0.82412612, (float)0.82226813, (float)0.82040137, (float)0.81852591,
+  (float)0.81664157, (float)0.81474847, (float)0.81284660, (float)0.81093609, (float)0.80901700,
+  (float)0.80708915, (float)0.80515265, (float)0.80320752, (float)0.80125374, (float)0.79929143,
+  (float)0.79732066, (float)0.79534125, (float)0.79335332, (float)0.79135686, (float)0.78935200,
+  (float)0.78733861, (float)0.78531694, (float)0.78328675, (float)0.78124815, (float)0.77920121,
+  (float)0.77714586, (float)0.77508223, (float)0.77301049, (float)0.77093029, (float)0.76884180,
+  (float)0.76674509, (float)0.76464021, (float)0.76252711, (float)0.76040596, (float)0.75827658,
+  (float)0.75613904, (float)0.75399339, (float)0.75183970, (float)0.74967796, (float)0.74750835,
+  (float)0.74533057, (float)0.74314481, (float)0.74095106, (float)0.73874938, (float)0.73653996,
+  (float)0.73432249, (float)0.73209721, (float)0.72986400, (float)0.72762305, (float)0.72537428,
+  (float)0.72311789, (float)0.72085363, (float)0.71858162, (float)0.71630186, (float)0.71401453,
+  (float)0.71171951, (float)0.70941705, (float)0.70710677, (float)0.70478898, (float)0.70246363,
+  (float)0.70013070, (float)0.69779032, (float)0.69544268, (float)0.69308734, (float)0.69072461,
+  (float)0.68835449, (float)0.68597704, (float)0.68359220, (float)0.68120021, (float)0.67880070,
+  (float)0.67639399, (float)0.67398006, (float)0.67155886, (float)0.66913044, (float)0.66669512,
+  (float)0.66425240, (float)0.66180259, (float)0.65934575, (float)0.65688181, (float)0.65441096,
+  (float)0.65193301, (float)0.64944804, (float)0.64695609, (float)0.64445722, (float)0.64195150,
+  (float)0.63943905, (float)0.63691956, (float)0.63439327, (float)0.63186014, (float)0.62932026,
+  (float)0.62677372, (float)0.62422055, (float)0.62166059, (float)0.61909389, (float)0.61652064,
+  (float)0.61394072, (float)0.61135429, (float)0.60876143, (float)0.60616189, (float)0.60355592,
+  (float)0.60094339, (float)0.59832448, (float)0.59569913, (float)0.59306765, (float)0.59042960,
+  (float)0.58778518, (float)0.58513451, (float)0.58247757, (float)0.57981461, (float)0.57714522,
+  (float)0.57446963, (float)0.57178789, (float)0.56910002, (float)0.56640613, (float)0.56370628,
+  (float)0.56100023, (float)0.55828822, (float)0.55557019, (float)0.55284619, (float)0.55011630,
+  (float)0.54738069, (float)0.54463905, (float)0.54189152, (float)0.53913826, (float)0.53637916,
+  (float)0.53361434, (float)0.53084403, (float)0.52806783, (float)0.52528596, (float)0.52249849,
+  (float)0.51970541, (float)0.51690674, (float)0.51410276, (float)0.51129305, (float)0.50847787,
+  (float)0.50565726, (float)0.50283122, (float)0.50000006, (float)0.49716327, (float)0.49432117,
+  (float)0.49147379, (float)0.48862115, (float)0.48576325, (float)0.48290038, (float)0.48003212,
+  (float)0.47715873, (float)0.47428021, (float)0.47139663, (float)0.46850798, (float)0.46561456,
+  (float)0.46271589, (float)0.45981231, (float)0.45690379, (float)0.45399037, (float)0.45107210,
+  (float)0.44814920, (float)0.44522130, (float)0.44228864, (float)0.43935123, (float)0.43640912,
+  (float)0.43346232, (float)0.43051112, (float)0.42755505, (float)0.42459446, (float)0.42162928,
+  (float)0.41865960, (float)0.41568545, (float)0.41270703, (float)0.40972400, (float)0.40673658,
+  (float)0.40374479, (float)0.40074870, (float)0.39774850, (float)0.39474386, (float)0.39173496,
+  (float)0.38872188, (float)0.38570464, (float)0.38268328, (float)0.37965804, (float)0.37662849,
+  (float)0.37359491, (float)0.37055734, (float)0.36751580, (float)0.36447033, (float)0.36142117,
+  (float)0.35836792, (float)0.35531086, (float)0.35224995, (float)0.34918529, (float)0.34611690,
+  (float)0.34304500, (float)0.33996922, (float)0.33688980, (float)0.33380675, (float)0.33072016,
+  (float)0.32763001, (float)0.32453656, (float)0.32143945, (float)0.31833887, (float)0.31523487,
+  (float)0.31212750, (float)0.30901679, (float)0.30590302, (float)0.30278572, (float)0.29966521,
+  (float)0.29654145, (float)0.29341453, (float)0.29028472, (float)0.28715155, (float)0.28401530,
+  (float)0.28087601, (float)0.27773371, (float)0.27458847, (float)0.27144048, (float)0.26828936,
+  (float)0.26513538, (float)0.26197854, (float)0.25881892, (float)0.25565651, (float)0.25249159,
+  (float)0.24932374, (float)0.24615324, (float)0.24298008, (float)0.23980433, (float)0.23662600,
+  (float)0.23344538, (float)0.23026201, (float)0.22707619, (float)0.22388794, (float)0.22069728,
+  (float)0.21750426, (float)0.21430916, (float)0.21111152, (float)0.20791161, (float)0.20470949,
+  (float)0.20150517, (float)0.19829892, (float)0.19509031, (float)0.19187963, (float)0.18866688,
+  (float)0.18545210, (float)0.18223536, (float)0.17901689, (float)0.17579627, (float)0.17257376,
+  (float)0.16934940, (float)0.16612324, (float)0.16289529, (float)0.15966584, (float)0.15643445,
+  (float)0.15320137, (float)0.14996666, (float)0.14673033, (float)0.14349243, (float)0.14025325,
+  (float)0.13701232, (float)0.13376991, (float)0.13052608, (float)0.12728085, (float)0.12403426,
+  (float)0.12078657, (float)0.11753736, (float)0.11428688, (float)0.11103519, (float)0.10778230,
+  (float)0.10452849, (float)0.10127334, (float)0.09801710, (float)0.09475980, (float)0.09150149,
+  (float)0.08824220, (float)0.08498220, (float)0.08172106, (float)0.07845904, (float)0.07519618,
+  (float)0.07193252, (float)0.06866808, (float)0.06540315, (float)0.06213728, (float)0.05887074,
+  (float)0.05560357, (float)0.05233581, (float)0.04906749, (float)0.04579888, (float)0.04252954,
+  (float)0.03925974, (float)0.03598953, (float)0.03271893, (float)0.02944798, (float)0.02617695,
+  (float)0.02290541, (float)0.01963361, (float)0.01636161, (float)0.01308943, (float)0.00981712,
+  (float)0.00654493, (float)0.00327244, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000,
+  (float)0.00000000, (float)0.00000000, (float)0.00000000, (float)0.00000000
+};
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_NS_MAIN_SOURCE_WINDOWS_PRIVATE_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/splitting_filter.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/splitting_filter.cc
new file mode 100644
index 0000000..9f10935
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/splitting_filter.cc
@@ -0,0 +1,108 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/modules/audio_processing/splitting_filter.h"
+
+#include "webrtc/base/checks.h"
+#include "webrtc/common_audio/signal_processing/include/signal_processing_library.h"
+#include "webrtc/common_audio/channel_buffer.h"
+
+namespace webrtc {
+
+SplittingFilter::SplittingFilter(size_t num_channels,
+                                 size_t num_bands,
+                                 size_t num_frames)
+    : num_bands_(num_bands) {
+  RTC_CHECK(num_bands_ == 2 || num_bands_ == 3);
+  if (num_bands_ == 2) {
+    two_bands_states_.resize(num_channels);
+  } else if (num_bands_ == 3) {
+    for (size_t i = 0; i < num_channels; ++i) {
+      three_band_filter_banks_.push_back(std::unique_ptr<ThreeBandFilterBank>(
+          new ThreeBandFilterBank(num_frames)));
+    }
+  }
+}
+
+SplittingFilter::~SplittingFilter() = default;
+
+void SplittingFilter::Analysis(const IFChannelBuffer* data,
+                               IFChannelBuffer* bands) {
+  RTC_DCHECK_EQ(num_bands_, bands->num_bands());
+  RTC_DCHECK_EQ(data->num_channels(), bands->num_channels());
+  RTC_DCHECK_EQ(data->num_frames(),
+                bands->num_frames_per_band() * bands->num_bands());
+  if (bands->num_bands() == 2) {
+    TwoBandsAnalysis(data, bands);
+  } else if (bands->num_bands() == 3) {
+    ThreeBandsAnalysis(data, bands);
+  }
+}
+
+void SplittingFilter::Synthesis(const IFChannelBuffer* bands,
+                                IFChannelBuffer* data) {
+  RTC_DCHECK_EQ(num_bands_, bands->num_bands());
+  RTC_DCHECK_EQ(data->num_channels(), bands->num_channels());
+  RTC_DCHECK_EQ(data->num_frames(),
+                bands->num_frames_per_band() * bands->num_bands());
+  if (bands->num_bands() == 2) {
+    TwoBandsSynthesis(bands, data);
+  } else if (bands->num_bands() == 3) {
+    ThreeBandsSynthesis(bands, data);
+  }
+}
+
+void SplittingFilter::TwoBandsAnalysis(const IFChannelBuffer* data,
+                                       IFChannelBuffer* bands) {
+  RTC_DCHECK_EQ(two_bands_states_.size(), data->num_channels());
+  for (size_t i = 0; i < two_bands_states_.size(); ++i) {
+    WebRtcSpl_AnalysisQMF(data->ibuf_const()->channels()[i],
+                          data->num_frames(),
+                          bands->ibuf()->channels(0)[i],
+                          bands->ibuf()->channels(1)[i],
+                          two_bands_states_[i].analysis_state1,
+                          two_bands_states_[i].analysis_state2);
+  }
+}
+
+void SplittingFilter::TwoBandsSynthesis(const IFChannelBuffer* bands,
+                                        IFChannelBuffer* data) {
+  RTC_DCHECK_LE(data->num_channels(), two_bands_states_.size());
+  for (size_t i = 0; i < data->num_channels(); ++i) {
+    WebRtcSpl_SynthesisQMF(bands->ibuf_const()->channels(0)[i],
+                           bands->ibuf_const()->channels(1)[i],
+                           bands->num_frames_per_band(),
+                           data->ibuf()->channels()[i],
+                           two_bands_states_[i].synthesis_state1,
+                           two_bands_states_[i].synthesis_state2);
+  }
+}
+
+void SplittingFilter::ThreeBandsAnalysis(const IFChannelBuffer* data,
+                                         IFChannelBuffer* bands) {
+  RTC_DCHECK_EQ(three_band_filter_banks_.size(), data->num_channels());
+  for (size_t i = 0; i < three_band_filter_banks_.size(); ++i) {
+    three_band_filter_banks_[i]->Analysis(data->fbuf_const()->channels()[i],
+                                          data->num_frames(),
+                                          bands->fbuf()->bands(i));
+  }
+}
+
+void SplittingFilter::ThreeBandsSynthesis(const IFChannelBuffer* bands,
+                                          IFChannelBuffer* data) {
+  RTC_DCHECK_LE(data->num_channels(), three_band_filter_banks_.size());
+  for (size_t i = 0; i < data->num_channels(); ++i) {
+    three_band_filter_banks_[i]->Synthesis(bands->fbuf_const()->bands(i),
+                                           bands->num_frames_per_band(),
+                                           data->fbuf()->channels()[i]);
+  }
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/splitting_filter.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/splitting_filter.h
new file mode 100644
index 0000000..c8a6b4d
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/splitting_filter.h
@@ -0,0 +1,69 @@
+/*
+ *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_SPLITTING_FILTER_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_SPLITTING_FILTER_H_
+
+#include <cstring>
+#include <memory>
+#include <vector>
+
+#include "webrtc/modules/audio_processing/three_band_filter_bank.h"
+
+namespace webrtc {
+
+class IFChannelBuffer;
+
+struct TwoBandsStates {
+  TwoBandsStates() {
+    memset(analysis_state1, 0, sizeof(analysis_state1));
+    memset(analysis_state2, 0, sizeof(analysis_state2));
+    memset(synthesis_state1, 0, sizeof(synthesis_state1));
+    memset(synthesis_state2, 0, sizeof(synthesis_state2));
+  }
+
+  static const int kStateSize = 6;
+  int analysis_state1[kStateSize];
+  int analysis_state2[kStateSize];
+  int synthesis_state1[kStateSize];
+  int synthesis_state2[kStateSize];
+};
+
+// Splitting filter which is able to split into and merge from 2 or 3 frequency
+// bands. The number of channels needs to be provided at construction time.
+//
+// For each block, Analysis() is called to split into bands and then Synthesis()
+// to merge these bands again. The input and output signals are contained in
+// IFChannelBuffers and for the different bands an array of IFChannelBuffers is
+// used.
+class SplittingFilter {
+ public:
+  SplittingFilter(size_t num_channels, size_t num_bands, size_t num_frames);
+  ~SplittingFilter();
+
+  void Analysis(const IFChannelBuffer* data, IFChannelBuffer* bands);
+  void Synthesis(const IFChannelBuffer* bands, IFChannelBuffer* data);
+
+ private:
+  // Two-band analysis and synthesis work for 640 samples or less.
+  void TwoBandsAnalysis(const IFChannelBuffer* data, IFChannelBuffer* bands);
+  void TwoBandsSynthesis(const IFChannelBuffer* bands, IFChannelBuffer* data);
+  void ThreeBandsAnalysis(const IFChannelBuffer* data, IFChannelBuffer* bands);
+  void ThreeBandsSynthesis(const IFChannelBuffer* bands, IFChannelBuffer* data);
+  void InitBuffers();
+
+  const size_t num_bands_;
+  std::vector<TwoBandsStates> two_bands_states_;
+  std::vector< std::unique_ptr<ThreeBandFilterBank> > three_band_filter_banks_;
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_SPLITTING_FILTER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/three_band_filter_bank.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/three_band_filter_bank.cc
new file mode 100644
index 0000000..61071bb
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/three_band_filter_bank.cc
@@ -0,0 +1,216 @@
+/*
+ *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// An implementation of a 3-band FIR filter-bank with DCT modulation, similar to
+// the proposed in "Multirate Signal Processing for Communication Systems" by
+// Fredric J Harris.
+//
+// The idea is to take a heterodyne system and change the order of the
+// components to get something which is efficient to implement digitally.
+//
+// It is possible to separate the filter using the noble identity as follows:
+//
+// H(z) = H0(z^3) + z^-1 * H1(z^3) + z^-2 * H2(z^3)
+//
+// This is used in the analysis stage to first downsample serial to parallel
+// and then filter each branch with one of these polyphase decompositions of the
+// lowpass prototype. Because each filter is only a modulation of the prototype,
+// it is enough to multiply each coefficient by the respective cosine value to
+// shift it to the desired band. But because the cosine period is 12 samples,
+// it requires separating the prototype even further using the noble identity.
+// After filtering and modulating for each band, the output of all filters is
+// accumulated to get the downsampled bands.
+//
+// A similar logic can be applied to the synthesis stage.
+
+// MSVC++ requires this to be set before any other includes to get M_PI.
+#define _USE_MATH_DEFINES
+
+#include "webrtc/modules/audio_processing/three_band_filter_bank.h"
+
+#include <cmath>
+
+#include "webrtc/base/checks.h"
+
+namespace webrtc {
+namespace {
+
+const size_t kNumBands = 3;
+const size_t kSparsity = 4;
+
+// Factors to take into account when choosing |kNumCoeffs|:
+//   1. Higher |kNumCoeffs|, means faster transition, which ensures less
+//      aliasing. This is especially important when there is non-linear
+//      processing between the splitting and merging.
+//   2. The delay that this filter bank introduces is
+//      |kNumBands| * |kSparsity| * |kNumCoeffs| / 2, so it increases linearly
+//      with |kNumCoeffs|.
+//   3. The computation complexity also increases linearly with |kNumCoeffs|.
+const size_t kNumCoeffs = 4;
+
+// The Matlab code to generate these |kLowpassCoeffs| is:
+//
+// N = kNumBands * kSparsity * kNumCoeffs - 1;
+// h = fir1(N, 1 / (2 * kNumBands), kaiser(N + 1, 3.5));
+// reshape(h, kNumBands * kSparsity, kNumCoeffs);
+//
+// Because the total bandwidth of the lower and higher band is double the middle
+// one (because of the spectrum parity), the low-pass prototype is half the
+// bandwidth of 1 / (2 * |kNumBands|) and is then shifted with cosine modulation
+// to the right places.
+// A Kaiser window is used because of its flexibility and the alpha is set to
+// 3.5, since that sets a stop band attenuation of 40dB ensuring a fast
+// transition.
+const float kLowpassCoeffs[kNumBands * kSparsity][kNumCoeffs] =
+    {{-0.00047749f, -0.00496888f, +0.16547118f, +0.00425496f},
+     {-0.00173287f, -0.01585778f, +0.14989004f, +0.00994113f},
+     {-0.00304815f, -0.02536082f, +0.12154542f, +0.01157993f},
+     {-0.00383509f, -0.02982767f, +0.08543175f, +0.00983212f},
+     {-0.00346946f, -0.02587886f, +0.04760441f, +0.00607594f},
+     {-0.00154717f, -0.01136076f, +0.01387458f, +0.00186353f},
+     {+0.00186353f, +0.01387458f, -0.01136076f, -0.00154717f},
+     {+0.00607594f, +0.04760441f, -0.02587886f, -0.00346946f},
+     {+0.00983212f, +0.08543175f, -0.02982767f, -0.00383509f},
+     {+0.01157993f, +0.12154542f, -0.02536082f, -0.00304815f},
+     {+0.00994113f, +0.14989004f, -0.01585778f, -0.00173287f},
+     {+0.00425496f, +0.16547118f, -0.00496888f, -0.00047749f}};
+
+// Downsamples |in| into |out|, taking one every |kNumbands| starting from
+// |offset|. |split_length| is the |out| length. |in| has to be at least
+// |kNumBands| * |split_length| long.
+void Downsample(const float* in,
+                size_t split_length,
+                size_t offset,
+                float* out) {
+  for (size_t i = 0; i < split_length; ++i) {
+    out[i] = in[kNumBands * i + offset];
+  }
+}
+
+// Upsamples |in| into |out|, scaling by |kNumBands| and accumulating it every
+// |kNumBands| starting from |offset|. |split_length| is the |in| length. |out|
+// has to be at least |kNumBands| * |split_length| long.
+void Upsample(const float* in, size_t split_length, size_t offset, float* out) {
+  for (size_t i = 0; i < split_length; ++i) {
+    out[kNumBands * i + offset] += kNumBands * in[i];
+  }
+}
+
+}  // namespace
+
+// Because the low-pass filter prototype has half bandwidth it is possible to
+// use a DCT to shift it in both directions at the same time, to the center
+// frequencies [1 / 12, 3 / 12, 5 / 12].
+ThreeBandFilterBank::ThreeBandFilterBank(size_t length)
+    : in_buffer_(rtc::CheckedDivExact(length, kNumBands)),
+      out_buffer_(in_buffer_.size()) {
+  for (size_t i = 0; i < kSparsity; ++i) {
+    for (size_t j = 0; j < kNumBands; ++j) {
+      analysis_filters_.push_back(
+          std::unique_ptr<SparseFIRFilter>(new SparseFIRFilter(
+              kLowpassCoeffs[i * kNumBands + j], kNumCoeffs, kSparsity, i)));
+      synthesis_filters_.push_back(
+          std::unique_ptr<SparseFIRFilter>(new SparseFIRFilter(
+              kLowpassCoeffs[i * kNumBands + j], kNumCoeffs, kSparsity, i)));
+    }
+  }
+  dct_modulation_.resize(kNumBands * kSparsity);
+  for (size_t i = 0; i < dct_modulation_.size(); ++i) {
+    dct_modulation_[i].resize(kNumBands);
+    for (size_t j = 0; j < kNumBands; ++j) {
+      dct_modulation_[i][j] =
+          2.f * cos(2.f * M_PI * i * (2.f * j + 1.f) / dct_modulation_.size());
+    }
+  }
+}
+
+ThreeBandFilterBank::~ThreeBandFilterBank() = default;
+
+// The analysis can be separated in these steps:
+//   1. Serial to parallel downsampling by a factor of |kNumBands|.
+//   2. Filtering of |kSparsity| different delayed signals with polyphase
+//      decomposition of the low-pass prototype filter and upsampled by a factor
+//      of |kSparsity|.
+//   3. Modulating with cosines and accumulating to get the desired band.
+void ThreeBandFilterBank::Analysis(const float* in,
+                                   size_t length,
+                                   float* const* out) {
+  RTC_CHECK_EQ(in_buffer_.size(), rtc::CheckedDivExact(length, kNumBands));
+  for (size_t i = 0; i < kNumBands; ++i) {
+    memset(out[i], 0, in_buffer_.size() * sizeof(*out[i]));
+  }
+  for (size_t i = 0; i < kNumBands; ++i) {
+    Downsample(in, in_buffer_.size(), kNumBands - i - 1, &in_buffer_[0]);
+    for (size_t j = 0; j < kSparsity; ++j) {
+      const size_t offset = i + j * kNumBands;
+      analysis_filters_[offset]->Filter(&in_buffer_[0],
+                                        in_buffer_.size(),
+                                        &out_buffer_[0]);
+      DownModulate(&out_buffer_[0], out_buffer_.size(), offset, out);
+    }
+  }
+}
+
+// The synthesis can be separated in these steps:
+//   1. Modulating with cosines.
+//   2. Filtering each one with a polyphase decomposition of the low-pass
+//      prototype filter upsampled by a factor of |kSparsity| and accumulating
+//      |kSparsity| signals with different delays.
+//   3. Parallel to serial upsampling by a factor of |kNumBands|.
+void ThreeBandFilterBank::Synthesis(const float* const* in,
+                                    size_t split_length,
+                                    float* out) {
+  RTC_CHECK_EQ(in_buffer_.size(), split_length);
+  memset(out, 0, kNumBands * in_buffer_.size() * sizeof(*out));
+  for (size_t i = 0; i < kNumBands; ++i) {
+    for (size_t j = 0; j < kSparsity; ++j) {
+      const size_t offset = i + j * kNumBands;
+      UpModulate(in, in_buffer_.size(), offset, &in_buffer_[0]);
+      synthesis_filters_[offset]->Filter(&in_buffer_[0],
+                                         in_buffer_.size(),
+                                         &out_buffer_[0]);
+      Upsample(&out_buffer_[0], out_buffer_.size(), i, out);
+    }
+  }
+}
+
+
+// Modulates |in| by |dct_modulation_| and accumulates it in each of the
+// |kNumBands| bands of |out|. |offset| is the index in the period of the
+// cosines used for modulation. |split_length| is the length of |in| and each
+// band of |out|.
+void ThreeBandFilterBank::DownModulate(const float* in,
+                                       size_t split_length,
+                                       size_t offset,
+                                       float* const* out) {
+  for (size_t i = 0; i < kNumBands; ++i) {
+    for (size_t j = 0; j < split_length; ++j) {
+      out[i][j] += dct_modulation_[offset][i] * in[j];
+    }
+  }
+}
+
+// Modulates each of the |kNumBands| bands of |in| by |dct_modulation_| and
+// accumulates them in |out|. |out| is cleared before starting to accumulate.
+// |offset| is the index in the period of the cosines used for modulation.
+// |split_length| is the length of each band of |in| and |out|.
+void ThreeBandFilterBank::UpModulate(const float* const* in,
+                                     size_t split_length,
+                                     size_t offset,
+                                     float* out) {
+  memset(out, 0, split_length * sizeof(*out));
+  for (size_t i = 0; i < kNumBands; ++i) {
+    for (size_t j = 0; j < split_length; ++j) {
+      out[j] += dct_modulation_[offset][i] * in[i][j];
+    }
+  }
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/three_band_filter_bank.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/three_band_filter_bank.h
new file mode 100644
index 0000000..f60f869
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/audio_processing/three_band_filter_bank.h
@@ -0,0 +1,69 @@
+/*
+ *  Copyright (c) 2015 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_AUDIO_PROCESSING_THREE_BAND_FILTER_BANK_H_
+#define WEBRTC_MODULES_AUDIO_PROCESSING_THREE_BAND_FILTER_BANK_H_
+
+#include <cstring>
+#include <memory>
+#include <vector>
+
+#include "webrtc/common_audio/sparse_fir_filter.h"
+
+namespace webrtc {
+
+// An implementation of a 3-band FIR filter-bank with DCT modulation, similar to
+// the proposed in "Multirate Signal Processing for Communication Systems" by
+// Fredric J Harris.
+// The low-pass filter prototype has these characteristics:
+// * Pass-band ripple = 0.3dB
+// * Pass-band frequency = 0.147 (7kHz at 48kHz)
+// * Stop-band attenuation = 40dB
+// * Stop-band frequency = 0.192 (9.2kHz at 48kHz)
+// * Delay = 24 samples (500us at 48kHz)
+// * Linear phase
+// This filter bank does not satisfy perfect reconstruction. The SNR after
+// analysis and synthesis (with no processing in between) is approximately 9.5dB
+// depending on the input signal after compensating for the delay.
+class ThreeBandFilterBank final {
+ public:
+  explicit ThreeBandFilterBank(size_t length);
+  ~ThreeBandFilterBank();
+
+  // Splits |in| into 3 downsampled frequency bands in |out|.
+  // |length| is the |in| length. Each of the 3 bands of |out| has to have a
+  // length of |length| / 3.
+  void Analysis(const float* in, size_t length, float* const* out);
+
+  // Merges the 3 downsampled frequency bands in |in| into |out|.
+  // |split_length| is the length of each band of |in|. |out| has to have at
+  // least a length of 3 * |split_length|.
+  void Synthesis(const float* const* in, size_t split_length, float* out);
+
+ private:
+  void DownModulate(const float* in,
+                    size_t split_length,
+                    size_t offset,
+                    float* const* out);
+  void UpModulate(const float* const* in,
+                  size_t split_length,
+                  size_t offset,
+                  float* out);
+
+  std::vector<float> in_buffer_;
+  std::vector<float> out_buffer_;
+  std::vector<std::unique_ptr<SparseFIRFilter> > analysis_filters_;
+  std::vector<std::unique_ptr<SparseFIRFilter> > synthesis_filters_;
+  std::vector<std::vector<float> > dct_modulation_;
+};
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_AUDIO_PROCESSING_THREE_BAND_FILTER_BANK_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/include/module_common_types.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/include/module_common_types.h
new file mode 100644
index 0000000..0a8ce33
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/modules/include/module_common_types.h
@@ -0,0 +1,231 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_MODULES_INCLUDE_MODULE_COMMON_TYPES_H_
+#define WEBRTC_MODULES_INCLUDE_MODULE_COMMON_TYPES_H_
+
+
+#include "webrtc/base/deprecation.h"
+#include "webrtc/base/safe_conversions.h"
+#include "webrtc/typedefs.h"
+
+namespace webrtc {
+
+/* This class holds up to 60 ms of super-wideband (32 kHz) stereo audio. It
+ * allows for adding and subtracting frames while keeping track of the resulting
+ * states.
+ *
+ * Notes
+ * - The total number of samples in |data_| is
+ *   samples_per_channel_ * num_channels_
+ *
+ * - Stereo data is interleaved starting with the left channel.
+ *
+ */
+class AudioFrame {
+ public:
+  // Using constexpr here causes linker errors unless the variable also has an
+  // out-of-class definition, which is impractical in this header-only class.
+  // (This makes no sense because it compiles as an enum value, which we most
+  // certainly cannot take the address of, just fine.) C++17 introduces inline
+  // variables which should allow us to switch to constexpr and keep this a
+  // header-only class.
+  enum : size_t {
+    // Stereo, 32 kHz, 60 ms (2 * 32 * 60)
+    kMaxDataSizeSamples = 3840,
+    kMaxDataSizeBytes = kMaxDataSizeSamples * sizeof(int16_t),
+  };
+
+  enum VADActivity {
+    kVadActive = 0,
+    kVadPassive = 1,
+    kVadUnknown = 2
+  };
+  enum SpeechType {
+    kNormalSpeech = 0,
+    kPLC = 1,
+    kCNG = 2,
+    kPLCCNG = 3,
+    kUndefined = 4
+  };
+
+  AudioFrame();
+
+  // Resets all members to their default state (except does not modify the
+  // contents of |data_|).
+  void Reset();
+
+  void UpdateFrame(int id, uint32_t timestamp, const int16_t* data,
+                   size_t samples_per_channel, int sample_rate_hz,
+                   SpeechType speech_type, VADActivity vad_activity,
+                   size_t num_channels = 1);
+
+  void CopyFrom(const AudioFrame& src);
+
+  // TODO(yujo): upcoming API update. Currently, both of these just return
+  // data_.
+  const int16_t* data() const;
+  int16_t* mutable_data();
+
+  // These methods are deprecated. Use the functions in
+  // webrtc/audio/utility instead. These methods will exists for a
+  // short period of time until webrtc clients have updated. See
+  // webrtc:6548 for details.
+  RTC_DEPRECATED void Mute();
+  RTC_DEPRECATED AudioFrame& operator>>=(const int rhs);
+  RTC_DEPRECATED AudioFrame& operator+=(const AudioFrame& rhs);
+
+  int id_;
+  // RTP timestamp of the first sample in the AudioFrame.
+  uint32_t timestamp_ = 0;
+  // Time since the first frame in milliseconds.
+  // -1 represents an uninitialized value.
+  int64_t elapsed_time_ms_ = -1;
+  // NTP time of the estimated capture time in local timebase in milliseconds.
+  // -1 represents an uninitialized value.
+  int64_t ntp_time_ms_ = -1;
+  int16_t data_[kMaxDataSizeSamples];
+  size_t samples_per_channel_ = 0;
+  int sample_rate_hz_ = 0;
+  size_t num_channels_ = 0;
+  SpeechType speech_type_ = kUndefined;
+  VADActivity vad_activity_ = kVadUnknown;
+
+ private:
+  RTC_DISALLOW_COPY_AND_ASSIGN(AudioFrame);
+};
+
+// TODO(henrik.lundin) Can we remove the call to data_()?
+// See https://bugs.chromium.org/p/webrtc/issues/detail?id=5647.
+inline AudioFrame::AudioFrame()
+    : data_() {
+}
+
+inline void AudioFrame::Reset() {
+  id_ = -1;
+  // TODO(wu): Zero is a valid value for |timestamp_|. We should initialize
+  // to an invalid value, or add a new member to indicate invalidity.
+  timestamp_ = 0;
+  elapsed_time_ms_ = -1;
+  ntp_time_ms_ = -1;
+  samples_per_channel_ = 0;
+  sample_rate_hz_ = 0;
+  num_channels_ = 0;
+  speech_type_ = kUndefined;
+  vad_activity_ = kVadUnknown;
+}
+
+inline void AudioFrame::UpdateFrame(int id,
+                                    uint32_t timestamp,
+                                    const int16_t* data,
+                                    size_t samples_per_channel,
+                                    int sample_rate_hz,
+                                    SpeechType speech_type,
+                                    VADActivity vad_activity,
+                                    size_t num_channels) {
+  id_ = id;
+  timestamp_ = timestamp;
+  samples_per_channel_ = samples_per_channel;
+  sample_rate_hz_ = sample_rate_hz;
+  speech_type_ = speech_type;
+  vad_activity_ = vad_activity;
+  num_channels_ = num_channels;
+
+  const size_t length = samples_per_channel * num_channels;
+  assert(length <= kMaxDataSizeSamples);
+  if (data != NULL) {
+    memcpy(data_, data, sizeof(int16_t) * length);
+  } else {
+    memset(data_, 0, sizeof(int16_t) * length);
+  }
+}
+
+inline void AudioFrame::CopyFrom(const AudioFrame& src) {
+  if (this == &src) return;
+
+  id_ = src.id_;
+  timestamp_ = src.timestamp_;
+  elapsed_time_ms_ = src.elapsed_time_ms_;
+  ntp_time_ms_ = src.ntp_time_ms_;
+  samples_per_channel_ = src.samples_per_channel_;
+  sample_rate_hz_ = src.sample_rate_hz_;
+  speech_type_ = src.speech_type_;
+  vad_activity_ = src.vad_activity_;
+  num_channels_ = src.num_channels_;
+
+  const size_t length = samples_per_channel_ * num_channels_;
+  assert(length <= kMaxDataSizeSamples);
+  memcpy(data_, src.data_, sizeof(int16_t) * length);
+}
+
+inline const int16_t* AudioFrame::data() const {
+  return data_;
+}
+
+inline int16_t* AudioFrame::mutable_data() {
+  return data_;
+}
+
+inline void AudioFrame::Mute() {
+  memset(data_, 0, samples_per_channel_ * num_channels_ * sizeof(int16_t));
+}
+
+inline AudioFrame& AudioFrame::operator>>=(const int rhs) {
+  assert((num_channels_ > 0) && (num_channels_ < 3));
+  if ((num_channels_ > 2) || (num_channels_ < 1)) return *this;
+
+  for (size_t i = 0; i < samples_per_channel_ * num_channels_; i++) {
+    data_[i] = static_cast<int16_t>(data_[i] >> rhs);
+  }
+  return *this;
+}
+
+inline AudioFrame& AudioFrame::operator+=(const AudioFrame& rhs) {
+  // Sanity check
+  assert((num_channels_ > 0) && (num_channels_ < 3));
+  if ((num_channels_ > 2) || (num_channels_ < 1)) return *this;
+  if (num_channels_ != rhs.num_channels_) return *this;
+
+  bool noPrevData = false;
+  if (samples_per_channel_ != rhs.samples_per_channel_) {
+    if (samples_per_channel_ == 0) {
+      // special case we have no data to start with
+      samples_per_channel_ = rhs.samples_per_channel_;
+      noPrevData = true;
+    } else {
+      return *this;
+    }
+  }
+
+  if ((vad_activity_ == kVadActive) || rhs.vad_activity_ == kVadActive) {
+    vad_activity_ = kVadActive;
+  } else if (vad_activity_ == kVadUnknown || rhs.vad_activity_ == kVadUnknown) {
+    vad_activity_ = kVadUnknown;
+  }
+
+  if (speech_type_ != rhs.speech_type_) speech_type_ = kUndefined;
+
+  if (noPrevData) {
+    memcpy(data_, rhs.data_,
+           sizeof(int16_t) * rhs.samples_per_channel_ * num_channels_);
+  } else {
+    // IMPROVEMENT this can be done very fast in assembly
+    for (size_t i = 0; i < samples_per_channel_ * num_channels_; i++) {
+      int32_t wrap_guard =
+          static_cast<int32_t>(data_[i]) + static_cast<int32_t>(rhs.data_[i]);
+      data_[i] = rtc::saturated_cast<int16_t>(wrap_guard);
+    }
+  }
+  return *this;
+}
+
+}  // namespace webrtc
+
+#endif  // WEBRTC_MODULES_INCLUDE_MODULE_COMMON_TYPES_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/aligned_malloc.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/aligned_malloc.h
new file mode 100644
index 0000000..bdd82cc
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/aligned_malloc.h
@@ -0,0 +1,59 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_SYSTEM_WRAPPERS_INCLUDE_ALIGNED_MALLOC_H_
+#define WEBRTC_SYSTEM_WRAPPERS_INCLUDE_ALIGNED_MALLOC_H_
+
+// The functions declared here
+// 1) Allocates block of aligned memory.
+// 2) Re-calculates a pointer such that it is aligned to a higher or equal
+//    address.
+// Note: alignment must be a power of two. The alignment is in bytes.
+
+#include <stddef.h>
+
+namespace webrtc {
+
+// Returns a pointer to the first boundry of |alignment| bytes following the
+// address of |ptr|.
+// Note that there is no guarantee that the memory in question is available.
+// |ptr| has no requirements other than it can't be NULL.
+void* GetRightAlign(const void* ptr, size_t alignment);
+
+// Allocates memory of |size| bytes aligned on an |alignment| boundry.
+// The return value is a pointer to the memory. Note that the memory must
+// be de-allocated using AlignedFree.
+void* AlignedMalloc(size_t size, size_t alignment);
+// De-allocates memory created using the AlignedMalloc() API.
+void AlignedFree(void* mem_block);
+
+// Templated versions to facilitate usage of aligned malloc without casting
+// to and from void*.
+template<typename T>
+T* GetRightAlign(const T* ptr, size_t alignment) {
+  return reinterpret_cast<T*>(GetRightAlign(reinterpret_cast<const void*>(ptr),
+                                            alignment));
+}
+template<typename T>
+T* AlignedMalloc(size_t size, size_t alignment) {
+  return reinterpret_cast<T*>(AlignedMalloc(size, alignment));
+}
+
+// Deleter for use with unique_ptr. E.g., use as
+//   std::unique_ptr<Foo, AlignedFreeDeleter> foo;
+struct AlignedFreeDeleter {
+  inline void operator()(void* ptr) const {
+    AlignedFree(ptr);
+  }
+};
+
+}  // namespace webrtc
+
+#endif // WEBRTC_SYSTEM_WRAPPERS_INCLUDE_ALIGNED_MALLOC_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/asm_defines.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/asm_defines.h
new file mode 100755
index 0000000..06f13a4
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/asm_defines.h
@@ -0,0 +1,66 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_SYSTEM_WRAPPERS_INCLUDE_ASM_DEFINES_H_
+#define WEBRTC_SYSTEM_WRAPPERS_INCLUDE_ASM_DEFINES_H_
+
+#if defined(__linux__) && defined(__ELF__)
+.section .note.GNU-stack,"",%progbits
+#endif
+
+// Define the macros used in ARM assembly code, so that for Mac or iOS builds
+// we add leading underscores for the function names.
+#ifdef __APPLE__
+.macro GLOBAL_FUNCTION name
+.global _\name
+.private_extern _\name
+.endm
+.macro DEFINE_FUNCTION name
+_\name:
+.endm
+.macro CALL_FUNCTION name
+bl _\name
+.endm
+.macro GLOBAL_LABEL name
+.global _\name
+.private_extern _\name
+.endm
+#else
+.macro GLOBAL_FUNCTION name
+.global \name
+.hidden \name
+.endm
+.macro DEFINE_FUNCTION name
+#if defined(__linux__) && defined(__ELF__)
+.type \name,%function
+#endif
+\name:
+.endm
+.macro CALL_FUNCTION name
+bl \name
+.endm
+.macro GLOBAL_LABEL name
+.global \name
+.hidden \name
+.endm
+#endif
+
+// With Apple's clang compiler, for instructions ldrb, strh, etc.,
+// the condition code is after the width specifier. Here we define
+// only the ones that are actually used in the assembly files.
+#if (defined __llvm__) && (defined __APPLE__)
+.macro streqh reg1, reg2, num
+strheq \reg1, \reg2, \num
+.endm
+#endif
+
+.text
+
+#endif  // WEBRTC_SYSTEM_WRAPPERS_INCLUDE_ASM_DEFINES_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/compile_assert_c.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/compile_assert_c.h
new file mode 100644
index 0000000..41c1ff7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/compile_assert_c.h
@@ -0,0 +1,21 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_SYSTEM_WRAPPERS_INCLUDE_COMPILE_ASSERT_H_
+#define WEBRTC_SYSTEM_WRAPPERS_INCLUDE_COMPILE_ASSERT_H_
+
+// Use this macro to verify at compile time that certain restrictions are met.
+// The argument is the boolean expression to evaluate.
+// Example:
+//   RTC_COMPILE_ASSERT(sizeof(foo) < 128);
+// Note: In C++, use static_assert instead!
+#define RTC_COMPILE_ASSERT(expression) switch (0) {case 0: case expression:;}
+
+#endif  // WEBRTC_SYSTEM_WRAPPERS_INCLUDE_COMPILE_ASSERT_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/cpu_features_wrapper.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/cpu_features_wrapper.h
new file mode 100644
index 0000000..9838d94
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/include/cpu_features_wrapper.h
@@ -0,0 +1,51 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#ifndef WEBRTC_SYSTEM_WRAPPERS_INCLUDE_CPU_FEATURES_WRAPPER_H_
+#define WEBRTC_SYSTEM_WRAPPERS_INCLUDE_CPU_FEATURES_WRAPPER_H_
+
+#if defined(__cplusplus) || defined(c_plusplus)
+extern "C" {
+#endif
+
+#include "webrtc/typedefs.h"
+
+// List of features in x86.
+typedef enum {
+  kSSE2,
+  kSSE3
+} CPUFeature;
+
+// List of features in ARM.
+enum {
+  kCPUFeatureARMv7       = (1 << 0),
+  kCPUFeatureVFPv3       = (1 << 1),
+  kCPUFeatureNEON        = (1 << 2),
+  kCPUFeatureLDREXSTREX  = (1 << 3)
+};
+
+typedef int (*WebRtc_CPUInfo)(CPUFeature feature);
+
+// Returns true if the CPU supports the feature.
+extern WebRtc_CPUInfo WebRtc_GetCPUInfo;
+
+// No CPU feature is available => straight C path.
+extern WebRtc_CPUInfo WebRtc_GetCPUInfoNoASM;
+
+// Return the features in an ARM device.
+// It detects the features in the hardware platform, and returns supported
+// values in the above enum definition as a bitmask.
+extern uint64_t WebRtc_GetCPUFeaturesARM(void);
+
+#if defined(__cplusplus) || defined(c_plusplus)
+}  // extern "C"
+#endif
+
+#endif // WEBRTC_SYSTEM_WRAPPERS_INCLUDE_CPU_FEATURES_WRAPPER_H_
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/aligned_malloc.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/aligned_malloc.cc
new file mode 100644
index 0000000..f700f8b
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/aligned_malloc.cc
@@ -0,0 +1,100 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include "webrtc/system_wrappers/include/aligned_malloc.h"
+
+#include <memory.h>
+#include <stdlib.h>
+
+#ifdef _WIN32
+#include <windows.h>
+#else
+#include <stdint.h>
+#endif
+
+#include "webrtc/typedefs.h"
+
+// Reference on memory alignment:
+// http://stackoverflow.com/questions/227897/solve-the-memory-alignment-in-c-interview-question-that-stumped-me
+namespace webrtc {
+
+uintptr_t GetRightAlign(uintptr_t start_pos, size_t alignment) {
+  // The pointer should be aligned with |alignment| bytes. The - 1 guarantees
+  // that it is aligned towards the closest higher (right) address.
+  return (start_pos + alignment - 1) & ~(alignment - 1);
+}
+
+// Alignment must be an integer power of two.
+bool ValidAlignment(size_t alignment) {
+  if (!alignment) {
+    return false;
+  }
+  return (alignment & (alignment - 1)) == 0;
+}
+
+void* GetRightAlign(const void* pointer, size_t alignment) {
+  if (!pointer) {
+    return NULL;
+  }
+  if (!ValidAlignment(alignment)) {
+    return NULL;
+  }
+  uintptr_t start_pos = reinterpret_cast<uintptr_t>(pointer);
+  return reinterpret_cast<void*>(GetRightAlign(start_pos, alignment));
+}
+
+void* AlignedMalloc(size_t size, size_t alignment) {
+  if (size == 0) {
+    return NULL;
+  }
+  if (!ValidAlignment(alignment)) {
+    return NULL;
+  }
+
+  // The memory is aligned towards the lowest address that so only
+  // alignment - 1 bytes needs to be allocated.
+  // A pointer to the start of the memory must be stored so that it can be
+  // retreived for deletion, ergo the sizeof(uintptr_t).
+  void* memory_pointer = malloc(size + sizeof(uintptr_t) + alignment - 1);
+  if (memory_pointer == NULL) {
+    return NULL;
+  }
+
+  // Aligning after the sizeof(uintptr_t) bytes will leave room for the header
+  // in the same memory block.
+  uintptr_t align_start_pos = reinterpret_cast<uintptr_t>(memory_pointer);
+  align_start_pos += sizeof(uintptr_t);
+  uintptr_t aligned_pos = GetRightAlign(align_start_pos, alignment);
+  void* aligned_pointer = reinterpret_cast<void*>(aligned_pos);
+
+  // Store the address to the beginning of the memory just before the aligned
+  // memory.
+  uintptr_t header_pos = aligned_pos - sizeof(uintptr_t);
+  void* header_pointer = reinterpret_cast<void*>(header_pos);
+  uintptr_t memory_start = reinterpret_cast<uintptr_t>(memory_pointer);
+  memcpy(header_pointer, &memory_start, sizeof(uintptr_t));
+
+  return aligned_pointer;
+}
+
+void AlignedFree(void* mem_block) {
+  if (mem_block == NULL) {
+    return;
+  }
+  uintptr_t aligned_pos = reinterpret_cast<uintptr_t>(mem_block);
+  uintptr_t header_pos = aligned_pos - sizeof(uintptr_t);
+
+  // Read out the address of the AlignedMemory struct from the header.
+  uintptr_t memory_start_pos = *reinterpret_cast<uintptr_t*>(header_pos);
+  void* memory_start = reinterpret_cast<void*>(memory_start_pos);
+  free(memory_start);
+}
+
+}  // namespace webrtc
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features.cc b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features.cc
new file mode 100644
index 0000000..49840eb
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features.cc
@@ -0,0 +1,72 @@
+/*
+ *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// Parts of this file derived from Chromium's base/cpu.cc.
+
+#include "webrtc/system_wrappers/include/cpu_features_wrapper.h"
+
+#if defined(WEBRTC_ARCH_X86_FAMILY) && defined(_MSC_VER)
+#include <intrin.h>
+#endif
+
+#include "webrtc/typedefs.h"
+
+// No CPU feature is available => straight C path.
+int GetCPUInfoNoASM(CPUFeature feature) {
+  (void)feature;
+  return 0;
+}
+
+#if defined(WEBRTC_ARCH_X86_FAMILY)
+#ifndef _MSC_VER
+// Intrinsic for "cpuid".
+#if defined(__pic__) && defined(__i386__)
+static inline void __cpuid(int cpu_info[4], int info_type) {
+  __asm__ volatile(
+    "mov %%ebx, %%edi\n"
+    "cpuid\n"
+    "xchg %%edi, %%ebx\n"
+    : "=a"(cpu_info[0]), "=D"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3])
+    : "a"(info_type));
+}
+#else
+static inline void __cpuid(int cpu_info[4], int info_type) {
+  __asm__ volatile(
+    "cpuid\n"
+    : "=a"(cpu_info[0]), "=b"(cpu_info[1]), "=c"(cpu_info[2]), "=d"(cpu_info[3])
+    : "a"(info_type));
+}
+#endif
+#endif  // _MSC_VER
+#endif  // WEBRTC_ARCH_X86_FAMILY
+
+#if defined(WEBRTC_ARCH_X86_FAMILY)
+// Actual feature detection for x86.
+static int GetCPUInfo(CPUFeature feature) {
+  int cpu_info[4];
+  __cpuid(cpu_info, 1);
+  if (feature == kSSE2) {
+    return 0 != (cpu_info[3] & 0x04000000);
+  }
+  if (feature == kSSE3) {
+    return 0 != (cpu_info[2] & 0x00000001);
+  }
+  return 0;
+}
+#else
+// Default to straight C for other platforms.
+static int GetCPUInfo(CPUFeature feature) {
+  (void)feature;
+  return 0;
+}
+#endif
+
+WebRtc_CPUInfo WebRtc_GetCPUInfo = GetCPUInfo;
+WebRtc_CPUInfo WebRtc_GetCPUInfoNoASM = GetCPUInfoNoASM;
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features_android.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features_android.c
new file mode 100644
index 0000000..0cb3a6c
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features_android.c
@@ -0,0 +1,15 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <cpu-features.h>
+
+uint64_t WebRtc_GetCPUFeaturesARM(void) {
+  return android_getCpuFeatures();
+}
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features_linux.c b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features_linux.c
new file mode 100644
index 0000000..112ad03
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/system_wrappers/source/cpu_features_linux.c
@@ -0,0 +1,86 @@
+/*
+ *  Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+#include <stdlib.h>
+#include <string.h>
+#include <features.h>
+#ifndef __GLIBC_PREREQ
+#define __GLIBC_PREREQ(a, b) 0
+#endif
+#if __GLIBC_PREREQ(2, 16)
+#include <sys/auxv.h>
+#else
+#include <fcntl.h>
+#include <unistd.h>
+#include <errno.h>
+#include <link.h>
+#endif
+#include "webrtc/system_wrappers/include/cpu_features_wrapper.h"
+
+#if defined(WEBRTC_ARCH_ARM_FAMILY)
+#include <asm/hwcap.h>
+
+uint64_t WebRtc_GetCPUFeaturesARM(void) {
+  uint64_t result = 0;
+  int architecture = 0;
+  unsigned long hwcap = 0;
+  const char* platform = NULL;
+#if __GLIBC_PREREQ(2, 16)
+  hwcap = getauxval(AT_HWCAP);
+  platform = (const char*)getauxval(AT_PLATFORM);
+#else
+  ElfW(auxv_t) auxv;
+  int fd = open("/proc/self/auxv", O_RDONLY);
+  if (fd >= 0) {
+    while (hwcap == 0 || platform == NULL) {
+      if (read(fd, &auxv, sizeof(auxv)) < (ssize_t)sizeof(auxv)) {
+        if (errno == EINTR)
+          continue;
+        break;
+      }
+      switch (auxv.a_type) {
+        case AT_HWCAP:
+          hwcap = auxv.a_un.a_val;
+          break;
+        case AT_PLATFORM:
+          platform = (const char*)auxv.a_un.a_val;
+          break;
+      }
+    }
+    close(fd);
+  }
+#endif  // __GLIBC_PREREQ(2,16)
+#if defined(__aarch64__)
+  architecture = 8;
+  if ((hwcap & HWCAP_FP) != 0)
+    result |= kCPUFeatureVFPv3;
+  if ((hwcap & HWCAP_ASIMD) != 0)
+    result |= kCPUFeatureNEON;
+#else
+  if (platform != NULL) {
+    /* expect a string in the form "v6l" or "v7l", etc.
+     */
+    if (platform[0] == 'v' && '0' <= platform[1] && platform[1] <= '9' &&
+        (platform[2] == 'l' || platform[2] == 'b')) {
+      architecture = platform[1] - '0';
+    }
+  }
+  if ((hwcap & HWCAP_VFPv3) != 0)
+    result |= kCPUFeatureVFPv3;
+  if ((hwcap & HWCAP_NEON) != 0)
+    result |= kCPUFeatureNEON;
+#endif
+  if (architecture >= 7)
+    result |= kCPUFeatureARMv7;
+  if (architecture >= 6)
+    result |= kCPUFeatureLDREXSTREX;
+  return result;
+}
+#endif  // WEBRTC_ARCH_ARM_FAMILY
diff --git a/AutoCoverTool/ref/tools/mixer/denoise/webrtc/typedefs.h b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/typedefs.h
new file mode 100644
index 0000000..bd0bee7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/denoise/webrtc/typedefs.h
@@ -0,0 +1,125 @@
+/*
+ *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
+ *
+ *  Use of this source code is governed by a BSD-style license
+ *  that can be found in the LICENSE file in the root of the source
+ *  tree. An additional intellectual property rights grant can be found
+ *  in the file PATENTS.  All contributing project authors may
+ *  be found in the AUTHORS file in the root of the source tree.
+ */
+
+// This file contains platform-specific typedefs and defines.
+// Much of it is derived from Chromium's build/build_config.h.
+
+#ifndef WEBRTC_TYPEDEFS_H_
+#define WEBRTC_TYPEDEFS_H_
+
+// Processor architecture detection.  For more info on what's defined, see:
+//   http://msdn.microsoft.com/en-us/library/b0084kay.aspx
+//   http://www.agner.org/optimize/calling_conventions.pdf
+//   or with gcc, run: "echo | gcc -E -dM -"
+#if defined(_M_X64) || defined(__x86_64__)
+#define WEBRTC_ARCH_X86_FAMILY
+#define WEBRTC_ARCH_X86_64
+#define WEBRTC_ARCH_64_BITS
+#define WEBRTC_ARCH_LITTLE_ENDIAN
+#elif defined(__aarch64__)
+#define WEBRTC_ARCH_ARM_FAMILY
+#define WEBRTC_ARCH_64_BITS
+#define WEBRTC_ARCH_LITTLE_ENDIAN
+#elif defined(_M_IX86) || defined(__i386__)
+#define WEBRTC_ARCH_X86_FAMILY
+#define WEBRTC_ARCH_X86
+#define WEBRTC_ARCH_32_BITS
+#define WEBRTC_ARCH_LITTLE_ENDIAN
+#elif defined(__ARMEL__)
+#define WEBRTC_ARCH_ARM_FAMILY
+#define WEBRTC_ARCH_32_BITS
+#define WEBRTC_ARCH_LITTLE_ENDIAN
+#elif defined(__MIPSEL__)
+#define WEBRTC_ARCH_MIPS_FAMILY
+#if defined(__LP64__)
+#define WEBRTC_ARCH_64_BITS
+#else
+#define WEBRTC_ARCH_32_BITS
+#endif
+#define WEBRTC_ARCH_LITTLE_ENDIAN
+#elif defined(__pnacl__)
+#define WEBRTC_ARCH_32_BITS
+#define WEBRTC_ARCH_LITTLE_ENDIAN
+#else
+#error Please add support for your architecture in typedefs.h
+#endif
+
+#if !(defined(WEBRTC_ARCH_LITTLE_ENDIAN) ^ defined(WEBRTC_ARCH_BIG_ENDIAN))
+#error Define either WEBRTC_ARCH_LITTLE_ENDIAN or WEBRTC_ARCH_BIG_ENDIAN
+#endif
+
+// TODO(zhongwei.yao): WEBRTC_CPU_DETECTION is only used in one place; we should
+// probably just remove it.
+#if (defined(WEBRTC_ARCH_X86_FAMILY) && !defined(__SSE2__))
+#define WEBRTC_CPU_DETECTION
+#endif
+
+#include <stdint.h>
+
+// Annotate a function indicating the caller must examine the return value.
+// Use like:
+//   int foo() RTC_WARN_UNUSED_RESULT;
+// To explicitly ignore a result, cast to void.
+// TODO(kwiberg): Remove when we can use [[nodiscard]] from C++17.
+#if defined(__clang__)
+#define RTC_WARN_UNUSED_RESULT __attribute__((__warn_unused_result__))
+#elif defined(__GNUC__)
+// gcc has a __warn_unused_result__ attribute, but you can't quiet it by
+// casting to void, so we don't use it.
+#define RTC_WARN_UNUSED_RESULT
+#else
+#define RTC_WARN_UNUSED_RESULT
+#endif
+
+// Put after a variable that might not be used, to prevent compiler warnings:
+//   int result ATTRIBUTE_UNUSED = DoSomething();
+//   assert(result == 17);
+// Deprecated since it only works with GCC & clang. See RTC_UNUSED below.
+// TODO(terelius): Remove.
+#ifndef ATTRIBUTE_UNUSED
+#if defined(__GNUC__) || defined(__clang__)
+#define ATTRIBUTE_UNUSED __attribute__ ((__unused__))
+#else
+#define ATTRIBUTE_UNUSED
+#endif
+#endif
+
+// Macro to be used for switch-case fallthrough (required for enabling
+// -Wimplicit-fallthrough warning on Clang).
+#ifndef FALLTHROUGH
+#if defined(__clang__)
+#define FALLTHROUGH() [[clang::fallthrough]]
+#else
+#define FALLTHROUGH() do { } while (0)
+#endif
+#endif
+
+#ifndef NO_RETURN
+// Annotate a function that will not return control flow to the caller.
+#if defined(_MSC_VER)
+#define NO_RETURN __declspec(noreturn)
+#elif defined(__GNUC__)
+#define NO_RETURN __attribute__ ((__noreturn__))
+#else
+#define NO_RETURN
+#endif
+#endif
+
+// Prevent the compiler from warning about an unused variable. For example:
+//   int result = DoSomething();
+//   assert(result == 17);
+//   RTC_UNUSED(result);
+// Note: In most cases it is better to remove the unused variable rather than
+// suppressing the compiler warning.
+#ifndef RTC_UNUSED
+#define RTC_UNUSED(x) static_cast<void>(x)
+#endif  // RTC_UNUSED
+
+#endif  // WEBRTC_TYPEDEFS_H_
diff --git a/AutoCoverTool/ref/tools/mixer/draw_volume.cpp b/AutoCoverTool/ref/tools/mixer/draw_volume.cpp
new file mode 100644
index 0000000..57a3475
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/draw_volume.cpp
@@ -0,0 +1,203 @@
+//
+// Created by yangjianli on 2023/2/27.
+//
+#include <iostream>
+#include <cstdio>
+#include <cmath>
+#include "WaveFile.h"
+#include "denoise/webrtc/include/WebrtcDenoise.h"
+#include "alimter/inc/alimiter.h"
+#include "ebur128.h"
+
+#define PROC_LEN 1024
+#define DEFAULT_BASELINE_DB (float)-14.57f
+
+double calc_power(const float *in, int32_t channel, int32_t len)
+{
+    double in_power = 0;
+    for (int i = 0; i < len; i += channel)
+    {
+        in_power += in[i] * in[i];
+    }
+    return in_power;
+}
+
+float calc_power_by_ref(const float *in, int32_t in_channel, int32_t in_len,
+        const float *ref, int32_t ref_channel, int32_t ref_len)
+{
+    double in_power = 0;
+    double ref_power = 0;
+
+    float mmax = -1;
+    for (int i = 0, j=0; i < in_len && j < ref_len; i += in_channel, j+=ref_channel)
+    {
+        // 能量过低，不参与计算
+        float cur_refj = ref[j] > 0 ? ref[j] : -ref[j];
+        if (cur_refj > mmax)
+        {
+            mmax = cur_refj;
+        }
+        if (cur_refj > 0.01)
+        {
+            in_power += in[i] > 0 ? in[i] : -in[i];
+            ref_power += cur_refj;
+        }
+    }
+    if (in_power > 0)
+    {
+        return float(ref_power / in_power);
+    }
+    return -1;
+}
+
+/**
+ * 获取增益
+ * @param nChannel
+ * @param nSampleRate
+ * @param pData
+ * @param nLength
+ * @param gain
+ * @return
+ */
+int ebur128_whole(int nChannel, int nSampleRate, short *pData, const int nLength, double &gated_loudness)
+{
+    printf("ebur128_init start .. %d\n", nLength);
+    ebur128_state *st = NULL;
+    st = ebur128_init(nChannel, nSampleRate, EBUR128_MODE_I);
+    if (NULL == st)
+    {
+        return -1;
+    }
+    int nPos = 0;
+    int nTmpLength = 0;
+    int nRet;
+    printf("process start ..\n");
+    while (nPos < nLength)
+    {
+        nTmpLength = PROC_LEN;
+        if (nLength - nPos < PROC_LEN)
+        {
+            nTmpLength = nLength - nPos;
+        }
+        nRet = ebur128_add_frames_short(st, pData + nPos, nTmpLength / nChannel);
+        if (nRet != 0)
+        {
+            return -2;
+        }
+        nPos += nTmpLength;
+    }
+    gated_loudness = -1;
+    ebur128_loudness_global(st, &gated_loudness);
+    printf("process ok.. %f\n", gated_loudness);
+//    float db = (DEFAULT_BASELINE_DB - gated_loudness) / 20.f;
+//    gain = pow(10, db);
+//    printf("gated_loudness = %f db = %f  gain = %f\n", gated_loudness, db, gain);
+    ebur128_destroy(&st);
+    return 0;
+}
+
+int main(int argc, char *argv[])
+{
+
+    if (argc != 4)
+    {
+        printf("input error! example: ./main vocal_path ref_vocal_path out_vocal_path\n");
+        return -1;
+    }
+    std::string vocal_path = argv[1];
+    std::string ref_vocal_path = argv[2];
+    std::string out_vocal_path = argv[3];
+
+    CWaveFile vocal_wav = CWaveFile(vocal_path.c_str(), false);
+    if (!vocal_wav.GetStatus())
+    {
+        printf("%s not ok!\n", vocal_path.c_str());
+        return -2;
+    }
+    CWaveFile ref_vocal_wav = CWaveFile(ref_vocal_path.c_str(), false);
+    if (!ref_vocal_wav.GetStatus())
+    {
+        printf("%s not ok!\n", ref_vocal_path.c_str());
+        return -3;
+    }
+    int vocal_buf_len = vocal_wav.GetChannels() * vocal_wav.GetTotalFrames();
+    float *vocal_buf = new float[vocal_buf_len];
+    vocal_wav.ReadFrameAsfloat(vocal_buf, vocal_wav.GetTotalFrames());
+    int ref_vocal_buf_len = ref_vocal_wav.GetChannels() * ref_vocal_wav.GetTotalFrames();
+    float *ref_vocal_buf = new float[ref_vocal_buf_len];
+    ref_vocal_wav.ReadFrameAsfloat(ref_vocal_buf, ref_vocal_wav.GetTotalFrames());
+
+//    CWebrtcDenoise denoise_inst;
+//    denoise_inst.init(vocal_wav.GetSampleRate(), vocal_wav.GetChannels());
+//    denoise_inst.set_level(kHigh);
+//    denoise_inst.process(vocal_buf, vocal_buf_len);
+//    denoise_inst.uninit();
+
+//    int min_frames = ref_vocal_wav.GetTotalFrames() > vocal_wav.GetTotalFrames() ? vocal_wav.GetTotalFrames()
+//                                                                                 : ref_vocal_wav.GetTotalFrames();
+//    double vocal_power = calc_power(vocal_buf, vocal_wav.GetChannels(), min_frames * vocal_wav.GetChannels());
+//    double ref_vocal_power = calc_power(ref_vocal_buf, ref_vocal_wav.GetChannels(),
+//                                        min_frames * ref_vocal_wav.GetChannels());
+//    if (fabs(vocal_power - 0) < 0.0001)
+//    {
+//        printf("vocal_power is zero\n");
+//        return -3;
+//    }
+//    float power_rate = sqrt(ref_vocal_power / vocal_power);
+
+    float power_rate = calc_power_by_ref(vocal_buf, vocal_wav.GetChannels(), vocal_wav.GetTotalFrames() * vocal_wav.GetChannels(),
+            ref_vocal_buf, ref_vocal_wav.GetChannels(), ref_vocal_wav.GetTotalFrames() * ref_vocal_wav.GetChannels());
+    if (power_rate < 0)
+    {
+        printf("vocal_power is zero\n");
+        return -3;
+    }
+
+    // 计算响度值
+    // 获取人声增益
+    double vocal_gated_loudness;
+    short* short_vocal_buf = new short[vocal_wav.GetTotalFrames() * vocal_wav.GetChannels()];
+    for(int i = 0; i < vocal_wav.GetTotalFrames() * vocal_wav.GetChannels(); i++)
+    {
+        short_vocal_buf[i] = float(vocal_buf[i]) * 32768.f;
+    }
+    ebur128_whole(vocal_wav.GetChannels(), vocal_wav.GetSampleRate(), short_vocal_buf,
+            vocal_wav.GetTotalFrames() * vocal_wav.GetChannels(), vocal_gated_loudness);
+
+    printf("vocal loudness=%f...\n", vocal_gated_loudness);
+    double ref_vocal_gated_loudness;
+    short* short_ref_vocal_buf = new short[ref_vocal_wav.GetTotalFrames() * ref_vocal_wav.GetChannels()];
+    for(int i = 0; i < ref_vocal_wav.GetTotalFrames() * ref_vocal_wav.GetChannels(); i++)
+    {
+        short_ref_vocal_buf[i] = float(ref_vocal_buf[i]) * 32768.f;
+    }
+    ebur128_whole(ref_vocal_wav.GetChannels(), ref_vocal_wav.GetSampleRate(), short_ref_vocal_buf,
+                  ref_vocal_wav.GetTotalFrames() * ref_vocal_wav.GetChannels(), ref_vocal_gated_loudness);
+    printf("ref vocal loudness=%f...\n", ref_vocal_gated_loudness);
+    float db = (ref_vocal_gated_loudness - vocal_gated_loudness) / 20.f;
+    float ebur128_rate = pow(10, db);
+    // 两者选择较大值
+    float final_rate = power_rate > ebur128_rate ? power_rate : ebur128_rate;
+    printf("power_rate:%f, ebur128_rate:%f final_rate:%f\n", power_rate, ebur128_rate, final_rate);
+    SUPERSOUND::Alimiter limiter;
+    limiter.SetParam(vocal_wav.GetSampleRate(), vocal_wav.GetChannels());
+    for (int i = 0; i < vocal_buf_len; i++)
+    {
+        float out = vocal_buf[i] * final_rate;
+        limiter.Filter(&out, &out, 1);
+        vocal_buf[i] = out;
+    }
+
+    CWaveFile out_wav = CWaveFile(out_vocal_path.c_str(), true);
+    out_wav.SetChannels(vocal_wav.GetChannels());
+    out_wav.SetSampleRate(vocal_wav.GetSampleRate());
+    out_wav.SetSampleFormat(SF_IEEE_FLOAT);
+    out_wav.SetupDone();
+    out_wav.WriteFrame(vocal_buf, vocal_wav.GetTotalFrames());
+
+    delete[] vocal_buf;
+    delete[] ref_vocal_buf;
+    delete[] short_vocal_buf;
+    delete[] short_ref_vocal_buf;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/ebur128/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/ebur128/CMakeLists.txt
new file mode 100644
index 0000000..18a5a86
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/ebur128/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_EBUR128_SRCS)
+add_library(ebur128 ${DIR_EBUR128_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/ebur128/inc/ebur128.h b/AutoCoverTool/ref/tools/mixer/ebur128/inc/ebur128.h
new file mode 100755
index 0000000..faa66c6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/ebur128/inc/ebur128.h
@@ -0,0 +1,425 @@
+/* See COPYING file for copyright and license details. */
+
+#ifndef EBUR128_H_
+#define EBUR128_H_
+
+/** \file ebur128.h
+ *  \brief libebur128 - a library for loudness measurement according to
+ *         the EBU R128 standard.
+ */
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#define EBUR128_VERSION_MAJOR 1
+#define EBUR128_VERSION_MINOR 2
+#define EBUR128_VERSION_PATCH 4
+
+#include <stddef.h>       /* for size_t */
+
+/** \enum channel
+ *  Use these values when setting the channel map with ebur128_set_channel().
+ *  See definitions in ITU R-REC-BS 1770-4
+ */
+enum channel {
+  EBUR128_UNUSED = 0,     /**< unused channel (for example LFE channel) */
+  EBUR128_LEFT   = 1,
+  EBUR128_Mp030  = 1,     /**< itu M+030 */
+  EBUR128_RIGHT  = 2,
+  EBUR128_Mm030  = 2,     /**< itu M-030 */
+  EBUR128_CENTER = 3,
+  EBUR128_Mp000  = 3,     /**< itu M+000 */
+  EBUR128_LEFT_SURROUND  = 4,
+  EBUR128_Mp110  = 4,     /**< itu M+110 */
+  EBUR128_RIGHT_SURROUND = 5,
+  EBUR128_Mm110  = 5,     /**< itu M-110 */
+  EBUR128_DUAL_MONO,      /**< a channel that is counted twice */
+  EBUR128_MpSC,           /**< itu M+SC */
+  EBUR128_MmSC,           /**< itu M-SC */
+  EBUR128_Mp060,          /**< itu M+060 */
+  EBUR128_Mm060,          /**< itu M-060 */
+  EBUR128_Mp090,          /**< itu M+090 */
+  EBUR128_Mm090,          /**< itu M-090 */
+  EBUR128_Mp135,          /**< itu M+135 */
+  EBUR128_Mm135,          /**< itu M-135 */
+  EBUR128_Mp180,          /**< itu M+180 */
+  EBUR128_Up000,          /**< itu U+000 */
+  EBUR128_Up030,          /**< itu U+030 */
+  EBUR128_Um030,          /**< itu U-030 */
+  EBUR128_Up045,          /**< itu U+045 */
+  EBUR128_Um045,          /**< itu U-030 */
+  EBUR128_Up090,          /**< itu U+090 */
+  EBUR128_Um090,          /**< itu U-090 */
+  EBUR128_Up110,          /**< itu U+110 */
+  EBUR128_Um110,          /**< itu U-110 */
+  EBUR128_Up135,          /**< itu U+135 */
+  EBUR128_Um135,          /**< itu U-135 */
+  EBUR128_Up180,          /**< itu U+180 */
+  EBUR128_Tp000,          /**< itu T+000 */
+  EBUR128_Bp000,          /**< itu B+000 */
+  EBUR128_Bp045,          /**< itu B+045 */
+  EBUR128_Bm045           /**< itu B-045 */
+};
+
+/** \enum error
+ *  Error return values.
+ */
+enum error {
+  EBUR128_SUCCESS = 0,
+  EBUR128_ERROR_NOMEM,
+  EBUR128_ERROR_INVALID_MODE,
+  EBUR128_ERROR_INVALID_CHANNEL_INDEX,
+  EBUR128_ERROR_NO_CHANGE
+};
+
+/** \enum mode
+ *  Use these values in ebur128_init (or'ed). Try to use the lowest possible
+ *  modes that suit your needs, as performance will be better.
+ */
+enum mode {
+  /** can call ebur128_loudness_momentary */
+  EBUR128_MODE_M           = (1 << 0),
+  /** can call ebur128_loudness_shortterm */
+  EBUR128_MODE_S           = (1 << 1) | EBUR128_MODE_M,
+  /** can call ebur128_loudness_global_* and ebur128_relative_threshold */
+  EBUR128_MODE_I           = (1 << 2) | EBUR128_MODE_M,
+  /** can call ebur128_loudness_range */
+  EBUR128_MODE_LRA         = (1 << 3) | EBUR128_MODE_S,
+  /** can call ebur128_sample_peak */
+  EBUR128_MODE_SAMPLE_PEAK = (1 << 4) | EBUR128_MODE_M,
+  /** can call ebur128_true_peak */
+  EBUR128_MODE_TRUE_PEAK   = (1 << 5) | EBUR128_MODE_M
+                                      | EBUR128_MODE_SAMPLE_PEAK,
+  /** uses histogram algorithm to calculate loudness */
+  EBUR128_MODE_HISTOGRAM   = (1 << 6)
+};
+
+/** forward declaration of ebur128_state_internal */
+struct ebur128_state_internal;
+
+/** \brief Contains information about the state of a loudness measurement.
+ *
+ *  You should not need to modify this struct directly.
+ */
+typedef struct {
+  int mode;                           /**< The current mode. */
+  unsigned int channels;              /**< The number of channels. */
+  unsigned long samplerate;           /**< The sample rate. */
+  struct ebur128_state_internal* d;   /**< Internal state. */
+} ebur128_state;
+
+/** \brief Get library version number. Do not pass null pointers here.
+ *
+ *  @param major major version number of library
+ *  @param minor minor version number of library
+ *  @param patch patch version number of library
+ */
+void ebur128_get_version(int* major, int* minor, int* patch);
+
+/** \brief Initialize library state.
+ *
+ *  @param channels the number of channels.
+ *  @param samplerate the sample rate.
+ *  @param mode see the mode enum for possible values.
+ *  @return an initialized library state, or NULL on error.
+ */
+ebur128_state* ebur128_init(unsigned int channels,
+                            unsigned long samplerate,
+                            int mode);
+
+/** \brief Destroy library state.
+ *
+ *  @param st pointer to a library state.
+ */
+void ebur128_destroy(ebur128_state** st);
+
+/** \brief Set channel type.
+ *
+ *  The default is:
+ *  - 0 -> EBUR128_LEFT
+ *  - 1 -> EBUR128_RIGHT
+ *  - 2 -> EBUR128_CENTER
+ *  - 3 -> EBUR128_UNUSED
+ *  - 4 -> EBUR128_LEFT_SURROUND
+ *  - 5 -> EBUR128_RIGHT_SURROUND
+ *
+ *  @param st library state.
+ *  @param channel_number zero based channel index.
+ *  @param value channel type from the "channel" enum.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_set_channel(ebur128_state* st,
+                        unsigned int channel_number,
+                        int value);
+
+/** \brief Change library parameters.
+ *
+ *  Note that the channel map will be reset when setting a different number of
+ *  channels. The current unfinished block will be lost.
+ *
+ *  @param st library state.
+ *  @param channels new number of channels.
+ *  @param samplerate new sample rate.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM on memory allocation error. The state will be
+ *      invalid and must be destroyed.
+ *    - EBUR128_ERROR_NO_CHANGE if channels and sample rate were not changed.
+ */
+int ebur128_change_parameters(ebur128_state* st,
+                              unsigned int channels,
+                              unsigned long samplerate);
+
+/** \brief Set the maximum window duration.
+ *
+ *  Set the maximum duration that will be used for ebur128_window_loudness().
+ *  Note that this destroys the current content of the audio buffer.
+ *
+ *  @param st library state.
+ *  @param window duration of the window in ms.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM on memory allocation error. The state will be
+ *      invalid and must be destroyed.
+ *    - EBUR128_ERROR_NO_CHANGE if window duration not changed.
+ */
+int ebur128_set_max_window(ebur128_state* st, unsigned long window);
+
+/** \brief Set the maximum history.
+ *
+ *  Set the maximum history that will be stored for loudness integration.
+ *  More history provides more accurate results, but requires more resources.
+ *
+ *  Applies to ebur128_loudness_range() and ebur128_loudness_global() when
+ *  EBUR128_MODE_HISTOGRAM is not set.
+ *
+ *  Default is ULONG_MAX (at least ~50 days).
+ *  Minimum is 3000ms for EBUR128_MODE_LRA and 400ms for EBUR128_MODE_M.
+ *
+ *  @param st library state.
+ *  @param history duration of history in ms.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NO_CHANGE if history not changed.
+ */
+int ebur128_set_max_history(ebur128_state* st, unsigned long history);
+
+/** \brief Add frames to be processed.
+ *
+ *  @param st library state.
+ *  @param src array of source frames. Channels must be interleaved.
+ *  @param frames number of frames. Not number of samples!
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM on memory allocation error.
+ */
+int ebur128_add_frames_short(ebur128_state* st,
+                             const short* src,
+                             size_t frames);
+/** \brief See \ref ebur128_add_frames_short */
+int ebur128_add_frames_int(ebur128_state* st,
+                             const int* src,
+                             size_t frames);
+/** \brief See \ref ebur128_add_frames_short */
+int ebur128_add_frames_float(ebur128_state* st,
+                             const float* src,
+                             size_t frames);
+/** \brief See \ref ebur128_add_frames_short */
+int ebur128_add_frames_double(ebur128_state* st,
+                             const double* src,
+                             size_t frames);
+
+/** \brief Get global integrated loudness in LUFS.
+ *
+ *  @param st library state.
+ *  @param out integrated loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_I" has not been set.
+ */
+int ebur128_loudness_global(ebur128_state* st, double* out);
+/** \brief Get global integrated loudness in LUFS across multiple instances.
+ *
+ *  @param sts array of library states.
+ *  @param size length of sts
+ *  @param out integrated loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_I" has not been set.
+ */
+int ebur128_loudness_global_multiple(ebur128_state** sts,
+                                     size_t size,
+                                     double* out);
+
+/** \brief Get momentary loudness (last 400ms) in LUFS.
+ *
+ *  @param st library state.
+ *  @param out momentary loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ */
+int ebur128_loudness_momentary(ebur128_state* st, double* out);
+/** \brief Get short-term loudness (last 3s) in LUFS.
+ *
+ *  @param st library state.
+ *  @param out short-term loudness in LUFS. -HUGE_VAL if result is negative
+ *             infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_S" has not been set.
+ */
+int ebur128_loudness_shortterm(ebur128_state* st, double* out);
+
+/** \brief Get loudness of the specified window in LUFS.
+ *
+ *  window must not be larger than the current window set in st.
+ *  The current window can be changed by calling ebur128_set_max_window().
+ *
+ *  @param st library state.
+ *  @param window window in ms to calculate loudness.
+ *  @param out loudness in LUFS. -HUGE_VAL if result is negative infinity.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if window larger than current window in st.
+ */
+int ebur128_loudness_window(ebur128_state* st,
+                            unsigned long window,
+                            double* out);
+
+/** \brief Get loudness range (LRA) of programme in LU.
+ *
+ *  Calculates loudness range according to EBU 3342.
+ *
+ *  @param st library state.
+ *  @param out loudness range (LRA) in LU. Will not be changed in case of
+ *             error. EBUR128_ERROR_NOMEM or EBUR128_ERROR_INVALID_MODE will be
+ *             returned in this case.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM in case of memory allocation error.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_LRA" has not been set.
+ */
+int ebur128_loudness_range(ebur128_state* st, double* out);
+/** \brief Get loudness range (LRA) in LU across multiple instances.
+ *
+ *  Calculates loudness range according to EBU 3342.
+ *
+ *  @param sts array of library states.
+ *  @param size length of sts
+ *  @param out loudness range (LRA) in LU. Will not be changed in case of
+ *             error. EBUR128_ERROR_NOMEM or EBUR128_ERROR_INVALID_MODE will be
+ *             returned in this case.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_NOMEM in case of memory allocation error.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_LRA" has not been set.
+ */
+int ebur128_loudness_range_multiple(ebur128_state** sts,
+                                    size_t size,
+                                    double* out);
+
+/** \brief Get maximum sample peak from all frames that have been processed.
+ *
+ *  The equation to convert to dBFS is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum sample peak in float format (1.0 is 0 dBFS)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_SAMPLE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_sample_peak(ebur128_state* st,
+                        unsigned int channel_number,
+                        double* out);
+
+/** \brief Get maximum sample peak from the last call to add_frames().
+ *
+ *  The equation to convert to dBFS is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum sample peak in float format (1.0 is 0 dBFS)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_SAMPLE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_prev_sample_peak(ebur128_state* st,
+                             unsigned int channel_number,
+                             double* out);
+
+/** \brief Get maximum true peak from all frames that have been processed.
+ *
+ *  Uses an implementation defined algorithm to calculate the true peak. Do not
+ *  try to compare resulting values across different versions of the library,
+ *  as the algorithm may change.
+ *
+ *  The current implementation uses a custom polyphase FIR interpolator to
+ *  calculate true peak. Will oversample 4x for sample rates < 96000 Hz, 2x for
+ *  sample rates < 192000 Hz and leave the signal unchanged for 192000 Hz.
+ *
+ *  The equation to convert to dBTP is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum true peak in float format (1.0 is 0 dBTP)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_TRUE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_true_peak(ebur128_state* st,
+                      unsigned int channel_number,
+                      double* out);
+
+/** \brief Get maximum true peak from the last call to add_frames().
+ *
+ *  Uses an implementation defined algorithm to calculate the true peak. Do not
+ *  try to compare resulting values across different versions of the library,
+ *  as the algorithm may change.
+ *
+ *  The current implementation uses a custom polyphase FIR interpolator to
+ *  calculate true peak. Will oversample 4x for sample rates < 96000 Hz, 2x for
+ *  sample rates < 192000 Hz and leave the signal unchanged for 192000 Hz.
+ *
+ *  The equation to convert to dBTP is: 20 * log10(out)
+ *
+ *  @param st library state
+ *  @param channel_number channel to analyse
+ *  @param out maximum true peak in float format (1.0 is 0 dBTP)
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_TRUE_PEAK" has not
+ *      been set.
+ *    - EBUR128_ERROR_INVALID_CHANNEL_INDEX if invalid channel index.
+ */
+int ebur128_prev_true_peak(ebur128_state* st,
+                           unsigned int channel_number,
+                           double* out);
+
+/** \brief Get relative threshold in LUFS.
+ *
+ *  @param st library state
+ *  @param out relative threshold in LUFS.
+ *  @return
+ *    - EBUR128_SUCCESS on success.
+ *    - EBUR128_ERROR_INVALID_MODE if mode "EBUR128_MODE_I" has not
+ *      been set.
+ */
+int ebur128_relative_threshold(ebur128_state* st, double* out);
+#ifdef __cplusplus
+}
+#endif
+
+#endif  /* EBUR128_H_ */
diff --git a/AutoCoverTool/ref/tools/mixer/ebur128/src/ebur128.c b/AutoCoverTool/ref/tools/mixer/ebur128/src/ebur128.c
new file mode 100755
index 0000000..6c10f1e
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/ebur128/src/ebur128.c
@@ -0,0 +1,1333 @@
+/* See COPYING file for copyright and license details. */
+
+#include "ebur128.h"
+
+#include <float.h>
+#include <limits.h>
+#include <math.h> /* You may have to define _USE_MATH_DEFINES if you use MSVC */
+#include <stdio.h>
+#include <stdlib.h>
+
+/* This can be replaced by any BSD-like queue implementation. */
+#include <sys/queue.h>
+
+#define CHECK_ERROR(condition, errorcode, goto_point)                          \
+  if ((condition)) {                                                           \
+    errcode = (errorcode);                                                     \
+    goto goto_point;                                                           \
+  }
+
+STAILQ_HEAD(ebur128_double_queue, ebur128_dq_entry);
+struct ebur128_dq_entry {
+  double z;
+  STAILQ_ENTRY(ebur128_dq_entry) entries;
+};
+
+#define ALMOST_ZERO 0.000001
+
+typedef struct {              /* Data structure for polyphase FIR interpolator */
+  unsigned int factor;        /* Interpolation factor of the interpolator */
+  unsigned int taps;          /* Taps (prefer odd to increase zero coeffs) */
+  unsigned int channels;      /* Number of channels */
+  unsigned int delay;         /* Size of delay buffer */
+  struct {
+    unsigned int count;       /* Number of coefficients in this subfilter */
+    unsigned int* index;      /* Delay index of corresponding filter coeff */
+    double* coeff;            /* List of subfilter coefficients */
+  }* filter;                  /* List of subfilters (one for each factor) */
+  float** z;                  /* List of delay buffers (one for each channel) */
+  unsigned int zi;            /* Current delay buffer index */
+} interpolator;
+
+struct ebur128_state_internal {
+  /** Filtered audio data (used as ring buffer). */
+  double* audio_data;
+  /** Size of audio_data array. */
+  size_t audio_data_frames;
+  /** Current index for audio_data. */
+  size_t audio_data_index;
+  /** How many frames are needed for a gating block. Will correspond to 400ms
+   *  of audio at initialization, and 100ms after the first block (75% overlap
+   *  as specified in the 2011 revision of BS1770). */
+  unsigned long needed_frames;
+  /** The channel map. Has as many elements as there are channels. */
+  int* channel_map;
+  /** How many samples fit in 100ms (rounded). */
+  unsigned long samples_in_100ms;
+  /** BS.1770 filter coefficients (nominator). */
+  double b[5];
+  /** BS.1770 filter coefficients (denominator). */
+  double a[5];
+  /** BS.1770 filter state. */
+  double v[5][5];
+  /** Linked list of block energies. */
+  struct ebur128_double_queue block_list;
+  unsigned long block_list_max;
+  unsigned long block_list_size;
+  /** Linked list of 3s-block energies, used to calculate LRA. */
+  struct ebur128_double_queue short_term_block_list;
+  unsigned long st_block_list_max;
+  unsigned long st_block_list_size;
+  int use_histogram;
+  unsigned long *block_energy_histogram;
+  unsigned long *short_term_block_energy_histogram;
+  /** Keeps track of when a new short term block is needed. */
+  size_t short_term_frame_counter;
+  /** Maximum sample peak, one per channel */
+  double* sample_peak;
+  double* prev_sample_peak;
+  /** Maximum true peak, one per channel */
+  double* true_peak;
+  double* prev_true_peak;
+  interpolator* interp;
+  float* resampler_buffer_input;
+  size_t resampler_buffer_input_frames;
+  float* resampler_buffer_output;
+  size_t resampler_buffer_output_frames;
+  /** The maximum window duration in ms. */
+  unsigned long window;
+  unsigned long history;
+};
+
+static double relative_gate = -10.0;
+
+/* Those will be calculated when initializing the library */
+static double relative_gate_factor;
+static double minus_twenty_decibels;
+static double histogram_energies[1000];
+static double histogram_energy_boundaries[1001];
+
+static interpolator* interp_create(unsigned int taps, unsigned int factor, unsigned int channels) {
+  interpolator* interp = calloc(1, sizeof(interpolator));
+  unsigned int j = 0;
+
+  interp->taps = taps;
+  interp->factor = factor;
+  interp->channels = channels;
+  interp->delay = (interp->taps + interp->factor - 1) / interp->factor;
+
+  /* Initialize the filter memory
+   * One subfilter per interpolation factor. */
+  interp->filter = calloc(interp->factor, sizeof(*interp->filter));
+  for (j = 0; j < interp->factor; j++) {
+    interp->filter[j].index = calloc(interp->delay, sizeof(unsigned int));
+    interp->filter[j].coeff = calloc(interp->delay, sizeof(double));
+  }
+  /* One delay buffer per channel. */
+  interp->z = calloc(interp->channels, sizeof(float*));
+  for (j = 0; j < interp->channels; j++) {
+    interp->z[j] = calloc( interp->delay, sizeof(float) );
+  }
+
+  /* Calculate the filter coefficients */
+  for (j = 0; j < interp->taps; j++) {
+    /* Calculate sinc */
+    double m = (double)j - (double)(interp->taps - 1) / 2.0;
+    double c = 1.0;
+    if (fabs(m) > ALMOST_ZERO) {
+      c = sin(m * M_PI / interp->factor) / (m * M_PI / interp->factor);
+    }
+    /* Apply Hanning window */
+    c *= 0.5 * (1 - cos(2 * M_PI * j / (interp->taps - 1)));
+
+    if (fabs(c) > ALMOST_ZERO) { /* Ignore any zero coeffs. */
+      /* Put the coefficient into the correct subfilter */
+      unsigned int f = j % interp->factor;
+      unsigned int t = interp->filter[f].count++;
+      interp->filter[f].coeff[t] = c;
+      interp->filter[f].index[t] = j / interp->factor;
+    }
+  }
+  return interp;
+}
+
+static void interp_destroy(interpolator* interp) {
+  unsigned int j = 0;
+  if (!interp) {
+    return;
+  }
+  for (j = 0; j < interp->factor; j++) {
+    free(interp->filter[j].index);
+    free(interp->filter[j].coeff);
+  }
+  free(interp->filter);
+  for (j = 0; j < interp->channels; j++) {
+    free(interp->z[j]);
+  }
+  free(interp->z);
+  free(interp);
+}
+
+static size_t interp_process(interpolator* interp, size_t frames, float* in, float* out) {
+  size_t frame = 0;
+  unsigned int chan = 0;
+  unsigned int f = 0;
+  unsigned int t = 0;
+  unsigned int out_stride = interp->channels * interp->factor;
+  float* outp = 0;
+  double acc = 0;
+  double c = 0;
+
+  for (frame = 0; frame < frames; frame++) {
+    for (chan = 0; chan < interp->channels; chan++) {
+      /* Add sample to delay buffer */
+      interp->z[chan][interp->zi] = *in++;
+      /* Apply coefficients */
+      outp = out + chan;
+      for (f = 0; f < interp->factor; f++) {
+        acc = 0.0;
+        for (t = 0; t < interp->filter[f].count; t++) {
+          int i = (int)interp->zi - (int)interp->filter[f].index[t];
+          if (i < 0) {
+            i += interp->delay;
+          }
+          c = interp->filter[f].coeff[t];
+          acc += interp->z[chan][i] * c;
+        }
+        *outp = (float)acc;
+        outp += interp->channels;
+      }
+    }
+    out += out_stride;
+    interp->zi++;
+    if (interp->zi == interp->delay) {
+      interp->zi = 0;
+    }
+  }
+
+  return frames * interp->factor;
+}
+
+static void ebur128_init_filter(ebur128_state* st) {
+  int i, j;
+
+  double f0 = 1681.974450955533;
+  double G  =    3.999843853973347;
+  double Q  =    0.7071752369554196;
+
+  double K  = tan(M_PI * f0 / (double) st->samplerate);
+  double Vh = pow(10.0, G / 20.0);
+  double Vb = pow(Vh, 0.4996667741545416);
+
+  double pb[3] = {0.0,  0.0, 0.0};
+  double pa[3] = {1.0,  0.0, 0.0};
+  double rb[3] = {1.0, -2.0, 1.0};
+  double ra[3] = {1.0,  0.0, 0.0};
+
+  double a0 =      1.0 + K / Q + K * K      ;
+  pb[0] =     (Vh + Vb * K / Q + K * K) / a0;
+  pb[1] =           2.0 * (K * K -  Vh) / a0;
+  pb[2] =     (Vh - Vb * K / Q + K * K) / a0;
+  pa[1] =           2.0 * (K * K - 1.0) / a0;
+  pa[2] =         (1.0 - K / Q + K * K) / a0;
+
+  /* fprintf(stderr, "%.14f %.14f %.14f %.14f %.14f\n",
+                     b1[0], b1[1], b1[2], a1[1], a1[2]); */
+
+  f0 = 38.13547087602444;
+  Q  =  0.5003270373238773;
+  K  = tan(M_PI * f0 / (double) st->samplerate);
+
+  ra[1] =   2.0 * (K * K - 1.0) / (1.0 + K / Q + K * K);
+  ra[2] = (1.0 - K / Q + K * K) / (1.0 + K / Q + K * K);
+
+  /* fprintf(stderr, "%.14f %.14f\n", a2[1], a2[2]); */
+
+  st->d->b[0] = pb[0] * rb[0];
+  st->d->b[1] = pb[0] * rb[1] + pb[1] * rb[0];
+  st->d->b[2] = pb[0] * rb[2] + pb[1] * rb[1] + pb[2] * rb[0];
+  st->d->b[3] = pb[1] * rb[2] + pb[2] * rb[1];
+  st->d->b[4] = pb[2] * rb[2];
+
+  st->d->a[0] = pa[0] * ra[0];
+  st->d->a[1] = pa[0] * ra[1] + pa[1] * ra[0];
+  st->d->a[2] = pa[0] * ra[2] + pa[1] * ra[1] + pa[2] * ra[0];
+  st->d->a[3] = pa[1] * ra[2] + pa[2] * ra[1];
+  st->d->a[4] = pa[2] * ra[2];
+
+  for (i = 0; i < 5; ++i) {
+    for (j = 0; j < 5; ++j) {
+      st->d->v[i][j] = 0.0;
+    }
+  }
+}
+
+static int ebur128_init_channel_map(ebur128_state* st) {
+  size_t i;
+  st->d->channel_map = (int*) malloc(st->channels * sizeof(int));
+  if (!st->d->channel_map) {
+    return EBUR128_ERROR_NOMEM;
+  }
+  if (st->channels == 4) {
+    st->d->channel_map[0] = EBUR128_LEFT;
+    st->d->channel_map[1] = EBUR128_RIGHT;
+    st->d->channel_map[2] = EBUR128_LEFT_SURROUND;
+    st->d->channel_map[3] = EBUR128_RIGHT_SURROUND;
+  } else if (st->channels == 5) {
+    st->d->channel_map[0] = EBUR128_LEFT;
+    st->d->channel_map[1] = EBUR128_RIGHT;
+    st->d->channel_map[2] = EBUR128_CENTER;
+    st->d->channel_map[3] = EBUR128_LEFT_SURROUND;
+    st->d->channel_map[4] = EBUR128_RIGHT_SURROUND;
+  } else {
+    for (i = 0; i < st->channels; ++i) {
+      switch (i) {
+        case 0:  st->d->channel_map[i] = EBUR128_LEFT;           break;
+        case 1:  st->d->channel_map[i] = EBUR128_RIGHT;          break;
+        case 2:  st->d->channel_map[i] = EBUR128_CENTER;         break;
+        case 3:  st->d->channel_map[i] = EBUR128_UNUSED;         break;
+        case 4:  st->d->channel_map[i] = EBUR128_LEFT_SURROUND;  break;
+        case 5:  st->d->channel_map[i] = EBUR128_RIGHT_SURROUND; break;
+        default: st->d->channel_map[i] = EBUR128_UNUSED;         break;
+      }
+    }
+  }
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_init_resampler(ebur128_state* st) {
+  int errcode = EBUR128_SUCCESS;
+
+  if (st->samplerate < 96000) {
+    st->d->interp = interp_create(49, 4, st->channels);
+    CHECK_ERROR(!st->d->interp, EBUR128_ERROR_NOMEM, exit)
+  } else if (st->samplerate < 192000) {
+    st->d->interp = interp_create(49, 2, st->channels);
+    CHECK_ERROR(!st->d->interp, EBUR128_ERROR_NOMEM, exit)
+  } else {
+    st->d->resampler_buffer_input = NULL;
+    st->d->resampler_buffer_output = NULL;
+    st->d->interp = NULL;
+    goto exit;
+  }
+
+  st->d->resampler_buffer_input_frames = st->d->samples_in_100ms * 4;
+  st->d->resampler_buffer_input = malloc(st->d->resampler_buffer_input_frames *
+                                      st->channels *
+                                      sizeof(float));
+  CHECK_ERROR(!st->d->resampler_buffer_input, EBUR128_ERROR_NOMEM, free_interp)
+
+  st->d->resampler_buffer_output_frames =
+                                    st->d->resampler_buffer_input_frames *
+                                    st->d->interp->factor;
+  st->d->resampler_buffer_output = malloc
+                                      (st->d->resampler_buffer_output_frames *
+                                       st->channels *
+                                       sizeof(float));
+  CHECK_ERROR(!st->d->resampler_buffer_output, EBUR128_ERROR_NOMEM, free_input)
+
+  return errcode;
+
+free_interp:
+  interp_destroy(st->d->interp);
+  st->d->interp = NULL;
+free_input:
+  free(st->d->resampler_buffer_input);
+  st->d->resampler_buffer_input = NULL;
+exit:
+  return errcode;
+}
+
+static void ebur128_destroy_resampler(ebur128_state* st) {
+  free(st->d->resampler_buffer_input);
+  st->d->resampler_buffer_input = NULL;
+  free(st->d->resampler_buffer_output);
+  st->d->resampler_buffer_output = NULL;
+  interp_destroy(st->d->interp);
+  st->d->interp = NULL;
+}
+
+void ebur128_get_version(int* major, int* minor, int* patch) {
+  *major = EBUR128_VERSION_MAJOR;
+  *minor = EBUR128_VERSION_MINOR;
+  *patch = EBUR128_VERSION_PATCH;
+}
+
+ebur128_state* ebur128_init(unsigned int channels,
+                            unsigned long samplerate,
+                            int mode) {
+  int result;
+  int errcode;
+  ebur128_state* st;
+  unsigned int i;
+  size_t j;
+
+  if (channels == 0 || samplerate < 5) {
+    return NULL;
+  }
+
+  st = (ebur128_state*) malloc(sizeof(ebur128_state));
+  CHECK_ERROR(!st, 0, exit)
+  st->d = (struct ebur128_state_internal*)
+          malloc(sizeof(struct ebur128_state_internal));
+  CHECK_ERROR(!st->d, 0, free_state)
+  st->channels = channels;
+  errcode = ebur128_init_channel_map(st);
+  CHECK_ERROR(errcode, 0, free_internal)
+
+  st->d->sample_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->sample_peak, 0, free_channel_map)
+  st->d->prev_sample_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->prev_sample_peak, 0, free_sample_peak)
+  st->d->true_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->true_peak, 0, free_prev_sample_peak)
+  st->d->prev_true_peak = (double*) malloc(channels * sizeof(double));
+  CHECK_ERROR(!st->d->prev_true_peak, 0, free_true_peak)
+  for (i = 0; i < channels; ++i) {
+    st->d->sample_peak[i] = 0.0;
+    st->d->prev_sample_peak[i] = 0.0;
+    st->d->true_peak[i] = 0.0;
+    st->d->prev_true_peak[i] = 0.0;
+  }
+
+  st->d->use_histogram = mode & EBUR128_MODE_HISTOGRAM ? 1 : 0;
+  st->d->history = ULONG_MAX;
+  st->samplerate = samplerate;
+  st->d->samples_in_100ms = (st->samplerate + 5) / 10;
+  st->mode = mode;
+  if ((mode & EBUR128_MODE_S) == EBUR128_MODE_S) {
+    st->d->window = 3000;
+  } else if ((mode & EBUR128_MODE_M) == EBUR128_MODE_M) {
+    st->d->window = 400;
+  } else {
+    goto free_prev_true_peak;
+  }
+  st->d->audio_data_frames = st->samplerate * st->d->window / 1000;
+  if (st->d->audio_data_frames % st->d->samples_in_100ms) {
+    /* round up to multiple of samples_in_100ms */
+    st->d->audio_data_frames = st->d->audio_data_frames
+                             + st->d->samples_in_100ms
+                             - (st->d->audio_data_frames % st->d->samples_in_100ms);
+  }
+  st->d->audio_data = (double*) malloc(st->d->audio_data_frames *
+                                       st->channels *
+                                       sizeof(double));
+  CHECK_ERROR(!st->d->audio_data, 0, free_true_peak)
+  for (j = 0; j < st->d->audio_data_frames * st->channels; ++j) {
+    st->d->audio_data[j] = 0.0;
+  }
+
+  ebur128_init_filter(st);
+
+  if (st->d->use_histogram) {
+    st->d->block_energy_histogram = malloc(1000 * sizeof(unsigned long));
+    CHECK_ERROR(!st->d->block_energy_histogram, 0, free_audio_data)
+    for (i = 0; i < 1000; ++i) {
+      st->d->block_energy_histogram[i] = 0;
+    }
+  } else {
+    st->d->block_energy_histogram = NULL;
+  }
+  if (st->d->use_histogram) {
+    st->d->short_term_block_energy_histogram = malloc(1000 * sizeof(unsigned long));
+    CHECK_ERROR(!st->d->short_term_block_energy_histogram, 0, free_block_energy_histogram)
+    for (i = 0; i < 1000; ++i) {
+      st->d->short_term_block_energy_histogram[i] = 0;
+    }
+  } else {
+    st->d->short_term_block_energy_histogram = NULL;
+  }
+  STAILQ_INIT(&st->d->block_list);
+  st->d->block_list_size = 0;
+  st->d->block_list_max = st->d->history / 100;
+  STAILQ_INIT(&st->d->short_term_block_list);
+  st->d->st_block_list_size = 0;
+  st->d->st_block_list_max = st->d->history / 3000;
+  st->d->short_term_frame_counter = 0;
+
+  result = ebur128_init_resampler(st);
+  CHECK_ERROR(result, 0, free_short_term_block_energy_histogram)
+
+  /* the first block needs 400ms of audio data */
+  st->d->needed_frames = st->d->samples_in_100ms * 4;
+  /* start at the beginning of the buffer */
+  st->d->audio_data_index = 0;
+
+  /* initialize static constants */
+  relative_gate_factor = pow(10.0, relative_gate / 10.0);
+  minus_twenty_decibels = pow(10.0, -20.0 / 10.0);
+  histogram_energy_boundaries[0] = pow(10.0, (-70.0 + 0.691) / 10.0);
+  if (st->d->use_histogram) {
+    for (i = 0; i < 1000; ++i) {
+      histogram_energies[i] = pow(10.0, ((double) i / 10.0 - 69.95 + 0.691) / 10.0);
+    }
+    for (i = 1; i < 1001; ++i) {
+      histogram_energy_boundaries[i] = pow(10.0, ((double) i / 10.0 - 70.0 + 0.691) / 10.0);
+    }
+  }
+
+  return st;
+
+free_short_term_block_energy_histogram:
+  free(st->d->short_term_block_energy_histogram);
+free_block_energy_histogram:
+  free(st->d->block_energy_histogram);
+free_audio_data:
+  free(st->d->audio_data);
+free_prev_true_peak:
+  free(st->d->prev_true_peak);
+free_true_peak:
+  free(st->d->true_peak);
+free_prev_sample_peak:
+  free(st->d->prev_sample_peak);
+free_sample_peak:
+  free(st->d->sample_peak);
+free_channel_map:
+  free(st->d->channel_map);
+free_internal:
+  free(st->d);
+free_state:
+  free(st);
+exit:
+  return NULL;
+}
+
+void ebur128_destroy(ebur128_state** st) {
+  struct ebur128_dq_entry* entry;
+  free((*st)->d->block_energy_histogram);
+  free((*st)->d->short_term_block_energy_histogram);
+  free((*st)->d->audio_data);
+  free((*st)->d->channel_map);
+  free((*st)->d->sample_peak);
+  free((*st)->d->prev_sample_peak);
+  free((*st)->d->true_peak);
+  free((*st)->d->prev_true_peak);
+  while (!STAILQ_EMPTY(&(*st)->d->block_list)) {
+    entry = STAILQ_FIRST(&(*st)->d->block_list);
+    STAILQ_REMOVE_HEAD(&(*st)->d->block_list, entries);
+    free(entry);
+  }
+  while (!STAILQ_EMPTY(&(*st)->d->short_term_block_list)) {
+    entry = STAILQ_FIRST(&(*st)->d->short_term_block_list);
+    STAILQ_REMOVE_HEAD(&(*st)->d->short_term_block_list, entries);
+    free(entry);
+  }
+  ebur128_destroy_resampler(*st);
+  free((*st)->d);
+  free(*st);
+  *st = NULL;
+}
+
+static void ebur128_check_true_peak(ebur128_state* st, size_t frames) {
+  size_t c, i, frames_out;
+
+  frames_out = interp_process(st->d->interp, frames,
+                 st->d->resampler_buffer_input,
+                 st->d->resampler_buffer_output);
+
+  for (i = 0; i < frames_out; ++i) {
+    for (c = 0; c < st->channels; ++c) {
+      float val = st->d->resampler_buffer_output[i * st->channels + c];
+
+      if (val > st->d->prev_true_peak[c]) {
+        st->d->prev_true_peak[c] = val;
+      } else if (-val > st->d->prev_true_peak[c]) {
+        st->d->prev_true_peak[c] = -val;
+      }
+    }
+  }
+}
+
+#ifdef __SSE2_MATH__
+#include <xmmintrin.h>
+#define TURN_ON_FTZ \
+        unsigned int mxcsr = _mm_getcsr(); \
+        _mm_setcsr(mxcsr | _MM_FLUSH_ZERO_ON);
+#define TURN_OFF_FTZ _mm_setcsr(mxcsr);
+#define FLUSH_MANUALLY
+#else
+#warning "manual FTZ is being used, please enable SSE2 (-msse2 -mfpmath=sse)"
+#define TURN_ON_FTZ
+#define TURN_OFF_FTZ
+#define FLUSH_MANUALLY \
+    st->d->v[ci][4] = fabs(st->d->v[ci][4]) < DBL_MIN ? 0.0 : st->d->v[ci][4]; \
+    st->d->v[ci][3] = fabs(st->d->v[ci][3]) < DBL_MIN ? 0.0 : st->d->v[ci][3]; \
+    st->d->v[ci][2] = fabs(st->d->v[ci][2]) < DBL_MIN ? 0.0 : st->d->v[ci][2]; \
+    st->d->v[ci][1] = fabs(st->d->v[ci][1]) < DBL_MIN ? 0.0 : st->d->v[ci][1];
+#endif
+
+#define EBUR128_FILTER(type, min_scale, max_scale)                             \
+static void ebur128_filter_##type(ebur128_state* st, const type* src,          \
+                                  size_t frames) {                             \
+  static double scaling_factor =                                               \
+                 -((double) (min_scale)) > (double) (max_scale) ?              \
+                 -((double) (min_scale)) : (double) (max_scale);               \
+  double* audio_data = st->d->audio_data + st->d->audio_data_index;            \
+  size_t i, c;                                                                 \
+                                                                               \
+  TURN_ON_FTZ                                                                  \
+                                                                               \
+  if ((st->mode & EBUR128_MODE_SAMPLE_PEAK) == EBUR128_MODE_SAMPLE_PEAK) {     \
+    for (c = 0; c < st->channels; ++c) {                                       \
+      double max = 0.0;                                                        \
+      for (i = 0; i < frames; ++i) {                                           \
+        if (src[i * st->channels + c] > max) {                                 \
+          max =        src[i * st->channels + c];                              \
+        } else if (-src[i * st->channels + c] > max) {                         \
+          max = -1.0 * src[i * st->channels + c];                              \
+        }                                                                      \
+      }                                                                        \
+      max /= scaling_factor;                                                   \
+      if (max > st->d->prev_sample_peak[c]) st->d->prev_sample_peak[c] = max;  \
+    }                                                                          \
+  }                                                                            \
+  if ((st->mode & EBUR128_MODE_TRUE_PEAK) == EBUR128_MODE_TRUE_PEAK &&         \
+      st->d->interp) {                                                         \
+    for (c = 0; c < st->channels; ++c) {                                       \
+      for (i = 0; i < frames; ++i) {                                           \
+        st->d->resampler_buffer_input[i * st->channels + c] =                  \
+                      (float) (src[i * st->channels + c] / scaling_factor);    \
+      }                                                                        \
+    }                                                                          \
+    ebur128_check_true_peak(st, frames);                                       \
+  }                                                                            \
+  for (c = 0; c < st->channels; ++c) {                                         \
+    int ci = st->d->channel_map[c] - 1;                                        \
+    if (ci < 0) continue;                                                      \
+    else if (ci == EBUR128_DUAL_MONO - 1) ci = 0; /*dual mono */               \
+    for (i = 0; i < frames; ++i) {                                             \
+      st->d->v[ci][0] = (double) (src[i * st->channels + c] / scaling_factor)  \
+                   - st->d->a[1] * st->d->v[ci][1]                             \
+                   - st->d->a[2] * st->d->v[ci][2]                             \
+                   - st->d->a[3] * st->d->v[ci][3]                             \
+                   - st->d->a[4] * st->d->v[ci][4];                            \
+      audio_data[i * st->channels + c] =                                       \
+                     st->d->b[0] * st->d->v[ci][0]                             \
+                   + st->d->b[1] * st->d->v[ci][1]                             \
+                   + st->d->b[2] * st->d->v[ci][2]                             \
+                   + st->d->b[3] * st->d->v[ci][3]                             \
+                   + st->d->b[4] * st->d->v[ci][4];                            \
+      st->d->v[ci][4] = st->d->v[ci][3];                                       \
+      st->d->v[ci][3] = st->d->v[ci][2];                                       \
+      st->d->v[ci][2] = st->d->v[ci][1];                                       \
+      st->d->v[ci][1] = st->d->v[ci][0];                                       \
+    }                                                                          \
+    FLUSH_MANUALLY                                                             \
+  }                                                                            \
+  TURN_OFF_FTZ                                                                 \
+}
+EBUR128_FILTER(short, SHRT_MIN, SHRT_MAX)
+EBUR128_FILTER(int, INT_MIN, INT_MAX)
+EBUR128_FILTER(float, -1.0f, 1.0f)
+EBUR128_FILTER(double, -1.0, 1.0)
+
+static double ebur128_energy_to_loudness(double energy) {
+  return 10 * (log(energy) / log(10.0)) - 0.691;
+}
+
+static size_t find_histogram_index(double energy) {
+  size_t index_min = 0;
+  size_t index_max = 1000;
+  size_t index_mid;
+
+  do {
+    index_mid = (index_min + index_max) / 2;
+    if (energy >= histogram_energy_boundaries[index_mid]) {
+      index_min = index_mid;
+    } else {
+      index_max = index_mid;
+    }
+  } while (index_max - index_min != 1);
+
+  return index_min;
+}
+
+static int ebur128_calc_gating_block(ebur128_state* st, size_t frames_per_block,
+                                     double* optional_output) {
+  size_t i, c;
+  double sum = 0.0;
+  double channel_sum;
+  for (c = 0; c < st->channels; ++c) {
+    if (st->d->channel_map[c] == EBUR128_UNUSED) {
+      continue;
+    }
+    channel_sum = 0.0;
+    if (st->d->audio_data_index < frames_per_block * st->channels) {
+      for (i = 0; i < st->d->audio_data_index / st->channels; ++i) {
+        channel_sum += st->d->audio_data[i * st->channels + c] *
+                       st->d->audio_data[i * st->channels + c];
+      }
+      for (i = st->d->audio_data_frames -
+              (frames_per_block -
+               st->d->audio_data_index / st->channels);
+           i < st->d->audio_data_frames; ++i) {
+        channel_sum += st->d->audio_data[i * st->channels + c] *
+                       st->d->audio_data[i * st->channels + c];
+      }
+    } else {
+      for (i = st->d->audio_data_index / st->channels - frames_per_block;
+           i < st->d->audio_data_index / st->channels;
+           ++i) {
+        channel_sum += st->d->audio_data[i * st->channels + c] *
+                       st->d->audio_data[i * st->channels + c];
+      }
+    }
+    if (st->d->channel_map[c] == EBUR128_Mp110 ||
+        st->d->channel_map[c] == EBUR128_Mm110 ||
+        st->d->channel_map[c] == EBUR128_Mp060 ||
+        st->d->channel_map[c] == EBUR128_Mm060 ||
+        st->d->channel_map[c] == EBUR128_Mp090 ||
+        st->d->channel_map[c] == EBUR128_Mm090) {
+      channel_sum *= 1.41;
+    } else if (st->d->channel_map[c] == EBUR128_DUAL_MONO) {
+      channel_sum *= 2.0;
+    }
+    sum += channel_sum;
+  }
+  sum /= (double) frames_per_block;
+  if (optional_output) {
+    *optional_output = sum;
+    return EBUR128_SUCCESS;
+  } else if (sum >= histogram_energy_boundaries[0]) {
+    if (st->d->use_histogram) {
+      ++st->d->block_energy_histogram[find_histogram_index(sum)];
+    } else {
+      struct ebur128_dq_entry* block;
+      if (st->d->block_list_size == st->d->block_list_max) {
+        block = STAILQ_FIRST(&st->d->block_list);
+        STAILQ_REMOVE_HEAD(&st->d->block_list, entries);
+      } else {
+        block = (struct ebur128_dq_entry*) malloc(sizeof(struct ebur128_dq_entry));
+        if (!block) {
+          return EBUR128_ERROR_NOMEM;
+        }
+        st->d->block_list_size++;
+      }
+      block->z = sum;
+      STAILQ_INSERT_TAIL(&st->d->block_list, block, entries);
+    }
+    return EBUR128_SUCCESS;
+  } else {
+    return EBUR128_SUCCESS;
+  }
+}
+
+int ebur128_set_channel(ebur128_state* st,
+                        unsigned int channel_number,
+                        int value) {
+  if (channel_number >= st->channels) {
+    return 1;
+  }
+  if (value == EBUR128_DUAL_MONO &&
+      (st->channels != 1 || channel_number != 0)) {
+    fprintf(stderr, "EBUR128_DUAL_MONO only works with mono files!\n");
+    return 1;
+  }
+  st->d->channel_map[channel_number] = value;
+  return 0;
+}
+
+int ebur128_change_parameters(ebur128_state* st,
+                              unsigned int channels,
+                              unsigned long samplerate) {
+  int errcode = EBUR128_SUCCESS;
+  size_t j;
+
+  if (channels == 0 || samplerate < 5) {
+    return EBUR128_ERROR_NOMEM;
+  }
+
+  if (channels == st->channels &&
+      samplerate == st->samplerate) {
+    return EBUR128_ERROR_NO_CHANGE;
+  }
+
+  free(st->d->audio_data);
+  st->d->audio_data = NULL;
+
+  if (channels != st->channels) {
+    unsigned int i;
+
+    free(st->d->channel_map); st->d->channel_map = NULL;
+    free(st->d->sample_peak); st->d->sample_peak = NULL;
+    free(st->d->prev_sample_peak); st->d->prev_sample_peak = NULL;
+    free(st->d->true_peak);   st->d->true_peak = NULL;
+    free(st->d->prev_true_peak); st->d->prev_true_peak = NULL;
+    st->channels = channels;
+
+    errcode = ebur128_init_channel_map(st);
+    CHECK_ERROR(errcode, EBUR128_ERROR_NOMEM, exit)
+
+    st->d->sample_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->sample_peak, EBUR128_ERROR_NOMEM, exit)
+    st->d->prev_sample_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->prev_sample_peak, EBUR128_ERROR_NOMEM, exit)
+    st->d->true_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->true_peak, EBUR128_ERROR_NOMEM, exit)
+    st->d->prev_true_peak = (double*) malloc(channels * sizeof(double));
+    CHECK_ERROR(!st->d->prev_true_peak, EBUR128_ERROR_NOMEM, exit)
+    for (i = 0; i < channels; ++i) {
+      st->d->sample_peak[i] = 0.0;
+      st->d->prev_sample_peak[i] = 0.0;
+      st->d->true_peak[i] = 0.0;
+      st->d->prev_true_peak[i] = 0.0;
+    }
+  }
+  if (samplerate != st->samplerate) {
+    st->samplerate = samplerate;
+    st->d->samples_in_100ms = (st->samplerate + 5) / 10;
+    ebur128_init_filter(st);
+  }
+  st->d->audio_data_frames = st->samplerate * st->d->window / 1000;
+  if (st->d->audio_data_frames % st->d->samples_in_100ms) {
+    /* round up to multiple of samples_in_100ms */
+    st->d->audio_data_frames = st->d->audio_data_frames
+                             + st->d->samples_in_100ms
+                             - (st->d->audio_data_frames % st->d->samples_in_100ms);
+  }
+  st->d->audio_data = (double*) malloc(st->d->audio_data_frames *
+                                       st->channels *
+                                       sizeof(double));
+  CHECK_ERROR(!st->d->audio_data, EBUR128_ERROR_NOMEM, exit)
+  for (j = 0; j < st->d->audio_data_frames * st->channels; ++j) {
+    st->d->audio_data[j] = 0.0;
+  }
+
+  ebur128_destroy_resampler(st);
+  errcode = ebur128_init_resampler(st);
+  CHECK_ERROR(errcode, EBUR128_ERROR_NOMEM, exit)
+
+  /* the first block needs 400ms of audio data */
+  st->d->needed_frames = st->d->samples_in_100ms * 4;
+  /* start at the beginning of the buffer */
+  st->d->audio_data_index = 0;
+  /* reset short term frame counter */
+  st->d->short_term_frame_counter = 0;
+
+exit:
+  return errcode;
+}
+
+int ebur128_set_max_window(ebur128_state* st, unsigned long window)
+{
+  int errcode = EBUR128_SUCCESS;
+  size_t j;
+
+  if ((st->mode & EBUR128_MODE_S) == EBUR128_MODE_S && window < 3000) {
+    window = 3000;
+  } else if ((st->mode & EBUR128_MODE_M) == EBUR128_MODE_M && window < 400) {
+    window = 400;
+  }
+  if (window == st->d->window) {
+    return EBUR128_ERROR_NO_CHANGE;
+  }
+
+  st->d->window = window;
+  free(st->d->audio_data);
+  st->d->audio_data = NULL;
+  st->d->audio_data_frames = st->samplerate * st->d->window / 1000;
+  if (st->d->audio_data_frames % st->d->samples_in_100ms) {
+    /* round up to multiple of samples_in_100ms */
+    st->d->audio_data_frames = st->d->audio_data_frames
+                             + st->d->samples_in_100ms
+                             - (st->d->audio_data_frames % st->d->samples_in_100ms);
+  }
+  st->d->audio_data = (double*) malloc(st->d->audio_data_frames *
+                                       st->channels *
+                                       sizeof(double));
+  CHECK_ERROR(!st->d->audio_data, EBUR128_ERROR_NOMEM, exit)
+  for (j = 0; j < st->d->audio_data_frames * st->channels; ++j) {
+    st->d->audio_data[j] = 0.0;
+  }
+
+  /* the first block needs 400ms of audio data */
+  st->d->needed_frames = st->d->samples_in_100ms * 4;
+  /* start at the beginning of the buffer */
+  st->d->audio_data_index = 0;
+  /* reset short term frame counter */
+  st->d->short_term_frame_counter = 0;
+
+exit:
+  return errcode;
+}
+
+int ebur128_set_max_history(ebur128_state* st, unsigned long history)
+{
+  if ((st->mode & EBUR128_MODE_LRA) == EBUR128_MODE_LRA && history < 3000) {
+    history = 3000;
+  } else if ((st->mode & EBUR128_MODE_M) == EBUR128_MODE_M && history < 400) {
+    history = 400;
+  }
+  if (history == st->d->history) {
+    return EBUR128_ERROR_NO_CHANGE;
+  }
+  st->d->history = history;
+  st->d->block_list_max = st->d->history / 100;
+  st->d->st_block_list_max = st->d->history / 3000;
+  while (st->d->block_list_size > st->d->block_list_max) {
+    struct ebur128_dq_entry* block = STAILQ_FIRST(&st->d->block_list);
+    STAILQ_REMOVE_HEAD(&st->d->block_list, entries);
+    free(block);
+    st->d->block_list_size--;
+  }
+  while (st->d->st_block_list_size > st->d->st_block_list_max) {
+    struct ebur128_dq_entry* block = STAILQ_FIRST(&st->d->short_term_block_list);
+    STAILQ_REMOVE_HEAD(&st->d->short_term_block_list, entries);
+    free(block);
+    st->d->st_block_list_size--;
+  }
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_energy_shortterm(ebur128_state* st, double* out);
+#define EBUR128_ADD_FRAMES(type)                                               \
+int ebur128_add_frames_##type(ebur128_state* st,                               \
+                              const type* src, size_t frames) {                \
+  size_t src_index = 0;                                                        \
+  unsigned int c = 0;                                                          \
+  for (c = 0; c < st->channels; c++) {                                         \
+    st->d->prev_sample_peak[c] = 0.0;                                          \
+    st->d->prev_true_peak[c] = 0.0;                                            \
+  }                                                                            \
+  while (frames > 0) {                                                         \
+    if (frames >= st->d->needed_frames) {                                      \
+      ebur128_filter_##type(st, src + src_index, st->d->needed_frames);        \
+      src_index += st->d->needed_frames * st->channels;                        \
+      frames -= st->d->needed_frames;                                          \
+      st->d->audio_data_index += st->d->needed_frames * st->channels;          \
+      /* calculate the new gating block */                                     \
+      if ((st->mode & EBUR128_MODE_I) == EBUR128_MODE_I) {                     \
+        if (ebur128_calc_gating_block(st, st->d->samples_in_100ms * 4, NULL)) {\
+          return EBUR128_ERROR_NOMEM;                                          \
+        }                                                                      \
+      }                                                                        \
+      if ((st->mode & EBUR128_MODE_LRA) == EBUR128_MODE_LRA) {                 \
+        st->d->short_term_frame_counter += st->d->needed_frames;               \
+        if (st->d->short_term_frame_counter == st->d->samples_in_100ms * 30) { \
+          struct ebur128_dq_entry* block;                                      \
+          double st_energy;                                                    \
+          if (ebur128_energy_shortterm(st, &st_energy) == EBUR128_SUCCESS &&   \
+                  st_energy >= histogram_energy_boundaries[0]) {               \
+            if (st->d->use_histogram) {                                        \
+              ++st->d->short_term_block_energy_histogram[                      \
+                                              find_histogram_index(st_energy)];\
+            } else {                                                           \
+              if (st->d->st_block_list_size == st->d->st_block_list_max) {     \
+                block = STAILQ_FIRST(&st->d->short_term_block_list);           \
+                STAILQ_REMOVE_HEAD(&st->d->short_term_block_list, entries);    \
+              } else {                                                         \
+                block = (struct ebur128_dq_entry*)                             \
+                        malloc(sizeof(struct ebur128_dq_entry));               \
+                if (!block) return EBUR128_ERROR_NOMEM;                        \
+                st->d->st_block_list_size++;                                   \
+              }                                                                \
+              block->z = st_energy;                                            \
+              STAILQ_INSERT_TAIL(&st->d->short_term_block_list,                \
+                                 block, entries);                              \
+            }                                                                  \
+          }                                                                    \
+          st->d->short_term_frame_counter = st->d->samples_in_100ms * 20;      \
+        }                                                                      \
+      }                                                                        \
+      /* 100ms are needed for all blocks besides the first one */              \
+      st->d->needed_frames = st->d->samples_in_100ms;                          \
+      /* reset audio_data_index when buffer full */                            \
+      if (st->d->audio_data_index == st->d->audio_data_frames * st->channels) {\
+        st->d->audio_data_index = 0;                                           \
+      }                                                                        \
+    } else {                                                                   \
+      ebur128_filter_##type(st, src + src_index, frames);                      \
+      st->d->audio_data_index += frames * st->channels;                        \
+      if ((st->mode & EBUR128_MODE_LRA) == EBUR128_MODE_LRA) {                 \
+        st->d->short_term_frame_counter += frames;                             \
+      }                                                                        \
+      st->d->needed_frames -= frames;                                          \
+      frames = 0;                                                              \
+    }                                                                          \
+  }                                                                            \
+  for (c = 0; c < st->channels; c++) {                                         \
+    if (st->d->prev_sample_peak[c] > st->d->sample_peak[c]) {                  \
+      st->d->sample_peak[c] = st->d->prev_sample_peak[c];                      \
+    }                                                                          \
+    if (st->d->prev_true_peak[c] > st->d->true_peak[c]) {                      \
+      st->d->true_peak[c] = st->d->prev_true_peak[c];                          \
+    }                                                                          \
+  }                                                                            \
+  return EBUR128_SUCCESS;                                                      \
+}
+EBUR128_ADD_FRAMES(short)
+EBUR128_ADD_FRAMES(int)
+EBUR128_ADD_FRAMES(float)
+EBUR128_ADD_FRAMES(double)
+
+static int ebur128_calc_relative_threshold(ebur128_state* st,
+                                           size_t* above_thresh_counter,
+                                           double* relative_threshold) {
+  struct ebur128_dq_entry* it;
+  size_t i;
+
+  if (st->d->use_histogram) {
+    for (i = 0; i < 1000; ++i) {
+      *relative_threshold += st->d->block_energy_histogram[i] *
+                            histogram_energies[i];
+      *above_thresh_counter += st->d->block_energy_histogram[i];
+    }
+  } else {
+    STAILQ_FOREACH(it, &st->d->block_list, entries) {
+      ++*above_thresh_counter;
+      *relative_threshold += it->z;
+    }
+  }
+
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_gated_loudness(ebur128_state** sts, size_t size,
+                                  double* out) {
+  struct ebur128_dq_entry* it;
+  double gated_loudness = 0.0;
+  double relative_threshold = 0.0;
+  size_t above_thresh_counter = 0;
+  size_t i, j, start_index;
+
+  for (i = 0; i < size; i++) {
+    if (sts[i] && (sts[i]->mode & EBUR128_MODE_I) != EBUR128_MODE_I) {
+      return EBUR128_ERROR_INVALID_MODE;
+    }
+  }
+
+  for (i = 0; i < size; i++) {
+    if (!sts[i]) {
+      continue;
+    }
+    ebur128_calc_relative_threshold(sts[i], &above_thresh_counter, &relative_threshold);
+  }
+  if (!above_thresh_counter) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+
+  relative_threshold /= (double)above_thresh_counter;
+  relative_threshold *= relative_gate_factor;
+
+  above_thresh_counter = 0;
+  if (relative_threshold < histogram_energy_boundaries[0]) {
+    start_index = 0;
+  } else {
+    start_index = find_histogram_index(relative_threshold);
+    if (relative_threshold > histogram_energies[start_index]) {
+      ++start_index;
+    }
+  }
+  for (i = 0; i < size; i++) {
+    if (!sts[i]) {
+      continue;
+    }
+    if (sts[i]->d->use_histogram) {
+      for (j = start_index; j < 1000; ++j) {
+        gated_loudness += sts[i]->d->block_energy_histogram[j] *
+                          histogram_energies[j];
+        above_thresh_counter += sts[i]->d->block_energy_histogram[j];
+      }
+    } else {
+      STAILQ_FOREACH(it, &sts[i]->d->block_list, entries) {
+        if (it->z >= relative_threshold) {
+          ++above_thresh_counter;
+          gated_loudness += it->z;
+        }
+      }
+    }
+  }
+  if (!above_thresh_counter) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  gated_loudness /= (double) above_thresh_counter;
+  *out = ebur128_energy_to_loudness(gated_loudness);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_relative_threshold(ebur128_state* st, double* out) {
+  double relative_threshold = 0.0;
+  size_t above_thresh_counter = 0;
+
+  if ((st->mode & EBUR128_MODE_I) != EBUR128_MODE_I) {
+    return EBUR128_ERROR_INVALID_MODE;
+  }
+
+  ebur128_calc_relative_threshold(st, &above_thresh_counter, &relative_threshold);
+
+  if (!above_thresh_counter) {
+      *out = -70.0;
+      return EBUR128_SUCCESS;
+  }
+
+  relative_threshold /= (double)above_thresh_counter;
+  relative_threshold *= relative_gate_factor;
+
+  *out = ebur128_energy_to_loudness(relative_threshold);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_loudness_global(ebur128_state* st, double* out) {
+  return ebur128_gated_loudness(&st, 1, out);
+}
+
+int ebur128_loudness_global_multiple(ebur128_state** sts, size_t size,
+                                     double* out) {
+  return ebur128_gated_loudness(sts, size, out);
+}
+
+static int ebur128_energy_in_interval(ebur128_state* st,
+                                      size_t interval_frames,
+                                      double* out) {
+  if (interval_frames > st->d->audio_data_frames) {
+    return EBUR128_ERROR_INVALID_MODE;
+  }
+  ebur128_calc_gating_block(st, interval_frames, out);
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_energy_shortterm(ebur128_state* st, double* out) {
+  return ebur128_energy_in_interval(st, st->d->samples_in_100ms * 30, out);
+}
+
+int ebur128_loudness_momentary(ebur128_state* st, double* out) {
+  double energy;
+  int error = ebur128_energy_in_interval(st, st->d->samples_in_100ms * 4,
+                                         &energy);
+  if (error) {
+    return error;
+  } else if (energy <= 0.0) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  *out = ebur128_energy_to_loudness(energy);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_loudness_shortterm(ebur128_state* st, double* out) {
+  double energy;
+  int error = ebur128_energy_shortterm(st, &energy);
+  if (error) {
+    return error;
+  } else if (energy <= 0.0) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  *out = ebur128_energy_to_loudness(energy);
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_loudness_window(ebur128_state* st,
+                            unsigned long window,
+                            double* out) {
+  double energy;
+  size_t interval_frames = st->samplerate * window / 1000;
+  int error = ebur128_energy_in_interval(st, interval_frames, &energy);
+  if (error) {
+    return error;
+  } else if (energy <= 0.0) {
+    *out = -HUGE_VAL;
+    return EBUR128_SUCCESS;
+  }
+  *out = ebur128_energy_to_loudness(energy);
+  return EBUR128_SUCCESS;
+}
+
+static int ebur128_double_cmp(const void *p1, const void *p2) {
+  const double* d1 = (const double*) p1;
+  const double* d2 = (const double*) p2;
+  return (*d1 > *d2) - (*d1 < *d2);
+}
+
+/* EBU - TECH 3342 */
+int ebur128_loudness_range_multiple(ebur128_state** sts, size_t size,
+                                    double* out) {
+  size_t i, j;
+  struct ebur128_dq_entry* it;
+  double* stl_vector;
+  size_t stl_size;
+  double* stl_relgated;
+  size_t stl_relgated_size;
+  double stl_power, stl_integrated;
+  /* High and low percentile energy */
+  double h_en, l_en;
+  int use_histogram = 0;
+
+  for (i = 0; i < size; ++i) {
+    if (sts[i]) {
+      if ((sts[i]->mode & EBUR128_MODE_LRA) != EBUR128_MODE_LRA) {
+        return EBUR128_ERROR_INVALID_MODE;
+      }
+      if (i == 0 && sts[i]->mode & EBUR128_MODE_HISTOGRAM) {
+        use_histogram = 1;
+      } else if (use_histogram != !!(sts[i]->mode & EBUR128_MODE_HISTOGRAM)) {
+        return EBUR128_ERROR_INVALID_MODE;
+      }
+    }
+  }
+
+  if (use_histogram) {
+    unsigned long hist[1000] = { 0 };
+    size_t percentile_low, percentile_high;
+    size_t index;
+
+    stl_size = 0;
+    stl_power = 0.0;
+    for (i = 0; i < size; ++i) {
+      if (!sts[i]) {
+        continue;
+      }
+      for (j = 0; j < 1000; ++j) {
+        hist[j]   += sts[i]->d->short_term_block_energy_histogram[j];
+        stl_size  += sts[i]->d->short_term_block_energy_histogram[j];
+        stl_power += sts[i]->d->short_term_block_energy_histogram[j]
+                     * histogram_energies[j];
+      }
+    }
+    if (!stl_size) {
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+
+    stl_power /= stl_size;
+    stl_integrated = minus_twenty_decibels * stl_power;
+
+    if (stl_integrated < histogram_energy_boundaries[0]) {
+      index = 0;
+    } else {
+      index = find_histogram_index(stl_integrated);
+      if (stl_integrated > histogram_energies[index]) {
+        ++index;
+      }
+    }
+    stl_size = 0;
+    for (j = index; j < 1000; ++j) {
+      stl_size += hist[j];
+    }
+    if (!stl_size) {
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+
+    percentile_low  = (size_t) ((stl_size - 1) * 0.1 + 0.5);
+    percentile_high = (size_t) ((stl_size - 1) * 0.95 + 0.5);
+
+    stl_size = 0;
+    j = index;
+    while (stl_size <= percentile_low) {
+      stl_size += hist[j++];
+    }
+    l_en = histogram_energies[j - 1];
+    while (stl_size <= percentile_high) {
+      stl_size += hist[j++];
+    }
+    h_en = histogram_energies[j - 1];
+    *out = ebur128_energy_to_loudness(h_en) - ebur128_energy_to_loudness(l_en);
+    return EBUR128_SUCCESS;
+
+  } else {
+    stl_size = 0;
+    for (i = 0; i < size; ++i) {
+      if (!sts[i]) {
+        continue;
+      }
+      STAILQ_FOREACH(it, &sts[i]->d->short_term_block_list, entries) {
+        ++stl_size;
+      }
+    }
+    if (!stl_size) {
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+    stl_vector = (double*) malloc(stl_size * sizeof(double));
+    if (!stl_vector) {
+      return EBUR128_ERROR_NOMEM;
+    }
+
+    j = 0;
+    for (i = 0; i < size; ++i) {
+      if (!sts[i]) {
+        continue;
+      }
+      STAILQ_FOREACH(it, &sts[i]->d->short_term_block_list, entries) {
+        stl_vector[j] = it->z;
+        ++j;
+      }
+    }
+    qsort(stl_vector, stl_size, sizeof(double), ebur128_double_cmp);
+    stl_power = 0.0;
+    for (i = 0; i < stl_size; ++i) {
+      stl_power += stl_vector[i];
+    }
+    stl_power /= (double) stl_size;
+    stl_integrated = minus_twenty_decibels * stl_power;
+
+    stl_relgated = stl_vector;
+    stl_relgated_size = stl_size;
+    while (stl_relgated_size > 0 && *stl_relgated < stl_integrated) {
+      ++stl_relgated;
+      --stl_relgated_size;
+    }
+
+    if (stl_relgated_size) {
+      h_en = stl_relgated[(size_t) ((stl_relgated_size - 1) * 0.95 + 0.5)];
+      l_en = stl_relgated[(size_t) ((stl_relgated_size - 1) * 0.1 + 0.5)];
+      free(stl_vector);
+      *out = ebur128_energy_to_loudness(h_en) - ebur128_energy_to_loudness(l_en);
+      return EBUR128_SUCCESS;
+    } else {
+      free(stl_vector);
+      *out = 0.0;
+      return EBUR128_SUCCESS;
+    }
+  }
+}
+
+int ebur128_loudness_range(ebur128_state* st, double* out) {
+  return ebur128_loudness_range_multiple(&st, 1, out);
+}
+
+int ebur128_sample_peak(ebur128_state* st,
+                        unsigned int channel_number,
+                        double* out) {
+  if ((st->mode & EBUR128_MODE_SAMPLE_PEAK) != EBUR128_MODE_SAMPLE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_prev_sample_peak(ebur128_state* st,
+                             unsigned int channel_number,
+                             double* out) {
+  if ((st->mode & EBUR128_MODE_SAMPLE_PEAK) != EBUR128_MODE_SAMPLE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->prev_sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_true_peak(ebur128_state* st,
+                      unsigned int channel_number,
+                      double* out) {
+  if ((st->mode & EBUR128_MODE_TRUE_PEAK) != EBUR128_MODE_TRUE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->true_peak[channel_number] > st->d->sample_peak[channel_number]
+       ? st->d->true_peak[channel_number]
+       : st->d->sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
+
+int ebur128_prev_true_peak(ebur128_state* st,
+                      unsigned int channel_number,
+                      double* out) {
+  if ((st->mode & EBUR128_MODE_TRUE_PEAK) != EBUR128_MODE_TRUE_PEAK) {
+    return EBUR128_ERROR_INVALID_MODE;
+  } else if (channel_number >= st->channels) {
+    return EBUR128_ERROR_INVALID_CHANNEL_INDEX;
+  }
+  *out = st->d->prev_true_peak[channel_number]
+                              > st->d->prev_sample_peak[channel_number]
+       ? st->d->prev_true_peak[channel_number]
+       : st->d->prev_sample_peak[channel_number];
+  return EBUR128_SUCCESS;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/im_effect.cpp b/AutoCoverTool/ref/tools/mixer/im_effect.cpp
new file mode 100644
index 0000000..650de46
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/im_effect.cpp
@@ -0,0 +1,241 @@
+//
+// Created by yangjianli on 2019-09-09.
+//
+/**
+ * 输入一个音频和伴奏自动进行混合
+ * gated_loudness 当前音量
+ * gain 预期增益
+ */
+#include "iostream"
+#include "WaveFile.h"
+#include "math.h"
+#include "ebur128.h"
+#include "AudioMixer.h"
+#include "alimiter.h"
+#include "waves/inc/WaveFile.h"
+#include "CAudioEffectsChainApi.h"
+#include "string"
+#include "ae_server/CAeServer.h"
+#include <cstdio>
+#include <chrono>
+#include <iostream>
+#include <cstdlib>
+#include <sys/time.h>
+#include "denoise/webrtc/include/WebrtcDenoise.h"
+
+#define PROC_LEN 1024
+#define DEFAULT_BASELINE_DB (float)-14.57f
+
+int short2float(short *pInBuf, int nLen, float *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    return 0;
+}
+
+int float2short(float *pInBuf, int nLen, short *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = int(pInBuf[i] * 32768);
+    }
+    return 0;
+}
+
+/**
+ * 获取增益
+ * @param nChannel
+ * @param nSampleRate
+ * @param pData
+ * @param nLength
+ * @param gain
+ * @return
+ */
+int ebur128_whole(int nChannel, int nSampleRate, short *pData, const int nLength, double &gated_loudness, double &gain)
+{
+    printf("ebur128_init start .. %d\n", nLength);
+    ebur128_state *st = NULL;
+    st = ebur128_init(nChannel, nSampleRate, EBUR128_MODE_I);
+    if (NULL == st)
+    {
+        return -1;
+    }
+    int nPos = 0;
+    int nTmpLength = 0;
+    int nRet;
+    printf("process start ..\n");
+    while (nPos < nLength)
+    {
+        nTmpLength = PROC_LEN;
+        if (nLength - nPos < PROC_LEN)
+        {
+            nTmpLength = nLength - nPos;
+        }
+        nRet = ebur128_add_frames_short(st, pData + nPos, nTmpLength / nChannel);
+        if (nRet != 0)
+        {
+            return -2;
+        }
+        nPos += nTmpLength;
+    }
+    printf("process ok..\n");
+    gated_loudness = -1;
+    ebur128_loudness_global(st, &gated_loudness);
+    float db = (DEFAULT_BASELINE_DB - gated_loudness) / 20.f;
+    gain = pow(10, db);
+    printf("gated_loudness = %f db = %f  gain = %f\n", gated_loudness, db, gain);
+    ebur128_destroy(&st);
+    return 0;
+}
+
+
+/**
+ * 混合音频和伴奏
+ * @param pVocalIn
+ * @param pAccIn
+ * @param nLength
+ * @param gainVocal
+ * @param gainAcc
+ * @param pOutBuf
+ * @return
+ */
+int mix(float *pVocalIn, float *pAccIn, int nLength, double gainVocal, double gainAcc, float *pOutBuf,
+        int nSampleRate, int nChannel, int nDelay, std::string effect_file)
+{
+
+    CAudioMixer *cAudioMixer = new CAudioMixer();
+    cAudioMixer->init(nSampleRate, nChannel);
+    cAudioMixer->set_acc_delay(nDelay);
+    cAudioMixer->set_vocal_volume(int(gainVocal * 50));
+    cAudioMixer->set_acc_volume(int(gainAcc * 50));
+
+    int nPos = 0;
+    int nStep = 1024;
+    float *fTmp = new float[nStep];
+    cAudioMixer->reset();
+    nPos = 0;
+    nStep = 1024;
+    int cnt = 0;
+
+    CAeServer cAeServer;
+    cAeServer.init(nSampleRate, nChannel, nStep / nChannel);
+    AE_PARAMS_IM_EFFECT im_params = {
+            .effect_path = effect_file,
+    };
+    cAeServer.set_params(AE_TYPE_IM_EFFECT, (void *) &im_params);
+
+
+    while (nPos < nLength)
+    {
+        if (nLength - nPos < nStep)
+        {
+            nStep = nLength - nPos;
+        }
+        cnt++;
+        cAeServer.process(pVocalIn + nPos, pVocalIn + nPos, nStep);
+        cAudioMixer->process(pVocalIn + nPos, pAccIn + nPos, pOutBuf + nPos, nStep);
+        nPos += nStep;
+    }
+    cAeServer.uninit();
+    delete cAudioMixer;
+    delete[] fTmp;
+    return 0;
+}
+
+int denoise_webrtc(short *pInBuf, int nLength, int nChannel, int nSampleRate)
+{
+    CWebrtcDenoise cWebrtcDenoise;
+    cWebrtcDenoise.init(nSampleRate, nChannel);
+    float *pTmp = new float[nLength];
+    for (int i = 0; i < nLength; i++)
+    {
+        pTmp[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    cWebrtcDenoise.set_level(kHigh);
+    int nStep = 512 * nChannel;
+
+    for (int i = 0; i < nStep; i++)
+    {
+        pTmp[i] = pTmp[i] * i * 1.0 / nStep;
+    }
+
+    for (int i = 0, cnt = 0; i < nLength; i += nStep, cnt++)
+    {
+        if (nLength - i < nStep) continue;
+        cWebrtcDenoise.process(pTmp + i, nStep);
+    }
+
+    for (int i = 0; i < nLength; i++)
+    {
+        pInBuf[i] = short(pTmp[i] * 32768);
+    }
+    delete[] pTmp;
+    return 0;
+}
+
+double calc_power_rate(float *in_data, int32_t in_len, float *ref_data, int32_t ref_len)
+{
+    double in_power = 0;
+    double ref_power = 0;
+    int32_t min_len = in_len > ref_len ? ref_len : in_len;
+    for (int i = 0; i < min_len; i++)
+    {
+        in_power += (in_data[i]) * (in_data[i]);
+        ref_power += (ref_data[i]) * (ref_data[i]);
+    }
+    return ref_power / in_power;
+}
+
+
+int main(int argc, char *argv[])
+{
+    if (argc != 4)
+    {
+        printf("input error! example: ./main im_path vocal_path effect_path!\n");
+        return -1;
+    }
+    std::string sImPath = argv[1];
+    std::string sVocal = argv[2];
+    std::string sMix = argv[3];
+
+    // 读取人声
+    CWaveFile *oWaveFile = new CWaveFile(sVocal.c_str(), false);
+    float *pVocalBuf = new float[oWaveFile->GetTotalFrames() * oWaveFile->GetChannels()];
+    oWaveFile->ReadFrameAsfloat(pVocalBuf, oWaveFile->GetTotalFrames());
+
+    int nPos = 0;
+    int nStep = 1024;
+    int nLength = oWaveFile->GetTotalFrames() * oWaveFile->GetChannels();
+    CAeServer cAeServer;
+    cAeServer.init(oWaveFile->GetSampleRate(), oWaveFile->GetChannels(), nStep / oWaveFile->GetChannels());
+    AE_PARAMS_IM_EFFECT im_params = {
+            .effect_path = sImPath,
+    };
+//    cAeServer.set_params(AE_TYPE_KTV, nullptr);
+    cAeServer.set_params(AE_TYPE_IM_EFFECT, (void *) &im_params);
+    while (nPos < nLength)
+    {
+        if (nLength - nPos < nStep)
+        {
+            nStep = nLength - nPos;
+        }
+        cAeServer.process(pVocalBuf + nPos, pVocalBuf + nPos, nStep);
+        nPos += nStep;
+    }
+    cAeServer.uninit();
+    //写入文件
+    printf("write2file nLength:%d path:%s!\n", oWaveFile->GetTotalFrames() * oWaveFile->GetChannels(), sMix.c_str());
+    CWaveFile *oWaveFile2 = new CWaveFile(sMix.c_str(), true);
+    oWaveFile2->SetSampleFormat(SF_IEEE_FLOAT);
+    oWaveFile2->SetSampleRate(oWaveFile->GetSampleRate());
+    oWaveFile2->SetChannels(oWaveFile->GetChannels());
+    oWaveFile2->SetupDone();
+    oWaveFile2->WriteFrame(pVocalBuf, oWaveFile->GetTotalFrames());
+
+    delete oWaveFile;
+
+    delete[] pVocalBuf;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/main.cpp b/AutoCoverTool/ref/tools/mixer/main.cpp
new file mode 100644
index 0000000..1ddcdf6
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/main.cpp
@@ -0,0 +1,292 @@
+//
+// Created by yangjianli on 2019-09-09.
+//
+/**
+ * 输入一个音频和伴奏自动进行混合
+ * gated_loudness 当前音量
+ * gain 预期增益
+ */
+#include "iostream"
+#include "WaveFile.h"
+#include "math.h"
+#include "ebur128.h"
+#include "AudioMixer.h"
+#include "alimiter.h"
+#include "waves/inc/WaveFile.h"
+#include "CAudioEffectsChainApi.h"
+#include "string"
+#include "ae_server/CAeServer.h"
+#include <cstdio>
+#include <chrono>
+#include <iostream>
+#include <cstdlib>
+#include <sys/time.h>
+#include "denoise/webrtc/include/WebrtcDenoise.h"
+
+#define PROC_LEN 1024
+#define DEFAULT_BASELINE_DB (float)-14.57f
+
+int short2float(short *pInBuf, int nLen, float *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    return 0;
+}
+
+int float2short(float *pInBuf, int nLen, short *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = int(pInBuf[i] * 32768);
+    }
+    return 0;
+}
+
+/**
+ * 获取增益
+ * @param nChannel
+ * @param nSampleRate
+ * @param pData
+ * @param nLength
+ * @param gain
+ * @return
+ */
+int ebur128_whole(int nChannel, int nSampleRate, short *pData, const int nLength, double &gated_loudness, double &gain)
+{
+    printf("ebur128_init start .. %d\n", nLength);
+    ebur128_state *st = NULL;
+    st = ebur128_init(nChannel, nSampleRate, EBUR128_MODE_I);
+    if (NULL == st)
+    {
+        return -1;
+    }
+    int nPos = 0;
+    int nTmpLength = 0;
+    int nRet;
+    printf("process start ..\n");
+    while (nPos < nLength)
+    {
+        nTmpLength = PROC_LEN;
+        if (nLength - nPos < PROC_LEN)
+        {
+            nTmpLength = nLength - nPos;
+        }
+        nRet = ebur128_add_frames_short(st, pData + nPos, nTmpLength / nChannel);
+        if (nRet != 0)
+        {
+            return -2;
+        }
+        nPos += nTmpLength;
+    }
+    printf("process ok..\n");
+    gated_loudness = -1;
+    ebur128_loudness_global(st, &gated_loudness);
+    float db = (DEFAULT_BASELINE_DB - gated_loudness) / 20.f;
+    gain = pow(10, db);
+    printf("gated_loudness = %f db = %f  gain = %f\n", gated_loudness, db, gain);
+    ebur128_destroy(&st);
+    return 0;
+}
+
+
+/**
+ * 混合音频和伴奏
+ * @param pVocalIn
+ * @param pAccIn
+ * @param nLength
+ * @param gainVocal
+ * @param gainAcc
+ * @param pOutBuf
+ * @return
+ */
+int mix(float *pVocalIn, float *pAccIn, int nLength, double gainVocal, double gainAcc, float *pOutBuf,
+        int nSampleRate, int nChannel, int nDelay, std::string effect_file)
+{
+
+    CAudioMixer *cAudioMixer = new CAudioMixer();
+    cAudioMixer->init(nSampleRate, nChannel);
+    cAudioMixer->set_acc_delay(nDelay);
+    cAudioMixer->set_vocal_volume(int(gainVocal * 50));
+    cAudioMixer->set_acc_volume(int(gainAcc * 50));
+
+    int nPos = 0;
+    int nStep = 1024;
+    float *fTmp = new float[nStep];
+    cAudioMixer->reset();
+    nPos = 0;
+    nStep = 1024;
+    int cnt = 0;
+
+    CAeServer cAeServer;
+    cAeServer.init(nSampleRate, nChannel, nStep / nChannel);
+    AE_PARAMS_IM_EFFECT im_params = {
+            .effect_path = effect_file,
+    };
+    cAeServer.set_params(AE_TYPE_IM_EFFECT, (void *) &im_params);
+
+
+    while (nPos < nLength)
+    {
+        if (nLength - nPos < nStep)
+        {
+            nStep = nLength - nPos;
+        }
+        cnt++;
+        cAeServer.process(pVocalIn + nPos, pVocalIn + nPos, nStep);
+        cAudioMixer->process(pVocalIn + nPos, pAccIn + nPos, pOutBuf + nPos, nStep);
+        nPos += nStep;
+    }
+    cAeServer.uninit();
+    delete cAudioMixer;
+    delete[] fTmp;
+    return 0;
+}
+
+int denoise_webrtc(short *pInBuf, int nLength, int nChannel, int nSampleRate)
+{
+    CWebrtcDenoise cWebrtcDenoise;
+    cWebrtcDenoise.init(nSampleRate, nChannel);
+    float *pTmp = new float[nLength];
+    for (int i = 0; i < nLength; i++)
+    {
+        pTmp[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    cWebrtcDenoise.set_level(kHigh);
+    int nStep = 512 * nChannel;
+
+    for (int i = 0; i < nStep; i++)
+    {
+        pTmp[i] = pTmp[i] * i * 1.0 / nStep;
+    }
+
+    for (int i = 0, cnt = 0; i < nLength; i += nStep, cnt++)
+    {
+        if (nLength - i < nStep) continue;
+        cWebrtcDenoise.process(pTmp + i, nStep);
+    }
+
+    for (int i = 0; i < nLength; i++)
+    {
+        pInBuf[i] = short(pTmp[i] * 32768);
+    }
+    delete[] pTmp;
+    return 0;
+}
+
+double calc_power_rate(float *in_data, int32_t in_len, float *ref_data, int32_t ref_len)
+{
+    double in_power = 0;
+    double ref_power = 0;
+    int32_t min_len = in_len > ref_len ? ref_len : in_len;
+    for (int i = 0; i < min_len; i++)
+    {
+        in_power += (in_data[i]) * (in_data[i]);
+        ref_power += (ref_data[i]) * (ref_data[i]);
+    }
+    return ref_power / in_power;
+}
+
+
+int main(int argc, char *argv[])
+{
+    if (argc != 6)
+    {
+        printf("input error! example: ./main im_path vocal_path ref_vocal_path acc_path mix_path!\n");
+        return -1;
+    }
+    std::string sImPath = argv[1];
+    std::string sVocal = argv[2];
+    std::string sRefVocal = argv[3];
+    std::string sAcc = argv[4];
+    std::string sMix = argv[5];
+
+    // 读取人声
+    CWaveFile *oWaveFile = new CWaveFile(sVocal.c_str(), false);
+    short *pVocalBuf = new short[oWaveFile->GetTotalFrames() * oWaveFile->GetChannels()];
+    oWaveFile->ReadFrameAsS16(pVocalBuf, oWaveFile->GetTotalFrames());
+
+    // 读取人声
+    CWaveFile *oRefWaveFile = new CWaveFile(sRefVocal.c_str(), false);
+    short *pRefVocalBuf = new short[oRefWaveFile->GetTotalFrames() * oRefWaveFile->GetChannels()];
+    oRefWaveFile->ReadFrameAsS16(pRefVocalBuf, oRefWaveFile->GetTotalFrames());
+
+    //读取伴奏
+    CWaveFile *oWaveFile1 = new CWaveFile(sAcc.c_str(), false);
+    short *pAccBuf = new short[oWaveFile1->GetTotalFrames() * oWaveFile1->GetChannels()];
+    oWaveFile1->ReadFrameAsS16(pAccBuf, oWaveFile1->GetTotalFrames());
+
+    if (oWaveFile->GetChannels() != oWaveFile1->GetChannels())
+    {
+        printf("channel not equal!\n");
+        return -1;
+    }
+
+    printf("denoise start...\n");
+    // 对人声做降噪
+    denoise_webrtc(pVocalBuf, oWaveFile->GetTotalFrames() * oWaveFile->GetChannels(),
+                   oWaveFile->GetChannels(), oWaveFile->GetSampleRate());
+
+    // 获取人声增益
+    printf("vocal start...\n");
+    double gated_loudness;
+    double gain;
+    ebur128_whole(oWaveFile->GetChannels(), oWaveFile->GetSampleRate(), pVocalBuf, oWaveFile->GetTotalFrames() * oWaveFile->GetChannels(),
+                  gated_loudness, gain);
+
+    printf("ref vocal start...\n");
+    // 获取参考人声的增益
+    double ref_gated_loudness;
+    double ref_gain;
+    ebur128_whole(oRefWaveFile->GetChannels(), oRefWaveFile->GetSampleRate(), pRefVocalBuf,
+                  oRefWaveFile->GetTotalFrames() * oRefWaveFile->GetChannels(), ref_gated_loudness, ref_gain);
+
+    // 混合音频和伴奏
+    printf("mix wav:%s and acc:%s!\n", sVocal.c_str(), sAcc.c_str());
+    int nOutLen = oWaveFile->GetTotalFrames() < oWaveFile1->GetTotalFrames() ? oWaveFile->GetTotalFrames()
+                                                                             : oWaveFile1->GetTotalFrames();
+    nOutLen = nOutLen * oWaveFile->GetChannels();
+    float *pOutBuf = new float[nOutLen];
+    float *pfVocalBuf = new float[oWaveFile->GetTotalFrames() * oWaveFile->GetChannels()];
+    float *pfAccBuf = new float[oWaveFile1->GetTotalFrames() * oWaveFile1->GetChannels()];
+    float *pfRefVocalBuf = new float[oRefWaveFile->GetTotalFrames() * oRefWaveFile->GetChannels()];
+    short2float(pVocalBuf, oWaveFile->GetTotalFrames() * oWaveFile->GetChannels(), pfVocalBuf);
+    short2float(pAccBuf, oWaveFile1->GetTotalFrames() * oWaveFile1->GetChannels(), pfAccBuf);
+    short2float(pRefVocalBuf, oWaveFile1->GetTotalFrames() * oWaveFile1->GetChannels(), pfRefVocalBuf);
+
+    // 对于伴奏和音频都不做拉伸
+    // 伴奏不动，人声拉到参考人声的响度
+    float db = (ref_gated_loudness - gated_loudness) / 20.f;
+    gain = pow(10, db);
+    double power_gain = calc_power_rate(pfVocalBuf,
+                                        oWaveFile->GetTotalFrames() * oWaveFile->GetChannels(), pfRefVocalBuf,
+                                        oRefWaveFile->GetTotalFrames() * oRefWaveFile->GetChannels());
+    printf("vocal->refvocal: online_gain=%f, gain=%f, powerGain=%f, src=%f, dst=%f\n",1.5 * pow(10, ((-14.57 - gated_loudness) / 20.f)),
+            gain, power_gain, gated_loudness, ref_gated_loudness);
+    gain = power_gain;
+
+    mix(pfVocalBuf, pfAccBuf, nOutLen, gain, 1.0, pOutBuf, oWaveFile->GetSampleRate(), oWaveFile->GetChannels(), 0,
+        sImPath);
+
+    //写入文件
+    printf("write2file nLength:%d path:%s!\n", nOutLen, sMix.c_str());
+    float2short(pOutBuf, nOutLen, pVocalBuf);
+    CWaveFile *oWaveFile2 = new CWaveFile(sMix.c_str(), true);
+    oWaveFile2->SetSampleFormat(SF_S16);
+    oWaveFile2->SetSampleRate(oWaveFile->GetSampleRate());
+    oWaveFile2->SetChannels(oWaveFile->GetChannels());
+    oWaveFile2->SetupDone();
+    oWaveFile2->WriteFrame(pVocalBuf, nOutLen / oWaveFile->GetChannels());
+
+    delete oWaveFile;
+    delete oWaveFile1;
+    delete oWaveFile2;
+
+    delete[] pVocalBuf;
+    delete[] pAccBuf;
+    delete[] pfVocalBuf;
+    delete[] pfAccBuf;
+    delete[] pOutBuf;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/simple_mixer.cpp b/AutoCoverTool/ref/tools/mixer/simple_mixer.cpp
new file mode 100644
index 0000000..fdf1673
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/simple_mixer.cpp
@@ -0,0 +1,236 @@
+//
+// Created by yangjianli on 2019-09-09.
+//
+/**
+ * 输入一个音频和伴奏自动进行混合
+ * gated_loudness 当前音量
+ * gain 预期增益
+ */
+#include "iostream"
+#include "WaveFile.h"
+#include "math.h"
+#include "ebur128.h"
+#include "AudioMixer.h"
+#include "alimiter.h"
+#include "waves/inc/WaveFile.h"
+#include "CAudioEffectsChainApi.h"
+#include "string"
+#include "ae_server/CAeServer.h"
+#include <cstdio>
+#include <chrono>
+#include <iostream>
+#include <cstdlib>
+#include <sys/time.h>
+#include "denoise/webrtc/include/WebrtcDenoise.h"
+
+#define PROC_LEN 1024
+#define DEFAULT_BASELINE_DB (float)-14.57f
+
+int short2float(short *pInBuf, int nLen, float *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    return 0;
+}
+
+int float2short(float *pInBuf, int nLen, short *pOutBuf)
+{
+    for (int i = 0; i < nLen; i++)
+    {
+        pOutBuf[i] = int(pInBuf[i] * 32768);
+    }
+    return 0;
+}
+
+/**
+ * 获取增益
+ * @param nChannel
+ * @param nSampleRate
+ * @param pData
+ * @param nLength
+ * @param gain
+ * @return
+ */
+int ebur128_whole(int nChannel, int nSampleRate, short *pData, const int nLength, double &gated_loudness, double &gain)
+{
+    printf("ebur128_init start .. %d\n", nLength);
+    ebur128_state *st = NULL;
+    st = ebur128_init(nChannel, nSampleRate, EBUR128_MODE_I);
+    if (NULL == st)
+    {
+        return -1;
+    }
+    int nPos = 0;
+    int nTmpLength = 0;
+    int nRet;
+    printf("process start ..\n");
+    while (nPos < nLength)
+    {
+        nTmpLength = PROC_LEN;
+        if (nLength - nPos < PROC_LEN)
+        {
+            nTmpLength = nLength - nPos;
+        }
+        nRet = ebur128_add_frames_short(st, pData + nPos, nTmpLength / nChannel);
+        if (nRet != 0)
+        {
+            return -2;
+        }
+        nPos += nTmpLength;
+    }
+    printf("process ok..\n");
+    gated_loudness = -1;
+    ebur128_loudness_global(st, &gated_loudness);
+    float db = (DEFAULT_BASELINE_DB - gated_loudness) / 20.f;
+    gain = pow(10, db);
+    printf("gated_loudness = %f db = %f  gain = %f\n", gated_loudness, db, gain);
+    ebur128_destroy(&st);
+    return 0;
+}
+
+
+/**
+ * 混合音频和伴奏
+ * @param pVocalIn
+ * @param pAccIn
+ * @param nLength
+ * @param gainVocal
+ * @param gainAcc
+ * @param pOutBuf
+ * @return
+ */
+int mix(float *pVocalIn, float *pAccIn, int nLength, double gainVocal, double gainAcc, float *pOutBuf,
+        int nSampleRate, int nChannel, int nDelay)
+{
+
+    CAudioMixer *cAudioMixer = new CAudioMixer();
+    cAudioMixer->init(nSampleRate, nChannel);
+    cAudioMixer->set_acc_delay(nDelay);
+    cAudioMixer->set_vocal_volume(int(gainVocal * 50));
+    cAudioMixer->set_acc_volume(int(gainAcc * 50));
+
+    int nPos = 0;
+    int nStep = 1024;
+    float *fTmp = new float[nStep];
+    cAudioMixer->reset();
+    nPos = 0;
+    nStep = 1024;
+    int cnt = 0;
+
+
+    while (nPos < nLength)
+    {
+        if (nLength - nPos < nStep)
+        {
+            nStep = nLength - nPos;
+        }
+        cnt++;
+        cAudioMixer->process(pVocalIn + nPos, pAccIn + nPos, pOutBuf + nPos, nStep);
+        nPos += nStep;
+    }
+    delete cAudioMixer;
+    delete[] fTmp;
+    return 0;
+}
+
+int denoise_webrtc(short *pInBuf, int nLength, int nChannel, int nSampleRate)
+{
+    CWebrtcDenoise cWebrtcDenoise;
+    cWebrtcDenoise.init(nSampleRate, nChannel);
+    float *pTmp = new float[nLength];
+    for (int i = 0; i < nLength; i++)
+    {
+        pTmp[i] = pInBuf[i] * 1.0 / 32768;
+    }
+    cWebrtcDenoise.set_level(kHigh);
+    int nStep = 512 * nChannel;
+
+    for (int i = 0; i < nStep; i++)
+    {
+        pTmp[i] = pTmp[i] * i * 1.0 / nStep;
+    }
+
+    for (int i = 0, cnt = 0; i < nLength; i += nStep, cnt++)
+    {
+        if (nLength - i < nStep) continue;
+        cWebrtcDenoise.process(pTmp + i, nStep);
+    }
+
+    for (int i = 0; i < nLength; i++)
+    {
+        pInBuf[i] = short(pTmp[i] * 32768);
+    }
+    delete[] pTmp;
+    return 0;
+}
+
+double calc_power_rate(float *in_data, int32_t in_len, float *ref_data, int32_t ref_len)
+{
+    double in_power = 0;
+    double ref_power = 0;
+    int32_t min_len = in_len > ref_len ? ref_len : in_len;
+    for (int i = 0; i < min_len; i++)
+    {
+        in_power += (in_data[i]) * (in_data[i]);
+        ref_power += (ref_data[i]) * (ref_data[i]);
+    }
+    return ref_power / in_power;
+}
+
+
+int main(int argc, char *argv[])
+{
+    if (argc != 4)
+    {
+        printf("input error! example: ./main vocal_path acc_path mix_path\n");
+        return -1;
+    }
+    std::string sVocal = argv[1];
+    std::string sAcc = argv[2];
+    std::string sMix = argv[3];
+
+    // 读取人声
+    CWaveFile *oWaveFile = new CWaveFile(sVocal.c_str(), false);
+    float *pfVocalBuf = new float[oWaveFile->GetTotalFrames() * oWaveFile->GetChannels()];
+    oWaveFile->ReadFrameAsfloat(pfVocalBuf, oWaveFile->GetTotalFrames());
+
+    //读取伴奏
+    CWaveFile *oWaveFile1 = new CWaveFile(sAcc.c_str(), false);
+    float *pfAccBuf = new float[oWaveFile1->GetTotalFrames() * oWaveFile1->GetChannels()];
+    oWaveFile1->ReadFrameAsfloat(pfAccBuf, oWaveFile1->GetTotalFrames());
+
+    if (oWaveFile->GetChannels() != oWaveFile1->GetChannels())
+    {
+        printf("channel not equal!\n");
+        return -1;
+    }
+
+    // 混合音频和伴奏
+    printf("mix wav:%s and acc:%s!\n", sVocal.c_str(), sAcc.c_str());
+    int nOutLen = oWaveFile->GetTotalFrames() < oWaveFile1->GetTotalFrames() ? oWaveFile->GetTotalFrames()
+                                                                             : oWaveFile1->GetTotalFrames();
+    nOutLen = nOutLen * oWaveFile->GetChannels();
+    float *pOutBuf = new float[nOutLen];
+
+    mix(pfVocalBuf, pfAccBuf, nOutLen, 1.0, 1.0, pOutBuf, oWaveFile->GetSampleRate(), oWaveFile->GetChannels(), 0);
+
+    //写入文件
+    printf("write2file nLength:%d path:%s!\n", nOutLen, sMix.c_str());
+    CWaveFile *oWaveFile2 = new CWaveFile(sMix.c_str(), true);
+    oWaveFile2->SetSampleFormat(SF_IEEE_FLOAT);
+    oWaveFile2->SetSampleRate(oWaveFile->GetSampleRate());
+    oWaveFile2->SetChannels(oWaveFile->GetChannels());
+    oWaveFile2->SetupDone();
+    oWaveFile2->WriteFrame(pOutBuf, nOutLen / oWaveFile->GetChannels());
+
+    delete oWaveFile;
+    delete oWaveFile1;
+    delete oWaveFile2;
+
+    delete[] pfVocalBuf;
+    delete[] pfAccBuf;
+    delete[] pOutBuf;
+    return 0;
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/waves/CMakeLists.txt b/AutoCoverTool/ref/tools/mixer/waves/CMakeLists.txt
new file mode 100644
index 0000000..3045b00
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/waves/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_WAVES_SRCS)
+add_library(waves ${DIR_WAVES_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/waves/inc/ExtraMono.h b/AutoCoverTool/ref/tools/mixer/waves/inc/ExtraMono.h
new file mode 100755
index 0000000..280fab0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/waves/inc/ExtraMono.h
@@ -0,0 +1,230 @@
+
+#include <string>
+#include <string.h>
+
+#define SIZE_LONG 4
+#define SIZE_SHORT 2
+
+#define SIZE_FLAG 4
+#define FMT_TAG 0x0001
+
+#define BITS_PER_BYTE 8
+
+#ifndef AFS_CMPL_MAX_WAV	
+#define AFS_CMPL_MAX_WAV 15360000	// 时长16分（960*16000）
+#endif
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个32位数据
+//+---------------------------------------------------------------------------+
+unsigned long fa_read_u32(FILE* fp)
+{
+	unsigned long cx;
+	unsigned char temp[SIZE_LONG];
+
+	fread(temp, sizeof(unsigned char), SIZE_LONG, fp);
+	cx =  (unsigned long)temp[0];
+	cx |= (unsigned long)temp[1] << 8;
+	cx |= (unsigned long)temp[2] << 16;
+	cx |= (unsigned long)temp[3] << 24;
+	return cx;
+}
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个16位数据
+//+---------------------------------------------------------------------------+
+unsigned short fa_read_u16(FILE *fp)
+{
+	unsigned short cx;
+	unsigned char  temp[SIZE_SHORT];
+
+	fread(temp, sizeof(unsigned char), SIZE_SHORT, fp);
+	cx = temp[0] | (temp[1] * 256);
+	return cx;
+}
+
+int GetWaveHeadLen(const char* pszFile,unsigned short &channels, int &nPos, int& nLength)
+{
+	//+---------------------------------------------------------------------------+
+	//+ 读取WAVE的头信息
+	//+---------------------------------------------------------------------------+
+	unsigned char  temp[SIZE_FLAG];
+	unsigned short bits_per_sample;
+	unsigned long  x_size;
+	unsigned long  n_skip;
+
+	unsigned short format;
+	//unsigned short channels;
+	unsigned long  sample_rate;
+	unsigned short block_align;
+	unsigned long  data_size;
+	int nCnt = 0;
+
+	/* 读取通用信息 */
+	FILE* pWavFile = fopen(pszFile, "rb");
+	if ( pWavFile == NULL )
+	{
+		printf("Input file can not be opened!\n");
+		return -1;
+	}
+
+	fseek(pWavFile, 0, SEEK_END );
+	nLength = ftell(pWavFile);
+	fseek(pWavFile, 0, SEEK_SET );
+
+	// 判断资源标识为"RIFF"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "RIFF", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Resource flag is not RIFF!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+	nCnt += SIZE_LONG;
+
+	// 判断文件标识为"WAVE"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "WAVE", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "File flag is not WAVE\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	// 判断格式标识为"fmt "
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "fmt ", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Format flag is not FMT!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	x_size = fa_read_u32(pWavFile);
+	nCnt += SIZE_LONG;
+
+	// 判断编码格式为0x0001
+	format = fa_read_u16(pWavFile);
+	nCnt += SIZE_SHORT;
+	if ( format != FMT_TAG )
+	{
+		fprintf(stderr, "Encoding format is not 0x0001!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+
+	// 读取声道数目和采样频率
+	channels = fa_read_u16(pWavFile);
+	sample_rate = fa_read_u32(pWavFile);
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+
+	// 读取对齐单位和样本位数
+	block_align = fa_read_u16(pWavFile);
+	bits_per_sample = fa_read_u16(pWavFile);
+
+	/* 读取特殊信息 */
+	x_size -= (4*SIZE_SHORT + 2*SIZE_LONG);
+	if ( x_size != 0 )
+	{
+		fseek(pWavFile, x_size, SEEK_CUR);
+	}
+
+	// 读取数据大小
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	while ( memcmp(temp, "data", SIZE_FLAG) != 0 )
+	{
+		n_skip = fa_read_u32(pWavFile);
+		fseek(pWavFile, n_skip, SEEK_CUR);
+
+		fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	}
+
+	data_size = fa_read_u32(pWavFile);
+	fclose(pWavFile);
+
+	//+---------------------------------------------------------------------------+
+	//+ 返回WAVE的头长度
+	//+---------------------------------------------------------------------------+
+	nPos = nCnt;
+	int nHeadLength = nLength - data_size;
+	return nHeadLength;
+}
+
+bool ExtraMono(const std::string &sInput, const std::string &sOutput)
+{
+	FILE *pFile = fopen(sInput.c_str(), "rb");
+	if ( NULL == pFile )
+	{
+		printf("Fopen Error %s", sInput.c_str());
+		return false;
+	}
+
+	FILE *pFile2 = fopen(sOutput.c_str(), "wb");
+	if ( NULL == pFile2 )
+	{
+		printf("Fopen2 Error %s", sOutput.c_str());
+		return false;
+	}
+
+	short *pBuf = new short[AFS_CMPL_MAX_WAV];
+	int nLen = 0;
+
+	nLen = fread(pBuf, sizeof(short), AFS_CMPL_MAX_WAV, pFile);
+	if ( nLen <= 0 )
+	{
+		perror("Fread Error!");
+		return false;
+	}
+
+	unsigned short channels=0;
+	int nPos;
+	int nLength;
+	int nHeadByte = GetWaveHeadLen(sInput.c_str(),channels, nPos, nLength);
+	int nHeadShort = nHeadByte/2;
+	
+	if (channels==1)
+	{
+		fwrite(pBuf + nHeadShort, sizeof(short), nLen - nHeadShort, pFile2);
+	}
+	else
+	{
+		short *pBuf2 = new short[AFS_CMPL_MAX_WAV];
+		memcpy( pBuf2, pBuf, nHeadShort*sizeof(short));
+		pBuf2[nPos] = 1;
+
+		unsigned char tmp[2];
+		memcpy(tmp, &pBuf2[nPos], 2);
+
+		pBuf2[nPos] = static_cast<short>(tmp[0] | tmp[1]*256);
+
+		short *pWav = pBuf + nHeadShort;
+		nLen -= nHeadShort;
+
+		int halfnlen=nLen/2;
+		for (int i=0;i<=halfnlen;i++ )
+		{
+			pBuf2[nHeadShort+i] = *(pWav+i*2);
+		}
+		fwrite(pBuf2, sizeof(short), nLen+nHeadShort, pFile2);
+
+		delete []pBuf;
+		delete []pBuf2;
+		pBuf = NULL;
+		pBuf2 = NULL;
+	}
+
+
+	fclose(pFile);
+	fclose(pFile2);
+	return true;
+}
diff --git a/AutoCoverTool/ref/tools/mixer/waves/inc/WaveFile.h b/AutoCoverTool/ref/tools/mixer/waves/inc/WaveFile.h
new file mode 100755
index 0000000..8b57806
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/waves/inc/WaveFile.h
@@ -0,0 +1,74 @@
+#ifndef WAVE_FILE_H
+#define WAVE_FILE_H
+
+#include <stdio.h>
+#include <stdint.h>
+
+
+typedef enum SAMPLE_FORMAT
+{
+    SF_U8 = 8,
+    SF_S16 = 16,
+    SF_S24 = 24,
+    SF_S32 = 32,
+    SF_IEEE_FLOAT = 0x100 + 32,
+    SF_IEEE_DOUBLE = 0x100 + 64,
+    SF_MAX,
+} SAMPLE_FORMAT;
+
+/* 主处理对象 **/
+class CWaveFile
+{
+public:
+	/* 构造传入文件及 是读还是写 **/
+    CWaveFile(const char* Filename, bool Write);
+    virtual ~CWaveFile();
+
+public:
+    int GetChannels();
+    int GetSampleRate();
+    double GetDuration();  // in second
+    uint32_t GetChannelMask();
+    void SetChannels(int Channels);
+    void SetSampleRate(int SampleRate);
+    void SetSampleFormat(SAMPLE_FORMAT Format);
+    void SetChannelMask(uint32_t Mask);
+    void Stat();
+    void SetupDone();
+    bool ReadFrameAsS16(short* FrameSamples, int Frames = 1);
+    bool ReadFrameAsDouble(double* FrameSamples, int Frames = 1);
+	bool ReadFrameAsfloat(float* FrameSamples, int Frames = 1);
+	void WriteRaw(void* Raw, int Size);
+    void WriteFrame(uint8_t* FrameSamples, int Frames = 1);
+    void WriteFrame(short* FrameSamples, int Frames = 1);
+    void WriteFrame(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrameS24(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrame(double* FrameSamples, int Frames = 1);
+    void WriteFrame(float* FrameSamples, int Frames=1);
+    void Seek(int FramePos, int Where = SEEK_SET);
+	bool GetStatus();
+	SAMPLE_FORMAT GetFormat();
+	int GetTotalFrames();
+	int GetFramesRead();
+
+
+protected:
+    FILE* File;
+    int Channels;					/* 通道数 **/
+    int SampleRate;					/* 采样率 **/
+    SAMPLE_FORMAT Format;			/* 采样精度 **/
+    int SampleSize; // Measured in Bits
+    unsigned int FrameStartPos;		/* 音频数据的起始位置 **/
+    unsigned long TotalFrames;		/* 总帧数，如果16bit，则一个short为一帧 **/
+    unsigned long FramesRead;
+    double Duration;				/* 时长 **/
+
+    bool ReadOnly;					/* 是度还是写 **/
+
+    uint32_t ChannelMask;
+
+	bool m_bOK;		/* 文件是否已经被打开 **/
+};
+
+
+#endif
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/mixer/waves/src/WaveFile.cpp b/AutoCoverTool/ref/tools/mixer/waves/src/WaveFile.cpp
new file mode 100755
index 0000000..83b83d7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/mixer/waves/src/WaveFile.cpp
@@ -0,0 +1,824 @@
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <memory.h>
+#include <errno.h>
+
+#if WIN32
+#else
+#include <inttypes.h>
+#endif
+
+#include "WaveFile.h"
+
+#define SPEAKER_FRONT_LEFT             0x1
+#define SPEAKER_FRONT_RIGHT            0x2
+#define SPEAKER_FRONT_CENTER           0x4
+#define SPEAKER_LOW_FREQUENCY          0x8
+#define SPEAKER_BACK_LEFT              0x10
+#define SPEAKER_BACK_RIGHT             0x20
+#define SPEAKER_FRONT_LEFT_OF_CENTER   0x40
+#define SPEAKER_FRONT_RIGHT_OF_CENTER  0x80
+#define SPEAKER_BACK_CENTER            0x100
+#define SPEAKER_SIDE_LEFT              0x200
+#define SPEAKER_SIDE_RIGHT             0x400
+#define SPEAKER_TOP_CENTER             0x800
+#define SPEAKER_TOP_FRONT_LEFT         0x1000
+#define SPEAKER_TOP_FRONT_CENTER       0x2000
+#define SPEAKER_TOP_FRONT_RIGHT        0x4000
+#define SPEAKER_TOP_BACK_LEFT          0x8000
+#define SPEAKER_TOP_BACK_CENTER        0x10000
+#define SPEAKER_TOP_BACK_RIGHT         0x20000
+#define SPEAKER_RESERVED               0x80000000
+
+
+#define SPEAKER_REAR_CENTER_SURROUND   SPEAKER_BACK_CENTER 
+
+#define DCA_MONO 0
+#define DCA_CHANNEL 1
+#define DCA_STEREO 2
+#define DCA_STEREO_SUMDIFF 3
+#define DCA_STEREO_TOTAL 4
+#define DCA_3F 5
+#define DCA_2F1R 6
+#define DCA_3F1R 7
+#define DCA_2F2R 8
+#define DCA_3F2R 9
+#define DCA_4F2R 10
+
+#define DCA_DOLBY 101 /* FIXME */
+
+#define DCA_CHANNEL_MAX  DCA_3F2R /* We don't handle anything above that */
+#define DCA_CHANNEL_BITS 6
+#define DCA_CHANNEL_MASK 0x3F
+
+#define DCA_LFE 0x80
+#define DCA_ADJUST_LEVEL 0x100
+
+#define WAVE_FORMAT_PCM        0x0001
+#define WAVE_FORMAT_IEEE_FLOAT 0x0003
+#define WAVE_FORMAT_EXTENSIBLE 0xFFFE
+
+static uint8_t wav_header[] = {
+    'R', 'I', 'F', 'F', 0xfc, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 16, 0, 0, 0,
+    WAVE_FORMAT_PCM, WAVE_FORMAT_PCM >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0,
+    'd', 'a', 't', 'a', 0xd8, 0xff, 0xff, 0xff
+};
+
+static uint8_t wavmulti_header[] = {
+    'R', 'I', 'F', 'F', 0xf0, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 40, 0, 0, 0,
+    (uint8_t)(WAVE_FORMAT_EXTENSIBLE & 0xFF), WAVE_FORMAT_EXTENSIBLE >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 22, 0,
+    0, 0, 0, 0, 0, 0,
+    WAVE_FORMAT_IEEE_FLOAT, WAVE_FORMAT_IEEE_FLOAT >> 8,
+    0, 0, 0, 0, 0x10, 0x00, 0x80, 0, 0, 0xaa, 0, 0x38, 0x9b, 0x71,
+    'd', 'a', 't', 'a', 0xb4, 0xff, 0xff, 0xff
+};
+
+static void store4 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+    buf[2] = value >> 16;
+    buf[3] = value >> 24;
+}
+
+static void store2 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+}
+
+
+static uint32_t find_chunk(FILE * file, const uint8_t chunk_id[4])
+{
+    uint8_t buffer[8];
+    while (1) {
+        size_t chunksize;
+        size_t s = fread(buffer, 1, 8, file);
+        if (s < 8)
+            return 0;
+        chunksize = (uint32_t)buffer[4] | ((uint32_t)buffer[5] << 8) |
+            ((uint32_t)buffer[6] << 16) | ((uint32_t)buffer[7] << 24);
+        if (!memcmp(buffer, chunk_id, 4))
+            return chunksize;
+        fseek(file, chunksize, SEEK_CUR);
+    }
+}
+
+
+CWaveFile::CWaveFile(const char* Filename, bool Write)
+    : Duration(0), ReadOnly(false), m_bOK(false)
+{
+    Channels = 0;
+
+	/* 打开文件 **/
+    File = fopen(Filename, Write ? "wb":"rb");
+    if ( !File )
+        return;
+    
+	/* 设置写文件初始参数 **/
+    if ( Write )
+    {
+        SampleRate = 44100;
+        Channels = 2;
+        Format = SF_S16;
+        SampleSize = 16;
+		ChannelMask = 0;
+		m_bOK = true;
+        return;
+    }
+
+    ReadOnly = true;
+
+    size_t s;
+    uint8_t buffer[8];
+    uint8_t *fmt = NULL;
+    uint32_t v;
+    uint32_t avg_bps;
+    uint32_t block_align;
+    unsigned short FormatType;
+    unsigned short SampleType;
+
+    static const uint8_t riff[4] = { 'R', 'I', 'F', 'F' };
+    static const uint8_t wave[4] = { 'W', 'A', 'V', 'E' };
+    static const uint8_t fmt_[4] = { 'f', 'm', 't', ' ' };
+    static const uint8_t data[4] = { 'd', 'a', 't', 'a' };
+
+	/* 前四个字节为 riff **/
+    s = fread(buffer, 1, 8, File);
+    if (s < 8)
+        goto err2;
+
+    if (memcmp(buffer, riff, 4))
+        goto err2;
+
+	/* 8~12为wave **/
+    /* TODO: check size (in buffer[4..8]) */
+    s = fread(buffer, 1, 4, File);
+    if (s < 4)
+        goto err2;
+
+    if (memcmp(buffer, wave, 4))
+        goto err2;
+
+    s = find_chunk(File, fmt_);
+    if ( s != 16 && s != 18 && s != 40 )
+        goto err2;
+
+    fmt = (uint8_t*)malloc(s);
+    if (!fmt)
+        goto err2;
+
+    if (fread(fmt, 1, s, File) != s)
+        goto err3;
+
+    /* wFormatTag */
+    v = (uint32_t)fmt[0] | ((uint32_t)fmt[1] << 8);
+    if (v != WAVE_FORMAT_PCM && v != WAVE_FORMAT_IEEE_FLOAT && v != WAVE_FORMAT_EXTENSIBLE)
+        goto err3;
+
+    FormatType = v;
+
+    if (s == 40 && 0xfffe == v)
+    {
+        // fmt begins at 0x14 of the wave file
+        v = *(unsigned short*)&fmt[0x2C - 0x14];
+    }
+
+    SampleType = v;
+
+    /* wChannels */
+    v = (uint32_t)fmt[2] | ((uint32_t)fmt[3] << 8);
+
+    Channels = v;
+
+    if (v < 1 || v > 32)
+        goto err3;
+
+    /* dwSamplesPerSec */
+    SampleRate = (uint32_t)fmt[4] | ((uint32_t)fmt[5] << 8) |
+        ((uint32_t)fmt[6] << 16) | ((uint32_t)fmt[7] << 24);
+
+    /* dwAvgBytesPerSec */
+    avg_bps = (uint32_t)fmt[8] | ((uint32_t)fmt[9] << 8) |
+        ((uint32_t)fmt[10] << 16) | ((uint32_t)fmt[11] << 24);
+
+    /* wBlockAlign */
+    block_align = (uint32_t)fmt[12] | ((uint32_t)fmt[13] << 8);
+
+    /* wBitsPerSample */
+    SampleSize = (uint32_t)fmt[14] | ((uint32_t)fmt[15] << 8);
+    if (SampleSize != 8 && SampleSize != 16 && SampleSize != 32 && SampleSize != 24 && SampleSize != 64)
+        goto err3;
+
+    switch (SampleSize)
+    {
+    case 8:
+        Format = SF_U8;
+        break;
+    case 16:
+        Format = SF_S16;
+        break;
+    case 24:
+        Format = SF_S24;
+        break;
+    case 32:
+    {
+        if (SampleType == WAVE_FORMAT_IEEE_FLOAT)
+            Format = SF_IEEE_FLOAT;
+        else
+            Format = SF_S32;
+
+    }
+    break;
+    case 64:
+        if (SampleType != WAVE_FORMAT_IEEE_FLOAT)
+            goto err3;
+        Format = SF_IEEE_DOUBLE;
+        break;
+    }
+
+
+    // Handle 24-bit samples individually
+#if 0
+    if (SampleSize == 24 && Channels <= 2)
+    {
+        int ba24 = Channels * (SampleSize / 8); // Align to 4x
+
+        ba24 = (ba24 + 3) / 4 * 4;
+
+        if (block_align != ba24)
+            goto err3;
+    }
+    else
+#endif
+    {
+        if (block_align != Channels * (SampleSize / 8))
+            goto err3;
+    }
+
+    if (avg_bps != block_align * SampleRate)
+        goto err3;
+
+    v = find_chunk(File, data);
+
+    if (v == 0 || v % block_align != 0)
+        goto err3;
+
+    TotalFrames = v / block_align;
+
+    FramesRead = 0;
+
+    if (FormatType == WAVE_FORMAT_EXTENSIBLE)
+    {
+        ChannelMask = *(unsigned int*)(&fmt[0x14]);
+    }
+    else
+    {
+        ChannelMask = 0;
+    }
+    
+    FrameStartPos = ftell(File);
+
+    free(fmt);
+	m_bOK = true;
+    return;
+
+err3:
+    free(fmt);
+err2:
+    fclose(File);
+
+    File = NULL;
+}
+
+bool CWaveFile::GetStatus()
+{
+	return m_bOK;
+}
+
+SAMPLE_FORMAT CWaveFile::GetFormat()
+{
+	return Format;
+}
+
+int CWaveFile::GetTotalFrames()
+{
+	return TotalFrames;
+}
+
+int CWaveFile::GetFramesRead()
+{
+	return FramesRead;
+}
+
+CWaveFile::~CWaveFile()
+{
+    if (File != NULL)
+    {
+        if (!ReadOnly)
+        {
+            unsigned int Size = ftell(File) - FrameStartPos;// 44;
+
+            fseek(File, FrameStartPos - 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+
+            Size += FrameStartPos - 8;
+
+            fseek(File, 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+        }
+
+        fclose(File);
+    }
+}
+
+int CWaveFile::GetSampleRate()
+{
+    return SampleRate;
+}
+
+void CWaveFile::SetSampleRate(int SampleRate)
+{
+    this->SampleRate = SampleRate;
+}
+
+void CWaveFile::SetupDone()
+{
+    unsigned char Header[68];
+
+    fseek(File, 0, SEEK_SET);
+
+    SampleSize = Format & 0xFF;
+
+    if (ChannelMask)
+    {
+        memcpy(Header, wavmulti_header, sizeof(wavmulti_header));
+
+        if (Format < SF_IEEE_FLOAT)
+        {
+         //   store2(Header + 20, WAVE_FORMAT_PCM);
+            store2(Header + 44, WAVE_FORMAT_PCM);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        store2(Header + 38, SampleSize / 8 * 8);
+        store4(Header + 40, ChannelMask);
+
+        fwrite(Header, sizeof(wavmulti_header), 1, File);
+    }
+    else
+    {
+        memcpy(Header, wav_header, sizeof(wav_header));
+
+        if (Format >= SF_IEEE_FLOAT)
+        {
+            store2(Header + 20, WAVE_FORMAT_IEEE_FLOAT);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        fwrite(Header, sizeof(wav_header), 1, File);
+    }
+
+
+    FrameStartPos = ftell(File);
+}
+
+
+void CWaveFile::Seek(int FramePos, int Where)
+{
+    // Ignoring Where
+
+    fseek(File, FrameStartPos + FramePos * Channels* (SampleSize / 8), Where);
+
+    FramesRead = FramePos;
+
+}
+
+int CWaveFile::GetChannels()
+{
+    return Channels;
+}
+
+void CWaveFile::SetChannels(int Channels)
+{
+    this->Channels = Channels;
+}
+
+void CWaveFile::SetSampleFormat(SAMPLE_FORMAT Format)
+{
+    this->Format = Format;
+}
+
+uint32_t CWaveFile::GetChannelMask()
+{
+    return ChannelMask;
+}
+
+void CWaveFile::SetChannelMask(uint32_t Mask)
+{
+    ChannelMask = Mask;
+}
+
+bool CWaveFile::ReadFrameAsS16(short* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) << 8;
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+        return Frames == fread(FrameSamples, sizeof(FrameSamples[0])*Channels, Frames, File);
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 8);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 16);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        double DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+bool CWaveFile::ReadFrameAsfloat(float* FrameSamples, int Frames)
+{
+	if (FramesRead >= TotalFrames)
+		return false;
+
+	FramesRead += Frames;
+
+	switch (Format)
+	{
+	case SF_U8:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 1, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S16:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 2, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S24:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 3, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S32:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 4, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_IEEE_FLOAT:
+	{
+        if(fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+            return true;
+        }
+        return false;
+
+//		float DirectSamples[32];
+//
+//		if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+//		{
+//			for (int frame = 0; frame < Frames; frame++)
+//			{
+//				for (int ch = 0; ch < Channels; ch++)
+//				{
+//					FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+//				}
+//			}
+//			return true;
+//		}
+//		return false;
+	}
+	case SF_IEEE_DOUBLE:
+	{
+		if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+		{
+			return true;
+		}
+		return false;
+	}
+	}
+	return false;
+}
+
+bool CWaveFile::ReadFrameAsDouble(double* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File)) 
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 2, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample ))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+void CWaveFile::WriteRaw(void* Raw, int Size)
+{
+	fwrite(Raw, Size, 1, File);
+}
+
+
+void CWaveFile::WriteFrame(uint8_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(short* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(int32_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrameS24(int32_t* FrameSamples, int Frames)
+{
+    for (int c = 0; c < Channels; c++)
+    {
+        fwrite(&FrameSamples[c], 3, 1, File);
+    }
+}
+
+void CWaveFile::WriteFrame(double* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(float* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+
+double CWaveFile::GetDuration()
+{
+    return Duration;
+}
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/CMakeLists.txt b/AutoCoverTool/ref/tools/pitch-detect-dpitch/CMakeLists.txt
new file mode 100644
index 0000000..8d6fb98
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/CMakeLists.txt
@@ -0,0 +1,10 @@
+cmake_minimum_required(VERSION 2.8)
+project(dpitch)
+set(LIBRARY_OUTPUT_PATH ${PROJECT_SOURCE_DIR}/lib)
+
+AUX_SOURCE_DIRECTORY(./src DIR_DPITCH_R_SRCS)
+include_directories(./inc ref/waves/inc)
+add_subdirectory(ref/waves)
+
+ADD_EXECUTABLE(dpitch test_dpitch.cpp ${DIR_DPITCH_R_SRCS})
+target_link_libraries(dpitch ${LIBRARY_OUTPUT_PATH}/libwaves.a)
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPParam.h b/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPParam.h
new file mode 100755
index 0000000..af2da73
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPParam.h
@@ -0,0 +1,39 @@
+
+#ifndef _DP_PARAM_H_
+#define _DP_PARAM_H_
+
+#include "DPitchDef.h"
+
+/* 全局参数和数据，所有线程共享，线程安全，单体模式 **/
+class CDPParam
+{
+public:
+	static const CDPParam& GetInstance() 
+	{
+		return m_oDPParamInst;
+	}
+
+public:
+	int m_nFFTNum;
+	int m_nNsampWindow;
+	int m_nHalfNsampWindow;
+	DP_DOUBLE* m_pWindow;
+	DP_DOUBLE* m_pWindowR;
+	DP_DOUBLE m_fDx;
+	int m_nSampPeriod;
+	int m_nHalfSampPeriod;
+	
+private:
+	CDPParam();
+	~CDPParam();
+
+private:
+	static CDPParam m_oDPParamInst;
+};
+
+/* 此函数为除fft外的热点，最好能优化 dahaowu log **/
+DP_DOUBLE NumInterpolateSinc(DP_DOUBLE y[], int nX, DP_DOUBLE x, int nMaxDepth);
+void DRealFFT(DP_DOUBLE* pData, int nLength, int iSign);
+
+
+#endif // _DP_PARAM_H_
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPitchDef.h b/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPitchDef.h
new file mode 100755
index 0000000..75f69ed
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPitchDef.h
@@ -0,0 +1,68 @@
+
+#ifndef _DPITCH_DEF_H_
+#define _DPITCH_DEF_H_
+
+#define DP_USE_DFFT 1
+#define DP_USE_KISS_FFT 0
+
+#define DP_ONLINE 1
+
+#if DP_ONLINE
+#define DP_ONLINE_POOL 100								/* 在线保存 100 帧 dahaowu log **/
+#define DP_AUDIO_BUFFER_LEN (DP_NSAMP_WINDOW * 20)		/* 数据buffer的长度 dahaowu this **/
+#else
+#define DP_ONLINE_POOL 12000								/* 离线 最多 一分钟 dahaowu log **/
+#endif
+
+/* 采样率 dahaowu this **/
+#define DP_SAMPLE_RATE /*44100 16000*/ 16000
+
+#if (DP_SAMPLE_RATE == 16000)
+/* 帧长 16000=550 dahaowu this **/
+#define DP_NSAMP_WINDOW /*560 550*/ 560
+
+/* 帧移 16000=160 dahaowu this **/
+#define DP_NSAMP_SHIFT /*80 160*/ 80
+#endif
+
+#if (DP_SAMPLE_RATE == 44100)
+/* 帧长 16000=550 dahaowu this **/
+#define DP_NSAMP_WINDOW 1323
+
+/* 帧移 16000=160 dahaowu this **/
+#define DP_NSAMP_SHIFT 1323
+#endif
+
+/* 进行一次路径选择的最小帧数 dahaowu this **/
+#define DP_DELAY_PATH_NUM 10
+
+/* 一次输入的数据最好不要超过 DP_NSAMP_WINDOW-DP_NSAMP_SHIFT_X **/
+#define DP_NSAMP_SHIFT_X 0
+
+/* 末尾需要不足的基频点个数 **/
+#define DP_TAIL_ADD (DP_NSAMP_WINDOW / DP_NSAMP_SHIFT)
+
+/* 候选最大数量 **/
+#define DP_MAX_CANDIDATES 10
+
+/* 开始进行路径选择的最小帧数、Online基频提取时计算每帧数据当前数据仅受到此前20帧数据的影响 **/
+#define DP_BEG_PATH_NUM 20
+
+/* 在线基频提取时最大帧数 **/
+#define DP_ONLINEF0BUFSIZE 1000
+
+/* 最小基频 **/
+#define DP_MINIMUM_PITCH 60 // TODO 修改为100
+
+#define DP_VOICING_THRESHOLD (0.45f)
+#define DP_SILENCE_THRESHOLD (0.03f)
+#define DP_GLOBAL_PEAK (0.9f)
+#define DP_CEILING 500 // TODO 修改为1000
+#define DP_OCTAVE_COST (0.01f)
+#define DP_VOICED_UNVOICED_COST (0.14f)
+#define DP_OCTAVE_JUMP_COST (0.35f)
+
+typedef float DP_DOUBLE;
+typedef float DP_FLOAT;
+
+#endif // _DPITCH_DEF_H_
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPitchHandle.h b/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPitchHandle.h
new file mode 100755
index 0000000..b69612f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/inc/DPitchHandle.h
@@ -0,0 +1,274 @@
+
+#ifndef _DPITCH_HANDLE_H_
+#define _DPITCH_HANDLE_H_
+
+#include <vector>
+#include "DPitchDef.h"
+#include "string.h"
+
+namespace DPitch
+{
+	class CPitcher
+	{
+	public:
+		CPitcher();
+		~CPitcher();
+
+	public:
+		/* 在线获取基频值 **/
+		bool Process(short* pSample, int nSampleSize, float* pPitch, int& nFrame, bool bLast);
+
+		/* 再次使用之前重置内部状态 **/
+		void Reset();	
+
+	private:
+		/* 初始化、逆初始化 **/
+		int Init();
+		int Uninit();
+
+		/* 追加新的audio数据，返回帧数 **/
+		bool AppendData(short* pSample, int nSampleSize);
+
+		/* 计算基频核心函数 **/
+		bool ProcessFrame(DP_FLOAT* pFrame, int nSize);
+
+		/* 确定最优基频序列 **/
+		bool SearchPath(bool bLast);
+
+	private:
+		/* 基频候选类 **/
+		class CPitchCandidate
+		{
+		public:
+			DP_DOUBLE fFrequency;		/* 候选频率 **/
+			DP_DOUBLE fStrength;		/* 候选分数 **/
+
+			void operator = (const CPitchCandidate& oCand)
+			{
+				fFrequency = oCand.fFrequency;
+				fStrength = oCand.fStrength;
+			}
+		};
+
+		/* 基频点类 **/
+		class CPitchFrame
+		{
+		public:
+			CPitchFrame() 
+				: nCandidates(0)
+				, nIntensity(0)
+				, nBest(0)
+			{}
+
+		public:
+			DP_DOUBLE nIntensity;		/* 能量比 **/
+			unsigned int nCandidates;	/* 候选个数 **/
+			CPitchCandidate oCandidate[DP_MAX_CANDIDATES];
+			unsigned int nBest;
+		};
+
+	private:
+		/* 已经得到候选的帧数 **/
+		int m_nProcessedCount;
+
+		/* 已经计算完成的帧数 **/
+		int m_nPathedCount;
+
+		/* 此处优化，看需要保留多少 dahaowu log **/
+		std::vector<CPitchFrame*> m_oFitchFrames;
+
+		/* fft 数量 **/
+		int m_nFFTNum;
+
+		/* 帧长、帧移 **/
+		int m_nNsampWindow;
+		int m_nHalfNsampWindow;
+
+		/* FFT缓存 **/
+		DP_DOUBLE* m_pFFTFrame;
+
+		/* 自相关缓存 **/
+		DP_DOUBLE* m_pAutocorrelation;
+
+		/* 正窗与反窗 **/
+		DP_DOUBLE* m_pWindow;
+		DP_DOUBLE* m_pWindowR;
+
+		/* 缓存数值 **/
+		float m_fLog2;
+		float m_fLog440;
+
+		/* 能量计算窗 **/
+		int m_nSampPeriod;
+		int m_nHalfSampPeriod;
+
+	private:
+		CPitchFrame* GetOnePitchFrame()
+		{
+			if ( m_nCount >= DP_ONLINE_POOL - 1 )
+			{
+				m_nCount = 0;
+			}
+			return &m_pPitch[m_nCount++];
+		}
+		int m_nCount;
+		CPitchFrame m_pPitch[DP_ONLINE_POOL];
+
+		/* 数据存储到buffer中 **/
+		void AudioToFloat(short* pSample, DP_FLOAT* pAudio, int nSize)
+		{
+			for( int i = 0; i < nSize; i++ )
+			{
+				pAudio[i] = pSample[i] / 32768.f;
+			}
+		}
+
+#if DP_ONLINE
+	private:
+		/* 音频数据的存储位置 **/
+		DP_FLOAT m_AudioBuf[DP_AUDIO_BUFFER_LEN + DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X];
+		int m_nBufValidHead;
+		int m_nBufValidTail;
+
+		/* copy 数据 **/
+		bool BufAppendData(short* pSample, int nSampleSize)
+		{
+			/* 超过了多少 **/
+			int nOver = nSampleSize + m_nBufValidTail - DP_AUDIO_BUFFER_LEN;
+			if( nOver <= 0 )
+			{
+				/* 添加后没有超出AUDIO_BUFFER_LEN **/
+				AudioToFloat(pSample, m_AudioBuf + m_nBufValidTail, nSampleSize);	/* 先正常存储 **/
+				DulpiTail(m_nBufValidTail, m_nBufValidTail + nSampleSize);			/* 应该不用处理 **/
+				m_nBufValidTail += nSampleSize;
+			}
+			else
+			{
+				/* 添加后已经超出AUDIO_BUFFER_LEN **/
+				int nOver2 = nOver - (DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X);
+				if( nOver2 <= 0 )
+				{
+					/* 超出部分不大于一个window-shift **/
+					int nDulpLen = m_nBufValidTail + nSampleSize - DP_AUDIO_BUFFER_LEN; /* 需要duplicate的长度 **/
+					AudioToFloat(pSample, m_AudioBuf + m_nBufValidTail, nSampleSize);	/* 先正常存储 **/
+					DulpiTail(m_nBufValidTail, m_nBufValidTail + nSampleSize);			/* dulpi超出AUDIO_BUFFER_LEN的部分 **/
+					m_nBufValidTail = nDulpLen;
+				}
+				else
+				{
+					/* 超出部分大于一个window-shift **/
+					int nDulpLen = DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X;	/* 需要duplicate的长度 **/
+					int nLen1 = DP_AUDIO_BUFFER_LEN - m_nBufValidTail + nDulpLen;
+					AudioToFloat(pSample, m_AudioBuf+m_nBufValidTail, nLen1);
+					DulpiTail(DP_AUDIO_BUFFER_LEN, DP_AUDIO_BUFFER_LEN + nDulpLen);
+					m_nBufValidTail = nDulpLen;
+
+					/* 上下的跟在tail之后 **/
+					AudioToFloat(pSample + nLen1, m_AudioBuf + m_nBufValidTail, nSampleSize - nLen1);
+					m_nBufValidTail += (nSampleSize - nLen1);
+				}
+			}
+			return true;
+		}
+
+		/* 获取buffer 长度 **/
+		int GetBufferUseLen()
+		{
+			if( m_nBufValidTail >= m_nBufValidHead )
+				return m_nBufValidTail - m_nBufValidHead;
+			else
+				return m_nBufValidTail - m_nBufValidHead + DP_AUDIO_BUFFER_LEN;
+		}
+
+		/* 先连续copy，再向头部处理，防止读取的时候不是完整帧，感觉这个逻辑好蠢，可以优化 **/
+		bool DulpiTail(int nBeg, int nEnd)
+		{
+			if ( m_nBufValidTail < m_nBufValidHead )
+			{
+				if( nBeg > DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X )	
+					return true;
+				int nDulpiLen = nEnd > DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X ? DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X - nBeg : nEnd - nBeg;
+				memcpy(m_AudioBuf + DP_AUDIO_BUFFER_LEN + nBeg, m_AudioBuf + nBeg, sizeof(DP_FLOAT) * nDulpiLen);
+				return true;
+			}
+			else
+			{
+				/* tail和head正常, 只需向头部dulpi **/
+				if( nEnd < DP_AUDIO_BUFFER_LEN )
+					return true;
+				if( nEnd > DP_AUDIO_BUFFER_LEN + DP_NSAMP_WINDOW - DP_NSAMP_SHIFT_X )	/* 不可能 **/
+					return false;
+				int nDulpiPos = nBeg < DP_AUDIO_BUFFER_LEN ? DP_AUDIO_BUFFER_LEN : nBeg;
+				int nDulpiLen = nEnd - nDulpiPos;
+				memcpy(m_AudioBuf + nDulpiPos - DP_AUDIO_BUFFER_LEN, m_AudioBuf + nDulpiPos, sizeof(DP_FLOAT) * nDulpiLen);
+				return true;
+			}
+		}
+		
+		/* 返回一帧的帧头，并删除一帧 **/
+		DP_FLOAT* GetCurFrame()
+		{
+			if( GetBufferUseLen() < DP_NSAMP_WINDOW )
+				return 0;
+
+			DP_FLOAT* pFrame = m_AudioBuf + m_nBufValidHead;
+			m_nBufValidHead += DP_NSAMP_SHIFT;
+			if( m_nBufValidHead >= DP_AUDIO_BUFFER_LEN )
+			{
+				m_nBufValidHead = m_nBufValidHead - DP_AUDIO_BUFFER_LEN;
+			}
+			return pFrame;
+		}
+#else
+	private:
+		short* m_pSample;
+		int m_nSampleSize;
+		int m_nThis;
+		DP_FLOAT m_pOneFrame[DP_NSAMP_WINDOW];
+
+		/* copy 数据 **/
+		bool BufAppendData(short* pSample, int nSampleSize)
+		{
+			m_pSample = pSample;
+			m_nSampleSize = nSampleSize;
+			return true;
+		}
+
+		/* 返回一帧的帧头，并删除一帧 **/
+		DP_FLOAT* GetCurFrame()
+		{
+			if ( m_nThis == 0 )
+			{
+				AudioToFloat(m_pSample, m_pOneFrame, DP_NSAMP_WINDOW);
+				m_nThis += DP_NSAMP_WINDOW;
+				return m_pOneFrame;
+			}
+			else
+			{
+				if ( m_nSampleSize - m_nThis >= DP_NSAMP_WINDOW )
+				{
+					if ( DP_NSAMP_WINDOW > DP_NSAMP_SHIFT )
+					{
+						memcpy(m_pOneFrame, m_pOneFrame + DP_NSAMP_SHIFT, (DP_NSAMP_WINDOW - DP_NSAMP_SHIFT) * sizeof(DP_FLOAT));
+						AudioToFloat(m_pSample + m_nThis, m_pOneFrame + (DP_NSAMP_WINDOW - DP_NSAMP_SHIFT), DP_NSAMP_SHIFT);
+						m_nThis += DP_NSAMP_SHIFT;
+						return m_pOneFrame;
+					}
+					else
+					{
+						AudioToFloat(m_pSample + m_nThis, m_pOneFrame, DP_NSAMP_WINDOW);
+						m_nThis += DP_NSAMP_SHIFT;
+						return m_pOneFrame;
+					}
+				}
+				else
+				{
+					return NULL;
+				}
+			}
+		}
+#endif
+	};
+};
+
+#endif // _DPITCH_HANDLE_H_
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/CMakeLists.txt b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/CMakeLists.txt
new file mode 100644
index 0000000..3045b00
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/CMakeLists.txt
@@ -0,0 +1,3 @@
+include_directories(inc)
+AUX_SOURCE_DIRECTORY(src DIR_WAVES_SRCS)
+add_library(waves ${DIR_WAVES_SRCS})
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/inc/ExtraMono.h b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/inc/ExtraMono.h
new file mode 100755
index 0000000..280fab0
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/inc/ExtraMono.h
@@ -0,0 +1,230 @@
+
+#include <string>
+#include <string.h>
+
+#define SIZE_LONG 4
+#define SIZE_SHORT 2
+
+#define SIZE_FLAG 4
+#define FMT_TAG 0x0001
+
+#define BITS_PER_BYTE 8
+
+#ifndef AFS_CMPL_MAX_WAV	
+#define AFS_CMPL_MAX_WAV 15360000	// 时长16分（960*16000）
+#endif
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个32位数据
+//+---------------------------------------------------------------------------+
+unsigned long fa_read_u32(FILE* fp)
+{
+	unsigned long cx;
+	unsigned char temp[SIZE_LONG];
+
+	fread(temp, sizeof(unsigned char), SIZE_LONG, fp);
+	cx =  (unsigned long)temp[0];
+	cx |= (unsigned long)temp[1] << 8;
+	cx |= (unsigned long)temp[2] << 16;
+	cx |= (unsigned long)temp[3] << 24;
+	return cx;
+}
+
+//+---------------------------------------------------------------------------+
+//+ 从文件中读取一个16位数据
+//+---------------------------------------------------------------------------+
+unsigned short fa_read_u16(FILE *fp)
+{
+	unsigned short cx;
+	unsigned char  temp[SIZE_SHORT];
+
+	fread(temp, sizeof(unsigned char), SIZE_SHORT, fp);
+	cx = temp[0] | (temp[1] * 256);
+	return cx;
+}
+
+int GetWaveHeadLen(const char* pszFile,unsigned short &channels, int &nPos, int& nLength)
+{
+	//+---------------------------------------------------------------------------+
+	//+ 读取WAVE的头信息
+	//+---------------------------------------------------------------------------+
+	unsigned char  temp[SIZE_FLAG];
+	unsigned short bits_per_sample;
+	unsigned long  x_size;
+	unsigned long  n_skip;
+
+	unsigned short format;
+	//unsigned short channels;
+	unsigned long  sample_rate;
+	unsigned short block_align;
+	unsigned long  data_size;
+	int nCnt = 0;
+
+	/* 读取通用信息 */
+	FILE* pWavFile = fopen(pszFile, "rb");
+	if ( pWavFile == NULL )
+	{
+		printf("Input file can not be opened!\n");
+		return -1;
+	}
+
+	fseek(pWavFile, 0, SEEK_END );
+	nLength = ftell(pWavFile);
+	fseek(pWavFile, 0, SEEK_SET );
+
+	// 判断资源标识为"RIFF"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "RIFF", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Resource flag is not RIFF!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+	nCnt += SIZE_LONG;
+
+	// 判断文件标识为"WAVE"
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "WAVE", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "File flag is not WAVE\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	// 判断格式标识为"fmt "
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	if ( memcmp(temp, "fmt ", (size_t)SIZE_FLAG) != 0 )
+	{
+		fprintf(stderr, "Format flag is not FMT!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+	nCnt += SIZE_FLAG;
+
+	x_size = fa_read_u32(pWavFile);
+	nCnt += SIZE_LONG;
+
+	// 判断编码格式为0x0001
+	format = fa_read_u16(pWavFile);
+	nCnt += SIZE_SHORT;
+	if ( format != FMT_TAG )
+	{
+		fprintf(stderr, "Encoding format is not 0x0001!\n");
+		fclose(pWavFile);
+
+		return -1;
+	}
+
+	// 读取声道数目和采样频率
+	channels = fa_read_u16(pWavFile);
+	sample_rate = fa_read_u32(pWavFile);
+
+	fseek(pWavFile, SIZE_LONG, SEEK_CUR);
+
+	// 读取对齐单位和样本位数
+	block_align = fa_read_u16(pWavFile);
+	bits_per_sample = fa_read_u16(pWavFile);
+
+	/* 读取特殊信息 */
+	x_size -= (4*SIZE_SHORT + 2*SIZE_LONG);
+	if ( x_size != 0 )
+	{
+		fseek(pWavFile, x_size, SEEK_CUR);
+	}
+
+	// 读取数据大小
+	fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	while ( memcmp(temp, "data", SIZE_FLAG) != 0 )
+	{
+		n_skip = fa_read_u32(pWavFile);
+		fseek(pWavFile, n_skip, SEEK_CUR);
+
+		fread(temp, sizeof(unsigned char), SIZE_FLAG, pWavFile);
+	}
+
+	data_size = fa_read_u32(pWavFile);
+	fclose(pWavFile);
+
+	//+---------------------------------------------------------------------------+
+	//+ 返回WAVE的头长度
+	//+---------------------------------------------------------------------------+
+	nPos = nCnt;
+	int nHeadLength = nLength - data_size;
+	return nHeadLength;
+}
+
+bool ExtraMono(const std::string &sInput, const std::string &sOutput)
+{
+	FILE *pFile = fopen(sInput.c_str(), "rb");
+	if ( NULL == pFile )
+	{
+		printf("Fopen Error %s", sInput.c_str());
+		return false;
+	}
+
+	FILE *pFile2 = fopen(sOutput.c_str(), "wb");
+	if ( NULL == pFile2 )
+	{
+		printf("Fopen2 Error %s", sOutput.c_str());
+		return false;
+	}
+
+	short *pBuf = new short[AFS_CMPL_MAX_WAV];
+	int nLen = 0;
+
+	nLen = fread(pBuf, sizeof(short), AFS_CMPL_MAX_WAV, pFile);
+	if ( nLen <= 0 )
+	{
+		perror("Fread Error!");
+		return false;
+	}
+
+	unsigned short channels=0;
+	int nPos;
+	int nLength;
+	int nHeadByte = GetWaveHeadLen(sInput.c_str(),channels, nPos, nLength);
+	int nHeadShort = nHeadByte/2;
+	
+	if (channels==1)
+	{
+		fwrite(pBuf + nHeadShort, sizeof(short), nLen - nHeadShort, pFile2);
+	}
+	else
+	{
+		short *pBuf2 = new short[AFS_CMPL_MAX_WAV];
+		memcpy( pBuf2, pBuf, nHeadShort*sizeof(short));
+		pBuf2[nPos] = 1;
+
+		unsigned char tmp[2];
+		memcpy(tmp, &pBuf2[nPos], 2);
+
+		pBuf2[nPos] = static_cast<short>(tmp[0] | tmp[1]*256);
+
+		short *pWav = pBuf + nHeadShort;
+		nLen -= nHeadShort;
+
+		int halfnlen=nLen/2;
+		for (int i=0;i<=halfnlen;i++ )
+		{
+			pBuf2[nHeadShort+i] = *(pWav+i*2);
+		}
+		fwrite(pBuf2, sizeof(short), nLen+nHeadShort, pFile2);
+
+		delete []pBuf;
+		delete []pBuf2;
+		pBuf = NULL;
+		pBuf2 = NULL;
+	}
+
+
+	fclose(pFile);
+	fclose(pFile2);
+	return true;
+}
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/inc/WaveFile.h b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/inc/WaveFile.h
new file mode 100755
index 0000000..8b57806
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/inc/WaveFile.h
@@ -0,0 +1,74 @@
+#ifndef WAVE_FILE_H
+#define WAVE_FILE_H
+
+#include <stdio.h>
+#include <stdint.h>
+
+
+typedef enum SAMPLE_FORMAT
+{
+    SF_U8 = 8,
+    SF_S16 = 16,
+    SF_S24 = 24,
+    SF_S32 = 32,
+    SF_IEEE_FLOAT = 0x100 + 32,
+    SF_IEEE_DOUBLE = 0x100 + 64,
+    SF_MAX,
+} SAMPLE_FORMAT;
+
+/* 主处理对象 **/
+class CWaveFile
+{
+public:
+	/* 构造传入文件及 是读还是写 **/
+    CWaveFile(const char* Filename, bool Write);
+    virtual ~CWaveFile();
+
+public:
+    int GetChannels();
+    int GetSampleRate();
+    double GetDuration();  // in second
+    uint32_t GetChannelMask();
+    void SetChannels(int Channels);
+    void SetSampleRate(int SampleRate);
+    void SetSampleFormat(SAMPLE_FORMAT Format);
+    void SetChannelMask(uint32_t Mask);
+    void Stat();
+    void SetupDone();
+    bool ReadFrameAsS16(short* FrameSamples, int Frames = 1);
+    bool ReadFrameAsDouble(double* FrameSamples, int Frames = 1);
+	bool ReadFrameAsfloat(float* FrameSamples, int Frames = 1);
+	void WriteRaw(void* Raw, int Size);
+    void WriteFrame(uint8_t* FrameSamples, int Frames = 1);
+    void WriteFrame(short* FrameSamples, int Frames = 1);
+    void WriteFrame(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrameS24(int32_t* FrameSamples, int Frames = 1);
+    void WriteFrame(double* FrameSamples, int Frames = 1);
+    void WriteFrame(float* FrameSamples, int Frames=1);
+    void Seek(int FramePos, int Where = SEEK_SET);
+	bool GetStatus();
+	SAMPLE_FORMAT GetFormat();
+	int GetTotalFrames();
+	int GetFramesRead();
+
+
+protected:
+    FILE* File;
+    int Channels;					/* 通道数 **/
+    int SampleRate;					/* 采样率 **/
+    SAMPLE_FORMAT Format;			/* 采样精度 **/
+    int SampleSize; // Measured in Bits
+    unsigned int FrameStartPos;		/* 音频数据的起始位置 **/
+    unsigned long TotalFrames;		/* 总帧数，如果16bit，则一个short为一帧 **/
+    unsigned long FramesRead;
+    double Duration;				/* 时长 **/
+
+    bool ReadOnly;					/* 是度还是写 **/
+
+    uint32_t ChannelMask;
+
+	bool m_bOK;		/* 文件是否已经被打开 **/
+};
+
+
+#endif
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/src/WaveFile.cpp b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/src/WaveFile.cpp
new file mode 100755
index 0000000..1a47272
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/ref/waves/src/WaveFile.cpp
@@ -0,0 +1,818 @@
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <memory.h>
+#include <errno.h>
+
+#if WIN32
+#else
+#include <inttypes.h>
+#endif
+
+#include "WaveFile.h"
+
+#define SPEAKER_FRONT_LEFT             0x1
+#define SPEAKER_FRONT_RIGHT            0x2
+#define SPEAKER_FRONT_CENTER           0x4
+#define SPEAKER_LOW_FREQUENCY          0x8
+#define SPEAKER_BACK_LEFT              0x10
+#define SPEAKER_BACK_RIGHT             0x20
+#define SPEAKER_FRONT_LEFT_OF_CENTER   0x40
+#define SPEAKER_FRONT_RIGHT_OF_CENTER  0x80
+#define SPEAKER_BACK_CENTER            0x100
+#define SPEAKER_SIDE_LEFT              0x200
+#define SPEAKER_SIDE_RIGHT             0x400
+#define SPEAKER_TOP_CENTER             0x800
+#define SPEAKER_TOP_FRONT_LEFT         0x1000
+#define SPEAKER_TOP_FRONT_CENTER       0x2000
+#define SPEAKER_TOP_FRONT_RIGHT        0x4000
+#define SPEAKER_TOP_BACK_LEFT          0x8000
+#define SPEAKER_TOP_BACK_CENTER        0x10000
+#define SPEAKER_TOP_BACK_RIGHT         0x20000
+#define SPEAKER_RESERVED               0x80000000
+
+
+#define SPEAKER_REAR_CENTER_SURROUND   SPEAKER_BACK_CENTER 
+
+#define DCA_MONO 0
+#define DCA_CHANNEL 1
+#define DCA_STEREO 2
+#define DCA_STEREO_SUMDIFF 3
+#define DCA_STEREO_TOTAL 4
+#define DCA_3F 5
+#define DCA_2F1R 6
+#define DCA_3F1R 7
+#define DCA_2F2R 8
+#define DCA_3F2R 9
+#define DCA_4F2R 10
+
+#define DCA_DOLBY 101 /* FIXME */
+
+#define DCA_CHANNEL_MAX  DCA_3F2R /* We don't handle anything above that */
+#define DCA_CHANNEL_BITS 6
+#define DCA_CHANNEL_MASK 0x3F
+
+#define DCA_LFE 0x80
+#define DCA_ADJUST_LEVEL 0x100
+
+#define WAVE_FORMAT_PCM        0x0001
+#define WAVE_FORMAT_IEEE_FLOAT 0x0003
+#define WAVE_FORMAT_EXTENSIBLE 0xFFFE
+
+static uint8_t wav_header[] = {
+    'R', 'I', 'F', 'F', 0xfc, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 16, 0, 0, 0,
+    WAVE_FORMAT_PCM, WAVE_FORMAT_PCM >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16, 0,
+    'd', 'a', 't', 'a', 0xd8, 0xff, 0xff, 0xff
+};
+
+static uint8_t wavmulti_header[] = {
+    'R', 'I', 'F', 'F', 0xf0, 0xff, 0xff, 0xff, 'W', 'A', 'V', 'E',
+    'f', 'm', 't', ' ', 40, 0, 0, 0,
+    (uint8_t)(WAVE_FORMAT_EXTENSIBLE & 0xFF), WAVE_FORMAT_EXTENSIBLE >> 8,
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 0, 22, 0,
+    0, 0, 0, 0, 0, 0,
+    WAVE_FORMAT_IEEE_FLOAT, WAVE_FORMAT_IEEE_FLOAT >> 8,
+    0, 0, 0, 0, 0x10, 0x00, 0x80, 0, 0, 0xaa, 0, 0x38, 0x9b, 0x71,
+    'd', 'a', 't', 'a', 0xb4, 0xff, 0xff, 0xff
+};
+
+static void store4 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+    buf[2] = value >> 16;
+    buf[3] = value >> 24;
+}
+
+static void store2 (uint8_t * buf, int value)
+{
+    buf[0] = value;
+    buf[1] = value >> 8;
+}
+
+
+static uint32_t find_chunk(FILE * file, const uint8_t chunk_id[4])
+{
+    uint8_t buffer[8];
+    while (1) {
+        size_t chunksize;
+        size_t s = fread(buffer, 1, 8, file);
+        if (s < 8)
+            return 0;
+        chunksize = (uint32_t)buffer[4] | ((uint32_t)buffer[5] << 8) |
+            ((uint32_t)buffer[6] << 16) | ((uint32_t)buffer[7] << 24);
+        if (!memcmp(buffer, chunk_id, 4))
+            return chunksize;
+        fseek(file, chunksize, SEEK_CUR);
+    }
+}
+
+
+CWaveFile::CWaveFile(const char* Filename, bool Write)
+    : Duration(0), ReadOnly(false), m_bOK(false)
+{
+    Channels = 0;
+
+	/* 打开文件 **/
+    File = fopen(Filename, Write ? "wb":"rb");
+    if ( !File )
+        return;
+    
+	/* 设置写文件初始参数 **/
+    if ( Write )
+    {
+        SampleRate = 44100;
+        Channels = 2;
+        Format = SF_S16;
+        SampleSize = 16;
+		ChannelMask = 0;
+		m_bOK = true;
+        return;
+    }
+
+    ReadOnly = true;
+
+    size_t s;
+    uint8_t buffer[8];
+    uint8_t *fmt = NULL;
+    uint32_t v;
+    uint32_t avg_bps;
+    uint32_t block_align;
+    unsigned short FormatType;
+    unsigned short SampleType;
+
+    static const uint8_t riff[4] = { 'R', 'I', 'F', 'F' };
+    static const uint8_t wave[4] = { 'W', 'A', 'V', 'E' };
+    static const uint8_t fmt_[4] = { 'f', 'm', 't', ' ' };
+    static const uint8_t data[4] = { 'd', 'a', 't', 'a' };
+
+	/* 前四个字节为 riff **/
+    s = fread(buffer, 1, 8, File);
+    if (s < 8)
+        goto err2;
+
+    if (memcmp(buffer, riff, 4))
+        goto err2;
+
+	/* 8~12为wave **/
+    /* TODO: check size (in buffer[4..8]) */
+    s = fread(buffer, 1, 4, File);
+    if (s < 4)
+        goto err2;
+
+    if (memcmp(buffer, wave, 4))
+        goto err2;
+
+    s = find_chunk(File, fmt_);
+    if ( s != 16 && s != 18 && s != 40 )
+        goto err2;
+
+    fmt = (uint8_t*)malloc(s);
+    if (!fmt)
+        goto err2;
+
+    if (fread(fmt, 1, s, File) != s)
+        goto err3;
+
+    /* wFormatTag */
+    v = (uint32_t)fmt[0] | ((uint32_t)fmt[1] << 8);
+    if (v != WAVE_FORMAT_PCM && v != WAVE_FORMAT_IEEE_FLOAT && v != WAVE_FORMAT_EXTENSIBLE)
+        goto err3;
+
+    FormatType = v;
+
+    if (s == 40 && 0xfffe == v)
+    {
+        // fmt begins at 0x14 of the wave file
+        v = *(unsigned short*)&fmt[0x2C - 0x14];
+    }
+
+    SampleType = v;
+
+    /* wChannels */
+    v = (uint32_t)fmt[2] | ((uint32_t)fmt[3] << 8);
+
+    Channels = v;
+
+    if (v < 1 || v > 32)
+        goto err3;
+
+    /* dwSamplesPerSec */
+    SampleRate = (uint32_t)fmt[4] | ((uint32_t)fmt[5] << 8) |
+        ((uint32_t)fmt[6] << 16) | ((uint32_t)fmt[7] << 24);
+
+    /* dwAvgBytesPerSec */
+    avg_bps = (uint32_t)fmt[8] | ((uint32_t)fmt[9] << 8) |
+        ((uint32_t)fmt[10] << 16) | ((uint32_t)fmt[11] << 24);
+
+    /* wBlockAlign */
+    block_align = (uint32_t)fmt[12] | ((uint32_t)fmt[13] << 8);
+
+    /* wBitsPerSample */
+    SampleSize = (uint32_t)fmt[14] | ((uint32_t)fmt[15] << 8);
+    if (SampleSize != 8 && SampleSize != 16 && SampleSize != 32 && SampleSize != 24 && SampleSize != 64)
+        goto err3;
+
+    switch (SampleSize)
+    {
+    case 8:
+        Format = SF_U8;
+        break;
+    case 16:
+        Format = SF_S16;
+        break;
+    case 24:
+        Format = SF_S24;
+        break;
+    case 32:
+    {
+        if (SampleType == WAVE_FORMAT_IEEE_FLOAT)
+            Format = SF_IEEE_FLOAT;
+        else
+            Format = SF_S32;
+
+    }
+    break;
+    case 64:
+        if (SampleType != WAVE_FORMAT_IEEE_FLOAT)
+            goto err3;
+        Format = SF_IEEE_DOUBLE;
+        break;
+    }
+
+
+    // Handle 24-bit samples individually
+#if 0
+    if (SampleSize == 24 && Channels <= 2)
+    {
+        int ba24 = Channels * (SampleSize / 8); // Align to 4x
+
+        ba24 = (ba24 + 3) / 4 * 4;
+
+        if (block_align != ba24)
+            goto err3;
+    }
+    else
+#endif
+    {
+        if (block_align != Channels * (SampleSize / 8))
+            goto err3;
+    }
+
+    if (avg_bps != block_align * SampleRate)
+        goto err3;
+
+    v = find_chunk(File, data);
+
+    if (v == 0 || v % block_align != 0)
+        goto err3;
+
+    TotalFrames = v / block_align;
+
+    FramesRead = 0;
+
+    if (FormatType == WAVE_FORMAT_EXTENSIBLE)
+    {
+        ChannelMask = *(unsigned int*)(&fmt[0x14]);
+    }
+    else
+    {
+        ChannelMask = 0;
+    }
+    
+    FrameStartPos = ftell(File);
+
+    free(fmt);
+	m_bOK = true;
+    return;
+
+err3:
+    free(fmt);
+err2:
+    fclose(File);
+
+    File = NULL;
+}
+
+bool CWaveFile::GetStatus()
+{
+	return m_bOK;
+}
+
+SAMPLE_FORMAT CWaveFile::GetFormat()
+{
+	return Format;
+}
+
+int CWaveFile::GetTotalFrames()
+{
+	return TotalFrames;
+}
+
+int CWaveFile::GetFramesRead()
+{
+	return FramesRead;
+}
+
+CWaveFile::~CWaveFile()
+{
+    if (File != NULL)
+    {
+        if (!ReadOnly)
+        {
+            unsigned int Size = ftell(File) - FrameStartPos;// 44;
+
+            fseek(File, FrameStartPos - 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+
+            Size += FrameStartPos - 8;
+
+            fseek(File, 4, SEEK_SET);
+            fwrite(&Size, 4, 1, File);
+        }
+
+        fclose(File);
+    }
+}
+
+int CWaveFile::GetSampleRate()
+{
+    return SampleRate;
+}
+
+void CWaveFile::SetSampleRate(int SampleRate)
+{
+    this->SampleRate = SampleRate;
+}
+
+void CWaveFile::SetupDone()
+{
+    unsigned char Header[68];
+
+    fseek(File, 0, SEEK_SET);
+
+    SampleSize = Format & 0xFF;
+
+    if (ChannelMask)
+    {
+        memcpy(Header, wavmulti_header, sizeof(wavmulti_header));
+
+        if (Format < SF_IEEE_FLOAT)
+        {
+         //   store2(Header + 20, WAVE_FORMAT_PCM);
+            store2(Header + 44, WAVE_FORMAT_PCM);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        store2(Header + 38, SampleSize / 8 * 8);
+        store4(Header + 40, ChannelMask);
+
+        fwrite(Header, sizeof(wavmulti_header), 1, File);
+    }
+    else
+    {
+        memcpy(Header, wav_header, sizeof(wav_header));
+
+        if (Format >= SF_IEEE_FLOAT)
+        {
+            store2(Header + 20, WAVE_FORMAT_IEEE_FLOAT);
+        }
+
+        store2(Header + 22, Channels);
+        store4(Header + 24, SampleRate);
+        store4(Header + 28, SampleSize / 8 * SampleRate * Channels);
+        store2(Header + 32, SampleSize / 8 * Channels);
+        store2(Header + 34, SampleSize / 8 * 8);
+
+        fwrite(Header, sizeof(wav_header), 1, File);
+    }
+
+
+    FrameStartPos = ftell(File);
+}
+
+
+void CWaveFile::Seek(int FramePos, int Where)
+{
+    // Ignoring Where
+
+    fseek(File, FrameStartPos + FramePos * Channels* (SampleSize / 8), Where);
+
+    FramesRead = FramePos;
+
+}
+
+int CWaveFile::GetChannels()
+{
+    return Channels;
+}
+
+void CWaveFile::SetChannels(int Channels)
+{
+    this->Channels = Channels;
+}
+
+void CWaveFile::SetSampleFormat(SAMPLE_FORMAT Format)
+{
+    this->Format = Format;
+}
+
+uint32_t CWaveFile::GetChannelMask()
+{
+    return ChannelMask;
+}
+
+void CWaveFile::SetChannelMask(uint32_t Mask)
+{
+    ChannelMask = Mask;
+}
+
+bool CWaveFile::ReadFrameAsS16(short* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) << 8;
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+        return Frames == fread(FrameSamples, sizeof(FrameSamples[0])*Channels, Frames, File);
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 8);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                unsigned int DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(unsigned short)(DirectSample >> 16);  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        double DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (short)(DirectSamples[ch + frame*Channels] * 32768);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+bool CWaveFile::ReadFrameAsfloat(float* FrameSamples, int Frames)
+{
+	if (FramesRead >= TotalFrames)
+		return false;
+
+	FramesRead += Frames;
+
+	switch (Format)
+	{
+	case SF_U8:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 1, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S16:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				short DirectSample = 0;
+				if (1 == fread(&DirectSample, 2, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S24:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 3, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_S32:
+	{
+		for (int frame = 0; frame < Frames; frame++)
+		{
+			for (int ch = 0; ch < Channels; ch++)
+			{
+				uint32_t DirectSample = 0;
+				if (1 == fread(&DirectSample, 4, 1, File))
+				{
+					FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample))) /
+						(double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+				}
+				else
+				{
+					return false;
+				}
+			}
+		}
+		return true;
+	}
+	case SF_IEEE_FLOAT:
+	{
+		float DirectSamples[32];
+
+		if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+		{
+			for (int frame = 0; frame < Frames; frame++)
+			{
+				for (int ch = 0; ch < Channels; ch++)
+				{
+					FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+				}
+			}
+			return true;
+		}
+		return false;
+	}
+	case SF_IEEE_DOUBLE:
+	{
+		if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+		{
+			return true;
+		}
+		return false;
+	}
+	}
+	return false;
+}
+
+bool CWaveFile::ReadFrameAsDouble(double* FrameSamples, int Frames)
+{
+    if (FramesRead >= TotalFrames)
+        return false;
+
+    FramesRead += Frames;
+
+    switch (Format)
+    {
+    case SF_U8:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 1, 1, File)) 
+                {
+                    FrameSamples[ch + frame*Channels] = (DirectSample - 128) / 128.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S16:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                short DirectSample = 0;
+                if (1 == fread(&DirectSample, 2, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = DirectSample / 32768.0;  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S24:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 3, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample << 8))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_S32:
+    {
+        for (int frame = 0; frame < Frames; frame++)
+        {
+            for (int ch = 0; ch < Channels; ch++)
+            {
+                uint32_t DirectSample = 0;
+                if (1 == fread(&DirectSample, 4, 1, File))
+                {
+                    FrameSamples[ch + frame*Channels] = ((int32_t)((uint32_t)(DirectSample ))) /
+                        (double)(((uint32_t)(1 << 31)));  // (short)(DirectSample * 32767.0 / ((1 << 24) - 1));
+                }
+                else
+                {
+                    return false;
+                }
+            }
+        }
+        return true;
+    }
+    case SF_IEEE_FLOAT:
+    {
+        float DirectSamples[32];
+
+        if (Frames == fread(DirectSamples, sizeof(DirectSamples[0]) * Channels, Frames, File))
+        {
+            for (int frame = 0; frame < Frames; frame++)
+            {
+                for (int ch = 0; ch < Channels; ch++)
+                {
+                    FrameSamples[ch + frame*Channels] = (double)(DirectSamples[ch + frame*Channels]);
+                }
+            }
+            return true;
+        }
+        return false;
+    }
+    case SF_IEEE_DOUBLE:
+    {
+        if (Frames == fread(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File))
+        {
+            return true;
+        }
+        return false;
+    }
+    }
+    return false;
+}
+
+void CWaveFile::WriteRaw(void* Raw, int Size)
+{
+	fwrite(Raw, Size, 1, File);
+}
+
+
+void CWaveFile::WriteFrame(uint8_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(short* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(int32_t* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrameS24(int32_t* FrameSamples, int Frames)
+{
+    for (int c = 0; c < Channels; c++)
+    {
+        fwrite(&FrameSamples[c], 3, 1, File);
+    }
+}
+
+void CWaveFile::WriteFrame(double* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+void CWaveFile::WriteFrame(float* FrameSamples, int Frames)
+{
+    fwrite(FrameSamples, sizeof(FrameSamples[0]) * Channels, Frames, File);
+}
+
+
+double CWaveFile::GetDuration()
+{
+    return Duration;
+}
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/src/DPParam.cpp b/AutoCoverTool/ref/tools/pitch-detect-dpitch/src/DPParam.cpp
new file mode 100755
index 0000000..06ec4c7
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/src/DPParam.cpp
@@ -0,0 +1,178 @@
+
+//#include "STSInDef.h"
+#include "DPParam.h"
+#include "math.h"
+#include "stdio.h"
+
+#define DP_PI 3.14159265358979323846
+
+CDPParam CDPParam::m_oDPParamInst;
+
+CDPParam::CDPParam()
+{
+	m_fDx = (DP_DOUBLE)(1.0 / DP_SAMPLE_RATE);
+
+	m_nSampPeriod = (int)floor(1 / m_fDx / DP_MINIMUM_PITCH); 
+	m_nHalfSampPeriod = m_nSampPeriod / 2 + 1;
+
+	m_nNsampWindow = DP_NSAMP_WINDOW; 
+	m_nHalfNsampWindow = m_nNsampWindow / 2;  
+	m_nNsampWindow = m_nHalfNsampWindow * 2;
+
+	m_pWindow = new DP_DOUBLE[m_nNsampWindow];			/* 一次性 dahaowu new **/
+
+	m_nFFTNum = 1; while (m_nFFTNum < m_nNsampWindow * (1 + 0.5)) m_nFFTNum *= 2;
+
+	int i = 0;
+
+	for (i = 0; i < m_nNsampWindow; i ++)
+		m_pWindow[i] = 0.5 - 0.5 * cos ((i+1) * 2 * DP_PI / (m_nNsampWindow + 1));
+
+	m_pWindowR = new DP_DOUBLE[m_nFFTNum];				/* 一次性 dahaowu new **/
+
+	for (i = 0; i < m_nNsampWindow; i ++) m_pWindowR [i] = m_pWindow[i];
+	for( ; i < m_nFFTNum; i++) m_pWindowR[i] = 0.0;
+	DRealFFT (m_pWindowR, m_nFFTNum, 1);   
+	m_pWindowR [0] *= m_pWindowR [0];  
+	m_pWindowR [1] *= m_pWindowR [1];  
+	for (i = 2; i < m_nFFTNum; i += 2) {
+		m_pWindowR [i] = m_pWindowR [i] * m_pWindowR [i] + m_pWindowR [i+1] * m_pWindowR [i+1];
+		m_pWindowR [i + 1] = 0.0; 
+	}
+	DRealFFT (m_pWindowR, m_nFFTNum, -1);  
+	for (i = 1; i < m_nNsampWindow; i ++) m_pWindowR [i] /= m_pWindowR [0];  
+	m_pWindowR [0] = 1.0;  
+}
+
+CDPParam::~CDPParam()
+{
+	if ( m_pWindow )
+	{
+		delete[] m_pWindow;
+		m_pWindow = NULL;
+	}
+
+	if ( m_pWindowR )
+	{
+		delete[] m_pWindowR;
+		m_pWindowR = NULL;
+	}
+}
+
+void DFFT(DP_DOUBLE* pData, int nLength, int iSign)
+{ 
+	long n = nLength << 1, mmax = 2, m, j = 0, i; 
+	for (i = 0; i < n - 1; i += 2) { 
+		if (j > i) { 
+			DP_DOUBLE dum; 
+			dum = pData [j], pData [j] = pData [i], pData [i] = dum; 
+			dum = pData [j+1], pData [j+1] = pData [i+1], pData [i+1] = dum; 
+		} 
+		m = n >> 1; 
+		while (m >= 1 && j + 1 > m) { j -= m; m >>= 1; } 
+		j += m; 
+	} 
+	while (n > mmax) { 
+		long istep = 2 * mmax; 
+		DP_DOUBLE theta = 2 * DP_PI / (iSign * mmax); 
+		DP_DOUBLE wr, wi, wtemp, wpr, wpi; 
+		wtemp = sin (0.5 * theta); 
+		wpr = -2.0 * wtemp * wtemp; 
+		wpi = sin (theta); 
+		wr = 1.0, wi = 0.0; 
+		for (m = 0; m < mmax - 1; m += 2) { 
+			for (i = m; i < n; i += istep) { 
+				DP_DOUBLE tempr, tempi; 
+				j = i + mmax; 
+				tempr = wr * pData [j] - wi * pData [j+1], tempi = wr * pData [j+1] + wi * pData [j]; 
+				pData [j] = pData [i] - tempr, pData [j+1] = pData [i+1] - tempi; 
+				pData [i] += tempr, pData [i+1] += tempi; 
+			} 
+			wtemp = wr, wr = wr * wpr - wi * wpi + wr, wi = wi * wpr + wtemp * wpi + wi; 
+		} 
+		mmax = istep; 
+	} 
+}
+
+void DRealFFT(DP_DOUBLE* pData, int nLength, int iSign)
+{
+	long i, i1, i2, i3, i4, np3; 
+	DP_DOUBLE c1 = 0.5, c2, h1r, h1i, h2r, h2i; 
+	DP_DOUBLE wr, wi, wpr, wpi, wtemp, theta; 
+	theta = DP_PI / (DP_DOUBLE) (nLength >> 1); 
+	if (iSign == 1) { c2 = -0.5; DFFT(pData, nLength >> 1, 1); } 
+	else { c2 = 0.5; theta = - theta; } 
+	wtemp = sin (0.5 * theta); 
+	wpr = -2.0 * wtemp * wtemp; 
+	wpi = sin (theta); 
+	wr = 1.0 + wpr; 
+	wi = wpi; 
+	np3 = nLength + 1; 
+	for (i = 1; i < nLength >> 2; i++) { 
+		i4 = 1 + (i3 = np3 - (i2 = 1 + (i1 = i + i ))); 
+		h1r = c1 * (pData [i1] + pData [i3]); 
+		h1i = c1 * (pData [i2] - pData [i4]); 
+		h2r = - c2 * (pData [i2] + pData [i4]); 
+		h2i = c2 * (pData [i1] - pData [i3]); 
+		pData [i1] = h1r + wr * h2r - wi * h2i; 
+		pData [i2] = h1i + wr * h2i + wi * h2r; 
+		pData [i3] = h1r - wr * h2r + wi * h2i; 
+		pData [i4] = - h1i + wr * h2i + wi * h2r; 
+		wr = (wtemp = wr) * wpr - wi * wpi + wr; 
+		wi = wi * wpr + wtemp * wpi + wi; 
+	} 
+	if (iSign == 1) { 
+		pData [0] = (h1r = pData [0]) + pData [1]; 
+		pData [1] = h1r - pData [1]; 
+	} else { 
+		pData [0] = c1 * ((h1r = pData [0]) + pData [1]); 
+		pData [1] = c1 * (h1r - pData [1]); 
+		DFFT(pData, nLength >> 1, -1); 
+	} 
+}
+
+DP_DOUBLE NumInterpolateSinc(DP_DOUBLE y[], int nX, DP_DOUBLE x, int nMaxDepth) 
+{ 
+	long ix, midleft = (long)floor (x), midright = midleft + 1, left, right; 
+	DP_DOUBLE result = 0.0, a, halfsina, aa, daa; 
+	if (nX < 1) return -1; 
+	if (x > nX) return y [nX]; 
+	if (x < 1) return y [1]; 
+	if (x == midleft) return y [midleft]; 
+	/* 1 < x < nx && x not integer: interpolate. */ 
+	if (nMaxDepth > midright - 1) nMaxDepth = midright - 1; 
+	if (nMaxDepth > nX - midleft) nMaxDepth = nX - midleft; 
+	if (nMaxDepth <= 0) return y [(long) floor (x + 0.5)]; 
+	if (nMaxDepth == 1) return y [midleft] + (x - midleft) * (y [midright] - y [midleft]); 
+	if (nMaxDepth == 2) { 
+		DP_DOUBLE yl = y [midleft], yr = y [midright]; 
+		DP_DOUBLE dyl = 0.5 * (yr - y [midleft - 1]), dyr = 0.5 * (y [midright + 1] - yl); 
+		DP_DOUBLE fil = x - midleft, fir = midright - x; 
+		return yl * fir + yr * fil - fil * fir * (0.5 * (dyr - dyl) + (fil - 0.5) * (dyl + dyr - 2 * (yr - yl))); 
+	}
+
+	left = midright - nMaxDepth, right = midleft + nMaxDepth; 
+	a = DP_PI * (x - midleft); 
+	halfsina = 0.5 * sin (a); 
+	aa = a / (x - left + 1); 
+	daa = DP_PI / (x - left + 1); 
+	for (ix = midleft - 1; ix >= left - 1; ix --) { 
+		DP_DOUBLE d = halfsina / a * (1.0 + cos (aa)); 
+		result += y [ix] * d; 
+		a += (DP_DOUBLE)DP_PI;	 
+		aa += daa;	 
+		halfsina = - halfsina; 
+	} 
+	a = DP_PI * (midright - x); 
+	halfsina = 0.5 * sin (a); 
+	aa = a / (right - x + 1); 
+	daa = DP_PI / (right - x + 1); 
+	for (ix = midright - 1; ix < right; ix ++) { 
+		DP_DOUBLE d = halfsina / a * (1.0 + cos (aa)); 
+		result += y [ix] * d; 
+		a += (DP_DOUBLE)DP_PI;	 
+		aa += daa; 
+		halfsina = - halfsina; 
+	} 
+	return result; 
+}
\ No newline at end of file
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/src/DPitchHandle.cpp b/AutoCoverTool/ref/tools/pitch-detect-dpitch/src/DPitchHandle.cpp
new file mode 100755
index 0000000..ab8b0da
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/src/DPitchHandle.cpp
@@ -0,0 +1,385 @@
+
+//#include "STSInDef.h"
+#include "DPitchHandle.h"
+#include "DPParam.h"
+
+#include "math.h"
+#include "stdio.h"
+
+#if DP_USE_KISS_FFT
+#include "fftwrap.h"
+#endif
+
+using namespace DPitch;
+
+#define NUMlog2e  1.4426950408889634074
+#define NUMlog2(x)  (log (x) * NUMlog2e)
+
+#if DP_USE_KISS_FFT
+void* g_pFFT = NULL;
+#endif
+
+#define GLOBAL_PITCHER_PARAM (CDPParam::GetInstance())
+
+CPitcher::CPitcher(void)
+{
+	Init();
+}
+
+CPitcher::~CPitcher(void)
+{
+	Uninit();
+}
+
+/* 在线获取基频值 **/
+bool CPitcher::Process(short* pSample, int nSampleSize, float* pPitch, int& nFrame, bool bLast)
+{
+	AppendData(pSample, nSampleSize);
+	
+	/* 没处理就不搜索了 **/
+	if ( m_nProcessedCount == m_nPathedCount )
+	{
+		nFrame = 0;
+		return true;
+	}
+
+	int nPathFrame = m_nPathedCount;
+	SearchPath(bLast);
+	nFrame = m_nPathedCount - nPathFrame;
+	for ( int j = 0; j < nFrame; j++ )
+	{
+		CPitchFrame* pFrame = m_oFitchFrames[j + nPathFrame];
+		pPitch[j] = (pFrame->oCandidate[pFrame->nBest].fFrequency);		
+	}
+	return true;
+}
+
+/* 再次使用之前重置内部状态 **/
+void CPitcher::Reset()
+{
+	m_nPathedCount = 0;
+	m_nProcessedCount = 0;
+#if DP_ONLINE
+	m_nBufValidHead = 0;
+	m_nBufValidTail = 0;
+#else
+	m_pSample = NULL;
+	m_nSampleSize = 0;
+	m_nThis = 0;
+#endif
+	m_nCount = 0;
+	memset(m_pPitch, 0, DP_ONLINE_POOL * sizeof(CPitchFrame));
+	m_oFitchFrames.clear();
+}
+
+int CPitcher::Init()
+{
+	m_nCount = 0;
+	m_nPathedCount = 0;
+	m_nProcessedCount = 0;
+
+#if DP_ONLINE
+	m_nBufValidHead = 0;
+	m_nBufValidTail = 0;
+	memset(m_AudioBuf, 0, sizeof(m_AudioBuf));
+#else
+	m_pSample = NULL;
+	m_nSampleSize = 0;
+	m_nThis = 0;
+#endif
+
+	const CDPParam& param = GLOBAL_PITCHER_PARAM;
+
+	m_nSampPeriod = param.m_nSampPeriod;
+	m_nHalfSampPeriod = param.m_nHalfSampPeriod;
+	m_nNsampWindow = param.m_nNsampWindow;
+	m_nHalfNsampWindow = param.m_nHalfNsampWindow;
+	m_pWindow = param.m_pWindow;
+	m_pWindowR = param.m_pWindowR;
+	m_nFFTNum = param.m_nFFTNum;
+
+	m_fLog440 = log(440.0);
+	m_fLog2 = log(2.0);
+
+#if DP_USE_KISS_FFT
+	g_pFFT = fftwrap_init(m_nFFTNum);
+#endif
+
+	m_pFFTFrame = new DP_DOUBLE[m_nFFTNum];							/* 一次性 dahaowu new **/
+	m_pAutocorrelation = new DP_DOUBLE[2 * m_nNsampWindow + 1];		/* 一次性 dahaowu new **/
+
+	return 0;
+}
+
+int CPitcher::Uninit()
+{
+	m_oFitchFrames.clear();
+	delete m_pFFTFrame;
+	m_pFFTFrame = NULL;
+	delete m_pAutocorrelation;
+	m_pAutocorrelation = NULL;
+
+#if DP_USE_KISS_FFT
+	fftwrap_destroy(g_pFFT);
+#endif
+	return 0;
+}
+
+/* 输入数据得到候选 **/
+bool CPitcher::AppendData(short* pSample, int nSampleSize)
+{
+	if( pSample == NULL || nSampleSize <= 0 )
+	{
+		return false;
+	}
+	BufAppendData(pSample, nSampleSize);
+	DP_FLOAT* pFrame = GetCurFrame();
+	while( pFrame )
+	{
+		ProcessFrame(pFrame, DP_NSAMP_WINDOW);
+		pFrame = GetCurFrame();
+	}
+	return true;
+}
+
+/* 计算基频，得到候选 **/
+bool CPitcher::ProcessFrame(DP_FLOAT* pBuffer, int nSize)
+{
+	m_nProcessedCount ++;
+	DP_FLOAT* pAmplitude = pBuffer; 
+	DP_DOUBLE* pHalfAutocorrelation = m_pAutocorrelation + m_nNsampWindow;
+
+	CPitchFrame* pPitchFrame = GetOnePitchFrame();
+	DP_DOUBLE localMean, localPeak;
+	long leftSample = m_nHalfNsampWindow, rightSample = leftSample + 1;
+	long startSample, endSample;
+
+	localMean = 0.0;
+	startSample = rightSample - m_nHalfNsampWindow;
+	endSample = leftSample + m_nHalfNsampWindow;
+
+	/* 计算直流分量 **/
+	for ( int i = startSample - 1; i < endSample; i ++ ) 
+		localMean += pAmplitude[i];
+	localMean /= 2 * m_nHalfNsampWindow;
+
+	//startSample = rightSample - m_nHalfNsampWindow;
+	//endSample = leftSample + m_nHalfNsampWindow;
+
+	/* 加窗 **/
+	for (int j = 0, i = startSample - 1; j < m_nNsampWindow; j ++)
+		m_pFFTFrame [j] = (pAmplitude [i ++] - localMean) * m_pWindow[j];
+
+	/* 多余数据置零，可优化 dahaowu log **/
+	for (int j = m_nNsampWindow; j < m_nFFTNum; j ++)
+		m_pFFTFrame [j] = 0.0;
+
+	/* 计算能量和 **/
+	localPeak = 0;
+	if ((startSample = m_nHalfNsampWindow + 1 - m_nHalfSampPeriod) < 0) 
+		startSample = 1;
+	if ((endSample = m_nHalfNsampWindow + m_nHalfSampPeriod) > m_nNsampWindow) 
+		endSample = m_nNsampWindow;
+
+	for (int j = startSample - 1; j < endSample; j ++)
+	{
+		if (fabs (m_pFFTFrame [j]) > localPeak) 
+			localPeak = fabs (m_pFFTFrame[j]);
+	}
+	pPitchFrame->nIntensity = localPeak > DP_GLOBAL_PEAK ? 1 : localPeak / DP_GLOBAL_PEAK;
+
+	pPitchFrame->nCandidates = 1;
+	pPitchFrame->oCandidate[0].fFrequency = 0.0;   
+	pPitchFrame->oCandidate[0].fStrength = 0.0;
+
+	if ( localPeak == 0 ) 
+	{
+		m_oFitchFrames.push_back(pPitchFrame);
+		return true;
+	}
+
+	/* 傅立叶变换 **/
+#if DP_USE_DFFT
+	DRealFFT(m_pFFTFrame, m_nFFTNum, 1); 
+#endif
+
+#if DP_USE_KISS_FFT
+	fftwrap_fft(g_pFFT, m_pFFTFrame, m_pFFTFrame);
+#endif
+
+	/* 功率谱 **/
+	m_pFFTFrame [0] *= m_pFFTFrame [0];   
+	m_pFFTFrame [1] *= m_pFFTFrame [1];  
+	for (int i = 2; i < m_nFFTNum; i += 2) {
+		m_pFFTFrame [i] = m_pFFTFrame [i] * m_pFFTFrame [i] + m_pFFTFrame [i+1] * m_pFFTFrame [i+1];
+		m_pFFTFrame [i + 1] = 0.0; 
+	}
+
+	/* 傅立叶逆变换，得到自相关函数 **/
+#if DP_USE_DFFT
+	DRealFFT (m_pFFTFrame, m_nFFTNum, -1);
+#endif
+
+#if DP_USE_KISS_FFT
+	fftwrap_ifft(g_pFFT, m_pFFTFrame, m_pFFTFrame); 
+#endif
+
+	/* 加窗自相关 **/
+	pHalfAutocorrelation [0] = 1.0;
+	for ( int i = 1; i <= m_nHalfNsampWindow; i++ )
+		pHalfAutocorrelation [- (i)] = pHalfAutocorrelation [i] = m_pFFTFrame [i + 1 - 1] / (m_pFFTFrame [0] * m_pWindowR [i + 1 - 1]);
+
+	/* 只保留 top **/
+	int nMax[DP_MAX_CANDIDATES];
+	nMax [0] = 0;
+
+	/* 选择候选基频点 **/
+	for ( int i = 1; i < m_nHalfNsampWindow; i ++ )
+	{
+		/* 找峰值点 **/
+		if ( pHalfAutocorrelation [i] > 0.5 * DP_VOICING_THRESHOLD &&
+			pHalfAutocorrelation [i] > pHalfAutocorrelation [i-1] && pHalfAutocorrelation [i] >= pHalfAutocorrelation [i+1] )  
+		{
+			/* 根据公式计算候选分数 **/
+			int place = -1;
+			DP_DOUBLE dr = 0.5 * (pHalfAutocorrelation [i+1] - pHalfAutocorrelation [i-1]), d2r = 2 * pHalfAutocorrelation [i] - pHalfAutocorrelation [i-1] - pHalfAutocorrelation [i+1];
+			DP_DOUBLE fFrequencyOfMaximum = DP_SAMPLE_RATE / ((i) + dr / d2r);
+			long offset = - m_nHalfNsampWindow - 1;
+			DP_DOUBLE fStrengthOfMaximum =
+				NumInterpolateSinc (pHalfAutocorrelation + offset + 1, m_nHalfNsampWindow - offset, DP_SAMPLE_RATE / fFrequencyOfMaximum - offset,
+				30);
+
+			if (fStrengthOfMaximum > 1.0) fStrengthOfMaximum = 1.0 / fStrengthOfMaximum;
+
+			if (pPitchFrame->nCandidates < DP_MAX_CANDIDATES) { 
+				{
+					place = pPitchFrame->nCandidates;
+					pPitchFrame->nCandidates++;
+				}
+			} else {
+				DP_DOUBLE weakest = 2;
+				int iweak;
+				for (iweak = 1; iweak < DP_MAX_CANDIDATES; iweak ++) {
+					DP_DOUBLE localStrength = pPitchFrame->oCandidate[iweak].fStrength - DP_OCTAVE_COST *
+						NUMlog2 (DP_MINIMUM_PITCH / pPitchFrame->oCandidate[iweak].fFrequency);
+					if (localStrength < weakest) 
+					{ 
+						weakest = localStrength; 
+						place = iweak; 
+					}
+				}
+				if (fStrengthOfMaximum - DP_OCTAVE_COST * NUMlog2 (DP_MINIMUM_PITCH / fFrequencyOfMaximum) <= weakest)
+					place = -1;
+			}
+			if ( place >= 0 ) 
+			{  
+				pPitchFrame->oCandidate[place].fFrequency = fFrequencyOfMaximum;
+				pPitchFrame->oCandidate[place].fStrength = fStrengthOfMaximum;
+				nMax[place] = i;
+			}
+		}
+	}
+	m_oFitchFrames.push_back(pPitchFrame);
+	return true;
+}
+
+/* 确定最优基频序列 **/
+bool CPitcher::SearchPath(bool bLast)
+{
+	if ( !bLast )
+	{
+		if ( m_nProcessedCount - m_nPathedCount < DP_DELAY_PATH_NUM )
+		{
+			return true;
+		}
+	}
+	
+	int nAllCount = m_oFitchFrames.size();
+	int nStartPos = std::max(0, m_nPathedCount - DP_BEG_PATH_NUM);
+
+	int nProcCount = nAllCount - nStartPos;
+
+	/* 第一次检索要20帧以上 **/
+	if( nProcCount < DP_BEG_PATH_NUM )
+	{
+		return true;
+	}
+
+	/* 这个每次都重新算，不太好，可以优化 dahaowu log **/
+	DP_FLOAT (*pDelta)[DP_MAX_CANDIDATES] = new DP_FLOAT[nProcCount][DP_MAX_CANDIDATES];		/* 一次性 dahaowu new **/
+	int	  (*pPsi)[DP_MAX_CANDIDATES]   = new int[nProcCount][DP_MAX_CANDIDATES];				/* 一次性 dahaowu new **/
+
+	/* 将静音的可能计算进去 **/
+	for( int i = nStartPos; i < nAllCount; i++ )
+	{
+		CPitchFrame* pFrame = m_oFitchFrames[i];
+		DP_DOUBLE fUnvoicedStrength = 2 - pFrame->nIntensity / (DP_SILENCE_THRESHOLD / (1 + DP_VOICING_THRESHOLD));		/* 静音可信度 **/
+		fUnvoicedStrength = DP_VOICING_THRESHOLD + (fUnvoicedStrength > 0 ? fUnvoicedStrength : 0);
+		for ( unsigned int j = 0; j < pFrame->nCandidates; j++ )			
+		{
+			CPitchCandidate* pCandidate = &pFrame->oCandidate[j];
+			bool bVoiceLess = pCandidate->fFrequency == 0 || pCandidate->fFrequency > DP_CEILING;
+			pDelta[i - nStartPos][j] = bVoiceLess ? fUnvoicedStrength :										/* 计算新的可信度 **/
+				pCandidate->fStrength - DP_OCTAVE_COST * NUMlog2 (DP_CEILING/pCandidate->fFrequency);
+		}
+	}
+
+	DP_FLOAT fMaximum;	/* 最优置信度 **/
+	int nPlace;
+	for ( int i = nStartPos + 1; i < nAllCount; i++ ) 
+	{
+		CPitchFrame* pRevFrame = m_oFitchFrames[i - 1], *pCurFrame = m_oFitchFrames[i];
+		DP_FLOAT* pRevDelta = pDelta[i - 1 - nStartPos], *pCurDelta = pDelta [i - nStartPos];
+		int* pCurPsi = pPsi[i - nStartPos];
+		/* 计算从上一帧跳转过来的最优置信度 **/
+		for ( unsigned int iCand2 = 0; iCand2 < pCurFrame -> nCandidates; iCand2 ++ ) 
+		{
+			DP_DOUBLE f2 = pCurFrame -> oCandidate [iCand2].fFrequency;
+			fMaximum = -10;
+			nPlace = 0;
+			for ( unsigned int iCand1 = 0; iCand1 < pRevFrame -> nCandidates; iCand1 ++) {
+				DP_DOUBLE f1 = pRevFrame->oCandidate[iCand1].fFrequency;
+				DP_DOUBLE pTransitionCost;
+				bool bPreviousVoiceless = f1 <= 0 || f1 >= DP_CEILING;
+				bool bCurrentVoiceless = f2 <= 0 || f2 >= DP_CEILING;
+				if ( bPreviousVoiceless != bCurrentVoiceless )   
+					pTransitionCost = DP_VOICED_UNVOICED_COST;								/* 静音的惩罚 **/
+				else if ( bCurrentVoiceless )  
+					pTransitionCost = 0;
+				else  
+					pTransitionCost = DP_OCTAVE_JUMP_COST * fabs(NUMlog2 (f1 / f2));		/* 跳频的惩罚 **/
+				DP_FLOAT fValue = pRevDelta[iCand1] - pTransitionCost + pCurDelta[iCand2];	/* 新的整体置信度 **/
+				if ( fValue > fMaximum ) 
+				{
+					fMaximum = fValue;
+					nPlace = iCand1;
+				}
+			}
+			pCurDelta[iCand2] = fMaximum;
+			pCurPsi[iCand2] = nPlace;
+		}
+	}
+
+	/* 从最后一帧开始回溯 **/
+	fMaximum = pDelta[nAllCount - 1 - nStartPos][nPlace = 0];
+	for ( unsigned int iCand = 0; iCand < m_oFitchFrames[nAllCount - 1]->nCandidates; iCand++ )
+	{
+		if ( pDelta[nAllCount - 1 - nStartPos][iCand] > fMaximum )
+		{
+			fMaximum = pDelta[nAllCount - 1 - nStartPos] [nPlace = iCand];
+		}
+	}
+
+	/* 最后只有最后一帧暂时无法确定 **/
+	for ( int i = nAllCount - 1; i >= nStartPos; i-- )
+	{
+		CPitchFrame* pFrame = m_oFitchFrames[i];
+		pFrame->nBest = nPlace;
+		nPlace = pPsi[i - nStartPos][nPlace];
+	}
+
+	m_nPathedCount = m_nProcessedCount;
+	delete[] pDelta;
+	delete[] pPsi;
+	return true;
+}
diff --git a/AutoCoverTool/ref/tools/pitch-detect-dpitch/test_dpitch.cpp b/AutoCoverTool/ref/tools/pitch-detect-dpitch/test_dpitch.cpp
new file mode 100644
index 0000000..44a692f
--- /dev/null
+++ b/AutoCoverTool/ref/tools/pitch-detect-dpitch/test_dpitch.cpp
@@ -0,0 +1,108 @@
+
+#include "WaveFile.h"
+#include "DPitchHandle.h"
+#include <fstream>
+
+#define MAX_WAV_LENGTH (10 * 60 * 16000)
+// 要求输入16000单声道的数据，输出5ms一帧的结果，对应的结果是频率
+int main(int argc, const char * argv[])
+{
+    if ( argc != 3 )
+    {
+        printf("param err %d\n", argc);
+        return -1;
+    }
+
+    std::string sInWavFile = argv[1];
+    std::string sOutLog = argv[2];
+
+    CWaveFile oWaveFile(sInWavFile.c_str(), false);
+    if ( !oWaveFile.GetStatus() )
+    {
+        printf("wav file err %s\n", sInWavFile.c_str());
+        return -1;
+    }
+
+    int nChannel = oWaveFile.GetChannels();
+    int nSampleRate = oWaveFile.GetSampleRate();
+    int nFrameNum = oWaveFile.GetTotalFrames();
+
+    if ( nChannel != 1 )
+    {
+        printf("channel err %d\n", nChannel);
+        return -1;
+    }
+
+//    if ( oWaveFile.GetFormat() != 16 )
+//    {
+//        printf("format err %d\n", oWaveFile.GetFormat());
+//        return -1;
+//    }
+
+    int nLength = nFrameNum;
+    if ( nLength > MAX_WAV_LENGTH )
+    {
+        printf("len err %d\n", nLength);
+        return -1;
+    }
+
+    short* pInBuffer = new short[nLength];
+    if ( !oWaveFile.ReadFrameAsS16((short*)pInBuffer, nFrameNum) )
+    {
+        printf("get wav err %d\n", nLength);
+        return -1;
+    }
+
+    if ( nSampleRate != 16000 )
+    {
+        printf("sample rate err %d\n", nSampleRate);
+        return -1;
+    }
+
+    DPitch::CPitcher oPitcher;
+    int nFrameShift = 320;
+    int nNum = nLength / nFrameShift;
+    float* fPitch = new float[100];
+
+    std::ofstream ofs1(sOutLog.c_str());
+    ofs1 << 0 << "\n";
+    ofs1 << 0 << "\n";
+    ofs1 << 0 << "\n";
+    int nFrame = 0;
+    for ( int i = 0; i < nNum; i++ )
+    {
+        nFrame = 0;
+        int nRet = oPitcher.Process((short*)pInBuffer + i * nFrameShift, nFrameShift, fPitch, nFrame, false);
+        if ( !nRet )
+        {
+            printf("get pitch err %d\n", nRet);
+            return -1;
+        }
+
+        for ( int j = 0; j < nFrame; j++ )
+        {
+            ofs1 << (float)fPitch[j] << "\n";
+        }
+    }
+
+    nFrame = 0;
+    int nRet = oPitcher.Process((short*)pInBuffer + nNum * nFrameShift, nLength - nNum * nFrameShift, fPitch, nFrame, true);
+    if ( !nRet )
+    {
+        printf("get pitch err %d\n", nRet);
+        return -1;
+    }
+
+    for ( int j = 0; j < nFrame; j++ )
+    {
+        ofs1 << (float)fPitch[j] << "\n";
+    }
+
+    ofs1 << 0 << "\n";
+    ofs1 << 0 << "\n";
+    ofs1 << 0 << "\n";
+    ofs1.close();
+
+    printf("proc ok\n");
+    return 0;
+}
diff --git a/AutoCoverTool/script/analy.py b/AutoCoverTool/script/analy.py
new file mode 100644
index 0000000..a617e46
--- /dev/null
+++ b/AutoCoverTool/script/analy.py
@@ -0,0 +1,58 @@
+"""
+数据分析
+1. 获取所有错误比例小于0.1的情况
+2. 获取错误比例大于0.5的情况
+"""
+
+
+def load_csv(file):
+    lines = []
+    with open(file) as f:
+        while True:
+            line = f.readline()
+            if not line:
+                break
+            line = line.strip()
+            lines.append(line.split(","))
+    return lines
+
+
+def write_csv(file, out):
+    with open(file, "w") as f:
+        for line in out:
+            f.write(line + "\n")
+
+
+def process():
+    """
+    1. 载入映射关系
+    2. 获取正常的数据分布
+    :return:
+    """
+    f1 = "/data/rsync/jianli.yang/AutoCoverTool/logs/real/rate_tot.csv"
+    f = "/data/rsync/jianli.yang/AutoCoverTool/logs/real/me_top500_vocals.csv"
+    f2 = "/data/rsync/jianli.yang/AutoCoverTool/logs/real/pitch_rate_tot.csv"
+    data = load_csv(f)
+    new_dict = {}
+    for line in data:
+        kk = line[1].split("/")[-2]
+        ana = ",".join(line[2:])
+        new_dict[kk] = ana
+
+    pitch_data = load_csv(f1)
+    out_pitch_data = []
+    for line in pitch_data:
+        kk = line[0].split("_")[0]
+        if kk not in new_dict.keys():
+            print("err! {}".format(kk))
+            continue
+        ana = new_dict[kk]
+        line_str = ",".join(line[0].split("_")) + "," + str(line[1]) + "," + ana
+        line_str = line_str.replace(".wav", "")
+        out_pitch_data.append(line_str)
+
+    write_csv(f2, out_pitch_data)
+
+
+if __name__ == '__main__':
+    process()
diff --git a/AutoCoverTool/script/common.py b/AutoCoverTool/script/common.py
new file mode 100644
index 0000000..ab4b5a4
--- /dev/null
+++ b/AutoCoverTool/script/common.py
@@ -0,0 +1,181 @@
+# -*-encoding=utf8-*-
+import time
+import pymysql
+import logging
+import pandas as pd
+
+# from impala.dbapi import connect
+# from sqlalchemy import create_engine
+# from sqlalchemy.types import NVARCHAR, Float, Integer
+
+banned_user_map = {
+    "host": "sg-songbook00.db.starmaker.co",
+    "user": "worker",
+    "passwd": "gRYppQtdTpP3nFzH",
+    "db": "starmaker"
+}
+
+banned_user_map_v1 = {
+    "host": "sg-starmaker-device-r2.db.starmaker.co",
+    "user": "worker",
+    "passwd": "gRYppQtdTpP3nFzH",
+    "db": "mis"
+}
+
+banned_user_map_v2 = {
+    "host": "sg-sm-img-r1.starmaker.co",
+    "user": "worker",
+    "passwd": "gRYppQtdTpP3nFzH",
+    "db": "sm"
+}
+
+# 做一下shared库的查询依赖
+shard_map = {
+    "shard_sm_12": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_13": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_14": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_15": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_30": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_31": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_20": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_21": "sg-shard02-r2.db.starmaker.co",
+    "shard_sm_22": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_23": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_24": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_25": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_26": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_27": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_28": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_29": "sg-shard03-r2.db.starmaker.co",
+    "shard_sm_0": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_1": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_2": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_3": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_4": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_5": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_16": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_17": "sg-shard00-r2.db.starmaker.co",
+    "shard_sm_6": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_7": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_8": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_9": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_10": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_11": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_18": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_19": "sg-shard01-r2.db.starmaker.co",
+    "shard_sm_32": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_33": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_34": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_35": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_36": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_37": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_38": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_39": "sg-shard04-r2.db.starmaker.co",
+    "shard_sm_40": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_41": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_42": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_43": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_44": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_45": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_46": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_47": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_48": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_49": "sg-shard05-r2.db.starmaker.co",
+    "shard_sm_50": "sg-shard05-r2.db.starmaker.co",
+    "name": "shard_sm_{}",
+    "port": 3306,
+    "user": "readonly",
+    "passwd": "JKw6woZgRXsveegL"
+}
+
+
+def connect_db(host="research-db-r1.starmaker.co", port=3306, user="root", passwd="Qrdl1130", db=""):
+    print("connect mysql host={} port={} user={} passwd={} db={}".format(host, port, user, passwd, db))
+    return pymysql.connect(host=host, port=port, user=user, passwd=passwd, db=db)
+
+
+def get_data_by_mysql(sql, ban=banned_user_map):
+    db = connect_db(host=ban["host"], passwd=ban["passwd"], user=ban["user"],
+                    db=ban["db"])
+    db_cursor = db.cursor()
+    if len(sql) < 100:
+        print("execute = {}".format(sql))
+    else:
+        print("execute = {}...".format(sql[:100]))
+
+    db_cursor.execute(sql)
+    res = db_cursor.fetchall()
+    db_cursor.close()
+    db.close()
+    print("res size={}".format(len(res)))
+    return res
+
+
+def get_shard_db(user_id):
+    return int(float(user_id)) >> 48
+
+
+def get_shard_data_by_sql(sql, user_id):
+    shard_id = get_shard_db(user_id)
+    db_name = shard_map["name"].format(shard_id)
+    host = shard_map[db_name]
+    db = connect_db(host=host, passwd=shard_map["passwd"], user=shard_map["user"], db=db_name)
+    db_cursor = db.cursor()
+    if len(sql) < 100:
+        print("execute = {}".format(sql))
+    else:
+        print("execute = {}...".format(sql[:100]))
+
+    db_cursor.execute(sql)
+    res = db_cursor.fetchall()
+    db_cursor.close()
+    db.close()
+    print("res size={}".format(len(res)))
+    return res
+
+
+# def get_data_by_hql(sql):
+#     logging.info(sql)
+#     ntime = time.time()
+#     conn = connect(host='sg-hive.starmaker.co', port=7001, auth_mechanism='PLAIN', timeout=3600, user="hadoop",
+#                    password="7396&pagesize")
+#     cur = conn.cursor()
+#     cur.execute(sql)
+#     data = cur.fetchall()
+#     cur.close()
+#     conn.close()
+#     logging.info("get sql: eps={}".format(time.time() - ntime))
+#     return data
+
+
+def read_file(in_file):
+    with open(in_file, "r") as f:
+        lines = f.readlines()
+        return lines
+
+
+def write2file(file_path, data):
+    with open(file_path, "w") as f:
+        for line in data:
+            line += "\n"
+            f.write(line)
+
+
+# def map_types(df):
+#     dtypedict = {}
+#     for i, j in zip(df.columns, df.dtypes):
+#         if "object" in str(j):
+#             dtypedict.update({i: NVARCHAR(length=255)})
+#         if "float" in str(j):
+#             dtypedict.update({i: Float(precision=2, asdecimal=True)})
+#         if "int" in str(j):
+#             dtypedict.update({i: Integer()})
+#     return dtypedict
+#
+#
+# def write2db(filename, tablename):
+#     engine = create_engine("mysql+mysqldb://{}:{}@{}/{}".format('root', '', 'localhost:3306', 'starmaker'))
+#     con = engine.connect()
+#     df = pd.read_csv(filename)
+#     dtypedict = map_types(df)
+#     df.to_sql(name=tablename, con=con, if_exists='append', index=False, dtype=dtypedict)
\ No newline at end of file
diff --git a/AutoCoverTool/script/dereverb_script.py b/AutoCoverTool/script/dereverb_script.py
new file mode 100644
index 0000000..9e94b00
--- /dev/null
+++ b/AutoCoverTool/script/dereverb_script.py
@@ -0,0 +1,154 @@
+"""
+拷贝混响
+"""
+import os
+import time
+
+gs_rever_path = "/data/rsync/jianli.yang/dereverbrate/build/dereverbrate_test"
+
+
+def process():
+    arr = [
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020256284/cache/611752105020256284_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020286433/cache/611752105020286433_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020286443/cache/611752105020286443_12384898975368914.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020286446/cache/611752105020286446_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020290639/cache/611752105020290639_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020290695/cache/611752105020290695_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020315328/cache/611752105020315328_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020315368/cache/611752105020315368_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020336950/cache/611752105020336950_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020343687/cache/611752105020343687_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020343699/cache/611752105020343699_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020351134/cache/611752105020351134_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020357112/cache/611752105020357112_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020378620/cache/611752105020378620_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020387015/cache/611752105020387015_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020394121/cache/611752105020394121_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020394297/cache/611752105020394297_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020411654/cache/611752105020411654_3096224751151928.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020417688/cache/611752105020417688_12947848931397021.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020548211/cache/611752105020548211_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020563523/cache/611752105020563523_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105021285282/cache/611752105021285282_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105021332759/cache/611752105021332759_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022446809/cache/611752105022446809_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022647082/cache/611752105022647082_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022667231/cache/611752105022667231_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022735101/cache/611752105022735101_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022736204/cache/611752105022736204_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022745595/cache/611752105022745595_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022770952/cache/611752105022770952_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022842004/cache/611752105022842004_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105022842477/cache/611752105022842477_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105023434557/cache/611752105023434557_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105023532439/cache/611752105023532439_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105023623965/cache/611752105023623965_3096224748076687.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105024250202/cache/611752105024250202_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105024628047/cache/611752105024628047_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105024676794/cache/611752105024676794_6755399442719465.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105024678976/cache/611752105024678976_6755399442719465.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105024679221/cache/611752105024679221_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105024953316/cache/611752105024953316_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105025104181/cache/611752105025104181_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105026189342/cache/611752105026189342_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105026523547/cache/611752105026523547_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105026707760/cache/611752105026707760_3096224748076687.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105026771723/cache/611752105026771723_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105026946178/cache/611752105026946178_10414574140317353.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105027047993/cache/611752105027047993_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105027188746/cache/611752105027188746_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105027189453/cache/611752105027189453_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105027302268/cache/611752105027302268_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105027557408/cache/611752105027557408_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105028650636/cache/611752105028650636_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105028683824/cache/611752105028683824_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105029990849/cache/611752105029990849_7036874421386111.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105029993297/cache/611752105029993297_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105030077711/cache/611752105030077711_3096224748076687.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105030104548/cache/611752105030104548_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105030419624/cache/611752105030419624_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105030419633/cache/611752105030419633_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105030419688/cache/611752105030419688_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105030433779/cache/611752105030433779_3634463651.wav"
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105015523266/cache/611752105015523266_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105017233541/cache/611752105017233541_6755399442719465.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414513/cache/611752105030414513_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414549/cache/611752105030414549_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414557/cache/611752105030414557_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414588/cache/611752105030414588_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414597/cache/611752105030414597_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414613/cache/611752105030414613_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414615/cache/611752105030414615_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414619/cache/611752105030414619_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414633/cache/611752105030414633_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414638/cache/611752105030414638_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414689/cache/611752105030414689_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414702/cache/611752105030414702_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414742/cache/611752105030414742_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414763/cache/611752105030414763_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414773/cache/611752105030414773_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414777/cache/611752105030414777_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414779/cache/611752105030414779_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414784/cache/611752105030414784_6755399442719465.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414890/cache/611752105030414890_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414915/cache/611752105030414915_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414925/cache/611752105030414925_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414929/cache/611752105030414929_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414935/cache/611752105030414935_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414943/cache/611752105030414943_6755399374234747.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414957/cache/611752105030414957_12384898975368914.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414962/cache/611752105030414962_8162774327817435.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414976/cache/611752105030414976_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414993/cache/611752105030414993_12947848931397021.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030414995/cache/611752105030414995_5066549357604730.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415003/cache/611752105030415003_12947848931397021.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415014/cache/611752105030415014_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415018/cache/611752105030415018_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415032/cache/611752105030415032_6755399442719465.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415056/cache/611752105030415056_3096224748076687.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415067/cache/611752105030415067_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415071/cache/611752105030415071_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415074/cache/611752105030415074_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415083/cache/611752105030415083_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415087/cache/611752105030415087_5910973794723621.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415100/cache/611752105030415100_10414574138721494.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy/611752105030415103/cache/611752105030415103_8162774329368194.wav"
+    ]
+
+    arr1 = [
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020256284/cache/611752105020256284_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020286433/cache/611752105020286433_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020286443/cache/611752105020286443_12384898975368914.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020286446/cache/611752105020286446_5629499489839033.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020290639/cache/611752105020290639_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020290695/cache/611752105020290695_1125899914308640.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020315328/cache/611752105020315328_8162774329368194.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020315368/cache/611752105020315368_1688849864840588.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020336950/cache/611752105020336950_3634463651.wav",
+        "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4/611752105020343687/cache/611752105020343687_8162774327817435.wav"
+    ]
+    tot_st = time.time()
+    for idx, file in enumerate(arr1):
+        """
+        1. 转码为44k双声道
+        2. 拷贝混响
+        """
+        st = time.time()
+        file_442 = file.replace(".wav", "_442.wav")
+        if not os.path.exists(file_442):
+            cmd = "ffmpeg -i {} -ar 44100 -ac 2 -y {}".format(file, file_442)
+            os.system(cmd)
+            if not os.path.exists(file_442):
+                continue
+        vocal_path = os.path.join("/".join(file.split("/")[:-1]), "vocal.wav")
+        file_dst = file.replace(".wav", "_442_dr_v2.wav")
+        cmd = "{} {} {} {}".format(gs_rever_path, vocal_path, file_442, file_dst)
+        os.system(cmd)
+        if not os.path.exists(file_dst):
+            continue
+        print("{}, per={}/{} spent={}, {}".format(file, idx, len(arr), time.time() - st, time.time() - tot_st))
+
+
+if __name__ == '__main__':
+    process()
diff --git a/AutoCoverTool/script/gen_inference_data.py b/AutoCoverTool/script/gen_inference_data.py
new file mode 100644
index 0000000..a6ade8b
--- /dev/null
+++ b/AutoCoverTool/script/gen_inference_data.py
@@ -0,0 +1,1129 @@
+"""
+"""
+import os
+import time
+import numpy as np
+
+
+def gen_inference():
+    old_users = [
+        # 611752105027200978,
+        # 611752105027801388,
+        # 611752105029274335,
+        # 611752105028546962,
+        # 611752105028354526,
+        # 611752105027200978,
+        # 611752105027945331,
+        # 611752105028237782,
+        # 611752105028354530,
+        # "top10_1",
+        # "top10_2",
+        # "top10_3",
+        # "top10_4",
+        # "top10_5",
+        # "top10_6",
+        # "top10_7",
+        # "top10_8",
+        # "top10_9",
+        # "top10_10",
+        # "611752105020942848",
+        # "611752105021644928",
+        # "611752105022647040",
+        # "611752105023534848",
+        # "611752105023678592",
+        # "611752105023989632",
+        # "611752105024485632",
+        # "611752105024705408",
+        # "611752105024830080",
+        # "611752105025003392",
+        # "611752105025063808",
+        # "611752105025116928",
+        # "611752105025198848",
+        # "611752105025222656",
+        # "611752105025957376",
+        # "611752105027326592",
+        # "611752105027599104",
+        # "611752105027702656",
+        # "611752105028761728",
+        # "611752105028859520",
+        # "611752105029197952",
+        # "611752105029330944",
+        # "611752105029455744",
+        # "611752105029540480",
+        # "611752105029951616",
+        # "611752105029955328",
+        # "611752105029955584",
+        # "611752105029956352"
+        # "100",
+        # "10",
+        # "11",
+        # "12",
+        # "13",
+        # "14",
+        # "15",
+        # "16",
+        # "17",
+        # "18",
+        # "19",
+        # "1",
+        # "20",
+        # "21",
+        # "22",
+        # "23",
+        # "24",
+        # "25",
+        # "26",
+        # "27",
+        # "28",
+        # "29",
+        # "2",
+        # "30",
+        # "31",
+        # "32",
+        # "33",
+        # "34",
+        # "35",
+        # "36",
+        # "37",
+        # "38",
+        # "39",
+        # "3",
+        # "40",
+        # "41",
+        # "42",
+        # "43",
+        # "44",
+        # "45",
+        # "46",
+        # "47",
+        # "48",
+        # "49",
+        # "4",
+        # "50",
+        # "51",
+        # "52",
+        # "53",
+        # "54",
+        # "55",
+        # "56",
+        # "57",
+        # "58",
+        # "59",
+        # "5",
+        # "60",
+        # "61",
+        # "62",
+        # "63",
+        # "64",
+        # "65",
+        # "66",
+        # "67",
+        # "68",
+        # "69",
+        # "6",
+        # "70",
+        # "71",
+        # "72",
+        # "73",
+        # "74",
+        # "75",
+        # "76",
+        # "77",
+        # "78",
+        # "79",
+        # "7",
+        # "81",
+        # "82",
+        # "83",
+        # "84",
+        # "85",
+        # "86",
+        # "87",
+        # "88",
+        # "89",
+        # "8",
+        # "90",
+        # "91",
+        # "92",
+        # "93",
+        # "94",
+        # "95",
+        # "96",
+        # "97",
+        # "98",
+        # "99",
+        # "9"
+        "611752105026649069",
+        "611752105027201163",
+        "611752105027601574",
+        "611752105027602999",
+        "611752105028392007",
+        "611752105028480056",
+        "611752105028480075",
+        "611752105029790637",
+        "611752105029951597",
+        "611752105029951604",
+        "611752105029951624",
+        "611752105030248975",
+        "611752105030248976",
+        "611752105030248977",
+        "611752105030248978",
+        "611752105030248979",
+        "611752105030248980",
+        "611752105030248981",
+        "611752105030248982",
+        "611752105030248983",
+        "611752105030248985",
+        "611752105030248986",
+        "611752105030248987",
+        "611752105030248988",
+        "611752105030248989",
+        "611752105030248990",
+        "611752105030248991",
+        "611752105030248992",
+        "611752105030248993",
+        "611752105030248994",
+        "611752105030248995",
+        "611752105030248996",
+        "611752105030248997",
+        "611752105030248998",
+        "611752105030248999",
+        "611752105030249000",
+        "611752105030249001",
+        "611752105030249002",
+        "611752105030249003",
+        "611752105030249004",
+        "611752105030249005",
+        "611752105030249006",
+        "611752105030249007",
+        "611752105030249008",
+        "611752105030249009",
+        "611752105030249010",
+        "611752105030249011",
+        "611752105030249012",
+        "611752105030249013",
+        "611752105030249014",
+        "611752105030249015",
+        "611752105030249016",
+        "611752105030249017",
+        "611752105030249018",
+        "611752105030249019",
+        "611752105030249020",
+        "611752105030249021",
+        "611752105030249022",
+        "611752105030249023",
+        "611752105030249024",
+        "611752105030249025",
+        "611752105030249026",
+        "611752105030249027",
+        "611752105030249028",
+        "611752105030249029",
+        "611752105030249030",
+        "611752105030249031",
+        "611752105030249032",
+        "611752105030249033",
+        "611752105030249034",
+        "611752105030249035",
+        "611752105030249036",
+        "611752105030249037",
+        "611752105030249038",
+        "611752105030249039",
+        "611752105030249040",
+        "611752105030249041",
+        "611752105030249042",
+        "611752105030249043",
+        "611752105030249044",
+        "611752105030249045",
+        "611752105030249046",
+        "611752105030249047",
+        "611752105030249048",
+        "611752105030249049",
+        "611752105030249050",
+        "611752105030249051",
+        "611752105030249052",
+        "611752105030249053",
+        "611752105030249054",
+        "611752105030249055",
+        "611752105030249056",
+        "611752105030249057",
+        "611752105030249058",
+        "611752105030249059",
+        "611752105030249060",
+        "611752105030249062",
+        "611752105030249063",
+        "611752105030249064",
+        "611752105030249065",
+        "611752105030249067",
+        "611752105030249068",
+        "611752105030249070",
+        "611752105030249071",
+        "611752105030249072",
+        "611752105030249073",
+        "611752105030249074",
+        "611752105030249075",
+        "611752105030249076",
+        "611752105030249077",
+        "611752105030249078",
+        "611752105030249079",
+        "611752105030249080",
+        "611752105030249081",
+        "611752105030249082",
+        "611752105030249083",
+        "611752105030249084",
+        "611752105030249085",
+        "611752105030249086",
+        "611752105030249087",
+        "611752105030249088",
+        "611752105030249089",
+        "611752105030249090",
+        "611752105030249091",
+        "611752105030249092",
+        "611752105030249093",
+        "611752105030249094",
+        "611752105030249095",
+        "611752105030249096",
+        "611752105030249098",
+        "611752105030249099",
+        "611752105030249100",
+        "611752105030249101",
+        "611752105030249102",
+        "611752105030249103",
+        "611752105030249104",
+        "611752105030249105",
+        "611752105030249106",
+        "611752105030249107",
+        "611752105030249108",
+        "611752105030249109",
+        "611752105030249110",
+        "611752105030249111",
+        "611752105030249112",
+        "611752105030249113",
+        "611752105030249114",
+        "611752105030249115",
+        "611752105030249116",
+        "611752105030249117",
+        "611752105030249118",
+        "611752105030249119",
+        "611752105030249120",
+        "611752105030249121",
+        "611752105030249122",
+        "611752105030249123",
+        "611752105030249124",
+        "611752105030249125",
+        "611752105030249126",
+        "611752105030249127",
+        "611752105030249128",
+        "611752105030249129",
+        "611752105030249130",
+        "611752105030249131",
+        "611752105030249132",
+        "611752105030249133",
+        "611752105030249134",
+        "611752105030249135",
+        "611752105030249136",
+        "611752105030249137",
+        "611752105030249138",
+        "611752105030249139",
+        "611752105030249140",
+        "611752105030249141",
+        "611752105030249142",
+        "611752105030249143",
+        "611752105030249144",
+        "611752105030249145",
+        "611752105030249146",
+        "611752105030249147",
+        "611752105030249148",
+        "611752105030249150",
+        "611752105030249151",
+        "611752105030249152",
+        "611752105030249153",
+        "611752105030249154",
+        "611752105030249155",
+        "611752105030249157",
+        "611752105030249158",
+        "611752105030249159",
+        "611752105030249160",
+        "611752105030249161",
+        "611752105030249162",
+        "611752105030249163",
+        "611752105030249165",
+        "611752105030249166",
+        "611752105030249167",
+        "611752105030249168",
+        "611752105030249170",
+        "611752105030249171",
+        "611752105030249172",
+        "611752105030249173",
+        "611752105030249174",
+        "611752105030249175",
+        "611752105030249176",
+        "611752105030249177",
+        "611752105030249178",
+        "611752105030249179",
+        "611752105030249180",
+        "611752105030249181",
+        "611752105030249182",
+        "611752105030249183",
+        "611752105030249185",
+        "611752105030249186",
+        "611752105030249187",
+        "611752105030249188",
+        "611752105030249189",
+        "611752105030249190",
+        "611752105030249191",
+        "611752105030249192",
+        "611752105030249193",
+        "611752105030249194",
+        "611752105030249195",
+        "611752105030249196",
+        "611752105030249197",
+        "611752105030249198",
+        "611752105030249199",
+        "611752105030249200",
+        "611752105030249201",
+        "611752105030249202",
+        "611752105030249203",
+        "611752105030249204",
+        "611752105030249205",
+        "611752105030249206",
+        "611752105030249207",
+        "611752105030249208",
+        "611752105030249209",
+        "611752105030249210",
+        "611752105030249211",
+        "611752105030249212",
+        "611752105030249213",
+        "611752105030249214",
+        "611752105030249216",
+        "611752105030249217",
+        "611752105030249218",
+        "611752105030249219",
+        "611752105030249220",
+        "611752105030249221",
+        "611752105030249223",
+        "611752105030249224",
+        "611752105030249225",
+        "611752105030249226",
+        "611752105030249227",
+        "611752105030249228",
+        "611752105030249229",
+        "611752105030249230",
+        "611752105030249231",
+        "611752105030249232",
+        "611752105030249233",
+        "611752105030249234",
+        "611752105030249235",
+        "611752105030249236",
+        "611752105030249237",
+        "611752105030249238",
+        "611752105030249239",
+        "611752105030249240",
+        "611752105030249241",
+        "611752105030249242",
+        "611752105030249243",
+        "611752105030249244",
+        "611752105030249245",
+        "611752105030249247",
+        "611752105030249248",
+        "611752105030249249",
+        "611752105030249250",
+        "611752105030249251",
+        "611752105030249252",
+        "611752105030249253",
+        "611752105030249255",
+        "611752105030249256",
+        "611752105030249257",
+        "611752105030249258",
+        "611752105030249259",
+        "611752105030249260",
+        "611752105030249261",
+        "611752105030249262",
+        "611752105030249264",
+        "611752105030249265",
+        "611752105030249266",
+        "611752105030249267",
+        "611752105030249269",
+        "611752105030249270",
+        "611752105030249271",
+        "611752105030249273",
+        "611752105030249274",
+        "611752105030249275",
+        "611752105030249277",
+        "611752105030249278",
+        "611752105030249279",
+        "611752105030249280",
+        "611752105030249281",
+        "611752105030249282",
+        "611752105030249283",
+        "611752105030249284",
+        "611752105030249287",
+        "611752105030249288",
+        "611752105030249289",
+        "611752105030249290",
+        "611752105030249292",
+        "611752105030249293",
+        "611752105030249294",
+        "611752105030249295",
+        "611752105030249296",
+        "611752105030249297",
+        "611752105030249298",
+        "611752105030249299",
+        "611752105030249300",
+        "611752105030249301",
+        "611752105030249302",
+        "611752105030249303",
+        "611752105030249307",
+        "611752105030249308",
+        "611752105030249309",
+        "611752105030249310",
+        "611752105030249313",
+        "611752105030249314",
+        "611752105030249315",
+        "611752105030249316",
+        "611752105030249317",
+        "611752105030249624",
+        "611752105030250688",
+        "611752105030250689",
+        "611752105030250690",
+        "611752105030250691",
+        "611752105030250692",
+        "611752105030250693",
+        "611752105030250695",
+        "611752105030250697",
+        "611752105030250698",
+        "611752105030250699",
+        "611752105030250700",
+        "611752105030250701",
+        "611752105030250702",
+        "611752105030250704",
+        "611752105030250707",
+        "611752105030250711",
+        "611752105030250712",
+        "611752105030250713",
+        "611752105030250714",
+        "611752105030250715",
+        "611752105030250716",
+        "611752105030250717",
+        "611752105030250718",
+        "611752105030250719",
+        "611752105030250720",
+        "611752105030250721",
+        "611752105030250723",
+        "611752105030250725"
+    ]
+
+    inf_users = [
+        "611752105026649069",
+        "611752105027201163",
+        "611752105027601574",
+        "611752105027602999",
+        "611752105028392007",
+        "611752105028480056",
+        "611752105028480075",
+        "611752105028480653",
+        "611752105029790637",
+        "611752105029951597",
+        "611752105029951604",
+        "611752105029951624",
+        "611752105030248965",
+        "611752105030248971",
+        "611752105030248972",
+        "611752105030248973",
+        "611752105030248974",
+        "611752105030248975",
+        "611752105030248976",
+        "611752105030248977",
+        "611752105030248978",
+        "611752105030248979",
+        "611752105030248980",
+        "611752105030248981",
+        "611752105030248982",
+        "611752105030248983",
+        "611752105030248985",
+        "611752105030248986",
+        "611752105030248987",
+        "611752105030248988",
+        "611752105030248989",
+        "611752105030248990",
+        "611752105030248991",
+        "611752105030248992",
+        "611752105030248993",
+        "611752105030248994",
+        "611752105030248995",
+        "611752105030248996",
+        "611752105030248997",
+        "611752105030248998",
+        "611752105030248999",
+        "611752105030249000",
+        "611752105030249001",
+        "611752105030249002",
+        "611752105030249003",
+        "611752105030249004",
+        "611752105030249005",
+        "611752105030249006",
+        "611752105030249007",
+        "611752105030249008",
+        "611752105030249009",
+        "611752105030249010",
+        "611752105030249011",
+        "611752105030249012",
+        "611752105030249013",
+        "611752105030249014",
+        "611752105030249015",
+        "611752105030249016",
+        "611752105030249017",
+        "611752105030249018",
+        "611752105030249019",
+        "611752105030249020",
+        "611752105030249021",
+        "611752105030249022",
+        "611752105030249023",
+        "611752105030249024",
+        "611752105030249025",
+        "611752105030249026",
+        "611752105030249027",
+        "611752105030249028",
+        "611752105030249029",
+        "611752105030249030",
+        "611752105030249031",
+        "611752105030249032",
+        "611752105030249033",
+        "611752105030249034",
+        "611752105030249035",
+        "611752105030249036",
+        "611752105030249037",
+        "611752105030249038",
+        "611752105030249039",
+        "611752105030249040",
+        "611752105030249041",
+        "611752105030249042",
+        "611752105030249043",
+        "611752105030249044",
+        "611752105030249045",
+        "611752105030249046",
+        "611752105030249047",
+        "611752105030249048",
+        "611752105030249049",
+        "611752105030249050",
+        "611752105030249051",
+        "611752105030249052",
+        "611752105030249053",
+        "611752105030249054",
+        "611752105030249055",
+        "611752105030249056",
+        "611752105030249057",
+        "611752105030249058",
+        "611752105030249059",
+        "611752105030249060",
+        "611752105030249062",
+        "611752105030249063",
+        "611752105030249064",
+        "611752105030249065",
+        "611752105030249067",
+        "611752105030249068",
+        "611752105030249070",
+        "611752105030249071",
+        "611752105030249072",
+        "611752105030249073",
+        "611752105030249074",
+        "611752105030249075",
+        "611752105030249076",
+        "611752105030249077",
+        "611752105030249078",
+        "611752105030249079",
+        "611752105030249080",
+        "611752105030249081",
+        "611752105030249082",
+        "611752105030249083",
+        "611752105030249084",
+        "611752105030249085",
+        "611752105030249086",
+        "611752105030249087",
+        "611752105030249088",
+        "611752105030249089",
+        "611752105030249090",
+        "611752105030249091",
+        "611752105030249092",
+        "611752105030249093",
+        "611752105030249094",
+        "611752105030249095",
+        "611752105030249096",
+        "611752105030249098",
+        "611752105030249099",
+        "611752105030249100",
+        "611752105030249101",
+        "611752105030249102",
+        "611752105030249103",
+        "611752105030249104",
+        "611752105030249105",
+        "611752105030249106",
+        "611752105030249107",
+        "611752105030249108",
+        "611752105030249109",
+        "611752105030249110",
+        "611752105030249111",
+        "611752105030249112",
+        "611752105030249113",
+        "611752105030249114",
+        "611752105030249115",
+        "611752105030249116",
+        "611752105030249117",
+        "611752105030249118",
+        "611752105030249119",
+        "611752105030249120",
+        "611752105030249121",
+        "611752105030249122",
+        "611752105030249123",
+        "611752105030249124",
+        "611752105030249125",
+        "611752105030249126",
+        "611752105030249127",
+        "611752105030249128",
+        "611752105030249129",
+        "611752105030249130",
+        "611752105030249131",
+        "611752105030249132",
+        "611752105030249133",
+        "611752105030249134",
+        "611752105030249135",
+        "611752105030249136",
+        "611752105030249137",
+        "611752105030249138",
+        "611752105030249139",
+        "611752105030249140",
+        "611752105030249141",
+        "611752105030249142",
+        "611752105030249143",
+        "611752105030249144",
+        "611752105030249145",
+        "611752105030249146",
+        "611752105030249147",
+        "611752105030249148",
+        "611752105030249150",
+        "611752105030249151",
+        "611752105030249152",
+        "611752105030249153",
+        "611752105030249154",
+        "611752105030249155",
+        "611752105030249157",
+        "611752105030249158",
+        "611752105030249159",
+        "611752105030249160",
+        "611752105030249161",
+        "611752105030249162",
+        "611752105030249163",
+        "611752105030249165",
+        "611752105030249166",
+        "611752105030249167",
+        "611752105030249168",
+        "611752105030249170",
+        "611752105030249171",
+        "611752105030249172",
+        "611752105030249173",
+        "611752105030249174",
+        "611752105030249175",
+        "611752105030249176",
+        "611752105030249177",
+        "611752105030249178",
+        "611752105030249179",
+        "611752105030249180",
+        "611752105030249181",
+        "611752105030249182",
+        "611752105030249183",
+        "611752105030249185",
+        "611752105030249186",
+        "611752105030249187",
+        "611752105030249188",
+        "611752105030249189",
+        "611752105030249190",
+        "611752105030249191",
+        "611752105030249192",
+        "611752105030249193",
+        "611752105030249194",
+        "611752105030249195",
+        "611752105030249196",
+        "611752105030249197",
+        "611752105030249198",
+        "611752105030249199",
+        "611752105030249200",
+        "611752105030249201",
+        "611752105030249202",
+        "611752105030249203",
+        "611752105030249204",
+        "611752105030249205",
+        "611752105030249206",
+        "611752105030249207",
+        "611752105030249208",
+        "611752105030249209",
+        "611752105030249210",
+        "611752105030249211",
+        "611752105030249212",
+        "611752105030249213",
+        "611752105030249214",
+        "611752105030249216",
+        "611752105030249217",
+        "611752105030249218",
+        "611752105030249219",
+        "611752105030249220",
+        "611752105030249221",
+        "611752105030249223",
+        "611752105030249224",
+        "611752105030249225",
+        "611752105030249226",
+        "611752105030249227",
+        "611752105030249228",
+        "611752105030249229",
+        "611752105030249230",
+        "611752105030249231",
+        "611752105030249232",
+        "611752105030249233",
+        "611752105030249234",
+        "611752105030249235",
+        "611752105030249236",
+        "611752105030249237",
+        "611752105030249238",
+        "611752105030249239",
+        "611752105030249240",
+        "611752105030249241",
+        "611752105030249242",
+        "611752105030249243",
+        "611752105030249244",
+        "611752105030249245",
+        "611752105030249247",
+        "611752105030249248",
+        "611752105030249249",
+        "611752105030249250",
+        "611752105030249251",
+        "611752105030249252",
+        "611752105030249253",
+        "611752105030249255",
+        "611752105030249256",
+        "611752105030249257",
+        "611752105030249258",
+        "611752105030249259",
+        "611752105030249260",
+        "611752105030249261",
+        "611752105030249262",
+        "611752105030249264",
+        "611752105030249265",
+        "611752105030249266",
+        "611752105030249267",
+        "611752105030249269",
+        "611752105030249270",
+        "611752105030249271",
+        "611752105030249273",
+        "611752105030249274",
+        "611752105030249275",
+        "611752105030249277",
+        "611752105030249278",
+        "611752105030249279",
+        "611752105030249280",
+        "611752105030249281",
+        "611752105030249282",
+        "611752105030249283",
+        "611752105030249284",
+        "611752105030249287",
+        "611752105030249288",
+        "611752105030249289",
+        "611752105030249290",
+        "611752105030249292",
+        "611752105030249293",
+        "611752105030249294",
+        "611752105030249295",
+        "611752105030249296",
+        "611752105030249297",
+        "611752105030249298",
+        "611752105030249299",
+        "611752105030249300",
+        "611752105030249301",
+        "611752105030249302",
+        "611752105030249303",
+        "611752105030249307",
+        "611752105030249308",
+        "611752105030249309",
+        "611752105030249310",
+        "611752105030249313",
+        "611752105030249314",
+        "611752105030249315",
+        "611752105030249316",
+        "611752105030249317",
+        "611752105030249318",
+        "611752105030249319",
+        "611752105030249320",
+        "611752105030249321",
+        "611752105030249322",
+        "611752105030249323",
+        "611752105030249324",
+        "611752105030249325",
+        "611752105030249327",
+        "611752105030249328",
+        "611752105030249329",
+        "611752105030249330",
+        "611752105030249331",
+        "611752105030249332",
+        "611752105030249333",
+        "611752105030249334",
+        "611752105030249336",
+        "611752105030249337",
+        "611752105030249338",
+        "611752105030249339",
+        "611752105030249340",
+        "611752105030249341",
+        "611752105030249342",
+        "611752105030249343",
+        "611752105030249344",
+        "611752105030249345",
+        "611752105030249346",
+        "611752105030249347",
+        "611752105030249348",
+        "611752105030249349",
+        "611752105030249350",
+        "611752105030249351",
+        "611752105030249352",
+        "611752105030249353",
+        "611752105030249354",
+        "611752105030249355",
+        "611752105030249356",
+        "611752105030249357",
+        "611752105030249358",
+        "611752105030249359",
+        "611752105030249360",
+        "611752105030249361",
+        "611752105030249362",
+        "611752105030249363",
+        "611752105030249364",
+        "611752105030249365",
+        "611752105030249366",
+        "611752105030249367",
+        "611752105030249368",
+        "611752105030249369",
+        "611752105030249370",
+        "611752105030249371",
+        "611752105030249372",
+        "611752105030249373",
+        "611752105030249374",
+        "611752105030249375",
+        "611752105030249376",
+        "611752105030249377",
+        "611752105030249378",
+        "611752105030249379",
+        "611752105030249380",
+        "611752105030249381",
+        "611752105030249383",
+        "611752105030249384",
+        "611752105030249385",
+        "611752105030249386",
+        "611752105030249387",
+        "611752105030249388",
+        "611752105030249389",
+        "611752105030249390",
+        "611752105030249391",
+        "611752105030249392",
+        "611752105030249393",
+        "611752105030249394",
+        "611752105030249395",
+        "611752105030249396",
+        "611752105030249397",
+        "611752105030249398",
+        "611752105030249399",
+        "611752105030249401",
+        "611752105030249402",
+        "611752105030249403",
+        "611752105030249404",
+        "611752105030249405",
+        "611752105030249406",
+        "611752105030249407",
+        "611752105030249408",
+        "611752105030249409",
+        "611752105030249410",
+        "611752105030249412",
+        "611752105030249413",
+        "611752105030249414",
+        "611752105030249415",
+        "611752105030249416",
+        "611752105030249417",
+        "611752105030249418",
+        "611752105030249419",
+        "611752105030249420",
+        "611752105030249421",
+        "611752105030249431",
+        "611752105030249624",
+        "611752105030250688",
+        "611752105030250689",
+        "611752105030250690",
+        "611752105030250691",
+        "611752105030250692",
+        "611752105030250693",
+        "611752105030250695",
+        "611752105030250697",
+        "611752105030250698",
+        "611752105030250699",
+        "611752105030250700",
+        "611752105030250701",
+        "611752105030250702",
+        "611752105030250704",
+        "611752105030250707",
+        "611752105030250711",
+        "611752105030250712",
+        "611752105030250713",
+        "611752105030250714",
+        "611752105030250715",
+        "611752105030250716",
+        "611752105030250717",
+        "611752105030250718",
+        "611752105030250719",
+        "611752105030250720",
+        "611752105030250721",
+        "611752105030250723",
+        "611752105030250725",
+        "611752105030250726",
+        "611752105030250728",
+        "611752105030250729",
+        "611752105030250730",
+        "611752105030250732",
+        "611752105030250733",
+        "611752105030250735",
+        "611752105030250736",
+        "611752105030250739",
+        "611752105030250741",
+        "611752105030250743"
+    ]
+
+    train_users = [
+        10414574138721494,
+        10414574140317353,
+        1688849864840588,
+        3634463651,
+        5629499489839033,
+        5910973794723621,
+        6755399374234747,
+        8162774327817435,
+        8162774329368194
+    ]
+
+    exe_cmd = """/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/inference_main.py data/train_users/{train_user}/logs/32k/G_2000.pth data/train_users/{train_user}/config/config.json data/inf_users/me_top500/{inf_user}/vocal_32.wav data/out_data/me_top500/{inf_user}/{inf_user}_{train_user}.wav"""
+    for inf_user in inf_users:
+        if inf_user not in old_users:
+            aa = []
+            while True:
+                if len(aa) == 3:
+                    break
+                num = np.random.randint(0, len(train_users))
+                if num in aa:
+                    continue
+                aa.append(num)
+                print(exe_cmd.format(train_user=train_users[num], inf_user=inf_user))
+        # for train_user in train_users:
+        #     out_path = "data/out_data/{inf_user}/{inf_user}_{train_user}.wav"
+        # if os.path.exists(out_path.format(train_user=train_user, inf_user=inf_user)):
+        #     continue
+        # num = np.random.randint(0, len(train_users))
+        # print(exe_cmd.format(train_user=train_user, inf_user=inf_user))
+
+
+def gen_mix():
+    inf_users = [
+        # 611752105027200978,
+        # 611752105027801388,
+        # 611752105029274335,
+        # 611752105028546962,
+        # 611752105028354526,
+        # 611752105027200978,
+        # 611752105027945331,
+        "top10_1",
+        "top10_2",
+        "top10_3",
+        "top10_4",
+        "top10_5",
+        "top10_6",
+        "top10_7",
+        # "top10_8",
+        "top10_9",
+        "top10_10",
+        # 611752105028354530
+    ]
+    train_users = [
+        10414574138721494,
+        10414574140317353,
+        1688849864840588,
+        3634463651,
+        5629499489839033,
+        5910973794723621,
+        6755399374234747,
+        8162774327817435,
+        8162774329368194
+    ]
+
+    out_data = "/data/rsync/jianli.yang/AutoCoverTool/data/out_data"
+    ffmpeg_cmd = "ffmpeg -i {} -ar 44100 -ac 2 {}"
+    # for inf_user in inf_users:
+    #     for train_user in train_users:
+    #         filename = "{}/{}_{}.wav".format(inf_user, inf_user, train_user)
+    #         filename442 = "{}/{}_{}_442.wav".format(inf_user, inf_user, train_user)
+    #         # 重采样
+    #         # if not os.path.exists(os.path.join(out_data, filename)):
+    #         #     continue
+    #         print(ffmpeg_cmd.format(os.path.join(out_data, filename), os.path.join(out_data, filename442)))
+    #
+    # exit(-1)
+    # 合成数据
+    mix_cmd = "/data/rsync/jianli.yang/AutoCoverTool/data/bin/mixer_15 /data/rsync/jianli.yang/AutoCoverTool/data/models/impluse_im_plus_wet2.wav {} {} {}"
+    acc_path = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/{}/acc.wav"
+    out_path = "/data/rsync/jianli.yang/AutoCoverTool/data/final_data/{}_{}_mix15.wav"
+    for inf_user in inf_users:
+        for train_user in train_users:
+            filename442 = "{}/{}_{}_442.wav".format(inf_user, inf_user, train_user)
+            # if not os.path.exists(os.path.join(out_data, filename442)):
+            #     continue
+            # if os.path.exists(out_path.format(inf_user, train_user)):
+            #     continue
+            print(mix_cmd.format(os.path.join(out_data, filename442), acc_path.format(inf_user),
+                                 out_path.format(inf_user, train_user)))
+            # print(mix_cmd)
+
+
+def copy():
+    import numpy as np
+    inf_users = [
+        "top10_1",
+        "top10_2",
+        "top10_3",
+        "top10_4",
+        "top10_5",
+        "top10_6",
+        "top10_7",
+        # "top10_8",
+        "top10_9",
+        "top10_10",
+    ]
+    train_users = [
+        10414574138721494,
+        10414574140317353,
+        1688849864840588,
+        3634463651,
+        5629499489839033,
+        5910973794723621,
+        6755399374234747,
+        8162774327817435,
+        8162774329368194
+    ]
+    base_src = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/data/final_data"
+    base_dst = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/data/real_out"
+    for inf_user in inf_users:
+        num = np.random.randint(0, len(train_users))
+        src_file = os.path.join(base_src, "{}_{}_mix15.wav".format(inf_user, train_users[num]))
+        dst_file = os.path.join(base_dst, "{}_{}_mix15.wav".format(inf_user, train_users[num]))
+        cmd = "cp -r {} {}".format(src_file, dst_file)
+        # os.system(cmd)
+        print(cmd)
+
+
+if __name__ == '__main__':
+    # copy()
+    gen_inference()
+# gen_mix()
+# import numpy as np
+#
+# for i in range(0, 10):
+#     data = np.random.randint(0, 8)
+#     print(data)
diff --git a/AutoCoverTool/script/get_song_url.py b/AutoCoverTool/script/get_song_url.py
new file mode 100644
index 0000000..921ed8d
--- /dev/null
+++ b/AutoCoverTool/script/get_song_url.py
@@ -0,0 +1,136 @@
+"""
+获取歌曲的地址
+"""
+from script.common import *
+from copy import deepcopy
+
+
+def get_url_by_song_id(song_id):
+    sql = "select task_url,starmaker_songid from silence where starmaker_songid = {} order by task_id limit 1".format(
+        song_id)
+    ban = deepcopy(banned_user_map)
+    ban["db"] = "starmaker_musicbook"
+    data = get_data_by_mysql(sql, ban)
+    if len(data) > 0:
+        return data[0][0]
+    return None
+
+
+def process():
+    arr = [
+        "611752105025886914",
+        "611752105030414513",
+        "611752105030414549",
+        "611752105016527562",
+        "611752105030414557",
+        "611752105030414568",
+        "611752105030414576",
+        "611752105025946483",
+        "611752105030414580",
+        "611752105030414584",
+        "611752105030414588",
+        "611752105030414590",
+        "611752105030414597",
+        "611752105030414600",
+        "611752105030414608",
+        "611752105030414613",
+        "611752105019802732",
+        "611752105030414615",
+        "611752105030414619",
+        "611752105030414633",
+        "611752105030414638",
+        "611752105030414644",
+        "611752105030414647",
+        "611752105030414655",
+        "611752105030414660",
+        "611752105030414663",
+        "611752105030414669",
+        "611752105030414674",
+        "611752105030414678",
+        "611752105030414680",
+        "611752105030414682",
+        "611752105030414686",
+        "611752105030414689",
+        "611752105030414696",
+        "611752105030414702",
+        "611752105030414706",
+        "611752105030414707",
+        "611752105030414711",
+        "611752105030414717",
+        "611752105030414729",
+        "611752105030414742",
+        "611752105020587028",
+        "611752105030414752",
+        "611752105030414757",
+        "611752105030414761",
+        "611752105030414763",
+        "611752105030414766",
+        "611752105030414773",
+        "611752105030414776",
+        "611752105030414777",
+        "611752105030414779",
+        "611752105030414784",
+        "611752105030414890",
+        "611752105030414907",
+        "611752105030414915",
+        "611752105030414919",
+        "611752105030414925",
+        "611752105030414929",
+        "611752105030414932",
+        "611752105030414935",
+        "611752105030414937",
+        "611752105019423720",
+        "611752105030414943",
+        "611752105030414948",
+        "611752105026101090",
+        "611752105030414949",
+        "611752105030414957",
+        "611752105030414962",
+        "611752105030414963",
+        "611752105030414968",
+        "611752105030414973",
+        "611752105030414976",
+        "611752105030414981",
+        "611752105030414986",
+        "611752105030414988",
+        "611752105030414990",
+        "611752105030414993",
+        "611752105030414995",
+        "611752105030415003",
+        "611752105030415007",
+        "611752105030415009",
+        "611752105030415014",
+        "611752105030415018",
+        "611752105030415032",
+        "611752105030415044",
+        "611752105030415050",
+        "611752105030415052",
+        "611752105030415056",
+        "611752105030415058",
+        "611752105030415062",
+        "611752105030415067",
+        "611752105017233541",
+        "611752105015523266",
+        "611752105030415071",
+        "611752105030415074",
+        "611752105030415078",
+        "611752105022920230",
+        "611752105030113709",
+        "611752105022990449",
+        "611752105030415083",
+        "611752105030415087",
+        "611752105030415094",
+        "611752105030415100",
+        "611752105030425986",
+        "611752105030415103",
+        "611752105030426004"
+    ]
+
+    for sid in arr:
+        url = get_url_by_song_id(sid)
+        if url is not None:
+            print("out,{},{}".format(url, sid))
+
+
+if __name__ == '__main__':
+    process()
diff --git a/AutoCoverTool/script/get_user_recordings.py b/AutoCoverTool/script/get_user_recordings.py
new file mode 100644
index 0000000..0eb9856
--- /dev/null
+++ b/AutoCoverTool/script/get_user_recordings.py
@@ -0,0 +1,128 @@
+"""
+获取用户数据
+"""
+import os
+import time
+import glob
+import json
+import librosa
+import soundfile
+
+from script.common import *
+
+
+def exec_cmd(cmd):
+    r = os.popen(cmd)
+    text = r.read()
+    r.close()
+    return text
+
+
+def get_d(audio_path):
+    cmd = "ffprobe -v quiet -print_format json -show_format -show_streams {}".format(audio_path)
+    data = exec_cmd(cmd)
+    data = json.loads(data)
+    if "format" in data.keys():
+        if "duration" in data['format']:
+            return float(data["format"]["duration"])
+    return 0
+
+
+def get_user_recordings(user_id):
+    sql = "select id, recording_url from recording where user_id={} and created_on > {} and is_public = 1 and is_deleted = 0 and media_type in (1, 2, 3, 4, 9, 10) ".format(
+        user_id,
+        time.time() - 86400 * 30)
+    res = get_shard_data_by_sql(sql, user_id)
+    true_num = 0
+    for id, url in res:
+        if download_url(url, user_id, str(id)):
+            true_num += 1
+        if true_num > 15:
+            break
+
+
+def download_url(url, uid, rid):
+    url = str(url).replace("master.mp4", "origin_master.mp4")
+    c_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_byw_man/{}".format(uid)
+    if not os.path.exists(c_dir):
+        os.makedirs(c_dir)
+    c_dir = os.path.join(c_dir, "src")
+    if not os.path.exists(c_dir):
+        os.makedirs(c_dir)
+    cmd = "wget {} -O {}/{}.mp4".format(url, c_dir, rid)
+    os.system(cmd)
+    # 转码为44k双声道音频
+    in_path = os.path.join(c_dir, rid + ".mp4")
+    if os.path.exists(in_path):
+        duration = get_d(in_path)
+        print("duration={}".format(duration))
+        if duration > 30:
+            dst_path = in_path.replace(".mp4", ".wav")
+            cmd = "ffmpeg -i {} -ar 44100 -ac 1 {}".format(in_path, dst_path)
+            print("exec={}".format(cmd))
+            os.system(cmd)
+            return os.path.exists(dst_path)
+    return False
+
+
+def split_to_idx(ppath, dst_path, user_id):
+    frame_len = 32000 * 15
+    files = glob.glob(os.path.join(ppath, "*mp4"))
+    mmax = 0
+    for file in files:
+        try:
+            audio, sr = librosa.load(file, sr=32000, mono=True)
+        except Exception as ex:
+            continue
+
+        print("audio_len:={}".format(audio.shape))
+        for i in range(0, len(audio), frame_len):
+            if i + frame_len > len(audio):
+                break
+            cur_data = audio[i:i + frame_len]
+            out_path = os.path.join(dst_path, "{}_{}.wav".format(user_id, mmax))
+            print("save to {}".format(out_path))
+            # librosa.output.write_wav(out_path, cur_data, 32000)
+            soundfile.write(out_path, cur_data, 32000, format="wav")
+            mmax += 1
+
+
+if __name__ == '__main__':
+    arr = [
+        "5348024335101054",
+        "4222124657245641",
+        "5629499489117674",
+        "12384898975368914",
+        "5629499489839033",
+        "5348024336648185",
+        "5910973794961321",
+        "3635518643",
+        "844424937670811",
+        "4785074600577375",
+        "6755399442719465",
+        "4785074603156924",
+        "11540474053041727",
+        "6473924129711210",
+        "7036874421386111",
+        "7599824376482810",
+        "6755399447475416",
+        "8444249306118343",
+        "3377699721107378",
+        "12947848931397021",
+        "7599824374449011",
+        "3096224748076687",
+        "12103424006572822",
+        "1125899914308640",
+        "12666373952417962",
+        "281474982845813",
+        "11821949029679778",
+        "12947848937379499",
+        "12947848936090348",
+        "3096224747262571",
+        "2814749767432467",
+        "5066549357604730",
+        "3096224751151928"
+    ]
+    for uuid in arr:
+        get_user_recordings(uuid)
+        print("finish =={} ".format(uuid))
diff --git a/AutoCoverTool/script/get_user_recordings_test.py b/AutoCoverTool/script/get_user_recordings_test.py
new file mode 100644
index 0000000..9cc55a6
--- /dev/null
+++ b/AutoCoverTool/script/get_user_recordings_test.py
@@ -0,0 +1,191 @@
+"""
+获取用户数据
+"""
+import os
+import time
+import glob
+import json
+import librosa
+import soundfile
+
+from script.common import *
+
+
+def exec_cmd(cmd):
+    r = os.popen(cmd)
+    text = r.read()
+    r.close()
+    return text
+
+
+def get_d(audio_path):
+    cmd = "ffprobe -v quiet -print_format json -show_format -show_streams {}".format(audio_path)
+    data = exec_cmd(cmd)
+    data = json.loads(data)
+    if "format" in data.keys():
+        if "duration" in data['format']:
+            return float(data["format"]["duration"])
+    return 0
+
+
+def get_user_recordings(user_id):
+    sm_ids = [
+        4148090438,
+        4148090458,
+        4148090494,
+        4148090510,
+        4148090514,
+        4148090534,
+        4148090546,
+        4148090574,
+        4148090582,
+        4148090606,
+        4148090622,
+        4148090646,
+        4148090678,
+        4148090718,
+        4148090750,
+        4148090786,
+        4148090810,
+        4148090834,
+        4148090858,
+        4148090866,
+        4148090886,
+        4148090902,
+        4148090922,
+        4148090934,
+        4148090970,
+        4148090986,
+        4148159561,
+        4148159581,
+        4148159593,
+        4148159673,
+        4148159721,
+        4148159729,
+        4148159757,
+        4148159781,
+        4148159789,
+        4148159797,
+        4148159833,
+        4148159841,
+        4148159881,
+        4148159949,
+        4148159965,
+        4148160013,
+        4148160021,
+        4148160037,
+        4148257127,
+        4148257179,
+        4148257215,
+        4148257251,
+        4148257263,
+        4148257271,
+        4148257303,
+        4148257307,
+        4148257311,
+        4148257323,
+        4148257335,
+        4148257343,
+        4148257383,
+        4148257419,
+        4148257427,
+        4148257431,
+        4148257439,
+        4148257447,
+        4148257451,
+        4148257471,
+        4148257483,
+        4148257491,
+        4148257551,
+        4148257575,
+        4148257615,
+        4148257623,
+        4148257627,
+        4148257631,
+        4148257655,
+        4148328480,
+        4148328492,
+        4148328552,
+        4148328564,
+        4148328580,
+        4148328588,
+        4148328592,
+        4148328600,
+        4148328608,
+        4148328660,
+        4148328668,
+        4148328728,
+        4148328788,
+        4148328804,
+        4148328828,
+        4148328868,
+        4148328900,
+        4148328928,
+        4148328944,
+        4148328972,
+        4148328988,
+        4148328996,
+        4148329008,
+        4148329012,
+        4148329016,
+        4148329028,
+        4148329076,
+        4148336302,
+        4148336310,
+        4148336314,
+        4148336334,
+        4148336350,
+        4148336366,
+        4148336386,
+        4148336390,
+        4148336406,
+        4148336418,
+        4148406433,
+        4148406441,
+        4148406445,
+        4148406449,
+        4148406469,
+        4148406473,
+        4148502907,
+        4148502911,
+        4148502915,
+        4148502931,
+        4148502947,
+        4148502951,
+        4148502963,
+        4148575184,
+        4148575208
+    ]
+    all_map = {}
+    for sm_id in sm_ids:
+        sql = "select id, sm_id, song_id from recording where sm_id = {}".format(sm_id)
+        res = get_shard_data_by_sql(sql, user_id)
+        print("RES,{},{}".format(res[0][1], res[0][2]))
+        all_map[res[0][2]] = res[0][1]
+
+    # err_song_id = [
+    #     611752105030249319,
+    #     611752105030249338,
+    #     611752105030249355,
+    #     611752105030249370,
+    #     611752105030249385,
+    #     611752105030249397,
+    #     611752105030249410,
+    #     611752105030250739,
+    #     611752105030249030,
+    #     611752105030249030,
+    #     611752105030249040,
+    #     611752105030249070,
+    #     611752105030249113,
+    #     611752105030249174,
+    #     611752105030249227,
+    #     611752105030249273,
+    #     611752105030249287,
+    #     611752105030250691
+    # ]
+    # for song_id in err_song_id:
+    #     print("err:{},{}".format(song_id, all_map[song_id]))
+
+
+if __name__ == '__main__':
+    get_user_recordings("1407374883605781")
diff --git a/AutoCoverTool/script/get_vocals_for_inference.py b/AutoCoverTool/script/get_vocals_for_inference.py
new file mode 100644
index 0000000..e3f9de9
--- /dev/null
+++ b/AutoCoverTool/script/get_vocals_for_inference.py
@@ -0,0 +1,28 @@
+from ref.music_remover.separate_interface import *
+import sys
+import glob
+import librosa
+import soundfile
+
+
+def get_vocal(in_file, vocal_out_file, acc_out_file):
+    inst = SeparateInterface()
+    inst.process(str(1), in_file, vocal_out_file, acc_out_file, 'cuda')
+
+
+if __name__ == '__main__':
+    st = time.time()
+    # name = sys.argv[1]
+    # base_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users"
+    # dst_dir = os.path.join(base_dir, name)
+    # src_file = os.path.join(dst_dir, "src.mp3")
+    src_file = sys.argv[1]  # 音频文件地址
+    dst_dir = sys.argv[2]  # 输出目录
+    if not os.path.exists(dst_dir):
+        os.makedirs(dst_dir, True)
+    if os.path.exists(os.path.join(dst_dir, "vocal_32.wav")):
+        exit(0)
+    get_vocal(src_file, os.path.join(dst_dir, "vocal.wav"), os.path.join(dst_dir, "acc.wav"))
+    audio, sr = librosa.load(os.path.join(dst_dir, "vocal.wav"), sr=32000, mono=True)
+    soundfile.write(os.path.join(dst_dir, "vocal_32.wav"), audio, 32000, format="wav")
+    print("spent = {}".format(time.time() - st))
diff --git a/AutoCoverTool/script/get_vocals_for_train.py b/AutoCoverTool/script/get_vocals_for_train.py
new file mode 100644
index 0000000..02df6c6
--- /dev/null
+++ b/AutoCoverTool/script/get_vocals_for_train.py
@@ -0,0 +1,87 @@
+from ref.music_remover.separate_interface import *
+import sys
+import glob
+import librosa
+import soundfile
+
+
+def get_vocal(in_file, vocal_out_file, acc_out_file):
+    inst = SeparateInterface()
+    try:
+        inst.process(str(1), in_file, vocal_out_file, acc_out_file, 'cuda')
+    except Exception as ex:
+        print(ex)
+
+
+def split_to_idx(ppath, dst_path, user_id):
+    frame_len = 32000 * 15
+    files = glob.glob(os.path.join(ppath, "*wav"))
+    mmax = 0
+    for file in files:
+        try:
+            audio, sr = librosa.load(file, sr=32000, mono=True)
+        except Exception as ex:
+            continue
+
+        print("audio_len:={}".format(audio.shape))
+        for i in range(0, len(audio), frame_len):
+            if i + frame_len > len(audio):
+                break
+            cur_data = audio[i:i + frame_len]
+            out_path = os.path.join(dst_path, "{}_{}.wav".format(user_id, mmax))
+            print("save to {}".format(out_path))
+            soundfile.write(out_path, cur_data, 32000, format="wav")
+            mmax += 1
+
+
+def abandon_wav(ppath):
+    files = glob.glob(os.path.join(ppath, "*wav"))
+    power_list = []
+    for file in files:
+        try:
+            audio, sr = librosa.load(file, sr=32000, mono=True)
+        except Exception as ex:
+            continue
+        power = sum(audio * audio) / len(audio)
+        power_list.append([power, file])
+    power_list_sorted = sorted(power_list, key=lambda x: x[0], reverse=True)
+    for idx, file in enumerate(power_list_sorted):
+        print(idx)
+        if idx >= 80:
+            os.unlink(file[1])
+            print("{},{}".format(idx, file[1]))
+
+
+def get_all_vocals(in_dir, out_dir):
+    # dir = "data/train_users/zjl/src"
+    # out_dir = "data/train_users/zjl/vocals/"
+    files = glob.glob(os.path.join(in_dir, "*wav"))
+    for file in files:
+        idx = file.split(".")[-2].split("/")[-1]
+        get_vocal(file, os.path.join(out_dir, "{}.wav".format(idx)), None)
+
+
+if __name__ == '__main__':
+    name = sys.argv[1]  # 文件夹名称
+    base = "data/train_users/0317_top200"
+    print("start get_all_vocals ...")
+
+    vocals_dir = os.path.join(base, os.path.join(name, "vocals"))
+    if not os.path.exists(vocals_dir):
+        os.makedirs(vocals_dir)
+
+    speaker0_dir = os.path.join(base, os.path.join(name, "speaker0"))
+    if not os.path.exists(speaker0_dir):
+        os.makedirs(speaker0_dir)
+
+    get_all_vocals(os.path.join(base, os.path.join(name, "src")), vocals_dir)
+    print("start split_to_idx ...")
+    split_to_idx(os.path.join(base, os.path.join(name, "vocals")), speaker0_dir, "0")
+
+    print("start abandon_wav ...")
+    abandon_wav(speaker0_dir)
+
+    # src_file = sys.argv[1]
+    # dst_vocal_file = sys.argv[2]
+    # dst_acc_file = sys.argv[3]
+    # get_vocal(src_file, dst_vocal_file, dst_acc_file)
diff --git a/AutoCoverTool/script/inference.sh b/AutoCoverTool/script/inference.sh
new file mode 100644
index 0000000..eab00f5
--- /dev/null
+++ b/AutoCoverTool/script/inference.sh
@@ -0,0 +1,24 @@
+export LD_LIBRARY_PATH=/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/lib:$LD_LIBRARY_PATH
+export PATH=$PATH:/data/gpu_env_common/env/bin/ffmpeg/bin
+export PYTHONPATH=$PWD:$PWD/ref/music_remover/demucs
+
+# 推理过程
+# 2. 提取人声、伴奏
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/$1/src.mp3 data/inf_users/$1
+
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/611752105028237782/src.mp3 data/inf_users/611752105028237782
+
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so-vits-svc/inference_main.py data/train_users/zjl/logs/32k/G_2000.pth data/train_users/zjl/config/config.json data/inf_users/pfdyt/vocal_32.wav data/out_data/pfdyt/pfdyt_zjl.wav
+
+
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_1/src.mp3 data/inf_users/top10_1
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_2/src.mp3 data/inf_users/top10_2
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_3/src.mp3 data/inf_users/top10_3
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_4/src.mp3 data/inf_users/top10_4
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_5/src.mp3 data/inf_users/top10_5
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_6/src.mp3 data/inf_users/top10_6
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_7/src.mp3 data/inf_users/top10_7
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_8/src.mp3 data/inf_users/top10_8
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_9/src.mp3 data/inf_users/top10_9
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_inference.py data/inf_users/top10_10/src.mp3 data/inf_users/top10_10
+
diff --git a/AutoCoverTool/script/inference_one.py b/AutoCoverTool/script/inference_one.py
new file mode 100644
index 0000000..8aace4c
--- /dev/null
+++ b/AutoCoverTool/script/inference_one.py
@@ -0,0 +1,1529 @@
+"""
+单个处理的逻辑
+song_id:
+    ---src.mp3                              // 源数据，需要提前放进去
+    ---cache
+        ---vocal.wav                            // 分离之后产生
+        ---acc.wav                              // 分离之后产生
+        ---vocal_32.wav                         // 分离之后产生
+        ---song_id_sp1.wav                      // 合成之后产生
+        ---song_id_sp2.wav                      // 合成之后产生
+        ---song_id_sp2_d.wav                    // 降噪之后生成
+        ---song_id_sp2_dv.wav                   // 降噪+拉伸之后产生 [占比太高的不产生]
+        ---song_id_sp2_dve442.wav               // 手动调整之后产生
+        ---song_id_sp2_dve442_replace.wav       // 替换之后产生
+        ---song_id_sp2_dve442_replace_mix.wav   // 人声+伴奏混合之后产生
+    ---song_id
+        --acc.mp3                           // 44k双声道320k
+        --vocal.mp3                         // 44k双声道320k
+        --src.mp3                           // 44k双声道320k
+        --song_id_sp2_dv.mp3                // 44k单声道320k
+    ---song_id_out                          // 对外输出
+        --src.mp3                           // 原始音频
+        --song_id_sp2_dv_replace_mix.mp3    // 制作完成的音频
+
+环境安装:
+conda create -n auto_song_cover  python=3.9
+# 安装demucs环境[进入到ref.music_remover 执行pip install -r requirements.txt]
+# 安装so_vits_svc环境[进入到ref.so_vits_svc 执行pip install -r requirements.txt]
+pip install librosa
+pip install scikit-maad
+pip install praat-parselmouth
+pip install matplotlib
+pip install torchvision
+pip install madmom
+pip install torchstat
+环境设置:
+export PATH=$PATH:/data/gpu_env_common/env/bin/ffmpeg/bin
+export PYTHONPATH=$PWD:$PWD/ref/music_remover/demucs:$PWD/ref/so_vits_svc:$PWD/ref/split_dirty_frame
+"""
+
+import os
+import time
+import shutil
+import random
+import logging
+import librosa
+
+gs_err_code_success = 0
+gs_err_code_no_src_mp3 = 1
+gs_err_code_separate = 2
+gs_err_code_trans_32 = 3
+gs_err_code_encode_err = 4
+gs_err_code_replace_err = 5
+gs_err_code_replace_trans_err = 6
+gs_err_code_mix_err = 7
+gs_err_code_mix_transcode_err = 8
+gs_err_code_no_src_dir = 9
+gs_err_code_volume_err = 10
+gs_err_code_trans2_442 = 11
+gs_err_code_reverb = 12
+
+gs_denoise_exe = "/opt/soft/bin/denoise_exe"
+gs_draw_volume_exe = "/opt/soft/bin/draw_volume_v1"
+gs_simple_mixer_path = "/opt/soft/bin/simple_mixer"
+gs_rever_path = "/data/rsync/jianli.yang/dereverbrate/build/dereverbrate_test"
+
+from ref.music_remover.separate_interface import SeparateInterface
+from ref.so_vits_svc.inference_main import *
+from ref.split_dirty_frame.script.process_one import ReplaceVocalFrame, construct_power_fragment
+from ref.split_dirty_frame.dataset.dataset import file2mfcc
+
+
+class SongCoverInference:
+    def __init__(self):
+        self.work_dir = None
+        self.cache_dir = None
+        self.cid = None
+        self.src_mp3 = None
+        self.vocal_path = None
+        self.vocal_32_path = None
+        self.acc_path = None
+        self.speakers = [
+            10414574138721494,
+            10414574140317353,
+            1688849864840588,
+            3634463651,
+            5629499489839033,
+            5910973794723621,
+            6755399374234747,
+            8162774327817435,
+            8162774329368194,
+            1125899914308640,  # 以下为男声,包括这个
+            12384898975368914,
+            12947848931397021,
+            3096224748076687,
+            3096224751151928,
+            5066549357604730,
+            5348024335101054,
+            6755399442719465,
+            7036874421386111
+        ]
+        self.speakers_model_path = "data/train_users/{}/logs/32k/G_2000.pth"
+        self.speakers_model_config = "data/train_users/{}/config/config.json"
+
+        st = time.time()
+        self.separate_inst = SeparateInterface()
+        self.replace_vocal_frame_inst = ReplaceVocalFrame("data/models/split_dirty_frame_v5_3_epoch3_852.pth")
+        logging.info("SongCoverInference init sp={}".format(time.time() - st))
+
+    def separate(self, cid, src_mp3, vocal_path, acc_path):
+        """
+        人声伴奏分离
+        :param cid:
+        :param src_mp3:
+        :param vocal_path:
+        :param acc_path:
+        :return:
+        """
+        st = time.time()
+        if not self.separate_inst.process(cid, src_mp3, vocal_path, acc_path):
+            return gs_err_code_separate
+        if not os.path.exists(vocal_path) or not os.path.exists(acc_path):
+            return gs_err_code_separate
+
+        # 转码出一个32k单声道的数据
+        cmd = "ffmpeg -i {} -ar 32000 -ac 1 -y {} -loglevel fatal".format(vocal_path, self.vocal_32_path)
+        os.system(cmd)
+        if not os.path.exists(self.vocal_32_path):
+            return gs_err_code_trans_32
+        print("separate:cid={}|sp={}".format(cid, time.time() - st))
+        return gs_err_code_success
+
+    def get_start_ms(self, vocal_path):
+        """
+        给定原始音频，找一段连续10s的音频
+        :param vocal_path:
+        :return:
+        """
+        audio, sr = librosa.load(vocal_path, sr=16000)
+        audio = librosa.util.normalize(audio)
+        # 帧长100ms,帧移10ms,计算能量
+        power_arr = []
+        for i in range(0, len(audio) - 1600, 160):
+            power_arr.append(np.sum(np.abs(audio[i:i + 160])) / 160)
+            # 将能量小于等于10的部分做成段
+        power_arr = construct_power_fragment(power_arr)
+        fragments = []
+        last_pos = 0
+        for idx, line in enumerate(power_arr):
+            start = round(float(line[0]) * 0.01, 3)
+            duration = round(float(line[1]) * 0.01, 3)
+            fragments.append([last_pos, start - last_pos])
+            last_pos = start + duration
+        if last_pos < len(audio) / sr:
+            fragments.append([last_pos, len(audio) / sr - last_pos])
+
+        # 合并数据，两者间隔在50ms以内的合并起来
+        idx = 0
+        while idx < len(fragments) - 1:
+            if fragments[idx + 1][0] - (fragments[idx][0] + fragments[idx][1]) < 0.05:
+                fragments[idx][1] = fragments[idx + 1][0] + fragments[idx + 1][1] - fragments[idx][0]
+                del fragments[idx + 1]
+                idx -= 1
+            idx += 1
+
+        # out_file = vocal_path + "_power.csv"
+        # with open(out_file, "w") as f:
+        #     f.write("Name\tStart\tDuration\tTime Format\tType\n")
+        #     for fragment in fragments:
+        #         start = round(float(fragment[0]), 3)
+        #         duration = round(float(fragment[1]), 3)
+        #         strr = "{}\t{}\t{}\t{}\n".format("11", start, duration, "decimal\tCue\t")
+        #         f.write(strr)
+
+        # 筛选出开始的位置
+        # 1. 连续时长大于10s，当前段长度大于3s
+        # 2. 不可用
+        # 从0到fragments[idx], 包含idx其中人声段的总和
+        tot_vocal_duration = [fragments[0][1]]
+        for i in range(1, len(fragments)):
+            tot_vocal_duration.append(tot_vocal_duration[i - 1] + fragments[i][1])
+
+        # 计算出任意两段之间非人声占比
+        for i in range(0, len(fragments)):
+            if fragments[i][1] >= 3:
+                now_tot = 0
+                if i > 0:
+                    now_tot = tot_vocal_duration[i - 1]
+                for j in range(i + 1, len(fragments)):
+                    cur_rate = tot_vocal_duration[j] - now_tot
+                    cur_rate = cur_rate / (fragments[j][1] + fragments[j][0] - fragments[i][0])
+                    if cur_rate > 0.1:
+                        return fragments[i][0]
+        return -1
+
+    def inference_speaker(self):
+        """
+        推理生成合成后的音频
+        随机取5个干声,选择占比最小的，并且要求占比小于0.3
+        :return:
+        """
+        st = time.time()
+        out_speakers = random.sample(self.speakers, 5)
+        out_songs_dict = {}
+        for speaker in out_speakers:
+            model_path = self.speakers_model_path.format(speaker)
+            config_path = self.speakers_model_config.format(speaker)
+            song_path = os.path.join(self.cache_dir, "{}_{}.wav".format(self.cid, speaker))
+            try:
+                inf(model_path, config_path, self.vocal_32_path, song_path, "prod")
+            except Exception as ex:
+                logging.info("cid={}, inference_speaker err={}".format(self.cid, ex))
+                continue
+            if os.path.exists(song_path):
+                rate = self.replace_vocal_frame_inst.get_rate(song_path)
+                if rate < 0.3:
+                    out_songs_dict[song_path] = rate
+
+        # 从内部选择占比最低的
+        out_songs = []
+        if len(out_songs_dict.keys()) > 0:
+            st_sec = self.get_start_ms(self.vocal_path)
+            song_msg = sorted(out_songs_dict.items(), key=lambda kv: kv[1])[0]
+            out_songs = [song_msg[0]]
+            logging.info("GetRate:cid={},song={},rate={},st_tm={}".format(self.cid, song_msg[0], round(song_msg[1], 2),
+                                                                          round(st_sec, 3)))
+            print("GetRate:cid={},song={},rate={},st_tm={}".format(self.cid, song_msg[0], round(song_msg[1], 2),
+                                                                   round(st_sec, 3)))
+        # logging.info("inference_speaker len = {} finish sp = {}".format(len(out_songs), time.time() - st))
+        print("inference_speaker len = {} finish sp = {}".format(len(out_songs), time.time() - st))
+        return out_songs
+
+    def get_new_vocal_rate(self, songs):
+        """
+        获取人声的比率
+        :param songs:
+        :return:
+        """
+        st = time.time()
+        need_to_process_song = []
+        for song in songs:
+            rate = self.replace_vocal_frame_inst.get_rate(song)
+            logging.info("{} {} replace_rate={}".format(self.cid, song, rate))
+            if rate < 1.0:
+                need_to_process_song.append(song)
+        logging.info(
+            "get_new_vocal_rate belen = {} len = {} finish sp = {}".format(len(songs), len(need_to_process_song),
+                                                                           time.time() - st))
+        return need_to_process_song
+
+    def preprocess_vocal(self, songs, vocal_path):
+        """
+        1. 降噪
+        2. 拉伸
+        :param songs:
+        :param vocal_path: 参考的音频信号
+        :return:
+        """
+        st = time.time()
+        dv_out_list = []
+        for song in songs:
+            denoise_path = str(song).replace(".wav", "_d.wav")
+            cmd = "{} {} {}".format(gs_denoise_exe, song, denoise_path)
+            os.system(cmd)
+            if not os.path.exists(denoise_path):
+                print("{} {} ERROR denoise".format(self.cid, song))
+                continue
+            # 拉伸
+            volume_path = str(song).replace(".wav", "_dv.wav")
+            cmd = "{} {} {} {}".format(gs_draw_volume_exe, denoise_path, vocal_path, volume_path)
+            os.system(cmd)
+            if not os.path.exists(volume_path):
+                print("{} {} ERROR denoise".format(self.cid, volume_path))
+                continue
+            dv_out_list.append(volume_path)
+        print(
+            "preprocess_vocal belen = {} len = {} finish sp = {}".format(len(songs), len(dv_out_list),
+                                                                         time.time() - st))
+        return dv_out_list
+
+    def output(self, dv_out_list):
+        """
+        对外输出数据
+        :param dv_out_list:
+        :return:
+        """
+        st = time.time()
+        out_dir = os.path.join(self.work_dir, self.cid)
+        if os.path.exists(out_dir):
+            shutil.rmtree(out_dir)
+        os.makedirs(out_dir)
+
+        # 拷贝数据
+        dst_mp3_path = os.path.join(out_dir, "src_mp3")
+        dst_acc_path = os.path.join(out_dir, "acc.mp3")
+        dst_vocal_path = os.path.join(out_dir, "vocal.mp3")
+        shutil.copyfile(self.src_mp3, dst_mp3_path)
+        cmd = "ffmpeg -i {} -ab 320k -y {} -loglevel fatal".format(self.acc_path, dst_acc_path)
+        os.system(cmd)
+        if not os.path.exists(dst_acc_path):
+            return gs_err_code_encode_err
+        cmd = "ffmpeg -i {} -ab 320k -y {} -loglevel fatal".format(self.vocal_path, dst_vocal_path)
+        os.system(cmd)
+        if not os.path.exists(dst_vocal_path):
+            return gs_err_code_encode_err
+
+        # 将所有数据放到out_dir中，用于给人工标注
+        for dv_wav in dv_out_list:
+            dv_wav_name = str(dv_wav).split("/")[-1].replace(".wav", "_441.mp3")
+            dst_dv_path = os.path.join(out_dir, dv_wav_name)
+
+            cmd = "ffmpeg -i {} -ar 44100 -ac 1 -ab 320k -y {} -loglevel fatal".format(dv_wav, dst_dv_path)
+            os.system(cmd)
+            if not os.path.exists(dst_dv_path):
+                print("{} encode err!".format(cmd))
+                continue
+        logging.info(
+            "preprocess_vocal output sp = {}".format(time.time() - st))
+
+    def process_one(self, cid, work_dir, enable_output=False):
+        logging.info("\nstart:cid={},work_dir={}----------------------->>>>>>>>".format(cid, work_dir))
+        self.cid = cid
+        self.work_dir = work_dir
+
+        # 所有不对外交付的，全部放到这里
+        self.cache_dir = os.path.join(work_dir, "cache")
+        if os.path.exists(self.cache_dir):
+            shutil.rmtree(self.cache_dir)
+        os.makedirs(self.cache_dir)
+
+        self.src_mp3 = os.path.join(self.work_dir, "src.mp3")
+        if not os.path.exists(self.src_mp3):
+            return gs_err_code_no_src_mp3
+        self.vocal_path = os.path.join(self.cache_dir, "vocal.wav")
+        self.vocal_32_path = os.path.join(self.cache_dir, "vocal_32.wav")
+        self.acc_path = os.path.join(self.cache_dir, "acc.wav")
+
+        if not os.path.exists(self.vocal_32_path):
+            logging.info("start separate ... {} {} {}".format(self.src_mp3, self.vocal_path, self.acc_path))
+            err = self.separate(cid, self.src_mp3, self.vocal_path, self.acc_path)
+            if err != gs_err_code_success:
+                return err
+        logging.info("start inference_speaker ...")
+        out_songs = self.inference_speaker()
+        logging.info("start get_new_vocal_rate ...")
+        # out_songs = self.get_new_vocal_rate(out_songs)
+        dv_out_list = self.preprocess_vocal(out_songs, self.vocal_path)
+        if enable_output:
+            self.output(dv_out_list)
+        else:
+            # 默认全部处理一遍
+            for dv_out_path in dv_out_list:
+                src_path = dv_out_path.replace("_dv.wav", ".wav")
+                err = self.after_process(self.cid, self.work_dir, src_path, dv_out_path, self.vocal_path, self.acc_path,
+                                         True, True)
+                if err != 0:
+                    logging.info("after_process err {}".format(err))
+        logging.info("finish:cid={},work_dir={}----------------------->>>>>>>>".format(cid, work_dir))
+        return gs_err_code_success
+
+    def reverb_by_vocal(self, file):
+        st = time.time()
+        file_442 = file.replace(".wav", "_442.wav")
+        if not os.path.exists(file_442):
+            cmd = "ffmpeg -i {} -ar 44100 -ac 2 -y {}".format(file, file_442)
+            os.system(cmd)
+            if not os.path.exists(file_442):
+                return None, gs_err_code_trans2_442
+
+        file_dst = file.replace(".wav", "_442_dr.wav")
+        cmd = "{} {} {} {}".format(gs_rever_path, self.vocal_path, file_442, file_dst)
+        os.system(cmd)
+        if not os.path.exists(file_dst):
+            return None, gs_err_code_reverb
+        print("cid = {}, reverb_by_vocal sp={}".format(self.cid, time.time() - st))
+        return file_dst, gs_err_code_success
+
+    def after_process(self, cid, work_dir, in_file, effect_file, vocal_file, acc_file, need_draw=True,
+                      need_reverb=True):
+        """
+        后处理逻辑
+        将处理好的音频进行替换，然后和伴奏进行混合，最后进行编码
+        :return:
+        """
+        if need_reverb:
+            # 抓取混响
+            effect_file, err = self.reverb_by_vocal(in_file)
+            if err != gs_err_code_success:
+                return err
+
+        if need_draw:
+            # 增加一个拉伸的步骤
+            volume_path = str(effect_file).replace(".wav", "_dv.wav")
+            cmd = "{} {} {} {}".format(gs_draw_volume_exe, effect_file, vocal_file, volume_path)
+            print(cmd)
+            os.system(cmd)
+            if not os.path.exists(volume_path):
+                print("{} {} ERROR draw volume".format(self.cid, volume_path))
+                return gs_err_code_volume_err
+            effect_file = volume_path
+
+        st = time.time()
+        self.cid = cid
+        self.work_dir = work_dir
+        self.src_mp3 = os.path.join(self.work_dir, "src.mp3")
+        if not os.path.exists(self.work_dir):
+            return gs_err_code_no_src_dir
+        self.replace_vocal_frame_inst.process(in_file, effect_file, vocal_file)
+        dst_path = effect_file + "_replace.wav"
+        if not os.path.exists(dst_path):
+            return gs_err_code_replace_err
+        print("replace_vocal_frame_inst sp = {}".format(time.time() - st))
+
+        # 转码
+        dst_path_442 = dst_path.replace("_replace.wav", "_replace442.wav")
+        cmd = "ffmpeg -i {} -ar 44100 -ac 2 -y {} -loglevel fatal".format(dst_path, dst_path_442)
+        os.system(cmd)
+        if not os.path.exists(dst_path_442):
+            return gs_err_code_replace_trans_err
+
+        # 合并转码后再做一次拉伸，保证响度
+        volume_path = str(dst_path_442).replace(".wav", "_dv.wav")
+        cmd = "{} {} {} {}".format(gs_draw_volume_exe, dst_path_442, vocal_file, volume_path)
+        print(cmd)
+        os.system(cmd)
+        if not os.path.exists(volume_path):
+            print("{} {} ERROR draw volume".format(self.cid, volume_path))
+            return gs_err_code_volume_err
+        dst_path_442 = volume_path
+        
+        # 混合
+        mix_path = dst_path_442.replace("_replace442.wav", "_replace442_mix.wav")
+        cmd = "{} {} {} {}".format(gs_simple_mixer_path, dst_path_442, acc_file, mix_path)
+        print("{}".format(cmd))
+        os.system(cmd)
+        if not os.path.exists(mix_path):
+            return gs_err_code_mix_err
+
+        # 编码为mp3
+        output_dir = os.path.join(self.work_dir, self.cid + "_out")
+        if not os.path.exists(output_dir):
+            os.makedirs(output_dir)
+        name = str(mix_path).replace("_replace442_mix.wav", "_replace442_mix.mp3").split("/")[-1]
+        mix_path_mp3 = os.path.join(output_dir, name)
+        cmd = "ffmpeg -i {} -ab 320k -y {} -loglevel fatal".format(mix_path, mix_path_mp3)
+        os.system(cmd)
+        if not os.path.exists(mix_path_mp3):
+            return gs_err_code_mix_transcode_err
+
+        # 拷贝src到output_dir
+        # shutil.copyfile(self.src_mp3, os.path.join(output_dir, "src.mp3"))
+        # logging.info("after_process sp = {}".format(time.time() - st))
+        return gs_err_code_success
+
+
+def test_volume_dir():
+    base_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4"
+    # arr = [
+    #     "611752105015523266/cache/611752105015523266_5066549357604730.wav",
+    #     "611752105017233541/cache/611752105017233541_6755399442719465.wav",
+    #     "611752105030414513/cache/611752105030414513_1125899914308640.wav",
+    #     "611752105030414549/cache/611752105030414549_5066549357604730.wav",
+    #     "611752105030414557/cache/611752105030414557_8162774327817435.wav",
+    #     "611752105030414588/cache/611752105030414588_1125899914308640.wav",
+    #     "611752105030414597/cache/611752105030414597_6755399374234747.wav",
+    #     "611752105030414613/cache/611752105030414613_5066549357604730.wav",
+    #     "611752105030414615/cache/611752105030414615_1125899914308640.wav",
+    #     "611752105030414619/cache/611752105030414619_5066549357604730.wav",
+    #     "611752105030414633/cache/611752105030414633_8162774327817435.wav",
+    #     "611752105030414638/cache/611752105030414638_8162774329368194.wav",
+    #     "611752105030414689/cache/611752105030414689_8162774327817435.wav",
+    #     "611752105030414702/cache/611752105030414702_6755399374234747.wav",
+    #     "611752105030414742/cache/611752105030414742_5066549357604730.wav",
+    #     "611752105030414763/cache/611752105030414763_1125899914308640.wav",
+    #     "611752105030414773/cache/611752105030414773_8162774329368194.wav",
+    #     "611752105030414777/cache/611752105030414777_8162774329368194.wav",
+    #     "611752105030414779/cache/611752105030414779_1125899914308640.wav",
+    #     "611752105030414784/cache/611752105030414784_6755399442719465.wav",
+    #     "611752105030414890/cache/611752105030414890_5066549357604730.wav",
+    #     "611752105030414915/cache/611752105030414915_5066549357604730.wav",
+    #     "611752105030414925/cache/611752105030414925_1125899914308640.wav",
+    #     "611752105030414929/cache/611752105030414929_1125899914308640.wav",
+    #     "611752105030414935/cache/611752105030414935_3634463651.wav",
+    #     "611752105030414943/cache/611752105030414943_6755399374234747.wav",
+    #     "611752105030414957/cache/611752105030414957_12384898975368914.wav",
+    #     "611752105030414962/cache/611752105030414962_8162774327817435.wav",
+    #     "611752105030414976/cache/611752105030414976_10414574138721494.wav",
+    #     "611752105030414993/cache/611752105030414993_12947848931397021.wav",
+    #     "611752105030414995/cache/611752105030414995_5066549357604730.wav",
+    #     "611752105030415003/cache/611752105030415003_12947848931397021.wav",
+    #     "611752105030415014/cache/611752105030415014_10414574138721494.wav",
+    #     "611752105030415018/cache/611752105030415018_8162774329368194.wav",
+    #     "611752105030415032/cache/611752105030415032_6755399442719465.wav",
+    #     "611752105030415056/cache/611752105030415056_3096224748076687.wav",
+    #     "611752105030415067/cache/611752105030415067_1125899914308640.wav",
+    #     "611752105030415071/cache/611752105030415071_5910973794723621.wav",
+    #     "611752105030415074/cache/611752105030415074_1125899914308640.wav",
+    #     "611752105030415083/cache/611752105030415083_1125899914308640.wav",
+    #     "611752105030415087/cache/611752105030415087_5910973794723621.wav",
+    #     "611752105030415100/cache/611752105030415100_10414574138721494.wav",
+    #     "611752105030415103/cache/611752105030415103_8162774329368194.wav"
+    # ]
+    # arr = [
+    #     "611752105020256284/cache/611752105020256284_8162774329368194.wav",
+    #     "611752105020286433/cache/611752105020286433_1125899914308640.wav",
+    #     "611752105020286443/cache/611752105020286443_12384898975368914.wav",
+    #     "611752105020286446/cache/611752105020286446_5629499489839033.wav",
+    #     "611752105020290639/cache/611752105020290639_3634463651.wav",
+    #     "611752105020290695/cache/611752105020290695_1125899914308640.wav",
+    #     "611752105020315328/cache/611752105020315328_8162774329368194.wav",
+    #     "611752105020315368/cache/611752105020315368_1688849864840588.wav",
+    #     "611752105020336950/cache/611752105020336950_3634463651.wav",
+    #     "611752105020343687/cache/611752105020343687_8162774327817435.wav",
+    #     "611752105020343699/cache/611752105020343699_1125899914308640.wav",
+    #     "611752105020351134/cache/611752105020351134_10414574138721494.wav",
+    #     "611752105020357112/cache/611752105020357112_8162774327817435.wav",
+    #     "611752105020378620/cache/611752105020378620_8162774327817435.wav",
+    #     "611752105020387015/cache/611752105020387015_1125899914308640.wav",
+    #     "611752105020394121/cache/611752105020394121_1125899914308640.wav",
+    #     "611752105020394297/cache/611752105020394297_3634463651.wav",
+    #     "611752105020411654/cache/611752105020411654_3096224751151928.wav",
+    #     "611752105020417688/cache/611752105020417688_12947848931397021.wav",
+    #     "611752105020563523/cache/611752105020563523_8162774327817435.wav",
+    #     "611752105021332759/cache/611752105021332759_3634463651.wav",
+    #     "611752105022446809/cache/611752105022446809_8162774327817435.wav",
+    #     "611752105022647082/cache/611752105022647082_8162774327817435.wav",
+    #     "611752105022667231/cache/611752105022667231_8162774327817435.wav",
+    #     "611752105022735101/cache/611752105022735101_5066549357604730.wav",
+    #     "611752105022736204/cache/611752105022736204_1125899914308640.wav",
+    #     "611752105022745595/cache/611752105022745595_10414574138721494.wav",
+    #     "611752105022770952/cache/611752105022770952_1125899914308640.wav",
+    #     "611752105022842004/cache/611752105022842004_3634463651.wav",
+    #     "611752105022842477/cache/611752105022842477_1125899914308640.wav",
+    #     "611752105023434557/cache/611752105023434557_6755399374234747.wav",
+    #     "611752105023532439/cache/611752105023532439_8162774329368194.wav",
+    #     "611752105023623965/cache/611752105023623965_3096224748076687.wav",
+    #     "611752105024250202/cache/611752105024250202_8162774327817435.wav",
+    #     "611752105024628047/cache/611752105024628047_5066549357604730.wav",
+    #     "611752105024676794/cache/611752105024676794_6755399442719465.wav",
+    #     "611752105024678976/cache/611752105024678976_6755399442719465.wav",
+    #     "611752105024679221/cache/611752105024679221_8162774329368194.wav",
+    #     "611752105024953316/cache/611752105024953316_1688849864840588.wav",
+    #     "611752105025104181/cache/611752105025104181_6755399374234747.wav",
+    #     "611752105026189342/cache/611752105026189342_5910973794723621.wav",
+    #     "611752105026523547/cache/611752105026523547_1125899914308640.wav",
+    #     "611752105026707760/cache/611752105026707760_3096224748076687.wav",
+    #     "611752105026771723/cache/611752105026771723_8162774327817435.wav",
+    #     "611752105026946178/cache/611752105026946178_10414574140317353.wav",
+    #     "611752105027047993/cache/611752105027047993_5066549357604730.wav",
+    #     "611752105027188746/cache/611752105027188746_5066549357604730.wav",
+    #     "611752105027189453/cache/611752105027189453_8162774329368194.wav",
+    #     "611752105027302268/cache/611752105027302268_5066549357604730.wav",
+    #     "611752105027557408/cache/611752105027557408_1125899914308640.wav",
+    #     "611752105028650636/cache/611752105028650636_8162774327817435.wav",
+    #     "611752105028683824/cache/611752105028683824_1125899914308640.wav",
+    #     "611752105029990849/cache/611752105029990849_7036874421386111.wav",
+    #     "611752105029993297/cache/611752105029993297_6755399374234747.wav",
+    #     "611752105030077711/cache/611752105030077711_3096224748076687.wav",
+    #     "611752105030104548/cache/611752105030104548_5629499489839033.wav",
+    #     "611752105030419624/cache/611752105030419624_8162774327817435.wav",
+    #     "611752105030419633/cache/611752105030419633_1125899914308640.wav",
+    #     "611752105030419688/cache/611752105030419688_1125899914308640.wav",
+    #     "611752105030433779/cache/611752105030433779_3634463651.wav"
+    # ]
+
+    arr = [
+        "611752105020256284/cache/611752105020256284_8162774329368194.wav",
+        "611752105020286433/cache/611752105020286433_1125899914308640.wav",
+        "611752105020286443/cache/611752105020286443_12384898975368914.wav",
+        "611752105020286446/cache/611752105020286446_5629499489839033.wav",
+        "611752105020290639/cache/611752105020290639_3634463651.wav",
+        "611752105020290695/cache/611752105020290695_1125899914308640.wav",
+        "611752105020315328/cache/611752105020315328_8162774329368194.wav",
+        "611752105020315368/cache/611752105020315368_1688849864840588.wav",
+        "611752105020336950/cache/611752105020336950_3634463651.wav",
+        "611752105020343687/cache/611752105020343687_8162774327817435.wav"
+    ]
+    s_inst = SongCoverInference()
+    for vocal_file in arr:
+        sstime = time.time()
+        i_file = os.path.join(base_dir, vocal_file)
+        cur_dir = "/".join(i_file.split("/")[:-1])
+        # e_file = os.path.join(base_dir, vocal_file.replace(".wav", "_dev_441.wav"))
+        # e_file = os.path.join(base_dir, vocal_file.replace(".wav", "_442_dr.wav"))
+        e_file = os.path.join(base_dir, vocal_file.replace(".wav", "_442_dr_v2.wav"))
+        v_file = os.path.join(cur_dir, "vocal.wav")
+        a_file = os.path.join(cur_dir, "acc.wav")
+        cur_id = cur_dir.split("/")[-1]
+        err = s_inst.after_process(cur_id, cur_dir, i_file, e_file, v_file, a_file, True, False)
+        print("err={}, sp={}".format(err, time.time() - sstime))
+
+
+def get_metop500():
+    arr = [
+        "611752105030249067",
+        "611752105030248972",
+        "611752105030249414",
+        "611752105030249374",
+        "611752105030249030",
+        "611752105030249127",
+        "611752105030249091",
+        "611752105030249233",
+        "611752105030249036",
+        "611752105030249281",
+        "611752105030249040",
+        "611752105030249052",
+        "611752105030249394",
+        "611752105030249347",
+        "611752105030249342",
+        "611752105030249282",
+        "611752105030249292",
+        "611752105030249356",
+        "611752105030249302",
+        "611752105030249377",
+        "611752105030248973",
+        "611752105030249393",
+        "611752105030249398",
+        "611752105030250695",
+        "611752105030249213",
+        "611752105030250739",
+        "611752105030249206",
+        "611752105030249074",
+        "611752105030249387",
+        "611752105030250702",
+        "611752105030249365",
+        "611752105030249011",
+        "611752105030249319",
+        "611752105030249016",
+        "611752105030249176",
+        "611752105030250690",
+        "611752105030250691",
+        "611752105030249032",
+        "611752105030249370",
+        "611752105030249410",
+        "611752105030249355",
+        "611752105030250730",
+        "611752105030249022",
+        "611752105030249240",
+        "611752105030249296",
+        "611752105030249070",
+        "611752105030249322",
+        "611752105030249402",
+        "611752105030249386",
+        "611752105030249280",
+        "611752105030249038",
+        "611752105030250743",
+        "611752105030249136",
+        "611752105030249034",
+        "611752105030249403",
+        "611752105030249104",
+        "611752105030249105",
+        "611752105030249359",
+        "611752105030250728",
+        "611752105030249338",
+        "611752105030249216",
+        "611752105030249334",
+        "611752105030249037",
+        "611752105030249264",
+        "611752105030249284",
+        "611752105030249267",
+        "611752105030249010",
+        "611752105030249431",
+        "611752105030249364",
+        "611752105030249243",
+        "611752105030249397",
+        "611752105030249041",
+        "611752105030249118",
+        "611752105030249283",
+        "611752105030249340",
+        "611752105030249250",
+        "611752105030249048",
+        "611752105030249336",
+        "611752105030249371",
+        "611752105030249372",
+        "611752105030249273",
+        "611752105030249366",
+        "611752105030249352",
+        "611752105030249049",
+        "611752105030249278",
+        "611752105030249401",
+        "611752105030249258",
+        "611752105030249160",
+        "611752105030249348",
+        "611752105030249071",
+        "611752105030249175",
+        "611752105030249053",
+        "611752105030249035",
+        "611752105030249375",
+        "611752105030249417",
+        "611752105030249055",
+        "611752105030249275",
+        "611752105030249177",
+        "611752105028480653",
+        "611752105030249385",
+        "611752105030249406",
+        "611752105030249383",
+        "611752105030249295",
+        "611752105030250699",
+        "611752105030249289",
+        "611752105030248965",
+        "611752105030249128",
+        "611752105030249173",
+        "611752105030249019",
+        "611752105030249333",
+        "611752105030249361",
+        "611752105030250733",
+        "611752105030249112",
+        "611752105030249293",
+        "611752105030249391",
+        "611752105030249195",
+        "611752105030249324",
+        "611752105030249388",
+        "611752105030249134",
+        "611752105030249073",
+        "611752105030249174",
+        "611752105030249353",
+        "611752105030249287",
+        "611752105030249113",
+        "611752105030249227"
+    ]
+    all = [
+        "611752105026649069",
+        "611752105027201163",
+        "611752105027601574",
+        "611752105027602999",
+        "611752105028392007",
+        "611752105028480056",
+        "611752105028480075",
+        "611752105028480653",
+        "611752105029330944",
+        "611752105029790637",
+        "611752105029951597",
+        "611752105029951604",
+        "611752105029951624",
+        "611752105029956352",
+        "611752105030248965",
+        "611752105030248971",
+        "611752105030248972",
+        "611752105030248973",
+        "611752105030248974",
+        "611752105030248975",
+        "611752105030248976",
+        "611752105030248977",
+        "611752105030248978",
+        "611752105030248979",
+        "611752105030248980",
+        "611752105030248981",
+        "611752105030248982",
+        "611752105030248983",
+        "611752105030248985",
+        "611752105030248986",
+        "611752105030248987",
+        "611752105030248988",
+        "611752105030248989",
+        "611752105030248990",
+        "611752105030248991",
+        "611752105030248992",
+        "611752105030248993",
+        "611752105030248994",
+        "611752105030248995",
+        "611752105030248996",
+        "611752105030248997",
+        "611752105030248998",
+        "611752105030248999",
+        "611752105030249000",
+        "611752105030249001",
+        "611752105030249002",
+        "611752105030249003",
+        "611752105030249004",
+        "611752105030249005",
+        "611752105030249006",
+        "611752105030249007",
+        "611752105030249008",
+        "611752105030249009",
+        "611752105030249010",
+        "611752105030249011",
+        "611752105030249012",
+        "611752105030249013",
+        "611752105030249014",
+        "611752105030249015",
+        "611752105030249016",
+        "611752105030249017",
+        "611752105030249018",
+        "611752105030249019",
+        "611752105030249020",
+        "611752105030249021",
+        "611752105030249022",
+        "611752105030249023",
+        "611752105030249024",
+        "611752105030249025",
+        "611752105030249026",
+        "611752105030249027",
+        "611752105030249028",
+        "611752105030249029",
+        "611752105030249030",
+        "611752105030249031",
+        "611752105030249032",
+        "611752105030249033",
+        "611752105030249034",
+        "611752105030249035",
+        "611752105030249036",
+        "611752105030249037",
+        "611752105030249038",
+        "611752105030249039",
+        "611752105030249040",
+        "611752105030249041",
+        "611752105030249042",
+        "611752105030249043",
+        "611752105030249044",
+        "611752105030249045",
+        "611752105030249046",
+        "611752105030249047",
+        "611752105030249048",
+        "611752105030249049",
+        "611752105030249050",
+        "611752105030249051",
+        "611752105030249052",
+        "611752105030249053",
+        "611752105030249054",
+        "611752105030249055",
+        "611752105030249056",
+        "611752105030249057",
+        "611752105030249058",
+        "611752105030249059",
+        "611752105030249060",
+        "611752105030249062",
+        "611752105030249063",
+        "611752105030249064",
+        "611752105030249065",
+        "611752105030249067",
+        "611752105030249068",
+        "611752105030249070",
+        "611752105030249071",
+        "611752105030249072",
+        "611752105030249073",
+        "611752105030249074",
+        "611752105030249075",
+        "611752105030249076",
+        "611752105030249077",
+        "611752105030249078",
+        "611752105030249079",
+        "611752105030249080",
+        "611752105030249081",
+        "611752105030249082",
+        "611752105030249083",
+        "611752105030249084",
+        "611752105030249085",
+        "611752105030249086",
+        "611752105030249087",
+        "611752105030249088",
+        "611752105030249089",
+        "611752105030249090",
+        "611752105030249091",
+        "611752105030249092",
+        "611752105030249093",
+        "611752105030249094",
+        "611752105030249095",
+        "611752105030249096",
+        "611752105030249098",
+        "611752105030249099",
+        "611752105030249100",
+        "611752105030249101",
+        "611752105030249102",
+        "611752105030249103",
+        "611752105030249104",
+        "611752105030249105",
+        "611752105030249106",
+        "611752105030249107",
+        "611752105030249108",
+        "611752105030249109",
+        "611752105030249110",
+        "611752105030249111",
+        "611752105030249112",
+        "611752105030249113",
+        "611752105030249114",
+        "611752105030249115",
+        "611752105030249116",
+        "611752105030249117",
+        "611752105030249118",
+        "611752105030249119",
+        "611752105030249120",
+        "611752105030249121",
+        "611752105030249122",
+        "611752105030249123",
+        "611752105030249124",
+        "611752105030249125",
+        "611752105030249126",
+        "611752105030249127",
+        "611752105030249128",
+        "611752105030249129",
+        "611752105030249130",
+        "611752105030249131",
+        "611752105030249132",
+        "611752105030249133",
+        "611752105030249134",
+        "611752105030249135",
+        "611752105030249136",
+        "611752105030249137",
+        "611752105030249138",
+        "611752105030249139",
+        "611752105030249140",
+        "611752105030249141",
+        "611752105030249142",
+        "611752105030249143",
+        "611752105030249144",
+        "611752105030249145",
+        "611752105030249146",
+        "611752105030249147",
+        "611752105030249148",
+        "611752105030249150",
+        "611752105030249151",
+        "611752105030249152",
+        "611752105030249153",
+        "611752105030249154",
+        "611752105030249155",
+        "611752105030249157",
+        "611752105030249158",
+        "611752105030249159",
+        "611752105030249160",
+        "611752105030249161",
+        "611752105030249162",
+        "611752105030249163",
+        "611752105030249165",
+        "611752105030249166",
+        "611752105030249167",
+        "611752105030249168",
+        "611752105030249170",
+        "611752105030249171",
+        "611752105030249172",
+        "611752105030249173",
+        "611752105030249174",
+        "611752105030249175",
+        "611752105030249176",
+        "611752105030249177",
+        "611752105030249178",
+        "611752105030249179",
+        "611752105030249180",
+        "611752105030249181",
+        "611752105030249182",
+        "611752105030249183",
+        "611752105030249185",
+        "611752105030249186",
+        "611752105030249187",
+        "611752105030249188",
+        "611752105030249189",
+        "611752105030249190",
+        "611752105030249191",
+        "611752105030249192",
+        "611752105030249193",
+        "611752105030249194",
+        "611752105030249195",
+        "611752105030249196",
+        "611752105030249197",
+        "611752105030249198",
+        "611752105030249199",
+        "611752105030249200",
+        "611752105030249201",
+        "611752105030249202",
+        "611752105030249203",
+        "611752105030249204",
+        "611752105030249205",
+        "611752105030249206",
+        "611752105030249207",
+        "611752105030249208",
+        "611752105030249209",
+        "611752105030249210",
+        "611752105030249211",
+        "611752105030249212",
+        "611752105030249213",
+        "611752105030249214",
+        "611752105030249216",
+        "611752105030249217",
+        "611752105030249218",
+        "611752105030249219",
+        "611752105030249220",
+        "611752105030249221",
+        "611752105030249223",
+        "611752105030249224",
+        "611752105030249225",
+        "611752105030249226",
+        "611752105030249227",
+        "611752105030249228",
+        "611752105030249229",
+        "611752105030249230",
+        "611752105030249231",
+        "611752105030249232",
+        "611752105030249233",
+        "611752105030249234",
+        "611752105030249235",
+        "611752105030249236",
+        "611752105030249237",
+        "611752105030249238",
+        "611752105030249239",
+        "611752105030249240",
+        "611752105030249241",
+        "611752105030249242",
+        "611752105030249243",
+        "611752105030249244",
+        "611752105030249245",
+        "611752105030249247",
+        "611752105030249248",
+        "611752105030249249",
+        "611752105030249250",
+        "611752105030249251",
+        "611752105030249252",
+        "611752105030249253",
+        "611752105030249255",
+        "611752105030249256",
+        "611752105030249257",
+        "611752105030249258",
+        "611752105030249259",
+        "611752105030249260",
+        "611752105030249261",
+        "611752105030249262",
+        "611752105030249264",
+        "611752105030249265",
+        "611752105030249266",
+        "611752105030249267",
+        "611752105030249269",
+        "611752105030249270",
+        "611752105030249271",
+        "611752105030249273",
+        "611752105030249274",
+        "611752105030249275",
+        "611752105030249277",
+        "611752105030249278",
+        "611752105030249279",
+        "611752105030249280",
+        "611752105030249281",
+        "611752105030249282",
+        "611752105030249283",
+        "611752105030249284",
+        "611752105030249287",
+        "611752105030249288",
+        "611752105030249289",
+        "611752105030249290",
+        "611752105030249292",
+        "611752105030249293",
+        "611752105030249294",
+        "611752105030249295",
+        "611752105030249296",
+        "611752105030249297",
+        "611752105030249298",
+        "611752105030249299",
+        "611752105030249300",
+        "611752105030249301",
+        "611752105030249302",
+        "611752105030249303",
+        "611752105030249307",
+        "611752105030249308",
+        "611752105030249309",
+        "611752105030249310",
+        "611752105030249313",
+        "611752105030249314",
+        "611752105030249315",
+        "611752105030249316",
+        "611752105030249317",
+        "611752105030249318",
+        "611752105030249319",
+        "611752105030249320",
+        "611752105030249321",
+        "611752105030249322",
+        "611752105030249323",
+        "611752105030249324",
+        "611752105030249325",
+        "611752105030249327",
+        "611752105030249328",
+        "611752105030249329",
+        "611752105030249330",
+        "611752105030249331",
+        "611752105030249332",
+        "611752105030249333",
+        "611752105030249334",
+        "611752105030249336",
+        "611752105030249337",
+        "611752105030249338",
+        "611752105030249339",
+        "611752105030249340",
+        "611752105030249341",
+        "611752105030249342",
+        "611752105030249343",
+        "611752105030249344",
+        "611752105030249345",
+        "611752105030249346",
+        "611752105030249347",
+        "611752105030249348",
+        "611752105030249349",
+        "611752105030249350",
+        "611752105030249351",
+        "611752105030249352",
+        "611752105030249353",
+        "611752105030249354",
+        "611752105030249355",
+        "611752105030249356",
+        "611752105030249357",
+        "611752105030249358",
+        "611752105030249359",
+        "611752105030249360",
+        "611752105030249361",
+        "611752105030249362",
+        "611752105030249363",
+        "611752105030249364",
+        "611752105030249365",
+        "611752105030249366",
+        "611752105030249367",
+        "611752105030249368",
+        "611752105030249369",
+        "611752105030249370",
+        "611752105030249371",
+        "611752105030249372",
+        "611752105030249373",
+        "611752105030249374",
+        "611752105030249375",
+        "611752105030249376",
+        "611752105030249377",
+        "611752105030249378",
+        "611752105030249379",
+        "611752105030249380",
+        "611752105030249381",
+        "611752105030249383",
+        "611752105030249384",
+        "611752105030249385",
+        "611752105030249386",
+        "611752105030249387",
+        "611752105030249388",
+        "611752105030249389",
+        "611752105030249390",
+        "611752105030249391",
+        "611752105030249392",
+        "611752105030249393",
+        "611752105030249394",
+        "611752105030249395",
+        "611752105030249396",
+        "611752105030249397",
+        "611752105030249398",
+        "611752105030249399",
+        "611752105030249401",
+        "611752105030249402",
+        "611752105030249403",
+        "611752105030249404",
+        "611752105030249405",
+        "611752105030249406",
+        "611752105030249407",
+        "611752105030249408",
+        "611752105030249409",
+        "611752105030249410",
+        "611752105030249412",
+        "611752105030249413",
+        "611752105030249414",
+        "611752105030249415",
+        "611752105030249416",
+        "611752105030249417",
+        "611752105030249418",
+        "611752105030249419",
+        "611752105030249420",
+        "611752105030249421",
+        "611752105030249431",
+        "611752105030249624",
+        "611752105030250688",
+        "611752105030250689",
+        "611752105030250690",
+        "611752105030250691",
+        "611752105030250692",
+        "611752105030250693",
+        "611752105030250695",
+        "611752105030250697",
+        "611752105030250698",
+        "611752105030250699",
+        "611752105030250700",
+        "611752105030250701",
+        "611752105030250702",
+        "611752105030250704",
+        "611752105030250707",
+        "611752105030250711",
+        "611752105030250712",
+        "611752105030250713",
+        "611752105030250714",
+        "611752105030250715",
+        "611752105030250716",
+        "611752105030250717",
+        "611752105030250718",
+        "611752105030250719",
+        "611752105030250720",
+        "611752105030250721",
+        "611752105030250723",
+        "611752105030250725",
+        "611752105030250726",
+        "611752105030250728",
+        "611752105030250729",
+        "611752105030250730",
+        "611752105030250731",
+        "611752105030250732",
+        "611752105030250733",
+        "611752105030250735",
+        "611752105030250736",
+        "611752105030250738",
+        "611752105030250739",
+        "611752105030250740",
+        "611752105030250741",
+        "611752105030250742",
+        "611752105030250743"
+    ]
+
+    new_arr = []
+    for sid in all:
+        if sid in arr:
+            continue
+        new_arr.append(sid)
+    print("len={}".format(len(new_arr)))
+    return new_arr
+
+
+def get_me_3_w4_zy():
+    arr = [
+        "611752105015523266",
+        "611752105016527562",
+        "611752105017233541",
+        "611752105019423720",
+        "611752105030113709",
+        "611752105030414513",
+        "611752105030414549",
+        "611752105030414557",
+        "611752105030414568",
+        "611752105030414576",
+        "611752105030414580",
+        "611752105030414584",
+        "611752105030414588",
+        "611752105030414590",
+        "611752105030414597",
+        "611752105030414600",
+        "611752105030414608",
+        "611752105030414613",
+        "611752105030414615",
+        "611752105030414619",
+        "611752105030414633",
+        "611752105030414638",
+        "611752105030414644",
+        "611752105030414647",
+        "611752105030414655",
+        "611752105030414660",
+        "611752105030414663",
+        "611752105030414669",
+        "611752105030414674",
+        "611752105030414678",
+        "611752105030414680",
+        "611752105030414682",
+        "611752105030414686",
+        "611752105030414689",
+        "611752105030414696",
+        "611752105030414702",
+        "611752105030414706",
+        "611752105030414707",
+        "611752105030414711",
+        "611752105030414717",
+        "611752105030414729",
+        "611752105030414742",
+        "611752105030414752",
+        "611752105030414757",
+        "611752105030414761",
+        "611752105030414763",
+        "611752105030414766",
+        "611752105030414773",
+        "611752105030414776",
+        "611752105030414777",
+        "611752105030414779",
+        "611752105030414784",
+        "611752105030414890",
+        "611752105030414907",
+        "611752105030414915",
+        "611752105030414919",
+        "611752105030414925",
+        "611752105030414929",
+        "611752105030414932",
+        "611752105030414935",
+        "611752105030414937",
+        "611752105030414943",
+        "611752105030414948",
+        "611752105030414949",
+        "611752105030414957",
+        "611752105030414962",
+        "611752105030414963",
+        "611752105030414968",
+        "611752105030414973",
+        "611752105030414976",
+        "611752105030414981",
+        "611752105030414986",
+        "611752105030414988",
+        "611752105030414990",
+        "611752105030414993",
+        "611752105030414995",
+        "611752105030415003",
+        "611752105030415007",
+        "611752105030415009",
+        "611752105030415014",
+        "611752105030415018",
+        "611752105030415032",
+        "611752105030415044",
+        "611752105030415050",
+        "611752105030415052",
+        "611752105030415056",
+        "611752105030415058",
+        "611752105030415062",
+        "611752105030415067",
+        "611752105030415071",
+        "611752105030415074",
+        "611752105030415078",
+        "611752105030415083",
+        "611752105030415087",
+        "611752105030415094",
+        "611752105030415100",
+        "611752105030415103",
+        "611752105030425986",
+        "611752105030426004"
+    ]
+    return arr
+
+
+def generate_arr():
+    # arr = [
+    #     "611752105020256284",
+    #     "611752105020282612",
+    #     "611752105020282613",
+    #     "611752105020286433",
+    #     "611752105020286443",
+    #     "611752105020286446",
+    #     "611752105020286501",
+    #     "611752105020290639",
+    #     "611752105020290695",
+    #     "611752105020315328",
+    #     "611752105020315368",
+    #     "611752105020325137",
+    #     "611752105020336946",
+    #     "611752105020336950",
+    #     "611752105020343687",
+    #     "611752105020343699",
+    #     "611752105020350988",
+    #     "611752105020350990",
+    #     "611752105020351134",
+    #     "611752105020357112",
+    #     "611752105020376320",
+    #     "611752105020378620",
+    #     "611752105020382559",
+    #     "611752105020387015",
+    #     "611752105020390950",
+    #     "611752105020394121",
+    #     "611752105020394297",
+    #     "611752105020411654",
+    #     "611752105020417488",
+    #     "611752105020417688",
+    #     "611752105020548211",
+    #     "611752105020563523",
+    #     "611752105021273980",
+    #     "611752105021285282",
+    #     "611752105021330812",
+    #     "611752105021332759",
+    #     "611752105021375100",
+    #     "611752105021442406",
+    #     "611752105021442417",
+    #     "611752105021453011",
+    #     "611752105022345104",
+    #     "611752105022389596",
+    #     "611752105022446809",
+    #     "611752105022647082",
+    #     "611752105022667231",
+    #     "611752105022735101",
+    #     "611752105022736204",
+    #     "611752105022745595",
+    #     "611752105022770952",
+    #     "611752105022842004",
+    #     "611752105022842477",
+    #     "611752105023434557",
+    #     "611752105023532439",
+    #     "611752105023623965",
+    #     "611752105023811083",
+    #     "611752105024250202",
+    #     "611752105024429936",
+    #     "611752105024628047",
+    #     "611752105024676794",
+    #     "611752105024678976",
+    #     "611752105024679221",
+    #     "611752105024714646",
+    #     "611752105024786030",
+    #     "611752105024953316",
+    #     "611752105025104181",
+    #     "611752105025231610",
+    #     "611752105025510149",
+    #     "611752105026189342",
+    #     "611752105026523547",
+    #     "611752105026707760",
+    #     "611752105026771723",
+    #     "611752105026946178",
+    #     "611752105027047993",
+    #     "611752105027188746",
+    #     "611752105027189453",
+    #     "611752105027302268",
+    #     "611752105027557408",
+    #     "611752105027588072",
+    #     "611752105028650636",
+    #     "611752105028683824",
+    #     "611752105029689090",
+    #     "611752105029954089",
+    #     "611752105029954168",
+    #     "611752105029955214",
+    #     "611752105029990849",
+    #     "611752105029993297",
+    #     "611752105030047424",
+    #     "611752105030077711",
+    #     "611752105030104548",
+    #     "611752105030419624",
+    #     "611752105030419633",
+    #     "611752105030419688",
+    #     "611752105030433779"
+    # ]
+
+    # arr = get_metop500()
+    arr = get_me_3_w4_zy()
+    s_inst = SongCoverInference()
+    for sid in arr:
+        sstime = time.time()
+        dir = os.path.join("/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_3_w4_zy", sid)
+        # dir = os.path.join("/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500", sid)
+        err = s_inst.process_one(sid, dir, True)
+        print("sid={}, err={}, sp={}".format(sid, err, time.time() - sstime))
+
+
+def test_rate():
+    arr = [
+        "611752105020256284",
+        "611752105020286433",
+        "611752105020286443",
+        "611752105020286446",
+        "611752105020290639",
+        "611752105020290695",
+        "611752105020315328",
+        "611752105020315368",
+        "611752105020336950",
+        "611752105020343687",
+        "611752105020343699",
+        "611752105020351134",
+        "611752105020357112",
+        "611752105020378620",
+        "611752105020387015",
+        "611752105020394121",
+        "611752105020394297",
+        "611752105020411654",
+        "611752105020417688",
+        "611752105020548211",
+        "611752105020563523",
+        "611752105021285282",
+        "611752105021332759",
+        "611752105022446809",
+        "611752105022647082",
+        "611752105022667231",
+        "611752105022735101",
+        "611752105022736204",
+        "611752105022745595",
+        "611752105022770952",
+        "611752105022842004",
+        "611752105022842477",
+        "611752105023434557",
+        "611752105023532439",
+        "611752105023623965",
+        "611752105024250202",
+        "611752105024628047",
+        "611752105024676794",
+        "611752105024678976",
+        "611752105024679221",
+        "611752105024953316",
+        "611752105025104181",
+        "611752105026189342",
+        "611752105026523547",
+        "611752105026707760",
+        "611752105026771723",
+        "611752105026946178",
+        "611752105027047993",
+        "611752105027188746",
+        "611752105027189453",
+        "611752105027302268",
+        "611752105027557408",
+        "611752105028650636",
+        "611752105028683824",
+        "611752105029990849",
+        "611752105029993297",
+        "611752105030077711",
+        "611752105030104548",
+        "611752105030419624",
+        "611752105030419633",
+        "611752105030419688",
+        "611752105030433779"
+    ]
+    s_inst = SongCoverInference()
+    for sid in arr:
+        vocal_path = "data/inf_users/me_3_w4/{}/cache/vocal.wav".format(sid)
+        tm = s_inst.get_start_ms(vocal_path)
+        print("res,{},{}".format(vocal_path, tm))
+
+
+def test():
+    arr = [
+        # "611752105020343687",
+        # "611752105023532439",
+        "611752105030419688",
+    ]
+    base_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/test"
+    s_inst = SongCoverInference()
+    for cid in arr:
+        st = time.time()
+        err = s_inst.process_one(cid, os.path.join(base_dir, cid), False)
+        print("cid={} RealFinish err={} sp={}".format(cid, err, time.time() - st))
+
+
+if __name__ == '__main__':
+    # test()
+    # test_rate()
+    test_volume_dir()
+    # generate_arr()
+    # test_volume_dir()
+    # s_inst = SongCoverInference()
+    # sstime = time.time()
+    # err = s_inst.process_one("611752105030249038",
+    #                          "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500/611752105030249038", False)
+    # # i_file = "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249121/611752105030249121_5629499489839033.wav"
+    # # e_file = "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500/611752105030249121/611752105030249121_5629499489839033.wav"
+    # # v_file = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500/611752105030249121/vocal.wav"
+    # # a_file = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500/611752105030249121/acc.wav"
+    # # w_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500/611752105030249121"
+    # #
+    # # err = s_inst.after_process("611752105030248965", w_dir, i_file, e_file, v_file, a_file)
+    # print("err={}, sp={}".format(err, time.time() - sstime))
diff --git a/AutoCoverTool/script/shuffle_label_data.py b/AutoCoverTool/script/shuffle_label_data.py
new file mode 100644
index 0000000..d9c096f
--- /dev/null
+++ b/AutoCoverTool/script/shuffle_label_data.py
@@ -0,0 +1,48 @@
+"""
+对数据打散，进行盲听实验
+"""
+import os
+import shutil
+import numpy as np
+
+
+def process():
+    arr = [
+        "611752105020256284_8162774329368194",
+        "611752105020286433_1125899914308640",
+        "611752105020286443_12384898975368914",
+        "611752105020286446_5629499489839033",
+        "611752105020290639_3634463651",
+        "611752105020290695_1125899914308640",
+        "611752105020315328_8162774329368194",
+        "611752105020315368_1688849864840588",
+        "611752105020336950_3634463651",
+        "611752105020343687_8162774327817435",
+    ]
+    base_dir = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/out_0327/test/me_3_w4_10_compare"
+    dst_dir = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/out_0327/test/me_3_w4_10_compare_shuffle"
+    exts = ["_dr_v2_dv2.mp3",
+            "_dev_441_dv.wav_replace442_mix.mp3",
+
+            "_442_dr_dv.wav_replace442_mix.mp3",
+            "_dev_441.wav_replace442_mix.mp3", "_442_dr.wav_replace442_mix.mp3"]
+    for i in range(0, len(arr)):
+        nm = np.random.randint(0, 10)
+        dev_file = os.path.join(base_dir, arr[i] + exts[0])
+        dr_dv_file = os.path.join(base_dir, arr[i] + exts[1])
+        dst_0_file = os.path.join(dst_dir, arr[i] + "_0.mp3")
+        dst_1_file = os.path.join(dst_dir, arr[i] + "_1.mp3")
+        if nm < 5:
+            shutil.copyfile(dev_file, dst_0_file)
+            shutil.copyfile(dr_dv_file, dst_1_file)
+            print("{},{}".format(arr[i] + exts[0], 0))
+            print("{},{}".format(arr[i] + exts[1], 1))
+        else:
+            shutil.copyfile(dev_file, dst_1_file)
+            shutil.copyfile(dr_dv_file, dst_0_file)
+            print("{},{}".format(arr[i] + exts[0], 1))
+            print("{},{}".format(arr[i] + exts[1], 0))
+
+
+if __name__ == '__main__':
+    process()
diff --git a/AutoCoverTool/script/test.py b/AutoCoverTool/script/test.py
new file mode 100644
index 0000000..2d6c2d9
--- /dev/null
+++ b/AutoCoverTool/script/test.py
@@ -0,0 +1,71 @@
+"""
+尝试一下
+w = (f(a) * sum(bi)) / sum(bi^2)
+"""
+import os
+import librosa
+import soundfile
+import numpy as np
+
+
+def t1():
+    # aa = librosa.stft(np.array([-1.0, -2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0]), n_fft=8, win_length=8, hop_length=4)
+    # print(aa.shape)
+    # print(aa.transpose()[1])
+    # # print(aa)
+    # print(np.abs(librosa.istft(aa * aa)))
+    # exit(-1)
+
+    base = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/me_top500/dataset/users/0/611752105030249289"
+    vocal = os.path.join(base, "vocal.mp3")
+    sr = 44100
+    fa_path, sr = librosa.load(vocal, sr=sr, mono=True)
+    fa_stft = librosa.stft(fa_path, n_fft=2048, hop_length=512).transpose()
+    # fa_istft = librosa.istft(fa_stft)
+
+    fb0, sr = librosa.load(os.path.join(base, "611752105030249289_8162774329368194_dv_441.wav.mp3"), sr=sr, mono=True)
+    fb0 = librosa.stft(fb0, n_fft=2048, hop_length=512).transpose()
+    fb1, sr = librosa.load(os.path.join(base, "611752105030249289_3634463651_dv_441.wav.mp3"), sr=sr, mono=True)
+    fb1 = librosa.stft(fb1, n_fft=2048, hop_length=512).transpose()
+    fb2, sr = librosa.load(os.path.join(base, "611752105030249289_8162774327817435_dv_441.wav.mp3"), sr=sr, mono=True)
+    fb2 = librosa.stft(fb2, n_fft=2048, hop_length=512).transpose()
+    w = []
+    for i in range(0, len(fb0)):
+        b0 = fb0[i]
+        b1 = fb1[i]
+        b2 = fb2[i]
+        sbi = b0 + b1 + b2
+        sbi2 = b0 * b0 + b1 * b1 + b2 * b2
+        if np.all(np.abs(sbi2 - 0) < 0.0000001):
+            continue
+        w.append((fa_stft[i] * sbi / sbi2))
+
+    # 滑窗取数据
+    # new_w = np.ones_like(w)
+    # step = 10
+    # for i in range(0, len(w) - step, step):
+    #     # new_w[i] = np.mean(w[i:i + step])
+    #     new_w[i] = w[i]
+    #     fb0[i] = new_w[i] * fb0[i]
+    w = np.mean(np.array(w), axis=0)
+    for i in range(0, len(fb0)):
+        fb0[i] = fb0[i] * w
+    new_fb0 = fb0.transpose()
+    fa_istft = librosa.istft(new_fb0)
+    print(fa_istft.shape)
+    fa_istft = np.expand_dims(fa_istft, 1)
+    print(fa_istft.shape)
+    fa_istft = np.repeat(fa_istft, 2, 1)
+    print(fa_istft.shape)
+    soundfile.write(vocal + "_out.wav", fa_istft, sr)
+
+
+def t2():
+    b0 = np.array([[1, 2], [4, 5], [6, 7]])
+    b1 = np.array([[3, 4], [7, 8], [10, 11]])
+    fa = np.array([[5, 6], [7, 8], [9, 10]])
+    print(b0.shape)
+
+
+if __name__ == '__main__':
+    t2()
diff --git a/AutoCoverTool/script/timbre.py b/AutoCoverTool/script/timbre.py
new file mode 100644
index 0000000..75d5220
--- /dev/null
+++ b/AutoCoverTool/script/timbre.py
@@ -0,0 +1,238 @@
+"""
+评价音色/音域之间的关系
+"""
+import os
+import copy
+import glob
+import time
+import shutil
+import numpy as np
+
+PITCH_EXE = "/opt/soft/bin/dpitch"
+
+
+class GetMidiMsg:
+    def __init__(self):
+        self.base_dir = "/tmp/auto_cover_tool"
+        if not os.path.exists(self.base_dir):
+            os.makedirs(self.base_dir)
+        self.cache_dir = None
+
+    def process_logic(self, in_file):
+        """
+        1. 转码为16k单声道
+        2. 提取midi
+        :param in_file:
+        :return:
+        """
+        cache_16kmono = os.path.join(self.cache_dir, "161.wav")
+        cmd = "ffmpeg -i {} -ar 16000 -ac 1 {}".format(in_file, cache_16kmono)
+        os.system(cmd)
+        if not os.path.exists(cache_16kmono):
+            return None, None, None, None
+        return process(cache_16kmono)
+
+    def process(self, in_file):
+        name = str(in_file).split("/")[-1]
+        self.cache_dir = os.path.join(self.base_dir, name)
+        if os.path.exists(self.cache_dir):
+            shutil.rmtree(self.cache_dir)
+        os.makedirs(self.cache_dir)
+        mmin, mmax, mmean, mstd = self.process_logic(in_file)
+        shutil.rmtree(self.cache_dir)
+        return mmin, mmax, mmean, mstd
+
+    def process_list(self, in_dir, cache_name):
+        wav_list = glob.glob(os.path.join(in_dir, "*wav"))
+        print(self.base_dir, cache_name)
+        self.cache_dir = os.path.join(self.base_dir, cache_name)
+        if os.path.exists(self.cache_dir):
+            shutil.rmtree(self.cache_dir)
+        os.makedirs(self.cache_dir)
+
+        out_wav_list = []
+        for wav in wav_list:
+            name = str(wav).split("/")[-1]
+            dst_path = os.path.join(self.cache_dir, name)
+            cmd = "ffmpeg -i {} -ar 16000 -ac 1 {}".format(wav, dst_path)
+            os.system(cmd)
+            if not os.path.exists(dst_path):
+                print("cmd={} err!".format(cmd))
+                continue
+            out_wav_list.append(dst_path)
+
+        mmin, mmax, mmean, mstd = process(out_wav_list, True)
+        shutil.rmtree(self.cache_dir)
+        return mmin, mmax, mmean, mstd
+
+
+def get_midi(in_file):
+    """
+    :return:
+    """
+    out_path = in_file + ".cache"
+    cmd = "{} {} {}".format(PITCH_EXE, in_file, in_file + ".cache")
+    print("exec:{}\n".format(cmd))
+    os.system(cmd)
+    if not os.path.exists(out_path):
+        return np.array([])
+    midi_arr = []
+    with open(out_path, "r") as f:
+        while True:
+            line = f.readline()
+            line = line.strip()
+            if not line:
+                break
+            freq = float(line)
+            midi = 0
+            if freq > 8:
+                midi = int(np.log2(freq / 440) * 12 + 69)
+            if midi != 0:
+                midi = max(midi, 21)
+                midi = min(midi, 108)
+                midi_arr.append(midi)
+    return np.array(midi_arr)
+
+
+def get_midi_list(in_file_list):
+    out_midi_arr = []
+    for in_file in in_file_list:
+        midi_arr = get_midi(in_file)
+        out_midi_arr.extend(midi_arr.tolist())
+    return np.array(out_midi_arr)
+
+
+def process(in_file, is_list=False):
+    """
+    1. 获取音频的pitch
+    :param in_file:
+    :return:
+    """
+    if is_list:
+        print("cacheDir:{}".format(len(in_file)))
+        midi = get_midi_list(in_file)
+    else:
+        print("cacheDir:{}".format(in_file))
+        midi = get_midi(in_file)
+    if len(midi) == 0:
+        return None, None, None, None
+    # mean_midi = np.mean(midi)
+    # std_midi = np.std(midi)
+    # print(mean_midi, std_midi)
+    # print(np.min(midi), np.max(midi))
+    mm_dict = {}
+    for i in range(0, len(midi)):
+        cur_midi = midi[i]
+        if cur_midi not in mm_dict.keys():
+            mm_dict[cur_midi] = 0
+        mm_dict[cur_midi] += 1
+
+    tot = sum(mm_dict.values())
+    kkeys = copy.deepcopy(list(mm_dict.keys()))
+    for kk in kkeys:
+        rate = round(mm_dict[kk] / tot, 3)
+        # 小于5%的部分不要
+        if rate < 0.05:
+            del mm_dict[kk]
+    new_midi = []
+    for kk in mm_dict.keys():
+        new_midi.extend([kk] * mm_dict[kk])
+    if len(new_midi) == 0:
+        return None, None, None, None
+    mean_midi = np.mean(new_midi)
+    std_midi = np.std(new_midi)
+    # print(mean_midi, std_midi)
+    # print(np.min(new_midi), np.max(new_midi))
+    return np.min(new_midi), np.max(new_midi), round(mean_midi, 2), round(std_midi, 2)
+
+
+def process_many():
+    tran_users = [
+        10414574138721494,
+        10414574140317353,
+        1688849864840588,
+        3634463651,
+        5629499489839033,
+        5910973794723621,
+        6755399374234747,
+        8162774327817435,
+        8162774329368194
+    ]
+    inst = GetMidiMsg()
+    for tran_user in tran_users:
+        in_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/train_users/{}/vocals".format(tran_user)
+        wav_list = glob.glob(os.path.join(in_dir, "*wav"))
+        for wav in wav_list:
+            mmin, mmax, mmean, mstd = inst.process(wav)
+            print("{},{},{},{},{},{}".format(tran_user, wav, mmin, mmax, mmean, mstd))
+
+
+def process_train():
+    base_dir = "/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_byw_man/{}/slice_resample/speaker0"
+    # tran_users = [
+    #     10414574138721494,
+    #     10414574140317353,
+    #     1688849864840588,
+    #     3634463651,
+    #     5629499489839033,
+    #     5910973794723621,
+    #     6755399374234747,
+    #     8162774327817435,
+    #     8162774329368194
+    # ]
+    tran_users = [
+        1125899914308640,
+        12384898975368914,
+        12947848931397021,
+        3096224748076687,
+        3096224751151928,
+        5066549357604730,
+        5348024335101054,
+        6755399442719465,
+        7036874421386111
+    ]
+    inst = GetMidiMsg()
+    for tran_user in tran_users:
+        in_dir = base_dir.format(tran_user)
+        mmin, mmax, mmean, mstd = inst.process_list(in_dir, str(tran_user))
+        # 把这些合并到一起
+        print("TrainXXX, {},{},{},{},{}".format(tran_user, mmin, mmax, mmean, mstd))
+
+
+def process_inf():
+    base_path = "/data/rsync/jianli.yang/AutoCoverTool/data/out_data/me_top500"
+    recordings = glob.glob(os.path.join(base_path, "*/*wav"))
+    inst = GetMidiMsg()
+    st = time.time()
+    for idx, recording in enumerate(recordings):
+        filename = recording.split("/")[-1]
+        if "d" in filename:
+            continue
+        mmin, mmax, mmean, mstd = inst.process(recording)
+        print("process_infXXX,{},{},{},{},{}".format(recording, mmin, mmax, mmean, mstd))
+        print("per={}/{}={}, sp = {}".format(idx, len(recordings), round(idx / len(recordings), 2),
+                                             time.time() - st))
+        print("finish {}".format(time.time() - st))
+
+
+def process_inf1():
+    base_path = "/data/rsync/jianli.yang/AutoCoverTool/data/inf_users/me_top500/"
+    recordings = glob.glob(os.path.join(base_path, "*/vocal.wav"))
+    inst = GetMidiMsg()
+    st = time.time()
+    for idx, recording in enumerate(recordings):
+        filename = recording.split("/")[-1]
+        if "d" in filename:
+            continue
+        mmin, mmax, mmean, mstd = inst.process(recording)
+        print("process_infXXX,{},{},{},{},{}".format(recording, mmin, mmax, mmean, mstd))
+        print("per={}/{}={}, sp = {}".format(idx, len(recordings), round(idx / len(recordings), 2),
+                                             time.time() - st))
+        print("finish {}".format(time.time() - st))
+
+
+if __name__ == '__main__':
+    # process_inf1()
+    process_train()
+    # process(
+    #     "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/AutoCoverTool/data/inf_users/wly/vocal_161s.wav")
diff --git a/AutoCoverTool/script/train.sh b/AutoCoverTool/script/train.sh
new file mode 100644
index 0000000..343f770
--- /dev/null
+++ b/AutoCoverTool/script/train.sh
@@ -0,0 +1,21 @@
+export LD_LIBRARY_PATH=/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/lib:$LD_LIBRARY_PATH
+export PATH=$PATH:/data/gpu_env_common/env/bin/ffmpeg/bin
+export PYTHONPATH=$PWD:$PWD/ref/music_remover/demucs
+
+mkdir -p /data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/filelists
+mkdir -p /data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/config
+# 1. 收集数据放到train_users/zjl/src
+# 2. 提取人声 & 分片 & 取音量响度大的Top80
+/data/gpu_env_common/env/anaconda3/envs/demucs/bin/python script/get_vocals_for_train.py $1
+# 3. 重采样
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so_vits_svc/resample.py --in_dir=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1 --out_dir2=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/slice_resample
+# 4. 生成配置文件
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so_vits_svc/preprocess_flist_config.py --source_dir=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/slice_resample --train_list=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/filelists/train.txt --val_list=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/filelists/val.txt --test_list=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/filelists/test.txt --config_path=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/config/config.json
+# 5. 预处理提取特征
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so_vits_svc/preprocess_hubert_f0.py --in_dir=/data/rsync/jianli.yang/AutoCoverTool/data/train_users/0317_top200/$1/slice_resample
+# 6. 拷贝数据到logs文件夹
+mkdir -p data/train_users/0317_top200/$1/logs/32k
+cp -r data/models/G_0.pth data/train_users/0317_top200/$1/logs/32k
+cp -r data/models/D_0.pth data/train_users/0317_top200/$1/logs/32k
+# 7. 训练
+/data/gpu_env_common/env/anaconda3/envs/so_vits_svc/bin/python ref/so_vits_svc/train.py -c data/train_users/0317_top200/$1/config/config.json -m 32k -l data/train_users/0317_top200/$1/logs
diff --git a/AutoCoverTool/script/train_user.sh b/AutoCoverTool/script/train_user.sh
new file mode 100644
index 0000000..6822f58
--- /dev/null
+++ b/AutoCoverTool/script/train_user.sh
@@ -0,0 +1,139 @@
+bash script/train.sh 10133099162774898
+bash script/train.sh 10133099165505798
+bash script/train.sh 10133099166238022
+bash script/train.sh 10133099166303694
+bash script/train.sh 10414574140750700
+bash script/train.sh 10414574143604234
+bash script/train.sh 10414574147828554
+bash script/train.sh 10696049121628986
+bash script/train.sh 10977524092826650
+bash script/train.sh 10977524093357608
+bash script/train.sh 10977524096777752
+bash script/train.sh 1125899910556940
+bash script/train.sh 1125899912511535
+bash script/train.sh 1125899912859360
+bash script/train.sh 1125899912929958
+bash script/train.sh 1125899913358232
+bash script/train.sh 1125899914953727
+bash script/train.sh 11821949025902914
+bash script/train.sh 11821949026179480
+bash script/train.sh 11821949026431616
+bash script/train.sh 11821949029742724
+bash script/train.sh 12103423998600142
+bash script/train.sh 12103423999409280
+bash script/train.sh 12103424002079730
+bash script/train.sh 12103424005848546
+bash script/train.sh 12947848932595064
+bash script/train.sh 12947848933097644
+bash script/train.sh 12947848933316944
+bash script/train.sh 12947848933899946
+bash script/train.sh 12947848936938186
+bash script/train.sh 13229323906199158
+bash script/train.sh 13792273859683018
+bash script/train.sh 13792273860722074
+bash script/train.sh 1688849861813535
+bash script/train.sh 1688849863542144
+bash script/train.sh 1688849864113505
+bash script/train.sh 1688849867241550
+bash script/train.sh 1688849867808490
+bash script/train.sh 1688849867868127
+bash script/train.sh 1688849868202697
+bash script/train.sh 1970324838195179
+bash script/train.sh 1970324840341371
+bash script/train.sh 1970324842945245
+bash script/train.sh 2251799815699655
+bash script/train.sh 2251799816635889
+bash script/train.sh 2251799817218088
+bash script/train.sh 2251799819353845
+bash script/train.sh 2533274793280297
+bash script/train.sh 2533274793464264
+bash script/train.sh 2533274793682339
+bash script/train.sh 2533274794030877
+bash script/train.sh 2533274795871759
+bash script/train.sh 2533274796020110
+bash script/train.sh 281474976786003
+bash script/train.sh 2814749768921322
+bash script/train.sh 2814749769914305
+bash script/train.sh 2814749769999875
+bash script/train.sh 2814749774295517
+bash script/train.sh 2814749774761906
+bash script/train.sh 281474979999994
+bash script/train.sh 281474983182829
+bash script/train.sh 3096224745564693
+bash script/train.sh 3096224747284097
+bash script/train.sh 3096224747482330
+bash script/train.sh 3096224747502899
+bash script/train.sh 3377699723287863
+bash script/train.sh 3377699724121868
+bash script/train.sh 3377699728561333
+bash script/train.sh 3638106974
+bash script/train.sh 3659174700455188
+bash script/train.sh 3659174704229686
+bash script/train.sh 3659174704442140
+bash script/train.sh 3659174705167593
+bash script/train.sh 3940649674894493
+bash script/train.sh 3940649677150746
+bash script/train.sh 3940649677324319
+bash script/train.sh 3940649677979647
+bash script/train.sh 3940649681330250
+bash script/train.sh 4222124654431329
+bash script/train.sh 4222124658020004
+bash script/train.sh 4222124658467837
+bash script/train.sh 4785074599520860
+bash script/train.sh 4785074599792504
+bash script/train.sh 4785074600347962
+bash script/train.sh 5066549357106838
+bash script/train.sh 5066549357219186
+bash script/train.sh 5066549357798842
+bash script/train.sh 5348024333764403
+bash script/train.sh 5348024333962443
+bash script/train.sh 5348024334065079
+bash script/train.sh 5348024339154304
+bash script/train.sh 5629499489621786
+bash script/train.sh 562949957074725
+bash script/train.sh 562949957107160
+bash script/train.sh 562949959231308
+bash script/train.sh 562949959983729
+bash script/train.sh 562949961216348
+bash script/train.sh 5910973797429506
+bash script/train.sh 6192448700267754
+bash script/train.sh 6192448704854979
+bash script/train.sh 6192448705925464
+bash script/train.sh 6192448706574397
+bash script/train.sh 6473924132718447
+bash script/train.sh 6755399375717418
+bash script/train.sh 6755399378511542
+bash script/train.sh 6755399379632118
+bash script/train.sh 6755399443759397
+bash script/train.sh 6755399447820306
+bash script/train.sh 7036874420974681
+bash script/train.sh 7036874422862432
+bash script/train.sh 7036874423888346
+bash script/train.sh 7036874424774508
+bash script/train.sh 7318349395720624
+bash script/train.sh 7318349397789093
+bash script/train.sh 7318349399797992
+bash script/train.sh 7318349400063521
+bash script/train.sh 7318349402559835
+bash script/train.sh 7599824374258214
+bash script/train.sh 7599824374439276
+bash script/train.sh 7599824374580278
+bash script/train.sh 7599824374587612
+bash script/train.sh 7881299351264940
+bash script/train.sh 7881299355927226
+bash script/train.sh 8162774325621941
+bash script/train.sh 8162774328094468
+bash script/train.sh 8444249304724233
+bash script/train.sh 8444249305973270
+bash script/train.sh 8444249306804457
+bash script/train.sh 844424931580446
+bash script/train.sh 844424933082968
+bash script/train.sh 844424933461071
+bash script/train.sh 844424933613855
+bash script/train.sh 844424933858702
+bash script/train.sh 844424934490972
+bash script/train.sh 844424937122795
+bash script/train.sh 844424937146141
+bash script/train.sh 8725724280938085
+bash script/train.sh 8725724284783179
+bash script/train.sh 8725724285034474
\ No newline at end of file
diff --git a/AutoCoverTool/script/wpe_tests.py b/AutoCoverTool/script/wpe_tests.py
new file mode 100644
index 0000000..c6857dd
--- /dev/null
+++ b/AutoCoverTool/script/wpe_tests.py
@@ -0,0 +1,29 @@
+"""
+测试去混响算法
+"""
+import matplotlib.pyplot as plt
+import librosa
+import numpy as np
+import soundfile as sf
+from tqdm import tqdm
+
+from nara_wpe.wpe import wpe
+from nara_wpe.wpe import get_power
+from nara_wpe.utils import stft, istft, get_stft_center_frequencies
+
+
+def wpe_work():
+    # in_path = "../data/ae/out.wav"
+    in_path = "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/me_top500/jianli/611752105030249000/vocal_01.wav"
+    data, sr = librosa.load(in_path, sr=44100, mono=False)
+    print(data.shape)
+    y = stft(data, size=512, shift=128).transpose(2, 0, 1)
+    Y = wpe(y, statistics_mode='full')
+    z = istft(Y.transpose(1, 2, 0), size=512, shift=128)
+    sf.write(
+        "/Users/yangjianli/starmaker-work/research/tmp_code/SVC方案调研/prod/me_top500/jianli/611752105030249000/vocal_out.wav",
+        z.transpose(1, 0), sr, "DOUBLE")
+
+
+if __name__ == '__main__':
+    wpe_work()
diff --git a/dereverbrate/main.cpp b/dereverbrate/main.cpp
index 3c39327..8748600 100644
--- a/dereverbrate/main.cpp
+++ b/dereverbrate/main.cpp
@@ -1,160 +1,169 @@
 
 #include <iostream>
 #include <cmath>
 //#include <cstdioh>
 #include <stdio.h>
 #include <cstring>
 #include <string>
 
-#include "inverse/inverse.h"  //�����ļ�
-#include "STWaveFile.h"  //wav�ļ�
+#include "inverse/inverse.h"  //无用文件
+#include "STWaveFile.h"  //wav文件
 
 #include "./dereveb_c/dereveb_c.h"
 
 #define max(a,b) (((a) > (b)) ? (a) : (b))
 #define min(a,b) (((a) < (b)) ? (a) : (b))
 
 int process(short* vocal_buf, short* vc_buf, short* out_buf, int frame_len, int fs){
 
-    std::string impulseResponse_name =  "../audio/stalbans_a_mono_16bit.wav"; // ����Ľ��
+//    std::string impulseResponse_name =  "../audio/stalbans_a_mono_16bit.wav"; // 输出的结果
+    std::string impulseResponse_name =  "/opt/soft/bin/res/stalbans_a_mono_16bit.wav"; // 输出的结果
 
     STCWaveFile impulseResponse = STCWaveFile(impulseResponse_name.c_str(), false);
     if (!impulseResponse.GetStatus() )
     {
         printf("impulseResponse wav read =%s  err !!!\n", impulseResponse_name.c_str());
         return -1;
     }
     int rir_len = impulseResponse.GetTotalFrames() * impulseResponse.GetChannels();
     short *rir_buf = new short[rir_len];
     impulseResponse.ReadFrameAsS16(rir_buf, impulseResponse.GetTotalFrames());
 
     /// input double type
     double* vocal_buf_double = new double[frame_len];
     double* vc_buf_double = new double[frame_len];
     double* out_buf_double = new double[frame_len];
     double* rir_buf_double = new double[rir_len];
     for(int i=0; i<frame_len; i++){
         vocal_buf_double[i] = vocal_buf[i]/32767.0;
         vc_buf_double[i] = vc_buf[i]/32767.0;
         out_buf_double[i] = 0;
     }
     for(int i=0; i<rir_len; i++){
         rir_buf_double[i] = rir_buf[i]/32767.0;
     }
 
    //process
     dereveb_c(vocal_buf_double,vc_buf_double, fs, rir_buf_double,out_buf_double);
 
     //output type convert
     for(int i=0; i<frame_len; i++){
         double out_tmp = min(out_buf_double[i]*32767.0,32767.0);
         out_tmp = max(out_tmp,-32768);
         out_buf[i] = short(out_tmp);
     }
 
     delete[] vocal_buf_double;
     delete[] vc_buf_double;
     delete[] out_buf_double;
     delete[] rir_buf_double;
     delete[] rir_buf;
 
     return 0;
 }
-int main() {
+int main(int argc, char* argv[]) {
 //    std::cout << "Hello, World!" << std::endl;
 //    double src[6] = {1,2,3,4,5,6};
 //    int n=6;
 //    double en[6];
 //    inverse(src,  n,  en);
 //
 //    for (int i=0;i<n; i++){
 //        std::cout << en[i]<<" "<<std::endl;;
 //    }
 
-    /////��wav�ļ�
+    /////读wav文件
 
-    // vocalԭʼ�źţ�vc�źţ�����ļ�
-    std::string src_audio_path =  "../test_wav/vocla_left.wav"; // vocalԭʼ�ź�
-    std::string ref_audio_path =  "../test_wav/611752105030249000_8162774329368194_dv_44100.wav";// vc�ź�
-    std::string dst_audio_path =  "../test_wav/reverberated_vc_opt6_tmpx23x12_c1.wav"; //����ļ�
+    // vocal原始信号，vc信号，输出文件
+//    std::string src_audio_path =  "../test_wav/vocla_left.wav"; // vocal原始信号
+//    std::string ref_audio_path =  "../test_wav/611752105030249000_8162774329368194_dv_44100.wav";// vc信号
+//    std::string dst_audio_path =  "../test_wav/reverberated_vc_opt6_tmpx23x12_c1.wav"; //输出文件
 
+    if (argc != 4)
+    {
+        printf("err! example:./exe src_audio(442) ref_audio(442) dst_audio \n");
+        return -1;
+    }
+    std::string src_audio_path =  argv[1]; // vocal原始信号
+    std::string ref_audio_path =  argv[2];// vc信号
+    std::string dst_audio_path =  argv[3]; //输出文件
 
 
 
-    // ��ȡ��Ƶ�ļ�
+    // 读取音频文件
     STCWaveFile in_wav = STCWaveFile(src_audio_path.c_str(), false);
     STCWaveFile ref_wav = STCWaveFile(ref_audio_path.c_str(), false);
     STCWaveFile dst_wav = STCWaveFile(dst_audio_path.c_str(), true);
 
     if (!in_wav.GetStatus() || !ref_wav.GetStatus())
     {
         printf("in_wav=%s or ref_wav=%s err! \n", src_audio_path.c_str(), ref_audio_path.c_str());
         return -1;
     }
 
     if (in_wav.GetChannels() != ref_wav.GetChannels())
     {
         printf("in_channel != ref_channel %d != %d! \n", in_wav.GetChannels(), ref_wav.GetChannels());
         return -2;
     }
-    //����ļ���������
+    //输出文件参数配置
      dst_wav.SetSampleRate(in_wav.GetSampleRate());
      dst_wav.SetChannels(in_wav.GetChannels());
      dst_wav.SetSampleFormat(SF_S16);
      dst_wav.SetupDone();
 
 
 
-    ////���ļ�����buffer
+    ////读文件进入buffer
     int in_len = in_wav.GetTotalFrames() * in_wav.GetChannels();
     int ref_len = ref_wav.GetTotalFrames() * ref_wav.GetChannels();
     short *in_buf = new short[in_len];
     short *ref_buf = new short[ref_len];
     in_wav.ReadFrameAsS16(in_buf, in_wav.GetTotalFrames());
     ref_wav.ReadFrameAsS16(ref_buf, ref_wav.GetTotalFrames());
 
-    ///�ļ����ȴ���
+    ///文件长度处理
     //int frame_len = in_wav.GetSampleRate()*1;
-    const int frame_len = 220500; //���ɸ���
+    const int frame_len = 220500; //不可更改
     const int  fs =in_wav.GetSampleRate();
 
-    /////���buffer,��������ֻ����40s
+    /////输出buffer,这里限制只处理40s
     int min_len = in_len < ref_len ? in_len : ref_len;
 //    int min_len = fs*20;
     short *out_buf = new short[frame_len];
 
     //printf("min_len =%d!\n", int(min_len));
     std::cout<<"min_len ="<< min_len<<std::endl;
     std::cout<<"frame_len ="<< frame_len<<std::endl;
     for (int i = 0; i < min_len; i += frame_len)
     {
         //printf("frame cnt =%d!\n", int(i/frame_len));
         std::cout<<"frame cnt = "<<int(i/frame_len) <<std::endl;
         if (i + frame_len > min_len)
         {
             break;
         }
 
-        ////process ����
+        ////process 函数
         int32_t err_code = process(in_buf+i, ref_buf+i, out_buf,  frame_len,fs);
 
         if (err_code != 0)
         {
             printf("dereverb process err=%d!\n", err_code);
         }
 
 
         dst_wav.WriteFrame(out_buf, int(frame_len / dst_wav.GetChannels()));
 
 
     }
     delete[] in_buf;
     delete[] ref_buf;
     delete[] out_buf;
 
     printf("dereverb process successful");
 
 
 
     return 0;
 }