mirror of
https://github.com/DrKLO/Telegram.git
synced 2025-01-21 16:04:43 +01:00
82 lines
3 KiB
C
82 lines
3 KiB
C
/*
|
|
* Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "common_audio/vad/vad_gmm.h"
|
|
|
|
#include "common_audio/signal_processing/include/signal_processing_library.h"
|
|
|
|
static const int32_t kCompVar = 22005;
|
|
static const int16_t kLog2Exp = 5909; // log2(exp(1)) in Q12.
|
|
|
|
// For a normal distribution, the probability of `input` is calculated and
|
|
// returned (in Q20). The formula for normal distributed probability is
|
|
//
|
|
// 1 / s * exp(-(x - m)^2 / (2 * s^2))
|
|
//
|
|
// where the parameters are given in the following Q domains:
|
|
// m = `mean` (Q7)
|
|
// s = `std` (Q7)
|
|
// x = `input` (Q4)
|
|
// in addition to the probability we output `delta` (in Q11) used when updating
|
|
// the noise/speech model.
|
|
int32_t WebRtcVad_GaussianProbability(int16_t input,
|
|
int16_t mean,
|
|
int16_t std,
|
|
int16_t* delta) {
|
|
int16_t tmp16, inv_std, inv_std2, exp_value = 0;
|
|
int32_t tmp32;
|
|
|
|
// Calculate `inv_std` = 1 / s, in Q10.
|
|
// 131072 = 1 in Q17, and (`std` >> 1) is for rounding instead of truncation.
|
|
// Q-domain: Q17 / Q7 = Q10.
|
|
tmp32 = (int32_t) 131072 + (int32_t) (std >> 1);
|
|
inv_std = (int16_t) WebRtcSpl_DivW32W16(tmp32, std);
|
|
|
|
// Calculate `inv_std2` = 1 / s^2, in Q14.
|
|
tmp16 = (inv_std >> 2); // Q10 -> Q8.
|
|
// Q-domain: (Q8 * Q8) >> 2 = Q14.
|
|
inv_std2 = (int16_t)((tmp16 * tmp16) >> 2);
|
|
// TODO(bjornv): Investigate if changing to
|
|
// inv_std2 = (int16_t)((inv_std * inv_std) >> 6);
|
|
// gives better accuracy.
|
|
|
|
tmp16 = (input << 3); // Q4 -> Q7
|
|
tmp16 = tmp16 - mean; // Q7 - Q7 = Q7
|
|
|
|
// To be used later, when updating noise/speech model.
|
|
// `delta` = (x - m) / s^2, in Q11.
|
|
// Q-domain: (Q14 * Q7) >> 10 = Q11.
|
|
*delta = (int16_t)((inv_std2 * tmp16) >> 10);
|
|
|
|
// Calculate the exponent `tmp32` = (x - m)^2 / (2 * s^2), in Q10. Replacing
|
|
// division by two with one shift.
|
|
// Q-domain: (Q11 * Q7) >> 8 = Q10.
|
|
tmp32 = (*delta * tmp16) >> 9;
|
|
|
|
// If the exponent is small enough to give a non-zero probability we calculate
|
|
// `exp_value` ~= exp(-(x - m)^2 / (2 * s^2))
|
|
// ~= exp2(-log2(exp(1)) * `tmp32`).
|
|
if (tmp32 < kCompVar) {
|
|
// Calculate `tmp16` = log2(exp(1)) * `tmp32`, in Q10.
|
|
// Q-domain: (Q12 * Q10) >> 12 = Q10.
|
|
tmp16 = (int16_t)((kLog2Exp * tmp32) >> 12);
|
|
tmp16 = -tmp16;
|
|
exp_value = (0x0400 | (tmp16 & 0x03FF));
|
|
tmp16 ^= 0xFFFF;
|
|
tmp16 >>= 10;
|
|
tmp16 += 1;
|
|
// Get `exp_value` = exp(-`tmp32`) in Q10.
|
|
exp_value >>= tmp16;
|
|
}
|
|
|
|
// Calculate and return (1 / s) * exp(-(x - m)^2 / (2 * s^2)), in Q20.
|
|
// Q-domain: Q10 * Q10 = Q20.
|
|
return inv_std * exp_value;
|
|
}
|