/*
Copyright (C) 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012
Her Majesty the Queen in Right of Canada (Communications Research
Center Canada)
Copyright (C) 2014
Matthias P. Braendli, matthias.braendli@mpb.li
http://opendigitalradio.org
*/
/*
This file is part of ODR-DabMod.
ODR-DabMod is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as
published by the Free Software Foundation, either version 3 of the
License, or (at your option) any later version.
ODR-DabMod is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with ODR-DabMod. If not, see .
*/
#include "GainControl.h"
#include "PcDebug.h"
#include
#include
#include
#ifdef __SSE__
# include
union __u128 {
__m128 m;
float f[4];
};
#endif
using namespace std;
GainControl::GainControl(size_t framesize,
GainMode mode,
float& digGain,
float normalise) :
ModCodec(),
RemoteControllable("gain"),
#ifdef __SSE__
m_frameSize(framesize * sizeof(complexf) / sizeof(__m128)),
#else // !__SSE__
m_frameSize(framesize),
#endif
m_digGain(digGain),
m_normalise(normalise)
{
PDEBUG("GainControl::GainControl(%zu, %u) @ %p\n", framesize, mode, this);
/* register the parameters that can be remote controlled */
RC_ADD_PARAMETER(digital, "Digital Gain");
switch(mode) {
case GainMode::GAIN_FIX:
PDEBUG("Gain mode: fix\n");
computeGain = computeGainFix;
break;
case GainMode::GAIN_MAX:
PDEBUG("Gain mode: max\n");
computeGain = computeGainMax;
break;
case GainMode::GAIN_VAR:
PDEBUG("Gain mode: var\n");
computeGain = computeGainVar;
break;
default:
throw std::runtime_error(
"GainControl::GainControl invalid computation gain mode!");
}
}
GainControl::~GainControl()
{
PDEBUG("GainControl::~GainControl() @ %p\n", this);
}
int GainControl::process(Buffer* const dataIn, Buffer* dataOut)
{
PDEBUG("GainControl::process"
"(dataIn: %p, dataOut: %p)\n",
dataIn, dataOut);
dataOut->setLength(dataIn->getLength());
#ifdef __SSE__
const __m128* in = reinterpret_cast(dataIn->getData());
__m128* out = reinterpret_cast<__m128*>(dataOut->getData());
size_t sizeIn = dataIn->getLength() / sizeof(__m128);
size_t sizeOut = dataOut->getLength() / sizeof(__m128);
__u128 gain128;
if ((sizeIn % m_frameSize) != 0) {
PDEBUG("%zu != %zu\n", sizeIn, m_frameSize);
throw std::runtime_error(
"GainControl::process input size not valid!");
}
for (size_t i = 0; i < sizeIn; i += m_frameSize) {
gain128.m = computeGain(in, m_frameSize);
gain128.m = _mm_mul_ps(gain128.m, _mm_set1_ps(m_normalise * m_digGain));
PDEBUG("********** Gain: %10f **********\n", gain128.f[0]);
////////////////////////////////////////////////////////////////////////
// Applying gain to output data
////////////////////////////////////////////////////////////////////////
for (size_t sample = 0; sample < m_frameSize; ++sample) {
out[sample] = _mm_mul_ps(in[sample], gain128.m);
}
in += m_frameSize;
out += m_frameSize;
}
#else // !__SSE__
const complexf* in = reinterpret_cast(dataIn->getData());
complexf* out = reinterpret_cast(dataOut->getData());
size_t sizeIn = dataIn->getLength() / sizeof(complexf);
size_t sizeOut = dataOut->getLength() / sizeof(complexf);
float gain;
if ((sizeIn % m_frameSize) != 0) {
PDEBUG("%zu != %zu\n", sizeIn, m_frameSize);
throw std::runtime_error(
"GainControl::process input size not valid!");
}
for (size_t i = 0; i < sizeIn; i += m_frameSize) {
gain = m_normalise * m_digGain * computeGain(in, m_frameSize);
PDEBUG("********** Gain: %10f **********\n", gain);
////////////////////////////////////////////////////////////////////////
// Applying gain to output data
////////////////////////////////////////////////////////////////////////
for (size_t sample = 0; sample < m_frameSize; ++sample) {
out[sample] = in[sample] * gain;
}
in += m_frameSize;
out += m_frameSize;
}
#endif // __SSE__
return sizeOut;
}
#ifdef __SSE__
__m128 GainControl::computeGainFix(const __m128* in, size_t sizeIn)
{
return _mm_set1_ps(512.0f);
}
__m128 GainControl::computeGainMax(const __m128* in, size_t sizeIn)
{
__u128 gain128;
__u128 min128;
__u128 max128;
__u128 tmp128;
static const __m128 factor128 = _mm_set1_ps(0x7fff);
////////////////////////////////////////////////////////////////////////
// Computing max, min and average
////////////////////////////////////////////////////////////////////////
min128.m = _mm_set1_ps(__FLT_MAX__);
max128.m = _mm_set1_ps(__FLT_MIN__);
for (size_t sample = 0; sample < sizeIn; ++sample) {
min128.m = _mm_min_ps(in[sample], min128.m);
max128.m = _mm_max_ps(in[sample], max128.m);
}
// Merging min
tmp128.m = _mm_shuffle_ps(min128.m, min128.m, _MM_SHUFFLE(0, 1, 2, 3));
min128.m = _mm_min_ps(min128.m, tmp128.m);
tmp128.m = _mm_shuffle_ps(min128.m, min128.m, _MM_SHUFFLE(1, 0, 3, 2));
min128.m = _mm_min_ps(min128.m, tmp128.m);
PDEBUG("********** Min: %10f **********\n", min128.f[0]);
// Merging max
tmp128.m = _mm_shuffle_ps(max128.m, max128.m, _MM_SHUFFLE(0, 1, 2, 3));
max128.m = _mm_max_ps(max128.m, tmp128.m);
tmp128.m = _mm_shuffle_ps(max128.m, max128.m, _MM_SHUFFLE(1, 0, 3, 2));
max128.m = _mm_max_ps(max128.m, tmp128.m);
PDEBUG("********** Max: %10f **********\n", max128.f[0]);
////////////////////////////////////////////////////////////////////////////
// Computing gain
////////////////////////////////////////////////////////////////////////////
// max = max(-min, max)
max128.m = _mm_max_ps(_mm_mul_ps(min128.m, _mm_set1_ps(-1.0f)), max128.m);
// Detect NULL
if ((int)max128.f[0] != 0) {
gain128.m = _mm_div_ps(factor128, max128.m);
}
else {
gain128.m = _mm_set1_ps(1.0f);
}
return gain128.m;
}
__m128 GainControl::computeGainVar(const __m128* in, size_t sizeIn)
{
__u128 gain128;
__u128 mean128;
__u128 var128;
__u128 tmp128;
static const __m128 factor128 = _mm_set1_ps(0x7fff);
mean128.m = _mm_setzero_ps();
for (size_t sample = 0; sample < sizeIn; ++sample) {
__m128 delta128 = _mm_sub_ps(in[sample], mean128.m);
__m128 i128 = _mm_set1_ps(sample + 1);
__m128 q128 = _mm_div_ps(delta128, i128);
mean128.m = _mm_add_ps(mean128.m, q128);
/*
tmp128.m = in[sample];
printf("S %zu, %.2f+%.2fj\t",
sample,
tmp128.f[0], tmp128.f[1]);
printf(": %.2f+%.2fj\n", mean128.f[0], mean128.f[1]);
printf("S %zu, %.2f+%.2fj\t",
sample,
tmp128.f[2], tmp128.f[3]);
printf(": %.2f+%.2fj\n", mean128.f[2], mean128.f[3]);
*/
}
// Merging average
tmp128.m = _mm_shuffle_ps(mean128.m, mean128.m, _MM_SHUFFLE(1, 0, 3, 2));
mean128.m = _mm_add_ps(mean128.m, tmp128.m);
mean128.m = _mm_mul_ps(mean128.m, _mm_set1_ps(0.5f));
PDEBUG("********** Mean: %10f + %10fj %10f + %10fj **********\n",
mean128.f[0], mean128.f[1], mean128.f[2], mean128.f[3]);
////////////////////////////////////////////////////////////////////////
// Computing standard deviation
////////////////////////////////////////////////////////////////////////
var128.m = _mm_setzero_ps();
for (size_t sample = 0; sample < sizeIn; ++sample) {
__m128 diff128 = _mm_sub_ps(in[sample], mean128.m);
__m128 delta128 = _mm_sub_ps(_mm_mul_ps(diff128, diff128), var128.m);
__m128 i128 = _mm_set1_ps(sample + 1);
__m128 q128 = _mm_div_ps(delta128, i128);
var128.m = _mm_add_ps(var128.m, q128);
/*
__u128 udiff128; udiff128.m = diff128;
__u128 udelta128; udelta128.m = delta128;
for (int off=0; off<4; off+=2) {
printf("S %zu, %.2f+%.2fj\t",
sample,
udiff128.f[off], udiff128.f[1+off]);
printf(": %.2f+%.2fj\t", udelta128.f[off], udelta128.f[1+off]);
printf(": %.2f+%.2fj\n", var128.f[off], var128.f[1+off]);
}
*/
}
PDEBUG("********** Vars: %10f + %10fj, %10f + %10fj **********\n",
var128.f[0], var128.f[1], var128.f[2], var128.f[3]);
// Merging standard deviations
tmp128.m = _mm_shuffle_ps(var128.m, var128.m, _MM_SHUFFLE(1, 0, 3, 2));
var128.m = _mm_add_ps(var128.m, tmp128.m);
var128.m = _mm_mul_ps(var128.m, _mm_set1_ps(0.5f));
var128.m = _mm_sqrt_ps(var128.m);
PDEBUG("********** Var: %10f + %10fj, %10f + %10fj **********\n",
var128.f[0], var128.f[1], var128.f[2], var128.f[3]);
var128.m = _mm_mul_ps(var128.m, _mm_set1_ps(4.0f));
PDEBUG("********** 4*Var: %10f + %10fj, %10f + %10fj **********\n",
var128.f[0], var128.f[1], var128.f[2], var128.f[3]);
////////////////////////////////////////////////////////////////////////////
// Computing gain
////////////////////////////////////////////////////////////////////////////
// gain = factor128 / max(real, imag)
// Detect NULL
if ((int)var128.f[0] != 0) {
gain128.m = _mm_div_ps(factor128,
_mm_max_ps(var128.m,
_mm_shuffle_ps(var128.m, var128.m, _MM_SHUFFLE(2, 3, 0, 1))));
} else {
gain128.m = _mm_set1_ps(1.0f);
}
return gain128.m;
}
#else // !__SSE__
float GainControl::computeGainFix(const complexf* in, size_t sizeIn)
{
return 512.0f;
}
float GainControl::computeGainMax(const complexf* in, size_t sizeIn)
{
float gain;
float min;
float max;
static const float factor = 0x7fff;
////////////////////////////////////////////////////////////////////////
// Computing max, min and average
////////////////////////////////////////////////////////////////////////
min = __FLT_MAX__;
max = __FLT_MIN__;
for (size_t sample = 0; sample < sizeIn; ++sample) {
if (in[sample].real() < min) {
min = in[sample].real();
}
if (in[sample].real() > max) {
max = in[sample].real();
}
if (in[sample].imag() < min) {
min = in[sample].imag();
}
if (in[sample].imag() > max) {
max = in[sample].imag();
}
}
PDEBUG("********** Min: %10f **********\n", min);
PDEBUG("********** Max: %10f **********\n", max);
////////////////////////////////////////////////////////////////////////////
// Computing gain
////////////////////////////////////////////////////////////////////////////
// gain = factor128 / max(-min, max)
min = -min;
if (min > max) {
max = min;
}
// Detect NULL
if ((int)max != 0) {
gain = factor / max;
}
else {
gain = 1.0f;
}
return gain;
}
float GainControl::computeGainVar(const complexf* in, size_t sizeIn)
{
complexf mean;
/* The variance calculation is a bit strange, because we
* emulate the exact same functionality as the SSE code,
* which is the most used one.
*
* TODO: verify that this actually corresponds to the
* gain mode suggested in EN 300 798 Clause 5.3 Numerical Range.
*/
complexf var1;
complexf var2;
static const float factor = 0x7fff;
mean = complexf(0.0f, 0.0f);
for (size_t sample = 0; sample < sizeIn; ++sample) {
complexf delta = in[sample] - mean;
float i = sample + 1;
complexf q = delta / i;
mean = mean + q;
/*
printf("F %zu, %.2f+%.2fj\t",
sample,
in[sample].real(), in[sample].imag());
printf(": %.2f+%.2fj\n", mean.real(), mean.imag());
*/
}
PDEBUG("********** Mean: %10f + %10fj **********\n", mean.real(), mean.imag());
////////////////////////////////////////////////////////////////////////
// Computing standard deviation
////////////////////////////////////////////////////////////////////////
var1 = complexf(0.0f, 0.0f);
var2 = complexf(0.0f, 0.0f);
for (size_t sample = 0; sample < sizeIn; ++sample) {
complexf diff = in[sample] - mean;
complexf delta;
complexf q;
float i = (sample/2) + 1;
if (sample % 2 == 0) {
delta = complexf(diff.real() * diff.real(),
diff.imag() * diff.imag()) - var1;
q = delta / i;
var1 += q;
}
else {
delta = complexf(diff.real() * diff.real(),
diff.imag() * diff.imag()) - var2;
q = delta / i;
var2 += q;
}
/*
printf("F %zu, %.2f+%.2fj\t",
sample,
diff.real(), diff.imag());
printf(": %.2f+%.2fj\t", delta.real(), delta.imag());
printf(": %.2f+%.2fj\t", var1.real(), var1.imag());
printf(": %.2f+%.2fj\n", var2.real(), var2.imag());
*/
}
PDEBUG("********** Vars: %10f + %10fj, %10f + %10fj **********\n",
var1.real(), var1.imag(),
var2.real(), var2.imag());
// Merge standard deviations in the same way the SSE version does it
complexf tmpvar = (var1 + var2) * 0.5f;
complexf var(sqrt(tmpvar.real()), sqrt(tmpvar.imag()));
PDEBUG("********** Var: %10f + %10fj **********\n", var.real(), var.imag());
var = var * 4.0f;
PDEBUG("********** 4*Var: %10f + %10fj **********\n", var.real(), var.imag());
////////////////////////////////////////////////////////////////////////////
// Computing gain
////////////////////////////////////////////////////////////////////////////
float gain = var.real();
// gain = factor128 / max(real, imag)
if (var.imag() > gain) {
gain = var.imag();
}
// Ignore zero variance samples and apply no gain
if ((int)gain == 0) {
gain = 1.0f;
}
else {
gain = factor / gain;
}
return gain;
}
#endif // !__SSE__
void GainControl::set_parameter(const string& parameter, const string& value)
{
stringstream ss(value);
ss.exceptions ( stringstream::failbit | stringstream::badbit );
if (parameter == "digital") {
float new_factor;
ss >> new_factor;
m_digGain = new_factor;
}
else {
stringstream ss;
ss << "Parameter '" << parameter
<< "' is not exported by controllable " << get_rc_name();
throw ParameterError(ss.str());
}
}
const string GainControl::get_parameter(const string& parameter) const
{
stringstream ss;
if (parameter == "digital") {
ss << std::fixed << m_digGain;
}
else {
ss << "Parameter '" << parameter <<
"' is not exported by controllable " << get_rc_name();
throw ParameterError(ss.str());
}
return ss.str();
}