wdsp/firmin.c
Uladzimir Karpenka 89c8a0e2b5 first commit
2026-06-01 15:58:45 +03:00

492 lines
14 KiB
C

/* firmin.c
This file is part of a program that implements a Software-Defined Radio.
Copyright (C) 2016, 2025 Warren Pratt, NR0V
This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License
as published by the Free Software Foundation; either version 2
of the License, or (at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
The author can be reached by email at
warren@wpratt.com
*/
#include "comm.h"
/********************************************************************************************************
* *
* Time-Domain FIR *
* *
********************************************************************************************************/
void calc_firmin (FIRMIN a)
{
a->h = fir_bandpass (a->nc, a->f_low, a->f_high, a->samplerate, a->wintype, 1, a->gain);
a->rsize = a->nc;
a->mask = a->rsize - 1;
a->ring = (double *) malloc0 (a->rsize * sizeof (complex));
a->idx = 0;
}
FIRMIN create_firmin (int run, int position, int size, double* in, double* out,
int nc, double f_low, double f_high, int samplerate, int wintype, double gain)
{
FIRMIN a = (FIRMIN) malloc0 (sizeof (firmin));
a->run = run;
a->position = position;
a->size = size;
a->in = in;
a->out = out;
a->nc = nc;
a->f_low = f_low;
a->f_high = f_high;
a->samplerate = samplerate;
a->wintype = wintype;
a->gain = gain;
calc_firmin (a);
return a;
}
void destroy_firmin (FIRMIN a)
{
_aligned_free (a->ring);
_aligned_free (a->h);
_aligned_free (a);
}
void flush_firmin (FIRMIN a)
{
memset (a->ring, 0, a->rsize * sizeof (complex));
a->idx = 0;
}
void xfirmin (FIRMIN a, int pos)
{
if (a->run && a->position == pos)
{
int i, j, k;
for (i = 0; i < a->size; i++)
{
a->ring[2 * a->idx + 0] = a->in[2 * i + 0];
a->ring[2 * a->idx + 1] = a->in[2 * i + 1];
a->out[2 * i + 0] = 0.0;
a->out[2 * i + 1] = 0.0;
k = a->idx;
for (j = 0; j < a->nc; j++)
{
a->out[2 * i + 0] += a->h[2 * j + 0] * a->ring[2 * k + 0] - a->h[2 * j + 1] * a->ring[2 * k + 1];
a->out[2 * i + 1] += a->h[2 * j + 0] * a->ring[2 * k + 1] + a->h[2 * j + 1] * a->ring[2 * k + 0];
k = (k + a->mask) & a->mask;
}
a->idx = (a->idx + 1) & a->mask;
}
}
else if (a->in != a->out)
memcpy (a->out, a->in, a->size * sizeof (complex));
}
void setBuffers_firmin (FIRMIN a, double* in, double* out)
{
a->in = in;
a->out = out;
}
void setSamplerate_firmin (FIRMIN a, int rate)
{
a->samplerate = (double)rate;
calc_firmin (a);
}
void setSize_firmin (FIRMIN a, int size)
{
a->size = size;
}
void setFreqs_firmin (FIRMIN a, double f_low, double f_high)
{
a->f_low = f_low;
a->f_high = f_high;
calc_firmin (a);
}
/********************************************************************************************************
* *
* Standalone Partitioned Overlap-Save Bandpass *
* *
********************************************************************************************************/
void plan_firopt (FIROPT a)
{
// must call for change in 'nc', 'size', 'out'
int i;
a->nfor = a->nc / a->size;
a->buffidx = 0;
a->idxmask = a->nfor - 1;
a->fftin = (double *) malloc0 (2 * a->size * sizeof (complex));
a->fftout = (double **) malloc0 (a->nfor * sizeof (double *));
a->fmask = (double **) malloc0 (a->nfor * sizeof (double *));
a->maskgen = (double *) malloc0 (2 * a->size * sizeof (complex));
a->pcfor = (fftw_plan *) malloc0 (a->nfor * sizeof (fftw_plan));
a->maskplan = (fftw_plan *) malloc0 (a->nfor * sizeof (fftw_plan));
for (i = 0; i < a->nfor; i++)
{
a->fftout[i] = (double *) malloc0 (2 * a->size * sizeof (complex));
a->fmask[i] = (double *) malloc0 (2 * a->size * sizeof (complex));
a->pcfor[i] = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->fftin, (fftw_complex *)a->fftout[i], FFTW_FORWARD, FFTW_PATIENT);
a->maskplan[i] = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->maskgen, (fftw_complex *)a->fmask[i], FFTW_FORWARD, FFTW_PATIENT);
}
a->accum = (double *) malloc0 (2 * a->size * sizeof (complex));
a->crev = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->accum, (fftw_complex *)a->out, FFTW_BACKWARD, FFTW_PATIENT);
}
void calc_firopt (FIROPT a)
{
// call for change in frequency, rate, wintype, gain
// must also call after a call to plan_firopt()
int i;
double* impulse = fir_bandpass (a->nc, a->f_low, a->f_high, a->samplerate, a->wintype, 1, a->gain);
a->buffidx = 0;
for (i = 0; i < a->nfor; i++)
{
// I right-justified the impulse response => take output from left side of output buff, discard right side
// Be careful about flipping an asymmetrical impulse response.
memcpy (&(a->maskgen[2 * a->size]), &(impulse[2 * a->size * i]), a->size * sizeof(complex));
fftw_execute (a->maskplan[i]);
}
_aligned_free (impulse);
}
FIROPT create_firopt (int run, int position, int size, double* in, double* out,
int nc, double f_low, double f_high, int samplerate, int wintype, double gain)
{
FIROPT a = (FIROPT) malloc0 (sizeof (firopt));
a->run = run;
a->position = position;
a->size = size;
a->in = in;
a->out = out;
a->nc = nc;
a->f_low = f_low;
a->f_high = f_high;
a->samplerate = samplerate;
a->wintype = wintype;
a->gain = gain;
plan_firopt (a);
calc_firopt (a);
return a;
}
void deplan_firopt (FIROPT a)
{
int i;
fftw_destroy_plan (a->crev);
_aligned_free (a->accum);
for (i = 0; i < a->nfor; i++)
{
_aligned_free (a->fftout[i]);
_aligned_free (a->fmask[i]);
fftw_destroy_plan (a->pcfor[i]);
fftw_destroy_plan (a->maskplan[i]);
}
_aligned_free (a->maskplan);
_aligned_free (a->pcfor);
_aligned_free (a->maskgen);
_aligned_free (a->fmask);
_aligned_free (a->fftout);
_aligned_free (a->fftin);
}
void destroy_firopt (FIROPT a)
{
deplan_firopt (a);
_aligned_free (a);
}
void flush_firopt (FIROPT a)
{
int i;
memset (a->fftin, 0, 2 * a->size * sizeof (complex));
for (i = 0; i < a->nfor; i++)
memset (a->fftout[i], 0, 2 * a->size * sizeof (complex));
a->buffidx = 0;
}
void xfiropt (FIROPT a, int pos)
{
if (a->run && (a->position == pos))
{
int i, j, k;
memcpy (&(a->fftin[2 * a->size]), a->in, a->size * sizeof (complex));
fftw_execute (a->pcfor[a->buffidx]);
k = a->buffidx;
memset (a->accum, 0, 2 * a->size * sizeof (complex));
for (j = 0; j < a->nfor; j++)
{
for (i = 0; i < 2 * a->size; i++)
{
a->accum[2 * i + 0] += a->fftout[k][2 * i + 0] * a->fmask[j][2 * i + 0] - a->fftout[k][2 * i + 1] * a->fmask[j][2 * i + 1];
a->accum[2 * i + 1] += a->fftout[k][2 * i + 0] * a->fmask[j][2 * i + 1] + a->fftout[k][2 * i + 1] * a->fmask[j][2 * i + 0];
}
k = (k + a->idxmask) & a->idxmask;
}
a->buffidx = (a->buffidx + 1) & a->idxmask;
fftw_execute (a->crev);
memcpy (a->fftin, &(a->fftin[2 * a->size]), a->size * sizeof(complex));
}
else if (a->in != a->out)
memcpy (a->out, a->in, a->size * sizeof (complex));
}
void setBuffers_firopt (FIROPT a, double* in, double* out)
{
a->in = in;
a->out = out;
deplan_firopt (a);
plan_firopt (a);
calc_firopt (a);
}
void setSamplerate_firopt (FIROPT a, int rate)
{
a->samplerate = rate;
calc_firopt (a);
}
void setSize_firopt (FIROPT a, int size)
{
a->size = size;
deplan_firopt (a);
plan_firopt (a);
calc_firopt (a);
}
void setFreqs_firopt (FIROPT a, double f_low, double f_high)
{
a->f_low = f_low;
a->f_high = f_high;
calc_firopt (a);
}
/********************************************************************************************************
* *
* Partitioned Overlap-Save Filter Kernel *
* *
********************************************************************************************************/
void plan_fircore (FIRCORE a)
{
// must call for change in 'nc', 'size', 'out'
int i;
a->nfor = a->nc / a->size;
a->cset = 0;
a->buffidx = 0;
a->idxmask = a->nfor - 1;
a->fftin = (double *) malloc0 (2 * a->size * sizeof (complex));
a->fftout = (double **) malloc0 (a->nfor * sizeof (double *));
a->fmask = (double ***) malloc0 (2 * sizeof (double **));
a->fmask[0] = (double **) malloc0 (a->nfor * sizeof (double *));
a->fmask[1] = (double **) malloc0 (a->nfor * sizeof (double *));
a->maskgen = (double *) malloc0 (2 * a->size * sizeof (complex));
a->pcfor = (fftw_plan *) malloc0 (a->nfor * sizeof (fftw_plan));
a->maskplan = (fftw_plan **) malloc0 (2 * sizeof (fftw_plan *));
a->maskplan[0] = (fftw_plan *) malloc0 (a->nfor * sizeof (fftw_plan));
a->maskplan[1] = (fftw_plan *) malloc0 (a->nfor * sizeof (fftw_plan));
for (i = 0; i < a->nfor; i++)
{
a->fftout[i] = (double *) malloc0 (2 * a->size * sizeof (complex));
a->fmask[0][i] = (double *) malloc0 (2 * a->size * sizeof (complex));
a->fmask[1][i] = (double *) malloc0 (2 * a->size * sizeof (complex));
a->pcfor[i] = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->fftin, (fftw_complex *)a->fftout[i], FFTW_FORWARD, FFTW_PATIENT);
a->maskplan[0][i] = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->maskgen, (fftw_complex *)a->fmask[0][i], FFTW_FORWARD, FFTW_PATIENT);
a->maskplan[1][i] = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->maskgen, (fftw_complex *)a->fmask[1][i], FFTW_FORWARD, FFTW_PATIENT);
}
a->accum = (double *) malloc0 (2 * a->size * sizeof (complex));
a->crev = fftw_plan_dft_1d(2 * a->size, (fftw_complex *)a->accum, (fftw_complex *)a->out, FFTW_BACKWARD, FFTW_PATIENT);
a->masks_ready = 0;
}
void calc_fircore (FIRCORE a, int flip)
{
// call for change in frequency, rate, wintype, gain
// must also call after a call to plan_firopt()
int i;
if (a->mp)
mp_imp (a->nc, a->impulse, a->imp, 16, 0);
else
memcpy (a->imp, a->impulse, a->nc * sizeof (complex));
for (i = 0; i < a->nfor; i++)
{
// I right-justified the impulse response => take output from left side of output buff, discard right side
// Be careful about flipping an asymmetrical impulse response.
memcpy (&(a->maskgen[2 * a->size]), &(a->imp[2 * a->size * i]), a->size * sizeof(complex));
fftw_execute (a->maskplan[1 - a->cset][i]);
}
a->masks_ready = 1;
if (flip)
{
EnterCriticalSection (&a->update);
a->cset = 1 - a->cset;
LeaveCriticalSection (&a->update);
a->masks_ready = 0;
}
}
FIRCORE create_fircore (int size, double* in, double* out, int nc, int mp, double* impulse)
{
FIRCORE a = (FIRCORE) malloc0 (sizeof (fircore));
a->size = size;
a->in = in;
a->out = out;
a->nc = nc;
a->mp = mp;
InitializeCriticalSectionAndSpinCount (&a->update, 2500);
plan_fircore (a);
a->impulse = (double *) malloc0 (a->nc * sizeof (complex));
a->imp = (double *) malloc0 (a->nc * sizeof (complex));
memcpy (a->impulse, impulse, a->nc * sizeof (complex));
calc_fircore (a, 1);
return a;
}
void deplan_fircore (FIRCORE a)
{
int i;
fftw_destroy_plan (a->crev);
_aligned_free (a->accum);
for (i = 0; i < a->nfor; i++)
{
_aligned_free (a->fftout[i]);
_aligned_free (a->fmask[0][i]);
_aligned_free (a->fmask[1][i]);
fftw_destroy_plan (a->pcfor[i]);
fftw_destroy_plan (a->maskplan[0][i]);
fftw_destroy_plan (a->maskplan[1][i]);
}
_aligned_free (a->maskplan[0]);
_aligned_free (a->maskplan[1]);
_aligned_free (a->maskplan);
_aligned_free (a->pcfor);
_aligned_free (a->maskgen);
_aligned_free (a->fmask[0]);
_aligned_free (a->fmask[1]);
_aligned_free (a->fmask);
_aligned_free (a->fftout);
_aligned_free (a->fftin);
}
void destroy_fircore (FIRCORE a)
{
deplan_fircore (a);
_aligned_free (a->imp);
_aligned_free (a->impulse);
DeleteCriticalSection (&a->update);
_aligned_free (a);
}
void flush_fircore (FIRCORE a)
{
int i;
memset (a->fftin, 0, 2 * a->size * sizeof (complex));
for (i = 0; i < a->nfor; i++)
memset (a->fftout[i], 0, 2 * a->size * sizeof (complex));
a->buffidx = 0;
}
void xfircore (FIRCORE a)
{
int i, j, k;
memcpy (&(a->fftin[2 * a->size]), a->in, a->size * sizeof (complex));
fftw_execute (a->pcfor[a->buffidx]);
k = a->buffidx;
memset (a->accum, 0, 2 * a->size * sizeof (complex));
EnterCriticalSection (&a->update);
double* accum = a->accum;
double** fftout = a->fftout;
double*** fmask = a->fmask;
int cset = a->cset;
int idxmask = a->idxmask;
int sz = a->size;
int nfor = a->nfor;
for (j = 0; j < nfor; j++)
{
for (i = 0; i < 2 * sz; i++)
{
accum[2 * i + 0] += fftout[k][2 * i + 0] * fmask[cset][j][2 * i + 0] - fftout[k][2 * i + 1] * fmask[cset][j][2 * i + 1];
accum[2 * i + 1] += fftout[k][2 * i + 0] * fmask[cset][j][2 * i + 1] + fftout[k][2 * i + 1] * fmask[cset][j][2 * i + 0];
}
k = (k + idxmask) & idxmask;
}
LeaveCriticalSection (&a->update);
a->buffidx = (a->buffidx + 1) & idxmask;
fftw_execute (a->crev);
memcpy (a->fftin, &(a->fftin[2 * a->size]), a->size * sizeof(complex));
}
void setBuffers_fircore (FIRCORE a, double* in, double* out)
{
a->in = in;
a->out = out;
deplan_fircore (a);
plan_fircore (a);
calc_fircore (a, 1);
}
void setSize_fircore (FIRCORE a, int size)
{
a->size = size;
deplan_fircore (a);
plan_fircore (a);
calc_fircore (a, 1);
}
void setImpulse_fircore (FIRCORE a, double* impulse, int update)
{
memcpy (a->impulse, impulse, a->nc * sizeof (complex));
calc_fircore (a, update);
}
void setNc_fircore (FIRCORE a, int nc, double* impulse)
{
// because of FFT planning, this will probably cause a glitch in audio if done during dataflow
deplan_fircore (a);
_aligned_free (a->impulse);
_aligned_free (a->imp);
a->nc = nc;
plan_fircore (a);
a->imp = (double *) malloc0 (a->nc * sizeof (complex));
a->impulse = (double *) malloc0 (a->nc * sizeof (complex));
memcpy (a->impulse, impulse, a->nc * sizeof (complex));
calc_fircore (a, 1);
}
void setMp_fircore (FIRCORE a, int mp)
{
a->mp = mp;
calc_fircore (a, 1);
}
void setUpdate_fircore (FIRCORE a)
{
if (a->masks_ready)
{
EnterCriticalSection (&a->update);
a->cset = 1 - a->cset;
LeaveCriticalSection (&a->update);
a->masks_ready = 0;
}
}