228 lines
		
	
	
		
			6.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			228 lines
		
	
	
		
			6.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * This file is part of FFmpeg.
 | |
|  *
 | |
|  * FFmpeg is free software; you can redistribute it and/or
 | |
|  * modify it under the terms of the GNU Lesser General Public
 | |
|  * License as published by the Free Software Foundation; either
 | |
|  * version 2.1 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  * FFmpeg is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | |
|  * Lesser General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU Lesser General Public
 | |
|  * License along with FFmpeg; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 | |
|  */
 | |
| 
 | |
| #undef ZERO
 | |
| #undef ONE
 | |
| #undef ftype
 | |
| #undef SAMPLE_FORMAT
 | |
| #if DEPTH == 32
 | |
| #define SAMPLE_FORMAT float
 | |
| #define ftype float
 | |
| #define ONE 1.f
 | |
| #define ZERO 0.f
 | |
| #else
 | |
| #define SAMPLE_FORMAT double
 | |
| #define ftype double
 | |
| #define ONE 1.0
 | |
| #define ZERO 0.0
 | |
| #endif
 | |
| 
 | |
| #define fn3(a,b)   a##_##b
 | |
| #define fn2(a,b)   fn3(a,b)
 | |
| #define fn(a)      fn2(a, SAMPLE_FORMAT)
 | |
| 
 | |
| #if DEPTH == 64
 | |
| static double scalarproduct_double(const double *v1, const double *v2, int len)
 | |
| {
 | |
|     double p = 0.0;
 | |
| 
 | |
|     for (int i = 0; i < len; i++)
 | |
|         p += v1[i] * v2[i];
 | |
| 
 | |
|     return p;
 | |
| }
 | |
| #endif
 | |
| 
 | |
| static ftype fn(fir_sample)(AudioAPContext *s, ftype sample, ftype *delay,
 | |
|                             ftype *coeffs, ftype *tmp, int *offset)
 | |
| {
 | |
|     const int order = s->order;
 | |
|     ftype output;
 | |
| 
 | |
|     delay[*offset] = sample;
 | |
| 
 | |
|     memcpy(tmp, coeffs + order - *offset, order * sizeof(ftype));
 | |
| #if DEPTH == 32
 | |
|     output = s->fdsp->scalarproduct_float(delay, tmp, s->kernel_size);
 | |
| #else
 | |
|     output = scalarproduct_double(delay, tmp, s->kernel_size);
 | |
| #endif
 | |
| 
 | |
|     if (--(*offset) < 0)
 | |
|         *offset = order - 1;
 | |
| 
 | |
|     return output;
 | |
| }
 | |
| 
 | |
| static int fn(lup_decompose)(ftype **MA, const int N, const ftype tol, int *P)
 | |
| {
 | |
|     for (int i = 0; i <= N; i++)
 | |
|         P[i] = i;
 | |
| 
 | |
|     for (int i = 0; i < N; i++) {
 | |
|         ftype maxA = ZERO;
 | |
|         int imax = i;
 | |
| 
 | |
|         for (int k = i; k < N; k++) {
 | |
|             ftype absA = fabs(MA[k][i]);
 | |
|             if (absA > maxA) {
 | |
|                 maxA = absA;
 | |
|                 imax = k;
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         if (maxA < tol)
 | |
|             return 0;
 | |
| 
 | |
|         if (imax != i) {
 | |
|             FFSWAP(int, P[i], P[imax]);
 | |
|             FFSWAP(ftype *, MA[i], MA[imax]);
 | |
|             P[N]++;
 | |
|         }
 | |
| 
 | |
|         for (int j = i + 1; j < N; j++) {
 | |
|             MA[j][i] /= MA[i][i];
 | |
| 
 | |
|             for (int k = i + 1; k < N; k++)
 | |
|                 MA[j][k] -= MA[j][i] * MA[i][k];
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return 1;
 | |
| }
 | |
| 
 | |
| static void fn(lup_invert)(ftype *const *MA, const int *P, const int N, ftype **IA)
 | |
| {
 | |
|     for (int j = 0; j < N; j++) {
 | |
|         for (int i = 0; i < N; i++) {
 | |
|             IA[i][j] = P[i] == j ? ONE : ZERO;
 | |
| 
 | |
|             for (int k = 0; k < i; k++)
 | |
|                 IA[i][j] -= MA[i][k] * IA[k][j];
 | |
|         }
 | |
| 
 | |
|         for (int i = N - 1; i >= 0; i--) {
 | |
|             for (int k = i + 1; k < N; k++)
 | |
|                 IA[i][j] -= MA[i][k] * IA[k][j];
 | |
| 
 | |
|             IA[i][j] /= MA[i][i];
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| static ftype fn(process_sample)(AudioAPContext *s, ftype input, ftype desired, int ch)
 | |
| {
 | |
|     ftype *dcoeffs = (ftype *)s->dcoeffs->extended_data[ch];
 | |
|     ftype *coeffs = (ftype *)s->coeffs->extended_data[ch];
 | |
|     ftype *delay = (ftype *)s->delay->extended_data[ch];
 | |
|     ftype **itmpmp = (ftype **)&s->itmpmp[s->projection * ch];
 | |
|     ftype **tmpmp = (ftype **)&s->tmpmp[s->projection * ch];
 | |
|     ftype *tmpm = (ftype *)s->tmpm->extended_data[ch];
 | |
|     ftype *tmp = (ftype *)s->tmp->extended_data[ch];
 | |
|     ftype *e = (ftype *)s->e->extended_data[ch];
 | |
|     ftype *x = (ftype *)s->x->extended_data[ch];
 | |
|     ftype *w = (ftype *)s->w->extended_data[ch];
 | |
|     int *p = (int *)s->p->extended_data[ch];
 | |
|     int *offset = (int *)s->offset->extended_data[ch];
 | |
|     const int projection = s->projection;
 | |
|     const ftype delta = s->delta;
 | |
|     const int order = s->order;
 | |
|     const int length = projection + order;
 | |
|     const ftype mu = s->mu;
 | |
|     const ftype tol = 0.00001f;
 | |
|     ftype output;
 | |
| 
 | |
|     x[offset[2] + length] = x[offset[2]] = input;
 | |
|     delay[offset[0] + order] = input;
 | |
| 
 | |
|     output = fn(fir_sample)(s, input, delay, coeffs, tmp, offset);
 | |
|     e[offset[1]] = e[offset[1] + projection] = desired - output;
 | |
| 
 | |
|     for (int i = 0; i < projection; i++) {
 | |
|         const int iprojection = i * projection;
 | |
| 
 | |
|         for (int j = i; j < projection; j++) {
 | |
|             ftype sum = ZERO;
 | |
|             for (int k = 0; k < order; k++)
 | |
|                 sum += x[offset[2] + i + k] * x[offset[2] + j + k];
 | |
|             tmpm[iprojection + j] = sum;
 | |
|             if (i != j)
 | |
|                 tmpm[j * projection + i] = sum;
 | |
|         }
 | |
| 
 | |
|         tmpm[iprojection + i] += delta;
 | |
|     }
 | |
| 
 | |
|     fn(lup_decompose)(tmpmp, projection, tol, p);
 | |
|     fn(lup_invert)(tmpmp, p, projection, itmpmp);
 | |
| 
 | |
|     for (int i = 0; i < projection; i++) {
 | |
|         ftype sum = ZERO;
 | |
|         for (int j = 0; j < projection; j++)
 | |
|             sum += itmpmp[i][j] * e[j + offset[1]];
 | |
|         w[i] = sum;
 | |
|     }
 | |
| 
 | |
|     for (int i = 0; i < order; i++) {
 | |
|         ftype sum = ZERO;
 | |
|         for (int j = 0; j < projection; j++)
 | |
|             sum += x[offset[2] + i + j] * w[j];
 | |
|         dcoeffs[i] = sum;
 | |
|     }
 | |
| 
 | |
|     for (int i = 0; i < order; i++)
 | |
|         coeffs[i] = coeffs[i + order] = coeffs[i] + mu * dcoeffs[i];
 | |
| 
 | |
|     if (--offset[1] < 0)
 | |
|         offset[1] = projection - 1;
 | |
| 
 | |
|     if (--offset[2] < 0)
 | |
|         offset[2] = length - 1;
 | |
| 
 | |
|     switch (s->output_mode) {
 | |
|     case IN_MODE:      output = input;            break;
 | |
|     case DESIRED_MODE: output = desired;          break;
 | |
|     case OUT_MODE:     output = desired - output; break;
 | |
|     case NOISE_MODE:   output = input - output;   break;
 | |
|     case ERROR_MODE:                              break;
 | |
|     }
 | |
|     return output;
 | |
| }
 | |
| 
 | |
| static int fn(filter_channels)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
 | |
| {
 | |
|     AudioAPContext *s = ctx->priv;
 | |
|     AVFrame *out = arg;
 | |
|     const int start = (out->ch_layout.nb_channels * jobnr) / nb_jobs;
 | |
|     const int end = (out->ch_layout.nb_channels * (jobnr+1)) / nb_jobs;
 | |
| 
 | |
|     for (int c = start; c < end; c++) {
 | |
|         const ftype *input = (const ftype *)s->frame[0]->extended_data[c];
 | |
|         const ftype *desired = (const ftype *)s->frame[1]->extended_data[c];
 | |
|         ftype *output = (ftype *)out->extended_data[c];
 | |
| 
 | |
|         for (int n = 0; n < out->nb_samples; n++) {
 | |
|             output[n] = fn(process_sample)(s, input[n], desired[n], c);
 | |
|             if (ctx->is_disabled)
 | |
|                 output[n] = input[n];
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return 0;
 | |
| }
 |