/* Spa */ /* SPDX-FileCopyrightText: Copyright © 2019 Wim Taymans */ /* SPDX-License-Identifier: MIT */ #include #include #include "resample.h" typedef void (*resample_func_t)(struct resample *r, const void * SPA_RESTRICT src[], uint32_t ioffs, uint32_t *in_len, void * SPA_RESTRICT dst[], uint32_t ooffs, uint32_t *out_len); struct resample_info { uint32_t format; resample_func_t process_copy; const char *copy_name; resample_func_t process_full; const char *full_name; resample_func_t process_inter; const char *inter_name; uint32_t cpu_flags; }; struct native_data { double rate; uint32_t n_taps; uint32_t n_phases; uint32_t in_rate; uint32_t out_rate; float phase; uint32_t inc; uint32_t frac; uint32_t filter_stride; uint32_t filter_stride_os; uint32_t hist; float **history; resample_func_t func; float *filter; float *hist_mem; const struct resample_info *info; }; #define DEFINE_RESAMPLER(type,arch) \ void do_resample_##type##_##arch(struct resample *r, \ const void * SPA_RESTRICT src[], uint32_t ioffs, uint32_t *in_len, \ void * SPA_RESTRICT dst[], uint32_t ooffs, uint32_t *out_len) #define MAKE_RESAMPLER_COPY(arch) \ DEFINE_RESAMPLER(copy,arch) \ { \ struct native_data *data = r->data; \ uint32_t index, n_taps = data->n_taps, n_taps2 = n_taps/2; \ uint32_t c, olen = *out_len, ilen = *in_len, ch = r->channels; \ \ index = ioffs; \ if (ooffs < olen && index + n_taps <= ilen) { \ uint32_t to_copy = SPA_MIN(olen - ooffs, \ ilen - (index + n_taps) + 1); \ for (c = 0; c < ch; c++) { \ const float *s = src[c]; \ float *d = dst[c]; \ spa_memcpy(&d[ooffs], &s[index + n_taps2], \ to_copy * sizeof(float)); \ } \ index += to_copy; \ ooffs += to_copy; \ } \ *in_len = index; \ *out_len = ooffs; \ } #define INC(index,phase,n_phases) \ index += inc; \ phase += frac; \ if (phase >= n_phases) { \ phase -= n_phases; \ index += 1; \ } #define MAKE_RESAMPLER_FULL(arch) \ DEFINE_RESAMPLER(full,arch) \ { \ struct native_data *data = r->data; \ uint32_t n_taps = data->n_taps, stride = data->filter_stride_os; \ uint32_t index, phase, n_phases = data->out_rate; \ uint32_t c, o, olen = *out_len, ilen = *in_len; \ uint32_t inc = data->inc, frac = data->frac, ch = r->channels; \ \ index = ioffs; \ phase = (uint32_t)data->phase; \ for (o = ooffs; o < olen && index + n_taps <= ilen; o++) { \ float *filter = &data->filter[phase * stride]; \ for (c = 0; c < ch; c++) { \ const float *s = src[c]; \ float *d = dst[c]; \ inner_product_##arch(&d[o], &s[index], \ filter, n_taps); \ } \ INC(index, phase, n_phases); \ } \ *in_len = index; \ *out_len = o; \ data->phase = phase; \ } #define MAKE_RESAMPLER_INTER(arch) \ DEFINE_RESAMPLER(inter,arch) \ { \ struct native_data *data = r->data; \ uint32_t index, stride = data->filter_stride; \ uint32_t n_phases = data->n_phases, out_rate = data->out_rate; \ uint32_t n_taps = data->n_taps; \ uint32_t c, o, olen = *out_len, ilen = *in_len; \ uint32_t inc = data->inc, frac = data->frac, ch = r->channels; \ float phase; \ \ index = ioffs; \ phase = data->phase; \ for (o = ooffs; o < olen && index + n_taps <= ilen; o++) { \ float ph = phase * n_phases / out_rate; \ uint32_t offset = (uint32_t)floorf(ph); \ float *filter0 = &data->filter[(offset+0) * stride]; \ float *filter1 = &data->filter[(offset+1) * stride]; \ float pho = ph - offset; \ for (c = 0; c < ch; c++) { \ const float *s = src[c]; \ float *d = dst[c]; \ inner_product_ip_##arch(&d[o], &s[index], \ filter0, filter1, pho, n_taps); \ } \ INC(index, phase, out_rate); \ } \ *in_len = index; \ *out_len = o; \ data->phase = phase; \ } DEFINE_RESAMPLER(copy,c); DEFINE_RESAMPLER(full,c); DEFINE_RESAMPLER(inter,c); #if defined (HAVE_NEON) DEFINE_RESAMPLER(full,neon); DEFINE_RESAMPLER(inter,neon); #endif #if defined (HAVE_SSE) DEFINE_RESAMPLER(full,sse); DEFINE_RESAMPLER(inter,sse); #endif #if defined (HAVE_SSSE3) DEFINE_RESAMPLER(full,ssse3); DEFINE_RESAMPLER(inter,ssse3); #endif #if defined (HAVE_AVX) && defined(HAVE_FMA) DEFINE_RESAMPLER(full,avx); DEFINE_RESAMPLER(inter,avx); #endif