Blame fft/hc_pass_n.c

Packit 67cb25
/* fft/hc_pass_n.c
Packit 67cb25
 * 
Packit 67cb25
 * Copyright (C) 1996, 1997, 1998, 1999, 2000, 2007 Brian Gough
Packit 67cb25
 * 
Packit 67cb25
 * This program is free software; you can redistribute it and/or modify
Packit 67cb25
 * it under the terms of the GNU General Public License as published by
Packit 67cb25
 * the Free Software Foundation; either version 3 of the License, or (at
Packit 67cb25
 * your option) any later version.
Packit 67cb25
 * 
Packit 67cb25
 * This program is distributed in the hope that it will be useful, but
Packit 67cb25
 * WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 67cb25
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 67cb25
 * General Public License for more details.
Packit 67cb25
 * 
Packit 67cb25
 * You should have received a copy of the GNU General Public License
Packit 67cb25
 * along with this program; if not, write to the Free Software
Packit 67cb25
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
Packit 67cb25
 */
Packit 67cb25
Packit 67cb25
static void
Packit 67cb25
FUNCTION(fft_halfcomplex,pass_n) (const BASE in[],
Packit 67cb25
                                  const size_t istride,
Packit 67cb25
                                  BASE out[],
Packit 67cb25
                                  const size_t ostride,
Packit 67cb25
                                  const size_t factor,
Packit 67cb25
                                  const size_t product,
Packit 67cb25
                                  const size_t n,
Packit 67cb25
                                  const TYPE(gsl_complex) twiddle[])
Packit 67cb25
{
Packit 67cb25
Packit 67cb25
  size_t k, k1;
Packit 67cb25
Packit 67cb25
  const size_t m = n / factor;
Packit 67cb25
  const size_t q = n / product;
Packit 67cb25
  const size_t product_1 = product / factor;
Packit 67cb25
Packit 67cb25
  size_t e1, e2;
Packit 67cb25
Packit 67cb25
  const double d_theta = 2.0 * M_PI / ((double) factor);
Packit 67cb25
  const ATOMIC cos_d_theta = cos (d_theta);
Packit 67cb25
  const ATOMIC sin_d_theta = sin (d_theta);
Packit 67cb25
Packit 67cb25
  for (k1 = 0; k1 < product_1; k1++)
Packit 67cb25
    {
Packit 67cb25
      /* compute z = W(factor) x, for x halfcomplex */
Packit 67cb25
Packit 67cb25
      ATOMIC dw_real = 1.0, dw_imag = 0.0;
Packit 67cb25
Packit 67cb25
      for (e1 = 0; e1 < factor; e1++)
Packit 67cb25
        {
Packit 67cb25
          ATOMIC sum_real = 0.0;
Packit 67cb25
          ATOMIC w_real = 1.0, w_imag = 0.0;
Packit 67cb25
Packit 67cb25
          if (e1 > 0)
Packit 67cb25
            {
Packit 67cb25
              ATOMIC tmp_real = dw_real * cos_d_theta - dw_imag * sin_d_theta;
Packit 67cb25
              ATOMIC tmp_imag = dw_real * sin_d_theta + dw_imag * cos_d_theta;
Packit 67cb25
              dw_real = tmp_real;
Packit 67cb25
              dw_imag = tmp_imag;
Packit 67cb25
            }
Packit 67cb25
Packit 67cb25
          for (e2 = 0; e2 <= factor - e2; e2++)
Packit 67cb25
            {
Packit 67cb25
              ATOMIC z_real, z_imag;
Packit 67cb25
Packit 67cb25
              if (e2 > 0)
Packit 67cb25
                {
Packit 67cb25
                  ATOMIC tmp_real = dw_real * w_real - dw_imag * w_imag;
Packit 67cb25
                  ATOMIC tmp_imag = dw_real * w_imag + dw_imag * w_real;
Packit 67cb25
                  w_real = tmp_real;
Packit 67cb25
                  w_imag = tmp_imag;
Packit 67cb25
                }
Packit 67cb25
Packit 67cb25
              if (e2 == 0)
Packit 67cb25
                {
Packit 67cb25
                  size_t from_idx = factor * k1 * q;
Packit 67cb25
                  z_real = VECTOR(in,istride,from_idx);
Packit 67cb25
                  z_imag = 0.0;
Packit 67cb25
                  sum_real += w_real * z_real - w_imag * z_imag;
Packit 67cb25
                }
Packit 67cb25
              else if (e2 == factor - e2)
Packit 67cb25
                {
Packit 67cb25
                  size_t from_idx = factor * q * k1 + 2 * e2 * q - 1;
Packit 67cb25
                  z_real = VECTOR(in,istride,from_idx);
Packit 67cb25
                  z_imag = 0.0;
Packit 67cb25
                  sum_real += w_real * z_real;
Packit 67cb25
                }
Packit 67cb25
              else
Packit 67cb25
                {
Packit 67cb25
                  size_t from_idx = factor * q * k1 + 2 * e2 * q - 1;
Packit 67cb25
                  z_real = VECTOR(in,istride,from_idx);
Packit 67cb25
                  z_imag = VECTOR(in,istride,from_idx + 1);
Packit 67cb25
                  sum_real += 2 * (w_real * z_real - w_imag * z_imag);
Packit 67cb25
                }
Packit 67cb25
Packit 67cb25
            }
Packit 67cb25
Packit 67cb25
          {
Packit 67cb25
            const size_t to_idx = q * k1 + e1 * m;
Packit 67cb25
            VECTOR(out,ostride,to_idx) = sum_real;
Packit 67cb25
          }
Packit 67cb25
        }
Packit 67cb25
    }
Packit 67cb25
Packit 67cb25
  if (q == 1)
Packit 67cb25
    return;
Packit 67cb25
Packit 67cb25
  for (k = 1; k < (q + 1) / 2; k++)
Packit 67cb25
    {
Packit 67cb25
      for (k1 = 0; k1 < product_1; k1++)
Packit 67cb25
        {
Packit 67cb25
Packit 67cb25
          ATOMIC dw_real = 1.0, dw_imag = 0.0;
Packit 67cb25
Packit 67cb25
          for (e1 = 0; e1 < factor; e1++)
Packit 67cb25
            {
Packit 67cb25
              ATOMIC z_real, z_imag;
Packit 67cb25
              ATOMIC sum_real = 0.0;
Packit 67cb25
              ATOMIC sum_imag = 0.0;
Packit 67cb25
              ATOMIC w_real = 1.0, w_imag = 0.0;
Packit 67cb25
Packit 67cb25
              if (e1 > 0)
Packit 67cb25
                {
Packit 67cb25
                  ATOMIC t_real = dw_real * cos_d_theta - dw_imag * sin_d_theta;
Packit 67cb25
                  ATOMIC t_imag = dw_real * sin_d_theta + dw_imag * cos_d_theta;
Packit 67cb25
                  dw_real = t_real;
Packit 67cb25
                  dw_imag = t_imag;
Packit 67cb25
                }
Packit 67cb25
Packit 67cb25
              for (e2 = 0; e2 < factor; e2++)
Packit 67cb25
                {
Packit 67cb25
Packit 67cb25
                  if (e2 > 0)
Packit 67cb25
                    {
Packit 67cb25
                      ATOMIC tmp_real = dw_real * w_real - dw_imag * w_imag;
Packit 67cb25
                      ATOMIC tmp_imag = dw_real * w_imag + dw_imag * w_real;
Packit 67cb25
                      w_real = tmp_real;
Packit 67cb25
                      w_imag = tmp_imag;
Packit 67cb25
                    }
Packit 67cb25
Packit 67cb25
                  if (e2 < factor - e2)
Packit 67cb25
                    {
Packit 67cb25
                      const size_t from0 = factor * k1 * q + 2 * k + 2 * e2 * q - 1;
Packit 67cb25
                      z_real = VECTOR(in,istride,from0);
Packit 67cb25
                      z_imag = VECTOR(in,istride,from0 + 1);
Packit 67cb25
                    }
Packit 67cb25
                  else
Packit 67cb25
                    {
Packit 67cb25
                      const size_t from0 = factor * k1 * q - 2 * k + 2 * (factor - e2) * q - 1;
Packit 67cb25
                      z_real = VECTOR(in,istride,from0);
Packit 67cb25
                      z_imag = -VECTOR(in,istride,from0 + 1);
Packit 67cb25
                    }
Packit 67cb25
Packit 67cb25
                  sum_real += w_real * z_real - w_imag * z_imag;
Packit 67cb25
                  sum_imag += w_real * z_imag + w_imag * z_real;
Packit 67cb25
                }
Packit 67cb25
Packit 67cb25
              if (k == 0 || e1 == 0)
Packit 67cb25
                {
Packit 67cb25
                  w_real = 1.0;
Packit 67cb25
                  w_imag = 0.0;
Packit 67cb25
                }
Packit 67cb25
              else
Packit 67cb25
                {
Packit 67cb25
                  size_t tskip = (q + 1) / 2 - 1;
Packit 67cb25
                  w_real = GSL_REAL(twiddle[k - 1 + tskip * (e1 - 1)]);
Packit 67cb25
                  w_imag = GSL_IMAG(twiddle[k - 1 + tskip * (e1 - 1)]);
Packit 67cb25
                }
Packit 67cb25
Packit 67cb25
              {
Packit 67cb25
                const size_t to0 = k1 * q + 2 * k + e1 * m - 1;
Packit 67cb25
                VECTOR(out,ostride,to0) = w_real * sum_real - w_imag * sum_imag;
Packit 67cb25
                VECTOR(out,ostride,to0 + 1) = w_real * sum_imag + w_imag * sum_real;
Packit 67cb25
              }
Packit 67cb25
Packit 67cb25
            }
Packit 67cb25
        }
Packit 67cb25
    }
Packit 67cb25
Packit 67cb25
Packit 67cb25
  if (q % 2 == 1)
Packit 67cb25
    return;
Packit 67cb25
Packit 67cb25
  {
Packit 67cb25
    double tw_arg = M_PI / ((double) factor);
Packit 67cb25
    ATOMIC cos_tw_arg = cos (tw_arg);
Packit 67cb25
    ATOMIC sin_tw_arg = sin (tw_arg);
Packit 67cb25
Packit 67cb25
    for (k1 = 0; k1 < product_1; k1++)
Packit 67cb25
      {
Packit 67cb25
Packit 67cb25
        ATOMIC dw_real = 1.0, dw_imag = 0.0;
Packit 67cb25
        ATOMIC tw_real = 1.0, tw_imag = 0.0;
Packit 67cb25
Packit 67cb25
        for (e1 = 0; e1 < factor; e1++)
Packit 67cb25
          {
Packit 67cb25
            ATOMIC w_real, w_imag, z_real, z_imag;
Packit 67cb25
Packit 67cb25
            ATOMIC sum_real = 0.0;
Packit 67cb25
Packit 67cb25
            if (e1 > 0)
Packit 67cb25
              {
Packit 67cb25
                ATOMIC tmp_real = tw_real * cos_tw_arg - tw_imag * sin_tw_arg;
Packit 67cb25
                ATOMIC tmp_imag = tw_real * sin_tw_arg + tw_imag * cos_tw_arg;
Packit 67cb25
                tw_real = tmp_real;
Packit 67cb25
                tw_imag = tmp_imag;
Packit 67cb25
              }
Packit 67cb25
Packit 67cb25
            w_real = tw_real;
Packit 67cb25
            w_imag = tw_imag;
Packit 67cb25
Packit 67cb25
            if (e1 > 0)
Packit 67cb25
              {
Packit 67cb25
                ATOMIC t_real = dw_real * cos_d_theta - dw_imag * sin_d_theta;
Packit 67cb25
                ATOMIC t_imag = dw_real * sin_d_theta + dw_imag * cos_d_theta;
Packit 67cb25
                dw_real = t_real;
Packit 67cb25
                dw_imag = t_imag;
Packit 67cb25
              }
Packit 67cb25
Packit 67cb25
            for (e2 = 0; e2 <= factor - e2 - 1; e2++)
Packit 67cb25
              {
Packit 67cb25
Packit 67cb25
                if (e2 > 0)
Packit 67cb25
                  {
Packit 67cb25
                    ATOMIC tmp_real = dw_real * w_real - dw_imag * w_imag;
Packit 67cb25
                    ATOMIC tmp_imag = dw_real * w_imag + dw_imag * w_real;
Packit 67cb25
                    w_real = tmp_real;
Packit 67cb25
                    w_imag = tmp_imag;
Packit 67cb25
                  }
Packit 67cb25
Packit 67cb25
Packit 67cb25
                if (e2 == factor - e2 - 1)
Packit 67cb25
                  {
Packit 67cb25
                    const size_t from0 = factor * k1 * q + q + 2 * e2 * q - 1;
Packit 67cb25
                    z_real = VECTOR(in,istride,from0);
Packit 67cb25
                    z_imag = 0.0;
Packit 67cb25
                    sum_real += w_real * z_real - w_imag * z_imag;
Packit 67cb25
                  }
Packit 67cb25
                else
Packit 67cb25
                  {
Packit 67cb25
                    const size_t from0 = factor * k1 * q + q + 2 * e2 * q - 1;
Packit 67cb25
                    z_real = VECTOR(in,istride,from0);
Packit 67cb25
                    z_imag = VECTOR(in,istride,from0 + 1);
Packit 67cb25
                    sum_real += 2 * (w_real * z_real - w_imag * z_imag);
Packit 67cb25
                  }
Packit 67cb25
Packit 67cb25
              }
Packit 67cb25
Packit 67cb25
            {
Packit 67cb25
              const size_t to0 = k1 * q + q + e1 * m - 1;
Packit 67cb25
              VECTOR(out,ostride,to0) = sum_real;
Packit 67cb25
            }
Packit 67cb25
          }
Packit 67cb25
      }
Packit 67cb25
  }
Packit 67cb25
  return;
Packit 67cb25
}