wrappers_r4d.c

/*****************************************************************************
! Copyright(C) 2006-2013 Intel Corporation. All Rights Reserved.
! 
! The source code, information  and  material ("Material") contained herein is
! owned  by Intel Corporation or its suppliers or licensors, and title to such
! Material remains  with Intel Corporation  or its suppliers or licensors. The
! Material  contains proprietary information  of  Intel or  its  suppliers and
! licensors. The  Material is protected by worldwide copyright laws and treaty
! provisions. No  part  of  the  Material  may  be  used,  copied, reproduced,
! modified, published, uploaded, posted, transmitted, distributed or disclosed
! in any way  without Intel's  prior  express written  permission. No  license
! under  any patent, copyright  or  other intellectual property rights  in the
! Material  is  granted  to  or  conferred  upon  you,  either  expressly,  by
! implication, inducement,  estoppel or  otherwise.  Any  license  under  such
! intellectual  property  rights must  be express  and  approved  by  Intel in
! writing.
! 
! *Third Party trademarks are the property of their respective owners.
! 
! Unless otherwise  agreed  by Intel  in writing, you may not remove  or alter
! this  notice or  any other notice embedded  in Materials by Intel or Intel's
! suppliers or licensors in any way.
!
!*****************************************************************************
! Content:
!    MKL Cluster DFT using FFTW interface (via wrappers)
!    example program (C-interface)
!
!    Forward-Backward 4D real-to-complex transform for double/single
!    precision data.
!
!*****************************************************************************
! Configuration parameters:
!    DFTI_FORWARD_DOMAIN = DFTI_REAL                         (obligatory)
!    DFTI_PRECISION      = DFTI_DOUBLE/DFTI_SINGLE           (obligatory)
!    DFTI_DIMENSION      = 4                                 (obligatory)
!    DFTI_LENGTHS        = {len[0],len[1],len[2],len[3]}     (obligatory)
!    DFTI_FORWARD_SCALE  = 1.0                               (default)
!    DFTI_BACKWARD_SCALE = 1.0/(len[0]*len[1]*len[2]*len[3]) (default=1.0)
!
!****************************************************************************/

#include <stdlib.h>
#include <math.h>
#include "rfftw_mpi.h"

#ifdef FFTW_ENABLE_FLOAT
    #define EPS 1.0E-6
#else
    #define EPS 1.0E-12
#endif

int main(int argc,char *argv[])
{

    fftw_real *local,*work;
    fftw_real *preal,t,err,g_err,scale;
    int i0,i1,i2,i3,PrS,PrR;
    rfftwnd_mpi_plan plan;

    int nx,nx_out,start_x,start_x_out,size;
    int len[4], len3_padded;
    int failure = 0;

    MPI_Init(&argc,&argv);
    MPI_Comm_size(MPI_COMM_WORLD,&PrS);
    MPI_Comm_rank(MPI_COMM_WORLD,&PrR);
    len[0]=64;
    len[1]=32;
    len[2]=80;
    len[3]=20;
    len3_padded = 2*(len[3]/2+1);

/*--- Usage of MPI FFTW for Real-to-Complex Multi-dimensional Transforms (work==NULL) n=4. rfftwnd_create_plan ---*/

    if (PrR==0) printf("Usage of MPI FFTW for Real-to-Complex Multi-dimensional Transforms (work==NULL) n=4.\nPlan = rfftwnd_mpi_create_plan(...)\n");
    if (PrR==0) printf("PrS=%d, lengths={%d,%d,%d,%d}\n",PrS,len[0],len[1],len[2],len[3]);

    plan=rfftwnd_mpi_create_plan(MPI_COMM_WORLD,4,len,FFTW_FORWARD,FFTW_ESTIMATE);

    if (PrR==0) printf("     CreatePlan for Forward....DONE\n");

    rfftwnd_mpi_local_sizes(plan,&nx,&start_x,&nx_out,&start_x_out,&size);
    if (PrR==0) printf("     LocalSizes................DONE\n");
    local=(fftw_real*)fftw_malloc(size*sizeof(fftw_complex));
    preal=(fftw_real*)local;
    srand(PrR*100);
    for (i0=0;i0<nx;i0++)
        for (i1=0;i1<len[1];i1++)
            for (i2=0;i2<len[2];i2++)
                for (i3=0;i3<len[3];i3++)
                    preal[i3+(i2+i1*len[2]+i0*len[1]*len[2])*len3_padded]=(fftw_real)rand()/RAND_MAX;

    rfftwnd_mpi(plan,1,local,NULL,FFTW_NORMAL_ORDER);
    if (PrR==0) printf("     Forward FFTW..............DONE\n");

    rfftwnd_mpi_destroy_plan(plan);
    if (PrR==0) printf("     Destroy plan for Forward..DONE\n");

    plan=rfftwnd_mpi_create_plan(MPI_COMM_WORLD,4,len,FFTW_BACKWARD,FFTW_ESTIMATE);
    if (PrR==0) printf("     CreatePlan for Backward...DONE\n");

    rfftwnd_mpi(plan,1,local,NULL,FFTW_NORMAL_ORDER);
    scale=1.0/len[1]/len[2]/len[3]/len[0];
    if (PrR==0) printf("     Backward FFTW.............DONE\n");

    for (i0=0;i0<nx;i0++)
        for (i1=0;i1<len[1];i1++)
            for (i2=0;i2<len[2];i2++)
                for (i3=0;i3<len[3];i3++)
                    preal[i3+(i2+i1*len[2]+i0*len[1]*len[2])*len3_padded]*=scale;

    rfftwnd_mpi_destroy_plan(plan);
    if (PrR==0) printf("     Destroy plan for Backward.DONE\n");
    srand(PrR*100);
    err=0.0;
    for (i0=0;i0<nx;i0++)
        for (i1=0;i1<len[1];i1++)
            for (i2=0;i2<len[2];i2++)
                for (i3=0;i3<len[3];i3++) {
                    t=fabs(preal[i3+(i2+i1*len[2]+i0*len[1]*len[2])*len3_padded]-(fftw_real)rand()/RAND_MAX);
                    if (t>err) err=t;
                }
    fftw_free(local);
#ifdef FFTW_ENABLE_FLOAT
    MPI_Reduce(&err,&g_err,1,MPI_FLOAT,MPI_MAX,0,MPI_COMM_WORLD);
#else
    MPI_Reduce(&err,&g_err,1,MPI_DOUBLE,MPI_MAX,0,MPI_COMM_WORLD);
#endif
    if (PrR==0) {
        printf("     Error=%e\n",g_err);
        if (g_err<EPS) {
            printf(" TEST OK\n\n");
        } else {
            printf(" TEST FAILED\n\n");
            failure++;
        }
    }

/*--- Usage of MPI FFTW for Real-to-Complex Multi-dimensional Transforms n=4. rfftwnd_create_plan ---*/

    if (PrR==0) printf("Usage of MPI FFTW for Real-to-Complex Multi-dimensional Transforms n=4.\nPlan = rfftwnd_mpi_create_plan(...)\n");
    if (PrR==0) printf("PrS=%d, lengths={%d,%d,%d,%d}\n",PrS,len[0],len[1],len[2],len[3]);
    plan=rfftwnd_mpi_create_plan(MPI_COMM_WORLD,4,len,FFTW_FORWARD,FFTW_ESTIMATE);
    if (PrR==0) printf("     CreatePlan for Forward....DONE\n");

    rfftwnd_mpi_local_sizes(plan,&nx,&start_x,&nx_out,&start_x_out,&size);
    if (PrR==0) printf("     LocalSizes................DONE\n");
    local=(fftw_real*)fftw_malloc(size*sizeof(fftw_complex));
    work=(fftw_real*)fftw_malloc(size*sizeof(fftw_complex));
    preal=(fftw_real*)local;

    srand(PrR*100);

    for (i0=0;i0<nx;i0++)
        for (i1=0;i1<len[1];i1++)
            for (i2=0;i2<len[2];i2++)
                for (i3=0;i3<len[3];i3++)
                    preal[i3+(i2+i1*len[2]+i0*len[1]*len[2])*len3_padded]=(fftw_real)rand()/RAND_MAX;

    rfftwnd_mpi(plan,1,local,work,FFTW_NORMAL_ORDER);
    if (PrR==0) printf("     Forward FFTW..............DONE\n");

    rfftwnd_mpi_destroy_plan(plan);
    if (PrR==0) printf("     Destroy plan for Forward..DONE\n");

    plan=rfftwnd_mpi_create_plan(MPI_COMM_WORLD,4,len,FFTW_BACKWARD,FFTW_ESTIMATE);
    if (PrR==0) printf("     CreatePlan for Backward...DONE\n");

    rfftwnd_mpi(plan,1,local,work,FFTW_NORMAL_ORDER);
    scale=1.0/len[1]/len[2]/len[3]/len[0];
    if (PrR==0) printf("     Backward FFTW.............DONE\n");

    for (i0=0;i0<nx;i0++)
        for (i1=0;i1<len[1];i1++)
            for (i2=0;i2<len[2];i2++)
                for (i3=0;i3<len[3];i3++)
                    preal[i3+(i2+i1*len[2]+i0*len[1]*len[2])*len3_padded]*=scale;

    rfftwnd_mpi_destroy_plan(plan);
    if (PrR==0) printf("     Destroy plan for Backward.DONE\n");
    srand(PrR*100);
    err=0.0;
    for (i0=0;i0<nx;i0++)
        for (i1=0;i1<len[1];i1++)
            for (i2=0;i2<len[2];i2++)
                for (i3=0;i3<len[3];i3++) {
                    t=fabs(preal[i3+(i2+i1*len[2]+i0*len[1]*len[2])*len3_padded]-(fftw_real)rand()/RAND_MAX);
                    if (t>err) err=t;
                }
    fftw_free(local);
    fftw_free(work);
#ifdef FFTW_ENABLE_FLOAT
    MPI_Reduce(&err,&g_err,1,MPI_FLOAT,MPI_MAX,0,MPI_COMM_WORLD);
#else
    MPI_Reduce(&err,&g_err,1,MPI_DOUBLE,MPI_MAX,0,MPI_COMM_WORLD);
#endif
    MPI_Finalize();

    if (PrR==0) {
        printf("     Error=%e\n",g_err);
        if (g_err<EPS) {
            printf(" TEST PASSED\n");
        } else {
            printf(" TEST FAILED\n");
            return 1;
        }
    }

    if (failure)
        return 1;

    if (PrR==0) printf(" END OF TEST\n");

    return 0;
}
For more complete information about compiler optimizations, see our Optimization Notice.