fasp/PreAMGSetupSA_8c_source.html

#include <math.h>

#include <time.h>


#ifdef _OPENMP

#include <omp.h>

#endif


#include "fasp.h"

#include "fasp_functs.h"


/*---------------------------------*/

/*--  Declare Private Functions  --*/

/*---------------------------------*/


#include "PreAMGAggregation.inl"

#include "PreAMGAggregationCSR.inl"


static SHORT amg_setup_smoothP_smoothR (AMG_data *, AMG_param *);

static SHORT amg_setup_smoothP_unsmoothR (AMG_data *, AMG_param *);

static void smooth_agg (dCSRmat *, dCSRmat *, dCSRmat *, AMG_param *, dCSRmat *);


/*---------------------------------*/

/*--      Public Functions       --*/

/*---------------------------------*/


SHORT fasp_amg_setup_sa (AMG_data   *mgl,

                         AMG_param  *param)

{

    const SHORT prtlvl     = param->print_level;

    const SHORT smoothR    = param->smooth_restriction;

    SHORT status           = FASP_SUCCESS;


    // Output some info for debuging

    if ( prtlvl > PRINT_NONE ) printf("\nSetting up SA AMG ...\n");


#if DEBUG_MODE > 0

    printf("### DEBUG: [-Begin-] %s ...\n", __FUNCTION__);

    printf("### DEBUG: nr=%d, nc=%d, nnz=%d\n",

           mgl[0].A.row, mgl[0].A.col, mgl[0].A.nnz);

#endif


    if ( smoothR ) { // Default: smoothed P, smoothed R

        status = amg_setup_smoothP_smoothR(mgl, param);

    }

    else { // smoothed P, unsmoothed R

        status = amg_setup_smoothP_unsmoothR(mgl, param);

    }


#if DEBUG_MODE > 0

    printf("### DEBUG: [--End--] %s ...\n", __FUNCTION__);

#endif


    return status;

}


/*---------------------------------*/

/*--      Private Functions      --*/

/*---------------------------------*/


static void smooth_agg (dCSRmat    *A,

                        dCSRmat    *tentp,

                        dCSRmat    *P,

                        AMG_param  *param,

                        dCSRmat    *N)

{

    const SHORT filter = param->smooth_filter;

    const INT   row = A->row, col= A->col;

    const REAL  smooth_factor = param->tentative_smooth;


    dCSRmat S;

    dvector diag;  // diagonal entries


    REAL row_sum_A, row_sum_N;

    INT i,j;


    /* Step 1. Form smoother */


    /* Without filter: Using A for damped Jacobian smoother */

    if ( filter != ON ) {


        // copy structure from A

        S = fasp_dcsr_create(row, col, A->IA[row]);


#ifdef _OPENMP

#pragma omp parallel for if(row>OPENMP_HOLDS)

#endif

        for ( i=0; i<=row; ++i ) S.IA[i] = A->IA[i];

        for ( i=0; i<S.IA[S.row]; ++i ) S.JA[i] = A->JA[i];


        fasp_dcsr_getdiag(0, A, &diag);  // get the diagonal entries of A


        // check the diagonal entries.

        // if it is too small, use Richardson smoother for the corresponding row

#ifdef _OPENMP

#pragma omp parallel for if(row>OPENMP_HOLDS)

#endif

        for (i=0; i<row; ++i) {

            if (ABS(diag.val[i]) < 1e-6) diag.val[i] = 1.0;

        }


#ifdef _OPENMP

#pragma omp parallel for if(row>OPENMP_HOLDS) private(j)

#endif

        for (i=0; i<row; ++i) {

            for (j=S.IA[i]; j<S.IA[i+1]; ++j) {

                if (S.JA[j] == i) {

                    S.val[j] = 1 - smooth_factor * A->val[j] / diag.val[i];

                }

                else {

                    S.val[j] = - smooth_factor * A->val[j] / diag.val[i];

                }

            }

        }

    }


    /* Using filtered A for damped Jacobian smoother */

    else {

        /* Form filtered A and store in N */

#ifdef _OPENMP

#pragma omp parallel for private(j, row_sum_A, row_sum_N) if (row>OPENMP_HOLDS)

#endif

        for (i=0; i<row; ++i) {

            for (row_sum_A = 0.0, j=A->IA[i]; j<A->IA[i+1]; ++j) {

                if (A->JA[j] != i) row_sum_A += A->val[j];

            }


            for (row_sum_N = 0.0, j=N->IA[i]; j<N->IA[i+1]; ++j) {

                if (N->JA[j] != i) row_sum_N += N->val[j];

            }


            for (j=N->IA[i]; j<N->IA[i+1]; ++j) {

                if (N->JA[j] == i) {

                    // The original paper has a wrong sign!!! --Chensong

                    N->val[j] += row_sum_A - row_sum_N;

                }

            }

        }


        // copy structure from N (filtered A)

        S = fasp_dcsr_create(row, col, N->IA[row]);


#ifdef _OPENMP

#pragma omp parallel for if(row>OPENMP_HOLDS)

#endif

        for (i=0; i<=row; ++i) S.IA[i] = N->IA[i];


        for (i=0; i<S.IA[S.row]; ++i) S.JA[i] = N->JA[i];


        fasp_dcsr_getdiag(0, N, &diag);  // get the diagonal entries of N (filtered A)


        // check the diagonal entries.

        // if it is too small, use Richardson smoother for the corresponding row

#ifdef _OPENMP

#pragma omp parallel for if(row>OPENMP_HOLDS)

#endif

        for (i=0;i<row;++i) {

            if (ABS(diag.val[i]) < 1e-6) diag.val[i] = 1.0;

        }


#ifdef _OPENMP

#pragma omp parallel for if(row>OPENMP_HOLDS) private(i,j)

#endif

        for (i=0;i<row;++i) {

            for (j=S.IA[i]; j<S.IA[i+1]; ++j) {

                if (S.JA[j] == i) {

                    S.val[j] = 1 - smooth_factor * N->val[j] / diag.val[i];

                }

                else {

                    S.val[j] = - smooth_factor * N->val[j] / diag.val[i];

                }

            }

        }


    }


    fasp_dvec_free(&diag);


    /* Step 2. Smooth the tentative prolongation P = S*tenp */

    fasp_blas_dcsr_mxm(&S, tentp, P); // Note: think twice about this.

    P->nnz = P->IA[P->row];

    fasp_dcsr_free(&S);

}


static SHORT amg_setup_smoothP_smoothR (AMG_data   *mgl,

                                        AMG_param  *param)

{

    const SHORT prtlvl     = param->print_level;

    const SHORT cycle_type = param->cycle_type;

    const SHORT csolver    = param->coarse_solver;

    const SHORT min_cdof   = MAX(param->coarse_dof,50);

    const INT   m          = mgl[0].A.row;


    // local variables

    SHORT       max_levels = param->max_levels, lvl = 0, status = FASP_SUCCESS;

    INT         i, j;

    REAL        setup_start, setup_end;

    ILU_param   iluparam;

    SWZ_param   swzparam;


#if DEBUG_MODE > 0

    printf("### DEBUG: [-Begin-] %s ...\n", __FUNCTION__);

#endif


    fasp_gettime(&setup_start);


    // level info (fine: 0; coarse: 1)

    ivector *vertices = (ivector *)fasp_mem_calloc(max_levels,sizeof(ivector));


    // each elvel stores the information of the number of aggregations

    INT *num_aggs = (INT *)fasp_mem_calloc(max_levels,sizeof(INT));


    // each level stores the information of the strongly coupled neighbourhood

    dCSRmat *Neighbor = (dCSRmat *)fasp_mem_calloc(max_levels,sizeof(dCSRmat));


    // each level stores the information of the tentative prolongations

    dCSRmat *tentp = (dCSRmat *)fasp_mem_calloc(max_levels,sizeof(dCSRmat));


    // Initialize level information

    for ( i = 0; i < max_levels; ++i ) num_aggs[i] = 0;


    mgl[0].near_kernel_dim   = 1;

    mgl[0].near_kernel_basis = (REAL **)fasp_mem_calloc(mgl->near_kernel_dim,sizeof(REAL*));


    for ( i = 0; i < mgl->near_kernel_dim; ++i ) {

        mgl[0].near_kernel_basis[i] = (REAL *)fasp_mem_calloc(m,sizeof(REAL));

        for ( j = 0; j < m; ++j ) mgl[0].near_kernel_basis[i][j] = 1.0;

    }


    // Initialize ILU parameters

    mgl->ILU_levels = param->ILU_levels;

    if ( param->ILU_levels > 0 ) {

        iluparam.print_level = param->print_level;

        iluparam.ILU_lfil    = param->ILU_lfil;

        iluparam.ILU_droptol = param->ILU_droptol;

        iluparam.ILU_relax   = param->ILU_relax;

        iluparam.ILU_type    = param->ILU_type;

    }


    // Initialize Schwarz parameters

    mgl->SWZ_levels = param->SWZ_levels;

    if ( param->SWZ_levels > 0 ) {

        swzparam.SWZ_mmsize = param->SWZ_mmsize;

        swzparam.SWZ_maxlvl = param->SWZ_maxlvl;

        swzparam.SWZ_type   = param->SWZ_type;

        swzparam.SWZ_blksolver = param->SWZ_blksolver;

    }


    // Initialize AMLI coefficients

    if ( cycle_type == AMLI_CYCLE ) {

        const INT amlideg = param->amli_degree;

        param->amli_coef = (REAL *)fasp_mem_calloc(amlideg+1,sizeof(REAL));

        REAL lambda_max = 2.0, lambda_min = lambda_max/4;

        fasp_amg_amli_coef(lambda_max, lambda_min, amlideg, param->amli_coef);

    }


#if DIAGONAL_PREF

    fasp_dcsr_diagpref(&mgl[0].A); // reorder each row to make diagonal appear first

#endif


    /*----------------------------*/

    /*--- checking aggregation ---*/

    /*----------------------------*/

    if ( param->aggregation_type == PAIRWISE )

        param->pair_number = MIN(param->pair_number, max_levels);


    // Main AMG setup loop

    while ( (mgl[lvl].A.row > min_cdof) && (lvl < max_levels-1) ) {


#if DEBUG_MODE > 2

        printf("### DEBUG: level = %d, row = %d, nnz = %d\n",

               lvl, mgl[lvl].A.row, mgl[lvl].A.nnz);

#endif


        /*-- setup ILU decomposition if necessary */

        if ( lvl < param->ILU_levels ) {

            status = fasp_ilu_dcsr_setup(&mgl[lvl].A, &mgl[lvl].LU, &iluparam);

            if ( status < 0 ) {

                if ( prtlvl > PRINT_MIN ) {

                    printf("### WARNING: ILU setup on level-%d failed!\n", lvl);

                    printf("### WARNING: Disable ILU for level >= %d.\n", lvl);

                }

                param->ILU_levels = lvl;

            }

        }


        /* -- setup Schwarz smoother if necessary */

        if ( lvl < param->SWZ_levels ) {

            mgl[lvl].Schwarz.A = fasp_dcsr_sympart(&mgl[lvl].A);

            fasp_dcsr_shift(&(mgl[lvl].Schwarz.A), 1);

            status = fasp_swz_dcsr_setup(&mgl[lvl].Schwarz, &swzparam);

            if ( status < 0 ) {

                if ( prtlvl > PRINT_MIN ) {

                    printf("### WARNING: Schwarz on level-%d failed!\n", lvl);

                    printf("### WARNING: Disable Schwarz for level >= %d.\n", lvl);

                }

                param->SWZ_levels = lvl;

            }

        }


        /*-- Aggregation --*/

        status = aggregation_vmb(&mgl[lvl].A, &vertices[lvl], param, lvl+1,

                                 &Neighbor[lvl], &num_aggs[lvl]);


        // Check 1: Did coarsening step succeed?

        if ( status < 0 ) {

            // When error happens, stop at the current multigrid level!

            if ( prtlvl > PRINT_MIN ) {

                printf("### WARNING: Forming aggregates on level-%d failed!\n", lvl);

            }

            status = FASP_SUCCESS;

            fasp_ivec_free(&vertices[lvl]);

            fasp_dcsr_free(&Neighbor[lvl]);

            break;

        }


        /* -- Form Tentative prolongation --*/

        form_tentative_p(&vertices[lvl], &tentp[lvl], mgl[0].near_kernel_basis,

                         num_aggs[lvl]);


        /* -- Form smoothed prolongation -- */

        smooth_agg(&mgl[lvl].A, &tentp[lvl], &mgl[lvl].P, param, &Neighbor[lvl]);


        // Check 2: Is coarse sparse too small?

        if ( mgl[lvl].P.col < MIN_CDOF ) {

            fasp_ivec_free(&vertices[lvl]);

            fasp_dcsr_free(&Neighbor[lvl]);

            fasp_dcsr_free(&tentp[lvl]);

            break;

        }


        // Check 3: Does this coarsening step too aggressive?

        if ( mgl[lvl].P.row > mgl[lvl].P.col * MAX_CRATE ) {

            if ( prtlvl > PRINT_MIN ) {

                printf("### WARNING: Coarsening might be too aggressive!\n");

                printf("### WARNING: Fine level = %d, coarse level = %d. Discard!\n",

                       mgl[lvl].P.row, mgl[lvl].P.col);

            }

            fasp_ivec_free(&vertices[lvl]);

            fasp_dcsr_free(&Neighbor[lvl]);

            fasp_dcsr_free(&tentp[lvl]);

            break;

        }


        /*-- Form restriction --*/

        fasp_dcsr_trans(&mgl[lvl].P, &mgl[lvl].R);


        /*-- Form coarse level stiffness matrix --*/

        fasp_blas_dcsr_rap(&mgl[lvl].R, &mgl[lvl].A, &mgl[lvl].P, &mgl[lvl+1].A);


        fasp_dcsr_free(&Neighbor[lvl]);

        fasp_dcsr_free(&tentp[lvl]);

        fasp_ivec_free(&vertices[lvl]);


        ++lvl;


#if DIAGONAL_PREF

        // reorder each row to make diagonal appear first

        fasp_dcsr_diagpref(&mgl[lvl].A);

#endif


        // Check 4: Is this coarsening ratio too small?

        if ( (REAL)mgl[lvl].P.col > mgl[lvl].P.row * MIN_CRATE ) {

            if ( prtlvl > PRINT_MIN ) {

                printf("### WARNING: Coarsening rate is too small!\n");

                printf("### WARNING: Fine level = %d, coarse level = %d. Discard!\n",

                       mgl[lvl].P.row, mgl[lvl].P.col);

            }


            break;

        }


    } // end of the main while loop


    // Setup coarse level systems for direct solvers

    switch (csolver) {


#if WITH_MUMPS

        case SOLVER_MUMPS: {

            // Setup MUMPS direct solver on the coarsest level

            mgl[lvl].mumps.job = 1;

            fasp_solver_mumps_steps(&mgl[lvl].A, &mgl[lvl].b, &mgl[lvl].x, &mgl[lvl].mumps);

            break;

        }

#endif


#if WITH_UMFPACK

        case SOLVER_UMFPACK: {

            // Need to sort the matrix A for UMFPACK to work

            dCSRmat Ac_tran;

            Ac_tran = fasp_dcsr_create(mgl[lvl].A.row, mgl[lvl].A.col, mgl[lvl].A.nnz);

            fasp_dcsr_transz(&mgl[lvl].A, NULL, &Ac_tran);

            // It is equivalent to do transpose and then sort

            //     fasp_dcsr_trans(&mgl[lvl].A, &Ac_tran);

            //     fasp_dcsr_sort(&Ac_tran);

            fasp_dcsr_cp(&Ac_tran, &mgl[lvl].A);

            fasp_dcsr_free(&Ac_tran);

            mgl[lvl].Numeric = fasp_umfpack_factorize(&mgl[lvl].A, 0);

            break;

        }

#endif


#if WITH_PARDISO

        case SOLVER_PARDISO: {

             fasp_dcsr_sort(&mgl[lvl].A);

             fasp_pardiso_factorize(&mgl[lvl].A, &mgl[lvl].pdata, prtlvl);

             break;

         }

#endif


        default:

            // Do nothing!

            break;

    }


    // setup total level number and current level

    mgl[0].num_levels = max_levels = lvl+1;

    mgl[0].w          = fasp_dvec_create(m);


    for ( lvl = 1; lvl < max_levels; ++lvl) {

        INT mm = mgl[lvl].A.row;

        mgl[lvl].num_levels = max_levels;

        mgl[lvl].b          = fasp_dvec_create(mm);

        mgl[lvl].x          = fasp_dvec_create(mm);


        mgl[lvl].cycle_type = cycle_type; // initialize cycle type!

        mgl[lvl].ILU_levels = param->ILU_levels - lvl; // initialize ILU levels!

        mgl[lvl].SWZ_levels = param->SWZ_levels -lvl; // initialize Schwarz!


        if ( cycle_type == NL_AMLI_CYCLE )

            mgl[lvl].w = fasp_dvec_create(3*mm);

        else

            mgl[lvl].w = fasp_dvec_create(2*mm);

    }


#if MULTI_COLOR_ORDER

    INT Colors,rowmax;

#ifdef _OPENMP

    int threads = fasp_get_num_threads();

    if (threads  > max_levels-1  ) threads = max_levels-1;

#pragma omp parallel for private(lvl,rowmax,Colors) schedule(static, 1) num_threads(threads)

#endif

    for (lvl=0; lvl<max_levels-1; lvl++){


#if 1

        dCSRmat_Multicoloring(&mgl[lvl].A, &rowmax, &Colors);

#else

        dCSRmat_Multicoloring_Theta(&mgl[lvl].A, mgl[lvl].GS_Theta, &rowmax, &Colors);

#endif

        if ( prtlvl > 1 )

            printf("mgl[%3d].A.row = %12d, rowmax = %5d, rowavg = %7.2lf, colors = %5d, Theta = %le.\n",

            lvl, mgl[lvl].A.row, rowmax, (double)mgl[lvl].A.nnz/mgl[lvl].A.row,

            mgl[lvl].A.color, mgl[lvl].GS_Theta);

    }

#endif


    if ( prtlvl > PRINT_NONE ) {

        fasp_gettime(&setup_end);

        fasp_amgcomplexity(mgl,prtlvl);

        fasp_cputime("Smoothed aggregation setup", setup_end - setup_start);

    }


    fasp_mem_free(vertices); vertices = NULL;

    fasp_mem_free(num_aggs); num_aggs = NULL;

    fasp_mem_free(Neighbor); Neighbor = NULL;

    fasp_mem_free(tentp);    tentp    = NULL;


#if DEBUG_MODE > 0

    printf("### DEBUG: [--End--] %s ...\n", __FUNCTION__);

#endif


    return status;

}


static SHORT amg_setup_smoothP_unsmoothR (AMG_data   *mgl,

                                          AMG_param  *param)

{

    const SHORT prtlvl     = param->print_level;

    const SHORT cycle_type = param->cycle_type;

    const SHORT csolver    = param->coarse_solver;

    const SHORT min_cdof   = MAX(param->coarse_dof,50);

    const INT   m          = mgl[0].A.row;


    // local variables

    SHORT       max_levels = param->max_levels, lvl = 0, status = FASP_SUCCESS;

    INT         i, j;

    REAL        setup_start, setup_end;

    ILU_param   iluparam;

    SWZ_param swzparam;


#if DEBUG_MODE > 0

    printf("### DEBUG: [-Begin-] %s ...\n", __FUNCTION__);

#endif


    fasp_gettime(&setup_start);


    // level info (fine: 0; coarse: 1)

    ivector *vertices = (ivector *)fasp_mem_calloc(max_levels,sizeof(ivector));


    // each level stores the information of the number of aggregations

    INT *num_aggs = (INT *)fasp_mem_calloc(max_levels,sizeof(INT));


    // each level stores the information of the strongly coupled neighbourhood

    dCSRmat *Neighbor = (dCSRmat *)fasp_mem_calloc(max_levels,sizeof(dCSRmat));


    // each level stores the information of the tentative prolongations

    dCSRmat *tentp = (dCSRmat *)fasp_mem_calloc(max_levels,sizeof(dCSRmat));

    dCSRmat *tentr = (dCSRmat *)fasp_mem_calloc(max_levels,sizeof(dCSRmat));


    for ( i = 0; i < max_levels; ++i ) num_aggs[i] = 0;


    mgl[0].near_kernel_dim   = 1;


    mgl[0].near_kernel_basis = (REAL **)fasp_mem_calloc(mgl->near_kernel_dim,sizeof(REAL*));


    for ( i = 0; i < mgl->near_kernel_dim; ++i ) {

        mgl[0].near_kernel_basis[i] = (REAL *)fasp_mem_calloc(m,sizeof(REAL));

        for ( j = 0; j < m; ++j ) mgl[0].near_kernel_basis[i][j] = 1.0;

    }


    // Initialize ILU parameters

    if ( param->ILU_levels > 0 ) {

        iluparam.print_level = param->print_level;

        iluparam.ILU_lfil    = param->ILU_lfil;

        iluparam.ILU_droptol = param->ILU_droptol;

        iluparam.ILU_relax   = param->ILU_relax;

        iluparam.ILU_type    = param->ILU_type;

    }


    // Initialize Schwarz parameters

    mgl->SWZ_levels = param->SWZ_levels;

    if ( param->SWZ_levels > 0 ) {

        swzparam.SWZ_mmsize = param->SWZ_mmsize;

        swzparam.SWZ_maxlvl = param->SWZ_maxlvl;

        swzparam.SWZ_type   = param->SWZ_type;

        swzparam.SWZ_blksolver = param->SWZ_blksolver;

    }


    // Initialize AMLI coefficients

    if ( cycle_type == AMLI_CYCLE ) {

        const INT amlideg = param->amli_degree;

        param->amli_coef = (REAL *)fasp_mem_calloc(amlideg+1,sizeof(REAL));

        REAL lambda_max = 2.0, lambda_min = lambda_max/4;

        fasp_amg_amli_coef(lambda_max, lambda_min, amlideg, param->amli_coef);

    }


    // Main AMG setup loop

    while ( (mgl[lvl].A.row > min_cdof) && (lvl < max_levels-1) ) {


        /*-- setup ILU decomposition if necessary */

        if ( lvl < param->ILU_levels ) {

            status = fasp_ilu_dcsr_setup(&mgl[lvl].A, &mgl[lvl].LU, &iluparam);

            if ( status < 0 ) {

                if ( prtlvl > PRINT_MIN ) {

                    printf("### WARNING: ILU setup on level-%d failed!\n", lvl);

                    printf("### WARNING: Disable ILU for level >= %d.\n", lvl);

                }

                param->ILU_levels = lvl;

            }

        }


        /* -- setup Schwarz smoother if necessary */

        if ( lvl < param->SWZ_levels ) {

            mgl[lvl].Schwarz.A = fasp_dcsr_sympart(&mgl[lvl].A);

            fasp_dcsr_shift(&(mgl[lvl].Schwarz.A), 1);

            status = fasp_swz_dcsr_setup(&mgl[lvl].Schwarz, &swzparam);

            if ( status < 0 ) {

                if ( prtlvl > PRINT_MIN ) {

                    printf("### WARNING: Schwarz on level-%d failed!\n", lvl);

                    printf("### WARNING: Disable Schwarz for level >= %d.\n", lvl);

                }

                param->SWZ_levels = lvl;

            }

        }


        /*-- Aggregation --*/

        status = aggregation_vmb(&mgl[lvl].A, &vertices[lvl], param, lvl+1,

                                 &Neighbor[lvl], &num_aggs[lvl]);


        // Check 1: Did coarsening step succeeded?

        if ( status < 0 ) {

            // When error happens, stop at the current multigrid level!

            if ( prtlvl > PRINT_MIN ) {

                printf("### WARNING: Stop coarsening on level=%d!\n", lvl);

            }

            status = FASP_SUCCESS; break;

        }


        /* -- Form Tentative prolongation --*/

        form_tentative_p(&vertices[lvl], &tentp[lvl], mgl[0].near_kernel_basis,

                         num_aggs[lvl]);


        /* -- Form smoothed prolongation -- */

        smooth_agg(&mgl[lvl].A, &tentp[lvl], &mgl[lvl].P, param, &Neighbor[lvl]);


        // Check 2: Is coarse sparse too small?

        if ( mgl[lvl].P.col < MIN_CDOF ) break;


        // Check 3: Does this coarsening step too aggressive?

        if ( mgl[lvl].P.row > mgl[lvl].P.col * MAX_CRATE ) {

            if ( prtlvl > PRINT_MIN ) {

                printf("### WARNING: Coarsening might be too aggressive!\n");

                printf("### WARNING: Fine level = %d, coarse level = %d. Discard!\n",

                       mgl[lvl].P.row, mgl[lvl].P.col);

            }

            break;

        }


        // Check 4: Is this coarsening ratio too small?

        if ( (REAL)mgl[lvl].P.col > mgl[lvl].P.row * MIN_CRATE ) {

            if ( prtlvl > PRINT_MIN ) {

                printf("### WARNING: Coarsening rate is too small!\n");

                printf("### WARNING: Fine level = %d, coarse level = %d. Discard!\n",

                       mgl[lvl].P.row, mgl[lvl].P.col);

            }

            break;

        }


        /*-- Form restriction --*/

        fasp_dcsr_trans(&mgl[lvl].P, &mgl[lvl].R);

        fasp_dcsr_trans(&tentp[lvl], &tentr[lvl]);


        /*-- Form coarse level stiffness matrix --*/

        fasp_blas_dcsr_rap_agg(&tentr[lvl], &mgl[lvl].A, &tentp[lvl], &mgl[lvl+1].A);


        fasp_dcsr_free(&Neighbor[lvl]);

        fasp_dcsr_free(&tentp[lvl]);

        fasp_ivec_free(&vertices[lvl]);


        ++lvl;

    }


    // Setup coarse level systems for direct solvers

    switch (csolver) {


#if WITH_MUMPS

        case SOLVER_MUMPS: {

            // Setup MUMPS direct solver on the coarsest level

            mgl[lvl].mumps.job = 1;

            fasp_solver_mumps_steps(&mgl[lvl].A, &mgl[lvl].b, &mgl[lvl].x, &mgl[lvl].mumps);

            break;

        }

#endif


#if WITH_UMFPACK

        case SOLVER_UMFPACK: {

            // Need to sort the matrix A for UMFPACK to work

            dCSRmat Ac_tran;

            Ac_tran = fasp_dcsr_create(mgl[lvl].A.row, mgl[lvl].A.col, mgl[lvl].A.nnz);

            fasp_dcsr_transz(&mgl[lvl].A, NULL, &Ac_tran);

            // It is equivalent to do transpose and then sort

            //     fasp_dcsr_trans(&mgl[lvl].A, &Ac_tran);

            //     fasp_dcsr_sort(&Ac_tran);

            fasp_dcsr_cp(&Ac_tran, &mgl[lvl].A);

            fasp_dcsr_free(&Ac_tran);

            mgl[lvl].Numeric = fasp_umfpack_factorize(&mgl[lvl].A, 0);

            break;

        }

#endif


#if WITH_PARDISO

        case SOLVER_PARDISO: {

             fasp_dcsr_sort(&mgl[lvl].A);

             fasp_pardiso_factorize(&mgl[lvl].A, &mgl[lvl].pdata, prtlvl);

             break;

         }

#endif


        default:

            // Do nothing!

            break;

    }


    // setup total level number and current level

    mgl[0].num_levels = max_levels = lvl+1;

    mgl[0].w          = fasp_dvec_create(m);


    for ( lvl = 1; lvl < max_levels; ++lvl) {

        INT mm = mgl[lvl].A.row;

        mgl[lvl].num_levels = max_levels;

        mgl[lvl].b          = fasp_dvec_create(mm);

        mgl[lvl].x          = fasp_dvec_create(mm);


        mgl[lvl].cycle_type     = cycle_type; // initialize cycle type!

        mgl[lvl].ILU_levels     = param->ILU_levels - lvl; // initialize ILU levels!

        mgl[lvl].SWZ_levels = param->SWZ_levels -lvl; // initialize Schwarz!


        if ( cycle_type == NL_AMLI_CYCLE )

            mgl[lvl].w = fasp_dvec_create(3*mm);

        else

            mgl[lvl].w = fasp_dvec_create(2*mm);

    }


#if MULTI_COLOR_ORDER

    INT Colors,rowmax;

#ifdef _OPENMP

    int threads = fasp_get_num_threads();

    if (threads  > max_levels-1  ) threads = max_levels-1;

#pragma omp parallel for private(lvl,rowmax,Colors) schedule(static, 1) num_threads(threads)

#endif

    for (lvl=0; lvl<max_levels-1; lvl++){


#if 1

        dCSRmat_Multicoloring(&mgl[lvl].A, &rowmax, &Colors);

#else

        dCSRmat_Multicoloring_Theta(&mgl[lvl].A, mgl[lvl].GS_Theta, &rowmax, &Colors);

#endif

        if ( prtlvl > 1 )

            printf("mgl[%3d].A.row = %12d, rowmax = %5d, rowavg = %7.2lf, colors = %5d, Theta = %le.\n",

            lvl, mgl[lvl].A.row, rowmax, (double)mgl[lvl].A.nnz/mgl[lvl].A.row,

            mgl[lvl].A.color, mgl[lvl].GS_Theta);

    }

#endif


    if ( prtlvl > PRINT_NONE ) {

        fasp_gettime(&setup_end);

        fasp_amgcomplexity(mgl,prtlvl);

        fasp_cputime("Smoothed aggregation 1/2 setup", setup_end - setup_start);

    }


    fasp_mem_free(vertices); vertices = NULL;

    fasp_mem_free(num_aggs); num_aggs = NULL;

    fasp_mem_free(Neighbor); Neighbor = NULL;

    fasp_mem_free(tentp);    tentp    = NULL;

    fasp_mem_free(tentr);    tentr    = NULL;


#if DEBUG_MODE > 0

    printf("### DEBUG: [--End--] %s ...\n", __FUNCTION__);

#endif


    return status;

}


/*---------------------------------*/

/*--        End of File          --*/

/*---------------------------------*/

fasp_mem_free
void fasp_mem_free(void *mem)
Free up previous allocated memory body and set pointer to NULL.
Definition: AuxMemory.c:152

fasp_mem_calloc
void * fasp_mem_calloc(const unsigned int size, const unsigned int type)
Allocate, initiate, and check memory.
Definition: AuxMemory.c:65

fasp_cputime
void fasp_cputime(const char *message, const REAL cputime)
Print CPU walltime.
Definition: AuxMessage.c:179

fasp_amgcomplexity
void fasp_amgcomplexity(const AMG_data *mgl, const SHORT prtlvl)
Print level and complexity information of AMG.
Definition: AuxMessage.c:84

fasp_gettime
void fasp_gettime(REAL *time)
Get system time.
Definition: AuxTiming.c:37

fasp_dvec_free
void fasp_dvec_free(dvector *u)
Free vector data space of REAL type.
Definition: AuxVector.c:145

fasp_ivec_free
void fasp_ivec_free(ivector *u)
Free vector data space of INT type.
Definition: AuxVector.c:164

fasp_dvec_create
dvector fasp_dvec_create(const INT m)
Create dvector data space of REAL type.
Definition: AuxVector.c:62

fasp_ilu_dcsr_setup
SHORT fasp_ilu_dcsr_setup(dCSRmat *A, ILU_data *iludata, ILU_param *iluparam)
Get ILU decomposition of a CSR matrix A.
Definition: BlaILUSetupCSR.c:40

fasp_swz_dcsr_setup
INT fasp_swz_dcsr_setup(SWZ_data *swzdata, SWZ_param *swzparam)
Setup phase for the Schwarz methods.
Definition: BlaSchwarzSetup.c:46

fasp_dcsr_diagpref
void fasp_dcsr_diagpref(dCSRmat *A)
Re-order the column and data arrays of a CSR matrix, so that the first entry in each row is the diago...
Definition: BlaSparseCSR.c:680

fasp_dcsr_create
dCSRmat fasp_dcsr_create(const INT m, const INT n, const INT nnz)
Create CSR sparse matrix data memory space.
Definition: BlaSparseCSR.c:47

fasp_dcsr_shift
void fasp_dcsr_shift(dCSRmat *A, const INT offset)
Re-index a REAL matrix in CSR format to make the index starting from 0 or 1.
Definition: BlaSparseCSR.c:1212

dCSRmat_Multicoloring_Theta
void dCSRmat_Multicoloring_Theta(dCSRmat *A, REAL theta, INT *rowmax, INT *groups)
Use the greedy multicoloring algorithm to get color groups for for the adjacency graph of A.
Definition: BlaSparseCSR.c:1984

fasp_dcsr_free
void fasp_dcsr_free(dCSRmat *A)
Free CSR sparse matrix data memory space.
Definition: BlaSparseCSR.c:184

fasp_dcsr_transz
void fasp_dcsr_transz(dCSRmat *A, INT *p, dCSRmat *AT)
Generalized transpose of A: (n x m) matrix given in dCSRmat format.
Definition: BlaSparseCSR.c:1416

fasp_dcsr_sort
void fasp_dcsr_sort(dCSRmat *A)
Sort each row of A in ascending order w.r.t. column indices.
Definition: BlaSparseCSR.c:385

dCSRmat_Multicoloring
void dCSRmat_Multicoloring(dCSRmat *A, INT *rowmax, INT *groups)
Use the greedy multicoloring algorithm to get color groups for for the adjacency graph of A.
Definition: BlaSparseCSR.c:1687

fasp_dcsr_cp
void fasp_dcsr_cp(const dCSRmat *A, dCSRmat *B)
copy a dCSRmat to a new one B=A
Definition: BlaSparseCSR.c:851

fasp_dcsr_getdiag
void fasp_dcsr_getdiag(INT n, const dCSRmat *A, dvector *diag)
Get first n diagonal entries of a CSR matrix A.
Definition: BlaSparseCSR.c:537

fasp_dcsr_sympart
dCSRmat fasp_dcsr_sympart(dCSRmat *A)
Get symmetric part of a dCSRmat matrix.
Definition: BlaSparseCSR.c:1357

fasp_dcsr_trans
INT fasp_dcsr_trans(const dCSRmat *A, dCSRmat *AT)
Find transpose of dCSRmat matrix A.
Definition: BlaSparseCSR.c:952

fasp_blas_dcsr_mxm
void fasp_blas_dcsr_mxm(const dCSRmat *A, const dCSRmat *B, dCSRmat *C)
Sparse matrix multiplication C=A*B.
Definition: BlaSpmvCSR.c:893

fasp_blas_dcsr_rap_agg
void fasp_blas_dcsr_rap_agg(const dCSRmat *R, const dCSRmat *A, const dCSRmat *P, dCSRmat *RAP)
Triple sparse matrix multiplication B=R*A*P (nonzeros of R, P = 1)
Definition: BlaSpmvCSR.c:1276

fasp_blas_dcsr_rap
void fasp_blas_dcsr_rap(const dCSRmat *R, const dCSRmat *A, const dCSRmat *P, dCSRmat *RAP)
Triple sparse matrix multiplication B=R*A*P.
Definition: BlaSpmvCSR.c:999

fasp_amg_setup_sa
SHORT fasp_amg_setup_sa(AMG_data *mgl, AMG_param *param)
Set up phase of smoothed aggregation AMG.
Definition: PreAMGSetupSA.c:63

fasp_amg_amli_coef
void fasp_amg_amli_coef(const REAL lambda_max, const REAL lambda_min, const INT degree, REAL *coef)
Compute the coefficients of the polynomial used by AMLI-cycle.
Definition: PreMGRecurAMLI.c:791

fasp_solver_mumps_steps
int fasp_solver_mumps_steps(dCSRmat *ptrA, dvector *b, dvector *u, Mumps_data *mumps)
Solve Ax=b by MUMPS in three steps.
Definition: XtrMumps.c:196

fasp.h
Main header file for the FASP project.

MIN
#define MIN(a, b)
Definition: fasp.h:83

REAL
#define REAL
Definition: fasp.h:75

SHORT
#define SHORT
FASP integer and floating point numbers.
Definition: fasp.h:71

ABS
#define ABS(a)
Definition: fasp.h:84

MAX
#define MAX(a, b)
Definition of max, min, abs.
Definition: fasp.h:82

INT
#define INT
Definition: fasp.h:72

AMLI_CYCLE
#define AMLI_CYCLE
Definition: fasp_const.h:181

SOLVER_PARDISO
#define SOLVER_PARDISO
Definition: fasp_const.h:126

NL_AMLI_CYCLE
#define NL_AMLI_CYCLE
Definition: fasp_const.h:182

FASP_SUCCESS
#define FASP_SUCCESS
Definition of return status and error messages.
Definition: fasp_const.h:19

MAX_CRATE
#define MAX_CRATE
Definition: fasp_const.h:262

SOLVER_MUMPS
#define SOLVER_MUMPS
Definition: fasp_const.h:125

PAIRWISE
#define PAIRWISE
Definition of aggregation types.
Definition: fasp_const.h:170

SOLVER_UMFPACK
#define SOLVER_UMFPACK
Definition: fasp_const.h:124

MIN_CRATE
#define MIN_CRATE
Definition: fasp_const.h:261

ON
#define ON
Definition of switch.
Definition: fasp_const.h:67

PRINT_NONE
#define PRINT_NONE
Print level for all subroutines – not including DEBUG output.
Definition: fasp_const.h:73

MIN_CDOF
#define MIN_CDOF
Definition: fasp_const.h:260

PRINT_MIN
#define PRINT_MIN
Definition: fasp_const.h:74

AMG_data
Data for AMG methods.
Definition: fasp.h:804

AMG_data::near_kernel_dim
INT near_kernel_dim
dimension of the near kernel for SAMG
Definition: fasp.h:849

AMG_data::A
dCSRmat A
pointer to the matrix at level level_num
Definition: fasp.h:817

AMG_data::cycle_type
INT cycle_type
cycle type
Definition: fasp.h:869

AMG_data::mumps
Mumps_data mumps
data for MUMPS
Definition: fasp.h:866

AMG_data::Schwarz
SWZ_data Schwarz
data of Schwarz smoother
Definition: fasp.h:860

AMG_data::b
dvector b
pointer to the right-hand side at level level_num
Definition: fasp.h:826

AMG_data::near_kernel_basis
REAL ** near_kernel_basis
basis of near kernel space for SAMG
Definition: fasp.h:852

AMG_data::Numeric
void * Numeric
pointer to the numerical factorization from UMFPACK
Definition: fasp.h:834

AMG_data::ILU_levels
INT ILU_levels
number of levels use ILU smoother
Definition: fasp.h:843

AMG_data::SWZ_levels
INT SWZ_levels
number of levels use Schwarz smoother
Definition: fasp.h:857

AMG_data::x
dvector x
pointer to the iterative solution at level level_num
Definition: fasp.h:829

AMG_data::num_levels
SHORT num_levels
number of levels in use <= max_levels
Definition: fasp.h:812

AMG_data::w
dvector w
temporary work space
Definition: fasp.h:863

AMG_param
Parameters for AMG methods.
Definition: fasp.h:455

AMG_param::ILU_lfil
INT ILU_lfil
level of fill-in for ILUs and ILUk
Definition: fasp.h:566

AMG_param::ILU_relax
REAL ILU_relax
relaxation for ILUs
Definition: fasp.h:572

AMG_param::SWZ_mmsize
INT SWZ_mmsize
maximal block size
Definition: fasp.h:581

AMG_param::print_level
SHORT print_level
print level for AMG
Definition: fasp.h:461

AMG_param::SWZ_maxlvl
INT SWZ_maxlvl
maximal levels
Definition: fasp.h:584

AMG_param::aggregation_type
SHORT aggregation_type
aggregation type
Definition: fasp.h:518

AMG_param::smooth_filter
SHORT smooth_filter
switch for filtered matrix used for smoothing the tentative prolongation
Definition: fasp.h:554

AMG_param::amli_coef
REAL * amli_coef
coefficients of the polynomial used by AMLI cycle
Definition: fasp.h:509

AMG_param::ILU_levels
SHORT ILU_levels
number of levels use ILU smoother
Definition: fasp.h:560

AMG_param::coarse_solver
SHORT coarse_solver
coarse solver type
Definition: fasp.h:500

AMG_param::cycle_type
SHORT cycle_type
type of AMG cycle
Definition: fasp.h:476

AMG_param::amli_degree
SHORT amli_degree
degree of the polynomial used by AMLI cycle
Definition: fasp.h:506

AMG_param::ILU_type
SHORT ILU_type
ILU type for smoothing.
Definition: fasp.h:563

AMG_param::SWZ_blksolver
INT SWZ_blksolver
type of Schwarz block solver
Definition: fasp.h:590

AMG_param::SWZ_type
INT SWZ_type
type of Schwarz method
Definition: fasp.h:587

AMG_param::coarse_dof
INT coarse_dof
max number of coarsest level DOF
Definition: fasp.h:473

AMG_param::ILU_droptol
REAL ILU_droptol
drop tolerance for ILUt
Definition: fasp.h:569

AMG_param::tentative_smooth
REAL tentative_smooth
relaxation parameter for smoothing the tentative prolongation
Definition: fasp.h:551

AMG_param::SWZ_levels
INT SWZ_levels
number of levels use Schwarz smoother
Definition: fasp.h:578

AMG_param::pair_number
INT pair_number
number of pairwise matchings
Definition: fasp.h:542

AMG_param::max_levels
SHORT max_levels
max number of levels of AMG
Definition: fasp.h:470

AMG_param::smooth_restriction
SHORT smooth_restriction
smooth the restriction for SA methods or not
Definition: fasp.h:557

ILU_param
Parameters for ILU.
Definition: fasp.h:404

ILU_param::ILU_lfil
INT ILU_lfil
level of fill-in for ILUk
Definition: fasp.h:413

ILU_param::ILU_relax
REAL ILU_relax
add the sum of dropped elements to diagonal element in proportion relax
Definition: fasp.h:419

ILU_param::print_level
SHORT print_level
print level
Definition: fasp.h:407

ILU_param::ILU_type
SHORT ILU_type
ILU type for decomposition.
Definition: fasp.h:410

ILU_param::ILU_droptol
REAL ILU_droptol
drop tolerance for ILUt
Definition: fasp.h:416

Mumps_data::job
INT job
work for MUMPS
Definition: fasp.h:615

SWZ_data::A
dCSRmat A
pointer to the original coefficient matrix
Definition: fasp.h:731

SWZ_param
Parameters for Schwarz method.
Definition: fasp.h:430

SWZ_param::SWZ_mmsize
INT SWZ_mmsize
maximal size of blocks
Definition: fasp.h:442

SWZ_param::SWZ_maxlvl
INT SWZ_maxlvl
maximal level for constructing the blocks
Definition: fasp.h:439

SWZ_param::SWZ_blksolver
INT SWZ_blksolver
type of Schwarz block solver
Definition: fasp.h:445

SWZ_param::SWZ_type
SHORT SWZ_type
type for Schwarz method
Definition: fasp.h:436

dCSRmat
Sparse matrix of REAL type in CSR format.
Definition: fasp.h:151

dCSRmat::col
INT col
column of matrix A, n
Definition: fasp.h:157

dCSRmat::val
REAL * val
nonzero entries of A
Definition: fasp.h:169

dCSRmat::row
INT row
row number of matrix A, m
Definition: fasp.h:154

dCSRmat::IA
INT * IA
integer array of row pointers, the size is m+1
Definition: fasp.h:163

dCSRmat::nnz
INT nnz
number of nonzero entries
Definition: fasp.h:160

dCSRmat::JA
INT * JA
integer array of column indexes, the size is nnz
Definition: fasp.h:166

dvector
Vector with n entries of REAL type.
Definition: fasp.h:354

dvector::val
REAL * val
actual vector entries
Definition: fasp.h:360

ivector
Vector with n entries of INT type.
Definition: fasp.h:368