fasp/PreMGRecurAMLI_8c_source.html

#include <math.h>

#include <time.h>


#include "fasp.h"

#include "fasp_functs.h"


/*---------------------------------*/

/*--  Declare Private Functions  --*/

/*---------------------------------*/


#include "PreMGRecurAMLI.inl"

#include "PreMGSmoother.inl"

#include "PreMGUtil.inl"


/*---------------------------------*/

/*--      Public Functions       --*/

/*---------------------------------*/


void fasp_solver_amli(AMG_data* mgl, AMG_param* param, INT l)

{

    const SHORT amg_type      = param->AMG_type;

    const SHORT prtlvl        = param->print_level;

    const SHORT smoother      = param->smoother;

    const SHORT smooth_order  = param->smooth_order;

    const SHORT coarse_solver = param->coarse_solver;

    const SHORT degree        = param->amli_degree;

    const REAL  relax         = param->relaxation;

    const REAL  tol           = param->tol * 1e-4;

    const SHORT ndeg          = param->polynomial_degree;


    // local variables

    REAL  alpha = 1.0;

    REAL* coef  = param->amli_coef;


    dvector *b0 = &mgl[l].b, *e0 = &mgl[l].x;         // fine level b and x

    dvector *b1 = &mgl[l + 1].b, *e1 = &mgl[l + 1].x; // coarse level b and x


    dCSRmat* A0 = &mgl[l].A;                          // fine level matrix

    dCSRmat* A1 = &mgl[l + 1].A;                      // coarse level matrix


    const INT m0 = A0->row, m1 = A1->row;


    INT*      ordering = mgl[l].cfmark.val;     // smoother ordering

    ILU_data* LU_level = &mgl[l].LU;            // fine level ILU decomposition

    REAL*     r        = mgl[l].w.val;          // work array for residual

    REAL*     r1       = mgl[l + 1].w.val + m1; // work array for residual


    // Schwarz parameters

    SWZ_param swzparam;

    if (param->SWZ_levels > 0) {

        swzparam.SWZ_blksolver = param->SWZ_blksolver;

    }


#if DEBUG_MODE > 0

    printf("### DEBUG: [-Begin-] %s ...\n", __FUNCTION__);

    printf("### DEBUG: n=%d, nnz=%d\n", mgl[0].A.row, mgl[0].A.nnz);

#endif


    if (prtlvl >= PRINT_MOST) printf("AMLI level %d, smoother %d.\n", l, smoother);


    if (l < mgl[l].num_levels - 1) {


        // pre smoothing

        if (l < mgl[l].ILU_levels) {


            fasp_smoother_dcsr_ilu(A0, b0, e0, LU_level);


        }


        else if (l < mgl->SWZ_levels) {


            switch (mgl[l].Schwarz.SWZ_type) {

                case SCHWARZ_SYMMETRIC:

                    fasp_dcsr_swz_forward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                          &mgl[l].b);

                    fasp_dcsr_swz_backward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                           &mgl[l].b);

                    break;

                default:

                    fasp_dcsr_swz_forward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                          &mgl[l].b);

                    break;

            }

        }


        else {

#if MULTI_COLOR_ORDER

            // printf("fasp_smoother_dcsr_gs_multicolor, %s, %d\n",  __FUNCTION__,

            // __LINE__);

            fasp_smoother_dcsr_gs_multicolor(&mgl[l].x, &mgl[l].A, &mgl[l].b,

                                             param->presmooth_iter, 1);

#else

            fasp_dcsr_presmoothing(smoother, A0, b0, e0, param->presmooth_iter, 0,

                                   m0 - 1, 1, relax, ndeg, smooth_order, ordering);

#endif

        }


        // form residual r = b - A x

        fasp_darray_cp(m0, b0->val, r);

        fasp_blas_dcsr_aAxpy(-1.0, A0, e0->val, r);


        // restriction r1 = R*r0

        switch (amg_type) {

            case UA_AMG:

                fasp_blas_dcsr_mxv_agg(&mgl[l].R, r, b1->val);

                break;

            default:

                fasp_blas_dcsr_mxv(&mgl[l].R, r, b1->val);

                break;

        }


        // coarse grid correction

        {

            INT i;


            fasp_darray_cp(m1, b1->val, r1);


            for (i = 1; i <= degree; i++) {

                fasp_dvec_set(m1, e1, 0.0);

                fasp_solver_amli(mgl, param, l + 1);


                // b1 = (coef[degree-i]/coef[degree])*r1 + A1*e1;

                // First, compute b1 = A1*e1

                fasp_blas_dcsr_mxv(A1, e1->val, b1->val);

                // Then, compute b1 = b1 + (coef[degree-i]/coef[degree])*r1

                fasp_blas_darray_axpy(m1, coef[degree - i] / coef[degree], r1, b1->val);

            }


            fasp_dvec_set(m1, e1, 0.0);

            fasp_solver_amli(mgl, param, l + 1);

        }


        // find the optimal scaling factor alpha

        fasp_blas_darray_ax(m1, coef[degree], e1->val);

        if (param->coarse_scaling == ON) {

            alpha = fasp_blas_darray_dotprod(m1, e1->val, r1) /

                    fasp_blas_dcsr_vmv(A1, e1->val, e1->val);

            alpha = MIN(alpha, 1.0);

        }


        // prolongation e0 = e0 + alpha * P * e1

        switch (amg_type) {

            case UA_AMG:

                fasp_blas_dcsr_aAxpy_agg(alpha, &mgl[l].P, e1->val, e0->val);

                break;

            default:

                fasp_blas_dcsr_aAxpy(alpha, &mgl[l].P, e1->val, e0->val);

                break;

        }


        // post smoothing

        if (l < mgl[l].ILU_levels) {


            fasp_smoother_dcsr_ilu(A0, b0, e0, LU_level);


        }


        else if (l < mgl->SWZ_levels) {


            switch (mgl[l].Schwarz.SWZ_type) {

                case SCHWARZ_SYMMETRIC:

                    fasp_dcsr_swz_backward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                           &mgl[l].b);

                    fasp_dcsr_swz_forward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                          &mgl[l].b);

                    break;

                default:

                    fasp_dcsr_swz_backward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                           &mgl[l].b);

                    break;

            }

        }


        else {

#if MULTI_COLOR_ORDER

            fasp_smoother_dcsr_gs_multicolor(&mgl[l].x, &mgl[l].A, &mgl[l].b,

                                             param->postsmooth_iter, -1);

#else

            fasp_dcsr_postsmoothing(smoother, A0, b0, e0, param->postsmooth_iter, 0,

                                    m0 - 1, -1, relax, ndeg, smooth_order, ordering);

#endif

        }


    }


    else { // coarsest level solver


        switch (coarse_solver) {


#if WITH_PARDISO

            case SOLVER_PARDISO:

                {

                    /* use Intel MKL PARDISO direct solver on the coarsest level */

                    fasp_pardiso_solve(A0, b0, e0, &mgl[l].pdata, 0);

                    break;

                }

#endif


#if WITH_SuperLU

            case SOLVER_SUPERLU:

                /* use SuperLU direct solver on the coarsest level */

                fasp_solver_superlu(A0, b0, e0, 0);

                break;

#endif


#if WITH_UMFPACK

            case SOLVER_UMFPACK:

                /* use UMFPACK direct solver on the coarsest level */

                fasp_umfpack_solve(A0, b0, e0, mgl[l].Numeric, 0);

                break;

#endif


#if WITH_MUMPS

            case SOLVER_MUMPS:

                /* use MUMPS direct solver on the coarsest level */

                mgl[l].mumps.job = 2;

                fasp_solver_mumps_steps(A0, b0, e0, &mgl[l].mumps);

                break;

#endif


            default:

                /* use iterative solver on the coarsest level */

                fasp_coarse_itsolver(A0, b0, e0, tol, prtlvl);

        }

    }


#if DEBUG_MODE > 0

    printf("### DEBUG: [--End--] %s ...\n", __FUNCTION__);

#endif

}


void fasp_solver_namli(AMG_data* mgl, AMG_param* param, INT l, INT num_levels)

{

    const SHORT amg_type      = param->AMG_type;

    const SHORT prtlvl        = param->print_level;

    const SHORT smoother      = param->smoother;

    const SHORT smooth_order  = param->smooth_order;

    const SHORT coarse_solver = param->coarse_solver;

    const REAL  relax         = param->relaxation;

    const REAL  tol           = param->tol * 1e-4;

    const SHORT ndeg          = param->polynomial_degree;


    dvector *b0 = &mgl[l].b, *e0 = &mgl[l].x;         // fine level b and x

    dvector *b1 = &mgl[l + 1].b, *e1 = &mgl[l + 1].x; // coarse level b and x


    dCSRmat* A0 = &mgl[l].A;                          // fine level matrix

    dCSRmat* A1 = &mgl[l + 1].A;                      // coarse level matrix


    const INT m0 = A0->row, m1 = A1->row;


    INT*      ordering = mgl[l].cfmark.val; // smoother ordering

    ILU_data* LU_level = &mgl[l].LU;        // fine level ILU decomposition

    REAL*     r        = mgl[l].w.val;      // work array for residual


    dvector uH;                             // for coarse level correction

    uH.row = m1;

    uH.val = mgl[l + 1].w.val + m1;


    // Schwarz parameters

    SWZ_param swzparam;

    if (param->SWZ_levels > 0) swzparam.SWZ_blksolver = param->SWZ_blksolver;


#if DEBUG_MODE > 0

    printf("### DEBUG: [-Begin-] %s ...\n", __FUNCTION__);

    printf("### DEBUG: n=%d, nnz=%d\n", mgl[0].A.row, mgl[0].A.nnz);

#endif


    if (prtlvl >= PRINT_MOST)

        printf("Nonlinear AMLI level %d, smoother %d.\n", num_levels, smoother);


    if (l < num_levels - 1) {


        // pre smoothing

        if (l < mgl[l].ILU_levels) {


            fasp_smoother_dcsr_ilu(A0, b0, e0, LU_level);


        }


        else if (l < mgl->SWZ_levels) {


            switch (mgl[l].Schwarz.SWZ_type) {

                case SCHWARZ_SYMMETRIC:

                    fasp_dcsr_swz_forward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                          &mgl[l].b);

                    fasp_dcsr_swz_backward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                           &mgl[l].b);

                    break;

                default:

                    fasp_dcsr_swz_forward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                          &mgl[l].b);

                    break;

            }

        }


        else {

#if MULTI_COLOR_ORDER

            // printf("fasp_smoother_dcsr_gs_multicolor, %s, %d\n",  __FUNCTION__,

            // __LINE__);

            fasp_smoother_dcsr_gs_multicolor(&mgl[l].x, &mgl[l].A, &mgl[l].b,

                                             param->presmooth_iter, 1);

#else

            fasp_dcsr_presmoothing(smoother, A0, b0, e0, param->presmooth_iter, 0,

                                   m0 - 1, 1, relax, ndeg, smooth_order, ordering);

#endif

        }


        // form residual r = b - A x

        fasp_darray_cp(m0, b0->val, r);

        fasp_blas_dcsr_aAxpy(-1.0, A0, e0->val, r);


        // restriction r1 = R*r0

        switch (amg_type) {

            case UA_AMG:

                fasp_blas_dcsr_mxv_agg(&mgl[l].R, r, b1->val);

                break;

            default:

                fasp_blas_dcsr_mxv(&mgl[l].R, r, b1->val);

        }


        // call nonlinear AMLI-cycle recursively

        {

            fasp_dvec_set(m1, e1, 0.0);


            // V-cycle will be enforced when needed !!!

            if (mgl[l + 1].cycle_type <= 1) {


                fasp_solver_namli(&mgl[l + 1], param, 0, num_levels - 1);


            }


            else { // recursively call preconditioned Krylov method on coarse grid


                precond_data pcdata;


                fasp_param_amg_to_prec(&pcdata, param);

                pcdata.maxit      = 1;

                pcdata.max_levels = num_levels - 1;

                pcdata.mgl_data   = &mgl[l + 1];


                precond pc;

                pc.data = &pcdata;

                pc.fct  = fasp_precond_namli;


                fasp_darray_cp(m1, e1->val, uH.val);


                switch (param->nl_amli_krylov_type) {

                    case SOLVER_GCG: // Use GCG

                        Kcycle_dcsr_pgcg(A1, b1, &uH, &pc);

                        break;

                    default: // Use GCR

                        Kcycle_dcsr_pgcr(A1, b1, &uH, &pc);

                }


                fasp_darray_cp(m1, uH.val, e1->val);

            }

        }


        // prolongation e0 = e0 + P*e1

        switch (amg_type) {

            case UA_AMG:

                fasp_blas_dcsr_aAxpy_agg(1.0, &mgl[l].P, e1->val, e0->val);

                break;

            default:

                fasp_blas_dcsr_aAxpy(1.0, &mgl[l].P, e1->val, e0->val);

        }


        // post smoothing

        if (l < mgl[l].ILU_levels) {


            fasp_smoother_dcsr_ilu(A0, b0, e0, LU_level);


        } else if (l < mgl->SWZ_levels) {


            switch (mgl[l].Schwarz.SWZ_type) {

                case SCHWARZ_SYMMETRIC:

                    fasp_dcsr_swz_backward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                           &mgl[l].b);

                    fasp_dcsr_swz_forward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                          &mgl[l].b);

                    break;

                default:

                    fasp_dcsr_swz_backward(&mgl[l].Schwarz, &swzparam, &mgl[l].x,

                                           &mgl[l].b);

            }


        }


        else {

#if MULTI_COLOR_ORDER

            fasp_smoother_dcsr_gs_multicolor(&mgl[l].x, &mgl[l].A, &mgl[l].b,

                                             param->postsmooth_iter, -1);

#else

            fasp_dcsr_postsmoothing(smoother, A0, b0, e0, param->postsmooth_iter, 0,

                                    m0 - 1, -1, relax, ndeg, smooth_order, ordering);

#endif

        }


    }


    else { // coarsest level solver


        switch (coarse_solver) {


#if WITH_PARDISO

            case SOLVER_PARDISO:

                {

                    /* use Intel MKL PARDISO direct solver on the coarsest level */

                    fasp_pardiso_solve(A0, b0, e0, &mgl[l].pdata, 0);

                    break;

                }

#endif


#if WITH_SuperLU

            case SOLVER_SUPERLU:

                /* use SuperLU direct solver on the coarsest level */

                fasp_solver_superlu(A0, b0, e0, 0);

                break;

#endif


#if WITH_UMFPACK

            case SOLVER_UMFPACK:

                /* use UMFPACK direct solver on the coarsest level */

                fasp_umfpack_solve(A0, b0, e0, mgl[l].Numeric, 0);

                break;

#endif


#if WITH_MUMPS

            case SOLVER_MUMPS:

                /* use MUMPS direct solver on the coarsest level */

                mgl[l].mumps.job = 2;

                fasp_solver_mumps_steps(A0, b0, e0, &mgl[l].mumps);

                break;

#endif


            default:

                /* use iterative solver on the coarsest level */

                fasp_coarse_itsolver(A0, b0, e0, tol, prtlvl);

        }

    }


#if DEBUG_MODE > 0

    printf("### DEBUG: [--End--] %s ...\n", __FUNCTION__);

#endif

}


void fasp_solver_namli_bsr(AMG_data_bsr* mgl, AMG_param* param, INT l, INT num_levels)

{

    const SHORT prtlvl        = param->print_level;

    const SHORT smoother      = param->smoother;

    const SHORT coarse_solver = param->coarse_solver;

    const REAL  relax         = param->relaxation;

    const REAL  tol           = param->tol;

    INT         i;


    dvector *b0 = &mgl[l].b, *e0 = &mgl[l].x;         // fine level b and x

    dvector *b1 = &mgl[l + 1].b, *e1 = &mgl[l + 1].x; // coarse level b and x


    dBSRmat*  A0 = &mgl[l].A;                         // fine level matrix

    dBSRmat*  A1 = &mgl[l + 1].A;                     // coarse level matrix

    const INT m0 = A0->ROW * A0->nb, m1 = A1->ROW * A1->nb;


    ILU_data* LU_level = &mgl[l].LU;   // fine level ILU decomposition

    REAL*     r        = mgl[l].w.val; // for residual


    dvector uH, bH;                    // for coarse level correction

    uH.row = m1;

    uH.val = mgl[l + 1].w.val + m1;

    bH.row = m1;

    bH.val = mgl[l + 1].w.val + 2 * m1;


#if DEBUG_MODE > 0

    printf("### DEBUG: [-Begin-] %s ...\n", __FUNCTION__);

    printf("### DEBUG: n=%d, nnz=%d\n", mgl[0].A.ROW, mgl[0].A.NNZ);

    // printf("### DEBUG: prtlvl=%d\n", prtlvl);

    // exit(0);

#endif


    // REAL start_time, end_time; //! zhaoli


    if (prtlvl >= PRINT_MOST)

        printf("Nonlinear AMLI: level %d, smoother %d.\n", l, smoother);


    if (l < num_levels - 1) {


        // fasp_gettime(&start_time); //! zhaoli


        // pre smoothing

        if (l < param->ILU_levels) {

            fasp_smoother_dbsr_ilu(A0, b0, e0, LU_level);

        } else {

            SHORT steps = param->presmooth_iter;


            if (steps > 0) {

                switch (smoother) {

                    case SMOOTHER_JACOBI:

                        for (i = 0; i < steps; i++)

                            // fasp_smoother_dbsr_jacobi (A0, b0, e0);

                            fasp_smoother_dbsr_jacobi1(A0, b0, e0, mgl[l].diaginv.val);

                        break;

                    case SMOOTHER_GS:

                        if (l == 0) {

                            for (i = 0; i < steps; i++)

#if BAMG_GS0_DiagInv || 1

                                fasp_smoother_dbsr_gs1(A0, b0, e0, ASCEND, NULL,

                                                       mgl[l].diaginv.val);

#else

                                fasp_smoother_dbsr_gs_ascend1(A0, b0, e0);

#endif

                        } else {

                            for (i = 0; i < steps; i++)

                                fasp_smoother_dbsr_gs1(A0, b0, e0, ASCEND, NULL,

                                                       mgl[l].diaginv.val);

                        }


                        break;

                    case SMOOTHER_SOR:

                        for (i = 0; i < steps; i++)

                            // fasp_smoother_dbsr_sor(A0, b0, e0, ASCEND, NULL, relax);

                            fasp_smoother_dbsr_sor1(A0, b0, e0, ASCEND, NULL,

                                                    mgl[l].diaginv.val, relax);

                        break;

                    default:

                        printf("### ERROR: Unknown smoother type %d!\n", smoother);

                        fasp_chkerr(ERROR_SOLVER_TYPE, __FUNCTION__);

                }

            }

        }


        // fasp_gettime(&end_time);                      //! zhaoli

        // PreSmoother_time_zl += end_time - start_time; //! zhaoli


        // form residual r = b - A x

        fasp_darray_cp(m0, b0->val, r);

        fasp_blas_dbsr_aAxpy(-1.0, A0, e0->val, r);


        fasp_blas_dbsr_mxv(&mgl[l].R, r, b1->val);


        // call nonlinear AMLI-cycle recursively

        {

            fasp_dvec_set(m1, e1, 0.0);


            // The coarsest problem is solved exactly.

            // No need to call Krylov method on second coarsest level

            if (l == num_levels - 2) {

                fasp_solver_namli_bsr(&mgl[l + 1], param, 0, num_levels - 1);

            } else { // recursively call preconditioned Krylov method on coarse grid

                precond_data_bsr pcdata;


                fasp_param_amg_to_precbsr(&pcdata, param);

                pcdata.maxit      = 1;

                pcdata.max_levels = num_levels - 1;

                pcdata.mgl_data   = &mgl[l + 1];


                precond pc;

                pc.data = &pcdata;

                pc.fct  = fasp_precond_dbsr_namli;


                fasp_darray_cp(m1, b1->val, bH.val);

                fasp_darray_cp(m1, e1->val, uH.val);


                const INT maxit = param->amli_degree + 1;


                // fasp_gettime(&start_time); //! zhaoli


                // fasp_solver_dbsr_pcg(A1, &bH, &uH, &pc, param->tol, param->tol *

                // 1e-8,

                //                      maxit, 1, PRINT_NONE);


                // printf("tol = %e\n", param->tol);

                // exit(0);

                // fasp_solver_dbsr_pbcgs(A1, &bH, &uH, &pc, param->tol, param->tol *

                // 1e-8,

                //                        maxit, 1, PRINT_NONE);


                fasp_solver_dbsr_pvfgmres(A1, &bH, &uH, &pc, param->tol,

                                          param->tol * 1e-8, maxit, MIN(maxit, 30), 1,

                                          PRINT_NONE);


                // fasp_gettime(&end_time);                 //! zhaoli

                // Krylov_time_zl += end_time - start_time; //! zhaoli


                fasp_darray_cp(m1, bH.val, b1->val);

                fasp_darray_cp(m1, uH.val, e1->val);

            }

        }


        fasp_blas_dbsr_aAxpy(1.0, &mgl[l].P, e1->val, e0->val);


        // fasp_gettime(&start_time); //! zhaoli


        // post smoothing

        if (l < param->ILU_levels) {

            fasp_smoother_dbsr_ilu(A0, b0, e0, LU_level);

        } else {

            SHORT steps = param->postsmooth_iter;


            if (steps > 0) {

                switch (smoother) {

                    case SMOOTHER_JACOBI:

                        for (i = 0; i < steps; i++)

                            // fasp_smoother_dbsr_jacobi(A0, b0, e0);

                            fasp_smoother_dbsr_jacobi1(A0, b0, e0, mgl[l].diaginv.val);

                        break;

                    case SMOOTHER_GS:

                        // fasp_smoother_dbsr_gs(A0, b0, e0, ASCEND, NULL);

                        if (l == 0) {

                            for (i = 0; i < steps; i++)

#if BAMG_GS0_DiagInv || 1

                                fasp_smoother_dbsr_gs1(A0, b0, e0, DESCEND, NULL,

                                                       mgl[l].diaginv.val);

#else

                                fasp_smoother_dbsr_gs_descend1(A0, b0, e0);

#endif

                        } else {

                            for (i = 0; i < steps; i++)

                                fasp_smoother_dbsr_gs1(A0, b0, e0, DESCEND, NULL,

                                                       mgl[l].diaginv.val);

                        }


                        break;

                    case SMOOTHER_SOR:

                        for (i = 0; i < steps; i++)

                            // fasp_smoother_dbsr_sor(A0, b0, e0, ASCEND, NULL, relax);

                            fasp_smoother_dbsr_sor1(A0, b0, e0, DESCEND, NULL,

                                                    mgl[l].diaginv.val, relax);

                        break;

                    default:

                        printf("### ERROR: Unknown smoother type %d!\n", smoother);

                        fasp_chkerr(ERROR_SOLVER_TYPE, __FUNCTION__);

                }

            }

        }


        // fasp_gettime(&end_time);                       //! zhaoli

        // PostSmoother_time_zl += end_time - start_time; //! zhaoli


    }


    else { // coarsest level solver

        // fasp_gettime(&start_time); //! zhaoli


        switch (coarse_solver) {


#if WITH_PARDISO

            case SOLVER_PARDISO:

                {

                    /* use Intel MKL PARDISO direct solver on the coarsest level */

                    fasp_pardiso_solve(&mgl[l].Ac, b0, e0, &mgl[l].pdata, 0);

                    break;

                }

#endif


#if WITH_SuperLU

            case SOLVER_SUPERLU:

                /* use SuperLU direct solver on the coarsest level */

                fasp_solver_superlu(&mgl[l].Ac, b0, e0, 0);

                break;

#endif


#if WITH_UMFPACK

            case SOLVER_UMFPACK:

                /* use UMFPACK direct solver on the coarsest level */

                fasp_umfpack_solve(&mgl[l].Ac, b0, e0, mgl[l].Numeric, 0);

                break;

#endif


#if WITH_MUMPS

            case SOLVER_MUMPS:

                /* use MUMPS direct solver on the coarsest level */

                mgl[l].mumps.job = 2;

                fasp_solver_mumps_steps(&mgl[l].Ac, b0, e0, &mgl[l].mumps);

                break;

#endif


            default:

                /* use iterative solver on the coarsest level */

                fasp_coarse_itsolver(&mgl[l].Ac, b0, e0, tol, prtlvl);

        }


        // fasp_gettime(&end_time);                  //! zhaoli

        // Coarsen_time_zl += end_time - start_time; //! zhaoli

    }


#if DEBUG_MODE > 0

    printf("### DEBUG: [--End--] %s ...\n", __FUNCTION__);

#endif

}


void fasp_amg_amli_coef(const REAL lambda_max,

                        const REAL lambda_min,

                        const INT  degree,

                        REAL*      coef)

{

    const REAL mu0 = 1.0 / lambda_max, mu1 = 1.0 / lambda_min;

    const REAL c = (sqrt(mu0) + sqrt(mu1)) * (sqrt(mu0) + sqrt(mu1));

    const REAL a = (4 * mu0 * mu1) / (c);


    const REAL kappa = lambda_max / lambda_min; // condition number

    const REAL delta = (sqrt(kappa) - 1.0) / (sqrt(kappa) + 1.0);

    const REAL b     = delta * delta;


    if (degree == 0) {

        coef[0] = 0.5 * (mu0 + mu1);

    }


    else if (degree == 1) {

        coef[0] = 0.5 * c;

        coef[1] = -1.0 * mu0 * mu1;

    }


    else if (degree > 1) {

        INT i;


        // allocate memory

        REAL* work = (REAL*)fasp_mem_calloc(2 * degree - 1, sizeof(REAL));

        REAL *coef_k, *coef_km1;

        coef_k   = work;

        coef_km1 = work + degree;


        // get q_k

        fasp_amg_amli_coef(lambda_max, lambda_min, degree - 1, coef_k);

        // get q_km1

        fasp_amg_amli_coef(lambda_max, lambda_min, degree - 2, coef_km1);


        // get coef

        coef[0] = a - b * coef_km1[0] + (1 + b) * coef_k[0];


        for (i = 1; i < degree - 1; i++) {

            coef[i] = -b * coef_km1[i] + (1 + b) * coef_k[i] - a * coef_k[i - 1];

        }


        coef[degree - 1] = (1 + b) * coef_k[degree - 1] - a * coef_k[degree - 2];


        coef[degree] = -a * coef_k[degree - 1];


        // clean memory

        fasp_mem_free(work);

        work = NULL;

    }


    else {

        printf("### ERROR: Wrong AMLI degree %d!\n", degree);

        fasp_chkerr(ERROR_INPUT_PAR, __FUNCTION__);

    }


    return;

}


/*---------------------------------*/

/*--        End of File          --*/

/*---------------------------------*/

fasp_darray_cp
void fasp_darray_cp(const INT n, const REAL *x, REAL *y)
Copy an array to the other y=x.
Definition: AuxArray.c:210

fasp_mem_free
void fasp_mem_free(void *mem)
Free up previous allocated memory body and set pointer to NULL.
Definition: AuxMemory.c:152

fasp_mem_calloc
void * fasp_mem_calloc(const unsigned int size, const unsigned int type)
Allocate, initiate, and check memory.
Definition: AuxMemory.c:65

fasp_chkerr
void fasp_chkerr(const SHORT status, const char *fctname)
Check error status and print out error messages before quit.
Definition: AuxMessage.c:213

fasp_param_amg_to_prec
void fasp_param_amg_to_prec(precond_data *pcdata, const AMG_param *amgparam)
Set precond_data with AMG_param.
Definition: AuxParam.c:782

fasp_param_amg_to_precbsr
void fasp_param_amg_to_precbsr(precond_data_bsr *pcdata, const AMG_param *amgparam)
Set precond_data_bsr with AMG_param.
Definition: AuxParam.c:848

fasp_dvec_set
void fasp_dvec_set(INT n, dvector *x, const REAL val)
Initialize dvector x[i]=val for i=0:n-1.
Definition: AuxVector.c:222

fasp_blas_darray_dotprod
REAL fasp_blas_darray_dotprod(const INT n, const REAL *x, const REAL *y)
Inner product of two arraies x and y.
Definition: BlaArray.c:771

fasp_blas_darray_ax
void fasp_blas_darray_ax(const INT n, const REAL a, REAL *x)
x = a*x
Definition: BlaArray.c:43

fasp_blas_darray_axpy
void fasp_blas_darray_axpy(const INT n, const REAL a, const REAL *x, REAL *y)
y = a*x + y
Definition: BlaArray.c:90

fasp_dcsr_swz_forward
void fasp_dcsr_swz_forward(SWZ_data *swzdata, SWZ_param *swzparam, dvector *x, dvector *b)
Schwarz smoother: forward sweep.
Definition: BlaSchwarzSetup.c:218

fasp_dcsr_swz_backward
void fasp_dcsr_swz_backward(SWZ_data *swzdata, SWZ_param *swzparam, dvector *x, dvector *b)
Schwarz smoother: backward sweep.
Definition: BlaSchwarzSetup.c:328

fasp_blas_dbsr_aAxpy
void fasp_blas_dbsr_aAxpy(const REAL alpha, const dBSRmat *A, const REAL *x, REAL *y)
Compute y := alpha*A*x + y.
Definition: BlaSpmvBSR.c:514

fasp_blas_dbsr_mxv
void fasp_blas_dbsr_mxv(const dBSRmat *A, const REAL *x, REAL *y)
Compute y := A*x.
Definition: BlaSpmvBSR.c:1055

fasp_blas_dcsr_mxv_agg
void fasp_blas_dcsr_mxv_agg(const dCSRmat *A, const REAL *x, REAL *y)
Matrix-vector multiplication y = A*x (nonzeros of A = 1)
Definition: BlaSpmvCSR.c:438

fasp_blas_dcsr_mxv
void fasp_blas_dcsr_mxv(const dCSRmat *A, const REAL *x, REAL *y)
Matrix-vector multiplication y = A*x.
Definition: BlaSpmvCSR.c:242

fasp_blas_dcsr_aAxpy_agg
void fasp_blas_dcsr_aAxpy_agg(const REAL alpha, const dCSRmat *A, const REAL *x, REAL *y)
Matrix-vector multiplication y = alpha*A*x + y (nonzeros of A = 1)
Definition: BlaSpmvCSR.c:727

fasp_blas_dcsr_vmv
REAL fasp_blas_dcsr_vmv(const dCSRmat *A, const REAL *x, const REAL *y)
vector-Matrix-vector multiplication alpha = y'*A*x
Definition: BlaSpmvCSR.c:839

fasp_blas_dcsr_aAxpy
void fasp_blas_dcsr_aAxpy(const REAL alpha, const dCSRmat *A, const REAL *x, REAL *y)
Matrix-vector multiplication y = alpha*A*x + y.
Definition: BlaSpmvCSR.c:494

fasp_smoother_dbsr_gs1
void fasp_smoother_dbsr_gs1(dBSRmat *A, dvector *b, dvector *u, INT order, INT *mark, REAL *diaginv)
Gauss-Seidel relaxation.
Definition: ItrSmootherBSR.c:520

fasp_smoother_dbsr_gs_descend1
void fasp_smoother_dbsr_gs_descend1(dBSRmat *A, dvector *b, dvector *u)
Gauss-Seidel relaxation in the descending order.
Definition: ItrSmootherBSR.c:751

fasp_smoother_dbsr_jacobi1
void fasp_smoother_dbsr_jacobi1(dBSRmat *A, dvector *b, dvector *u, REAL *diaginv)
Jacobi relaxation.
Definition: ItrSmootherBSR.c:263

fasp_smoother_dbsr_gs_ascend1
void fasp_smoother_dbsr_gs_ascend1(dBSRmat *A, dvector *b, dvector *u)
Gauss-Seidel relaxation in the ascending order.
Definition: ItrSmootherBSR.c:619

fasp_smoother_dbsr_ilu
void fasp_smoother_dbsr_ilu(dBSRmat *A, dvector *b, dvector *x, void *data)
ILU method as the smoother in solving Au=b with multigrid method.
Definition: ItrSmootherBSR.c:1479

fasp_smoother_dbsr_sor1
void fasp_smoother_dbsr_sor1(dBSRmat *A, dvector *b, dvector *u, INT order, INT *mark, REAL *diaginv, REAL weight)
SOR relaxation.
Definition: ItrSmootherBSR.c:1075

fasp_smoother_dcsr_ilu
void fasp_smoother_dcsr_ilu(dCSRmat *A, dvector *b, dvector *x, void *data)
ILU method as a smoother.
Definition: ItrSmootherCSR.c:1279

fasp_solver_dbsr_pvfgmres
INT fasp_solver_dbsr_pvfgmres(dBSRmat *A, dvector *b, dvector *x, precond *pc, const REAL tol, const REAL abstol, const INT MaxIt, const SHORT restart, const SHORT StopType, const SHORT PrtLvl)
Solve "Ax=b" using PFGMRES(right preconditioned) iterative method in which the restart parameter can ...
Definition: KryPvfgmres.c:386

fasp_precond_dbsr_namli
void fasp_precond_dbsr_namli(REAL *r, REAL *z, void *data)
Nonlinear AMLI-cycle AMG preconditioner.
Definition: PreBSR.c:1294

fasp_precond_namli
void fasp_precond_namli(REAL *r, REAL *z, void *data)
Nonlinear AMLI AMG preconditioner.
Definition: PreCSR.c:515

fasp_solver_namli
void fasp_solver_namli(AMG_data *mgl, AMG_param *param, INT l, INT num_levels)
Solve Ax=b with recursive nonlinear AMLI-cycle.
Definition: PreMGRecurAMLI.c:291

fasp_amg_amli_coef
void fasp_amg_amli_coef(const REAL lambda_max, const REAL lambda_min, const INT degree, REAL *coef)
Compute the coefficients of the polynomial used by AMLI-cycle.
Definition: PreMGRecurAMLI.c:791

fasp_solver_namli_bsr
void fasp_solver_namli_bsr(AMG_data_bsr *mgl, AMG_param *param, INT l, INT num_levels)
Solve Ax=b with recursive nonlinear AMLI-cycle.
Definition: PreMGRecurAMLI.c:528

fasp_solver_amli
void fasp_solver_amli(AMG_data *mgl, AMG_param *param, INT l)
Solve Ax=b with recursive AMLI-cycle.
Definition: PreMGRecurAMLI.c:58

fasp_solver_mumps_steps
int fasp_solver_mumps_steps(dCSRmat *ptrA, dvector *b, dvector *u, Mumps_data *mumps)
Solve Ax=b by MUMPS in three steps.
Definition: XtrMumps.c:196

fasp_solver_superlu
int fasp_solver_superlu(dCSRmat *ptrA, dvector *b, dvector *u, const SHORT prtlvl)
Solve Au=b by SuperLU.
Definition: XtrSuperlu.c:47

fasp.h
Main header file for the FASP project.

MIN
#define MIN(a, b)
Definition: fasp.h:83

REAL
#define REAL
Definition: fasp.h:75

SHORT
#define SHORT
FASP integer and floating point numbers.
Definition: fasp.h:71

INT
#define INT
Definition: fasp.h:72

SMOOTHER_SOR
#define SMOOTHER_SOR
Definition: fasp_const.h:195

SOLVER_PARDISO
#define SOLVER_PARDISO
Definition: fasp_const.h:126

SMOOTHER_JACOBI
#define SMOOTHER_JACOBI
Definition: fasp_const.h:190

PRINT_MOST
#define PRINT_MOST
Definition: fasp_const.h:77

ASCEND
#define ASCEND
Definition: fasp_const.h:249

SOLVER_MUMPS
#define SOLVER_MUMPS
Definition: fasp_const.h:125

ERROR_SOLVER_TYPE
#define ERROR_SOLVER_TYPE
Definition: fasp_const.h:41

SOLVER_SUPERLU
#define SOLVER_SUPERLU
Definition: fasp_const.h:123

SCHWARZ_SYMMETRIC
#define SCHWARZ_SYMMETRIC
Definition: fasp_const.h:158

SMOOTHER_GS
#define SMOOTHER_GS
Definition: fasp_const.h:191

SOLVER_UMFPACK
#define SOLVER_UMFPACK
Definition: fasp_const.h:124

DESCEND
#define DESCEND
Definition: fasp_const.h:250

ERROR_INPUT_PAR
#define ERROR_INPUT_PAR
Definition: fasp_const.h:24

ON
#define ON
Definition of switch.
Definition: fasp_const.h:67

PRINT_NONE
#define PRINT_NONE
Print level for all subroutines – not including DEBUG output.
Definition: fasp_const.h:73

SOLVER_GCG
#define SOLVER_GCG
Definition: fasp_const.h:109

UA_AMG
#define UA_AMG
Definition: fasp_const.h:165

AMG_data_bsr
Data for multigrid levels in dBSRmat format.
Definition: fasp_block.h:146

AMG_data_bsr::A
dBSRmat A
pointer to the matrix at level level_num
Definition: fasp_block.h:155

AMG_data_bsr::mumps
Mumps_data mumps
data for MUMPS
Definition: fasp_block.h:245

AMG_data_bsr::b
dvector b
pointer to the right-hand side at level level_num
Definition: fasp_block.h:164

AMG_data_bsr::x
dvector x
pointer to the iterative solution at level level_num
Definition: fasp_block.h:167

AMG_data_bsr::w
dvector w
temporary work space
Definition: fasp_block.h:242

AMG_data_bsr::LU
ILU_data LU
ILU matrix for ILU smoother.
Definition: fasp_block.h:220

AMG_data
Data for AMG methods.
Definition: fasp.h:804

AMG_data::A
dCSRmat A
pointer to the matrix at level level_num
Definition: fasp.h:817

AMG_data::mumps
Mumps_data mumps
data for MUMPS
Definition: fasp.h:866

AMG_data::b
dvector b
pointer to the right-hand side at level level_num
Definition: fasp.h:826

AMG_data::x
dvector x
pointer to the iterative solution at level level_num
Definition: fasp.h:829

AMG_data::w
dvector w
temporary work space
Definition: fasp.h:863

AMG_data::cfmark
ivector cfmark
pointer to the CF marker at level level_num
Definition: fasp.h:840

AMG_data::LU
ILU_data LU
ILU matrix for ILU smoother.
Definition: fasp.h:846

AMG_param
Parameters for AMG methods.
Definition: fasp.h:455

AMG_param::print_level
SHORT print_level
print level for AMG
Definition: fasp.h:461

AMG_param::polynomial_degree
SHORT polynomial_degree
degree of the polynomial smoother
Definition: fasp.h:497

AMG_param::nl_amli_krylov_type
SHORT nl_amli_krylov_type
type of Krylov method used by Nonlinear AMLI cycle
Definition: fasp.h:512

AMG_param::coarse_scaling
SHORT coarse_scaling
switch of scaling of the coarse grid correction
Definition: fasp.h:503

AMG_param::amli_coef
REAL * amli_coef
coefficients of the polynomial used by AMLI cycle
Definition: fasp.h:509

AMG_param::AMG_type
SHORT AMG_type
type of AMG method
Definition: fasp.h:458

AMG_param::tol
REAL tol
stopping tolerance for AMG solver
Definition: fasp.h:467

AMG_param::coarse_solver
SHORT coarse_solver
coarse solver type
Definition: fasp.h:500

AMG_param::relaxation
REAL relaxation
relaxation parameter for Jacobi and SOR smoother
Definition: fasp.h:494

AMG_param::smoother
SHORT smoother
smoother type
Definition: fasp.h:482

AMG_param::amli_degree
SHORT amli_degree
degree of the polynomial used by AMLI cycle
Definition: fasp.h:506

AMG_param::SWZ_blksolver
INT SWZ_blksolver
type of Schwarz block solver
Definition: fasp.h:590

AMG_param::postsmooth_iter
SHORT postsmooth_iter
number of postsmoothers
Definition: fasp.h:491

AMG_param::SWZ_levels
INT SWZ_levels
number of levels use Schwarz smoother
Definition: fasp.h:578

AMG_param::presmooth_iter
SHORT presmooth_iter
number of presmoothers
Definition: fasp.h:488

AMG_param::smooth_order
SHORT smooth_order
smoother order
Definition: fasp.h:485

ILU_data
Data for ILU setup.
Definition: fasp.h:651

Mumps_data::job
INT job
work for MUMPS
Definition: fasp.h:615

SWZ_param
Parameters for Schwarz method.
Definition: fasp.h:430

SWZ_param::SWZ_blksolver
INT SWZ_blksolver
type of Schwarz block solver
Definition: fasp.h:445

dBSRmat
Block sparse row storage matrix of REAL type.
Definition: fasp_block.h:34

dBSRmat::NNZ
INT NNZ
number of nonzero sub-blocks in matrix A, NNZ
Definition: fasp_block.h:43

dBSRmat::val
REAL * val
Definition: fasp_block.h:57

dBSRmat::nb
INT nb
dimension of each sub-block
Definition: fasp_block.h:46

dBSRmat::ROW
INT ROW
number of rows of sub-blocks in matrix A, M
Definition: fasp_block.h:37

dCSRmat
Sparse matrix of REAL type in CSR format.
Definition: fasp.h:151

dCSRmat::val
REAL * val
nonzero entries of A
Definition: fasp.h:169

dCSRmat::row
INT row
row number of matrix A, m
Definition: fasp.h:154

dCSRmat::nnz
INT nnz
number of nonzero entries
Definition: fasp.h:160

dvector
Vector with n entries of REAL type.
Definition: fasp.h:354

dvector::val
REAL * val
actual vector entries
Definition: fasp.h:360

dvector::row
INT row
number of rows
Definition: fasp.h:357

ivector::val
INT * val
actual vector entries
Definition: fasp.h:374

precond_data_bsr
Data for preconditioners in dBSRmat format.
Definition: fasp_block.h:271

precond_data_bsr::mgl_data
AMG_data_bsr * mgl_data
AMG preconditioner data.
Definition: fasp_block.h:328

precond_data_bsr::max_levels
INT max_levels
max number of AMG levels
Definition: fasp_block.h:283

precond_data_bsr::maxit
INT maxit
max number of iterations of AMG preconditioner
Definition: fasp_block.h:280

precond_data
Data for preconditioners.
Definition: fasp.h:894

precond_data::mgl_data
AMG_data * mgl_data
AMG preconditioner data.
Definition: fasp.h:954

precond_data::max_levels
SHORT max_levels
max number of AMG levels
Definition: fasp.h:906

precond_data::maxit
INT maxit
max number of iterations of AMG preconditioner
Definition: fasp.h:903

precond
Preconditioner data and action.
Definition: fasp.h:1095

precond::data
void * data
data for preconditioner, void pointer
Definition: fasp.h:1098

precond::fct
void(* fct)(REAL *, REAL *, void *)
action for preconditioner, void function pointer
Definition: fasp.h:1101