1c4762a1bSJed Brown static char help[] = "Test LAPACK routine DSTEBZ() and DTEIN(). \n\n"; 2c4762a1bSJed Brown 3c4762a1bSJed Brown #include <petscmat.h> 4c4762a1bSJed Brown #include <petscblaslapack.h> 5c4762a1bSJed Brown 6c4762a1bSJed Brown extern PetscErrorCode CkEigenSolutions(PetscInt,Mat,PetscInt,PetscInt,PetscScalar*,Vec*,PetscReal*); 7c4762a1bSJed Brown 8c4762a1bSJed Brown int main(int argc,char **args) 9c4762a1bSJed Brown { 10c4762a1bSJed Brown PetscErrorCode ierr; 11c4762a1bSJed Brown #if defined(PETSC_USE_COMPLEX) || defined(PETSC_MISSING_LAPACK_STEBZ) || defined(PETSC_MISSING_LAPACK_STEIN) 12c4762a1bSJed Brown ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr; 13c4762a1bSJed Brown SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_SUP_SYS,"This example requires LAPACK routines dstebz and stien and real numbers"); 14c4762a1bSJed Brown #else 15c4762a1bSJed Brown PetscReal *work,tols[2]; 16c4762a1bSJed Brown PetscInt i,j; 17c4762a1bSJed Brown PetscBLASInt n,il=1,iu=5,*iblock,*isplit,*iwork,nevs,*ifail,cklvl=2; 18c4762a1bSJed Brown PetscMPIInt size; 19c4762a1bSJed Brown PetscBool flg; 20c4762a1bSJed Brown Vec *evecs; 21c4762a1bSJed Brown PetscScalar *evecs_array,*D,*E,*evals; 22c4762a1bSJed Brown Mat T; 23c4762a1bSJed Brown PetscReal vl=0.0,vu=4.0,tol= 1000*PETSC_MACHINE_EPSILON; 24c4762a1bSJed Brown PetscBLASInt nsplit,info; 25c4762a1bSJed Brown 26c4762a1bSJed Brown ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr; 275f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size)); 282c71b3e2SJacob Faibussowitsch PetscCheckFalse(size != 1,PETSC_COMM_WORLD, PETSC_ERR_WRONG_MPI_SIZE,"This is a uniprocessor example only!"); 29c4762a1bSJed Brown 30c4762a1bSJed Brown n = 100; 31c4762a1bSJed Brown nevs = iu - il; 325f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(3*n+1,&D)); 33c4762a1bSJed Brown E = D + n; 34c4762a1bSJed Brown evals = E + n; 355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(5*n+1,&work)); 365f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(3*n+1,&iwork)); 375f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(3*n+1,&iblock)); 38c4762a1bSJed Brown isplit = iblock + n; 39c4762a1bSJed Brown 40c4762a1bSJed Brown /* Set symmetric tridiagonal matrix */ 41c4762a1bSJed Brown for (i=0; i<n; i++) { 42c4762a1bSJed Brown D[i] = 2.0; 43c4762a1bSJed Brown E[i] = 1.0; 44c4762a1bSJed Brown } 45c4762a1bSJed Brown 46c4762a1bSJed Brown /* Solve eigenvalue problem: A*evec = eval*evec */ 475f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," LAPACKstebz_: compute %d eigenvalues...\n",nevs)); 48c4762a1bSJed Brown LAPACKstebz_("I","E",&n,&vl,&vu,&il,&iu,&tol,(PetscReal*)D,(PetscReal*)E,&nevs,&nsplit,(PetscReal*)evals,iblock,isplit,work,iwork,&info); 49*28b400f6SJacob Faibussowitsch PetscCheck(!info,PETSC_COMM_SELF,PETSC_ERR_USER,"LAPACKstebz_ fails. info %d",info); 50c4762a1bSJed Brown 515f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," LAPACKstein_: compute %d found eigenvectors...\n",nevs)); 525f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(n*nevs,&evecs_array)); 535f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nevs,&ifail)); 54c4762a1bSJed Brown LAPACKstein_(&n,(PetscReal*)D,(PetscReal*)E,&nevs,(PetscReal*)evals,iblock,isplit,evecs_array,&n,work,iwork,ifail,&info); 55*28b400f6SJacob Faibussowitsch PetscCheck(!info,PETSC_COMM_SELF,PETSC_ERR_USER,"LAPACKstein_ fails. info %d",info); 56c4762a1bSJed Brown /* View evals */ 575f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsHasName(NULL,NULL, "-eig_view", &flg)); 58c4762a1bSJed Brown if (flg) { 595f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," %d evals: \n",nevs)); 605f80ce2aSJacob Faibussowitsch for (i=0; i<nevs; i++) CHKERRQ(PetscPrintf(PETSC_COMM_SELF,"%" PetscInt_FMT " %g\n",i,(double)evals[i])); 61c4762a1bSJed Brown } 62c4762a1bSJed Brown 63c4762a1bSJed Brown /* Check residuals and orthogonality */ 645f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreate(PETSC_COMM_SELF,&T)); 655f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetSizes(T,PETSC_DECIDE,PETSC_DECIDE,n,n)); 665f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(T,MATSBAIJ)); 675f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetFromOptions(T)); 685f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetUp(T)); 69c4762a1bSJed Brown for (i=0; i<n; i++) { 705f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetValues(T,1,&i,1,&i,&D[i],INSERT_VALUES)); 71c4762a1bSJed Brown if (i != n-1) { 72c4762a1bSJed Brown j = i+1; 735f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetValues(T,1,&i,1,&j,&E[i],INSERT_VALUES)); 74c4762a1bSJed Brown } 75c4762a1bSJed Brown } 765f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyBegin(T,MAT_FINAL_ASSEMBLY)); 775f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyEnd(T,MAT_FINAL_ASSEMBLY)); 78c4762a1bSJed Brown 795f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nevs+1,&evecs)); 80c4762a1bSJed Brown for (i=0; i<nevs; i++) { 815f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreate(PETSC_COMM_SELF,&evecs[i])); 825f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetSizes(evecs[i],PETSC_DECIDE,n)); 835f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetFromOptions(evecs[i])); 845f80ce2aSJacob Faibussowitsch CHKERRQ(VecPlaceArray(evecs[i],evecs_array+i*n)); 85c4762a1bSJed Brown } 86c4762a1bSJed Brown 87c4762a1bSJed Brown tols[0] = 1.e-8; tols[1] = 1.e-8; 885f80ce2aSJacob Faibussowitsch CHKERRQ(CkEigenSolutions(cklvl,T,il-1,iu-1,evals,evecs,tols)); 89c4762a1bSJed Brown 90c4762a1bSJed Brown for (i=0; i<nevs; i++) { 915f80ce2aSJacob Faibussowitsch CHKERRQ(VecResetArray(evecs[i])); 92c4762a1bSJed Brown } 93c4762a1bSJed Brown 94c4762a1bSJed Brown /* free space */ 95c4762a1bSJed Brown 965f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&T)); 97c4762a1bSJed Brown 985f80ce2aSJacob Faibussowitsch for (i=0; i<nevs; i++) CHKERRQ(VecDestroy(&evecs[i])); 995f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(evecs)); 1005f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(D)); 1015f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(work)); 1025f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(iwork)); 1035f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(iblock)); 1045f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(evecs_array)); 1055f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(ifail)); 106c4762a1bSJed Brown ierr = PetscFinalize(); 107c4762a1bSJed Brown return ierr; 108c4762a1bSJed Brown #endif 109c4762a1bSJed Brown } 110c4762a1bSJed Brown /*------------------------------------------------ 111c4762a1bSJed Brown Check the accuracy of the eigen solution 112c4762a1bSJed Brown ----------------------------------------------- */ 113c4762a1bSJed Brown /* 114c4762a1bSJed Brown input: 115c4762a1bSJed Brown cklvl - check level: 116c4762a1bSJed Brown 1: check residual 117c4762a1bSJed Brown 2: 1 and check B-orthogonality locally 118c4762a1bSJed Brown A - matrix 119c4762a1bSJed Brown il,iu - lower and upper index bound of eigenvalues 120c4762a1bSJed Brown eval, evec - eigenvalues and eigenvectors stored in this process 121c4762a1bSJed Brown tols[0] - reporting tol_res: || A * evec[i] - eval[i]*evec[i] || 122c4762a1bSJed Brown tols[1] - reporting tol_orth: evec[i]^T*evec[j] - delta_ij 123c4762a1bSJed Brown */ 124c4762a1bSJed Brown #undef DEBUG_CkEigenSolutions 125c4762a1bSJed Brown PetscErrorCode CkEigenSolutions(PetscInt cklvl,Mat A,PetscInt il,PetscInt iu,PetscScalar *eval,Vec *evec,PetscReal *tols) 126c4762a1bSJed Brown { 127c4762a1bSJed Brown PetscInt ierr,i,j,nev; 128c4762a1bSJed Brown Vec vt1,vt2; /* tmp vectors */ 129c4762a1bSJed Brown PetscReal norm,norm_max; 130c4762a1bSJed Brown PetscScalar dot,tmp; 131c4762a1bSJed Brown PetscReal dot_max; 132c4762a1bSJed Brown 133c4762a1bSJed Brown PetscFunctionBegin; 134c4762a1bSJed Brown nev = iu - il; 135c4762a1bSJed Brown if (nev <= 0) PetscFunctionReturn(0); 136c4762a1bSJed Brown 1375f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(evec[0],&vt1)); 1385f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(evec[0],&vt2)); 139c4762a1bSJed Brown 140c4762a1bSJed Brown switch (cklvl) { 141c4762a1bSJed Brown case 2: 142c4762a1bSJed Brown dot_max = 0.0; 143c4762a1bSJed Brown for (i = il; i<iu; i++) { 1445f80ce2aSJacob Faibussowitsch CHKERRQ(VecCopy(evec[i], vt1)); 145c4762a1bSJed Brown for (j=il; j<iu; j++) { 1465f80ce2aSJacob Faibussowitsch CHKERRQ(VecDot(evec[j],vt1,&dot)); 147c4762a1bSJed Brown if (j == i) { 148c4762a1bSJed Brown dot = PetscAbsScalar(dot - (PetscScalar)1.0); 149c4762a1bSJed Brown } else { 150c4762a1bSJed Brown dot = PetscAbsScalar(dot); 151c4762a1bSJed Brown } 152c4762a1bSJed Brown if (PetscAbsScalar(dot) > dot_max) dot_max = PetscAbsScalar(dot); 153c4762a1bSJed Brown #if defined(DEBUG_CkEigenSolutions) 154c4762a1bSJed Brown if (dot > tols[1]) { 1555f80ce2aSJacob Faibussowitsch CHKERRQ(VecNorm(evec[i],NORM_INFINITY,&norm)); 1565f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF,"|delta(%d,%d)|: %g, norm: %d\n",i,j,(double)dot,(double)norm)); 157c4762a1bSJed Brown } 158c4762a1bSJed Brown #endif 159c4762a1bSJed Brown } 160c4762a1bSJed Brown } 1615f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," max|(x_j^T*x_i) - delta_ji|: %g\n",(double)dot_max)); 162c4762a1bSJed Brown 163c4762a1bSJed Brown case 1: 164c4762a1bSJed Brown norm_max = 0.0; 165c4762a1bSJed Brown for (i = il; i< iu; i++) { 1665f80ce2aSJacob Faibussowitsch CHKERRQ(MatMult(A, evec[i], vt1)); 1675f80ce2aSJacob Faibussowitsch CHKERRQ(VecCopy(evec[i], vt2)); 168c4762a1bSJed Brown tmp = -eval[i]; 1695f80ce2aSJacob Faibussowitsch CHKERRQ(VecAXPY(vt1,tmp,vt2)); 1705f80ce2aSJacob Faibussowitsch CHKERRQ(VecNorm(vt1, NORM_INFINITY, &norm)); 171c4762a1bSJed Brown norm = PetscAbsReal(norm); 172c4762a1bSJed Brown if (norm > norm_max) norm_max = norm; 173c4762a1bSJed Brown #if defined(DEBUG_CkEigenSolutions) 174c4762a1bSJed Brown if (norm > tols[0]) { 1755f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," residual violation: %d, resi: %g\n",i, norm)); 176c4762a1bSJed Brown } 177c4762a1bSJed Brown #endif 178c4762a1bSJed Brown } 1795f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," max_resi: %g\n", (double)norm_max)); 180c4762a1bSJed Brown break; 181c4762a1bSJed Brown default: 1825f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF,"Error: cklvl=%d is not supported \n",cklvl)); 183c4762a1bSJed Brown } 184c4762a1bSJed Brown 1855f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&vt2)); 1865f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&vt1)); 187c4762a1bSJed Brown PetscFunctionReturn(0); 188c4762a1bSJed Brown } 189