1c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> 296c04dfeSSatish Balay 396c04dfeSSatish Balay #undef __FUNCT__ 496c04dfeSSatish Balay #define __FUNCT__ "MatGetMultiProcBlock_MPIAIJ" 53233f0ddSHong Zhang PetscErrorCode MatGetMultiProcBlock_MPIAIJ(Mat mat, MPI_Comm subComm, MatReuse scall,Mat *subMat) 696c04dfeSSatish Balay { 796c04dfeSSatish Balay PetscErrorCode ierr; 896c04dfeSSatish Balay Mat_MPIAIJ *aij = (Mat_MPIAIJ*)mat->data; 996c04dfeSSatish Balay Mat_SeqAIJ *aijB = (Mat_SeqAIJ*)aij->B->data; 1096c04dfeSSatish Balay PetscMPIInt commRank,subCommSize,subCommRank; 115d22bc9fSHong Zhang PetscMPIInt *commRankMap,subRank,rank,commsize; 1296c04dfeSSatish Balay PetscInt *garrayCMap,col,i,j,*nnz,newRow,newCol; 1396c04dfeSSatish Balay 1496c04dfeSSatish Balay PetscFunctionBegin; 15ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)mat),&commsize);CHKERRQ(ierr); 165d22bc9fSHong Zhang ierr = MPI_Comm_size(subComm,&subCommSize);CHKERRQ(ierr); 1796c04dfeSSatish Balay 1896c04dfeSSatish Balay /* create subMat object with the relavent layout */ 19ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 2096c04dfeSSatish Balay ierr = MatCreate(subComm,subMat);CHKERRQ(ierr); 2196c04dfeSSatish Balay ierr = MatSetType(*subMat,MATMPIAIJ);CHKERRQ(ierr); 2296c04dfeSSatish Balay ierr = MatSetSizes(*subMat,mat->rmap->n,mat->cmap->n,PETSC_DECIDE,PETSC_DECIDE);CHKERRQ(ierr); 23*33d57670SJed Brown ierr = MatSetBlockSizesFromMats(*subMat,mat,mat);CHKERRQ(ierr); 24fc08c53fSHong Zhang 2596c04dfeSSatish Balay /* need to setup rmap and cmap before Preallocation */ 2696c04dfeSSatish Balay ierr = PetscLayoutSetUp((*subMat)->rmap);CHKERRQ(ierr); 2796c04dfeSSatish Balay ierr = PetscLayoutSetUp((*subMat)->cmap);CHKERRQ(ierr); 28ce1d8e51SHong Zhang } 2996c04dfeSSatish Balay 30ce1d8e51SHong Zhang /* create a map of comm_rank from subComm to comm - should commRankMap and garrayCMap be kept for reused? */ 31ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)mat),&commRank);CHKERRQ(ierr); 3296c04dfeSSatish Balay ierr = MPI_Comm_rank(subComm,&subCommRank);CHKERRQ(ierr); 33785e854fSJed Brown ierr = PetscMalloc1(subCommSize,&commRankMap);CHKERRQ(ierr); 3496c04dfeSSatish Balay ierr = MPI_Allgather(&commRank,1,MPI_INT,commRankMap,1,MPI_INT,subComm);CHKERRQ(ierr); 3596c04dfeSSatish Balay 3696c04dfeSSatish Balay /* Traverse garray and identify column indices [of offdiag mat] that 3796c04dfeSSatish Balay should be discarded. For the ones not discarded, store the newCol+1 3896c04dfeSSatish Balay value in garrayCMap */ 391795a4d1SJed Brown ierr = PetscCalloc1(aij->B->cmap->n,&garrayCMap);CHKERRQ(ierr); 4096c04dfeSSatish Balay for (i=0; i<aij->B->cmap->n; i++) { 4196c04dfeSSatish Balay col = aij->garray[i]; 4296c04dfeSSatish Balay for (subRank=0; subRank<subCommSize; subRank++) { 4396c04dfeSSatish Balay rank = commRankMap[subRank]; 4496c04dfeSSatish Balay if ((col >= mat->cmap->range[rank]) && (col < mat->cmap->range[rank+1])) { 4596c04dfeSSatish Balay garrayCMap[i] = (*subMat)->cmap->range[subRank] + col - mat->cmap->range[rank]+1; 4696c04dfeSSatish Balay break; 4796c04dfeSSatish Balay } 4896c04dfeSSatish Balay } 4996c04dfeSSatish Balay } 5096c04dfeSSatish Balay 51ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 5296c04dfeSSatish Balay /* Now compute preallocation for the offdiag mat */ 531795a4d1SJed Brown ierr = PetscCalloc1(aij->B->rmap->n,&nnz);CHKERRQ(ierr); 5496c04dfeSSatish Balay for (i=0; i<aij->B->rmap->n; i++) { 5596c04dfeSSatish Balay for (j=aijB->i[i]; j<aijB->i[i+1]; j++) { 5696c04dfeSSatish Balay if (garrayCMap[aijB->j[j]]) nnz[i]++; 5796c04dfeSSatish Balay } 5896c04dfeSSatish Balay } 590298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(*(subMat),0,NULL,0,nnz);CHKERRQ(ierr); 6096c04dfeSSatish Balay 6196c04dfeSSatish Balay /* reuse diag block with the new submat */ 626bf464f9SBarry Smith ierr = MatDestroy(&((Mat_MPIAIJ*)((*subMat)->data))->A);CHKERRQ(ierr); 632205254eSKarl Rupp 6496c04dfeSSatish Balay ((Mat_MPIAIJ*)((*subMat)->data))->A = aij->A; 652205254eSKarl Rupp 6696c04dfeSSatish Balay ierr = PetscObjectReference((PetscObject)aij->A);CHKERRQ(ierr); 67ce1d8e51SHong Zhang } else if (((Mat_MPIAIJ*)(*subMat)->data)->A != aij->A) { 68ce1d8e51SHong Zhang PetscObject obj = (PetscObject)((Mat_MPIAIJ*)((*subMat)->data))->A; 692205254eSKarl Rupp 70ce1d8e51SHong Zhang ierr = PetscObjectReference((PetscObject)obj);CHKERRQ(ierr); 712205254eSKarl Rupp 72ce1d8e51SHong Zhang ((Mat_MPIAIJ*)((*subMat)->data))->A = aij->A; 732205254eSKarl Rupp 74ce1d8e51SHong Zhang ierr = PetscObjectReference((PetscObject)aij->A);CHKERRQ(ierr); 75ce1d8e51SHong Zhang } 7696c04dfeSSatish Balay 7796c04dfeSSatish Balay /* Now traverse aij->B and insert values into subMat */ 7896c04dfeSSatish Balay for (i=0; i<aij->B->rmap->n; i++) { 7996c04dfeSSatish Balay newRow = (*subMat)->rmap->range[subCommRank] + i; 8096c04dfeSSatish Balay for (j=aijB->i[i]; j<aijB->i[i+1]; j++) { 8196c04dfeSSatish Balay newCol = garrayCMap[aijB->j[j]]; 8296c04dfeSSatish Balay if (newCol) { 8396c04dfeSSatish Balay newCol--; /* remove the increment */ 8496c04dfeSSatish Balay ierr = MatSetValues(*subMat,1,&newRow,1,&newCol,(aijB->a+j),INSERT_VALUES);CHKERRQ(ierr); 8596c04dfeSSatish Balay } 8696c04dfeSSatish Balay } 8796c04dfeSSatish Balay } 8896c04dfeSSatish Balay 8996c04dfeSSatish Balay /* assemble the submat */ 9096c04dfeSSatish Balay ierr = MatAssemblyBegin(*subMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9196c04dfeSSatish Balay ierr = MatAssemblyEnd(*subMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9296c04dfeSSatish Balay 9396c04dfeSSatish Balay /* deallocate temporary data */ 9496c04dfeSSatish Balay ierr = PetscFree(commRankMap);CHKERRQ(ierr); 9596c04dfeSSatish Balay ierr = PetscFree(garrayCMap);CHKERRQ(ierr); 96ce1d8e51SHong Zhang if (scall == MAT_INITIAL_MATRIX) { 9796c04dfeSSatish Balay ierr = PetscFree(nnz);CHKERRQ(ierr); 98ce1d8e51SHong Zhang } 9996c04dfeSSatish Balay PetscFunctionReturn(0); 10096c04dfeSSatish Balay } 101