111320018SBarry Smith 2af0996ceSBarry Smith #include <petsc/private/snesimpl.h> /*I "petscsnes.h" I*/ 3b1f624c7SBarry Smith #include <petscdm.h> 411320018SBarry Smith 54b828684SBarry Smith /*@C 68d359177SBarry Smith SNESComputeJacobianDefault - Computes the Jacobian using finite differences. 711320018SBarry Smith 8c3339decSBarry Smith Collective 9fee21e36SBarry Smith 10c7afd0dbSLois Curfman McInnes Input Parameters: 11f6dfbefdSBarry Smith + snes - the `SNES` context 126b867d5aSJose E. Roman . x1 - compute Jacobian at this point 13f6dfbefdSBarry Smith - ctx - application's function context, as set with `SNESSetFunction()` 14c7afd0dbSLois Curfman McInnes 15c7afd0dbSLois Curfman McInnes Output Parameters: 16c7afd0dbSLois Curfman McInnes + J - Jacobian matrix (not altered in this routine) 17*dc4c0fb0SBarry Smith - B - newly computed Jacobian matrix to use with preconditioner (generally the same as `J`) 18c7afd0dbSLois Curfman McInnes 19f6dfbefdSBarry Smith Options Database Keys: 20f6dfbefdSBarry Smith + -snes_fd - Activates `SNESComputeJacobianDefault()` 21*dc4c0fb0SBarry Smith . -snes_fd_coloring - Activates a faster computation that uses a graph coloring of the matrix 2279f36460SBarry Smith . -snes_test_err - Square root of function error tolerance, default square root of machine 2377d8c4bbSBarry Smith epsilon (1.e-8 in double, 3.e-4 in single) 24f6dfbefdSBarry Smith - -mat_fd_type - Either wp or ds (see `MATMFFD_WP` or `MATMFFD_DS`) 25ad960d00SLois Curfman McInnes 26*dc4c0fb0SBarry Smith Level: intermediate 27*dc4c0fb0SBarry Smith 285f3c43d9SLois Curfman McInnes Notes: 295f3c43d9SLois Curfman McInnes This routine is slow and expensive, and is not currently optimized 305f3c43d9SLois Curfman McInnes to take advantage of sparsity in the problem. Although 31f6dfbefdSBarry Smith `SNESComputeJacobianDefault()` is not recommended for general use 325f3c43d9SLois Curfman McInnes in large-scale applications, It can be useful in checking the 335f3c43d9SLois Curfman McInnes correctness of a user-provided Jacobian. 3411320018SBarry Smith 3579f36460SBarry Smith An alternative routine that uses coloring to exploit matrix sparsity is 36f6dfbefdSBarry Smith `SNESComputeJacobianDefaultColor()`. 37b4fc646aSLois Curfman McInnes 38f6dfbefdSBarry Smith This routine ignores the maximum number of function evaluations set with `SNESSetTolerances()` and the function 39f6dfbefdSBarry Smith evaluations it performs are not counted in what is returned by of `SNESGetNumberFunctionEvals()`. 40f6dfbefdSBarry Smith 41f6dfbefdSBarry Smith This function can be provided to `SNESSetJacobian()` along with a dense matrix to hold the Jacobian 420df40c35SBarry Smith 43f6dfbefdSBarry Smith .seealso: `SNES`, `SNESSetJacobian()`, `SNESSetJacobian()`, `SNESComputeJacobianDefaultColor()`, `MatCreateSNESMF()` 4411320018SBarry Smith @*/ 45d71ae5a4SJacob Faibussowitsch PetscErrorCode SNESComputeJacobianDefault(SNES snes, Vec x1, Mat J, Mat B, void *ctx) 46d71ae5a4SJacob Faibussowitsch { 4788c956adSLois Curfman McInnes Vec j1a, j2a, x2; 480df40c35SBarry Smith PetscInt i, N, start, end, j, value, root, max_funcs = snes->max_funcs; 495edff71fSBarry Smith PetscScalar dx, *y, wscale; 505edff71fSBarry Smith const PetscScalar *xx; 5177d8c4bbSBarry Smith PetscReal amax, epsilon = PETSC_SQRT_MACHINE_EPSILON; 5279f36460SBarry Smith PetscReal dx_min = 1.e-16, dx_par = 1.e-1, unorm; 53bbb6d6a8SBarry Smith MPI_Comm comm; 54ace3abfcSBarry Smith PetscBool assembled, use_wp = PETSC_TRUE, flg; 5579f36460SBarry Smith const char *list[2] = {"ds", "wp"}; 5686c88abdSHong Zhang PetscMPIInt size; 5786c88abdSHong Zhang const PetscInt *ranges; 580df40c35SBarry Smith DM dm; 590df40c35SBarry Smith DMSNES dms; 600521c3abSLois Curfman McInnes 613a40ed3dSBarry Smith PetscFunctionBegin; 620df40c35SBarry Smith snes->max_funcs = PETSC_MAX_INT; 635d5a84c9SBarry Smith /* Since this Jacobian will possibly have "extra" nonzero locations just turn off errors for these locations */ 649566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE)); 659566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetReal(((PetscObject)snes)->options, ((PetscObject)snes)->prefix, "-snes_test_err", &epsilon, NULL)); 6623242f5aSBarry Smith 679566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)x1, &comm)); 689566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm, &size)); 699566063dSJacob Faibussowitsch PetscCall(MatAssembled(B, &assembled)); 701baa6e33SBarry Smith if (assembled) PetscCall(MatZeroEntries(B)); 71aa79bc6dSLois Curfman McInnes if (!snes->nvwork) { 72b1f624c7SBarry Smith if (snes->dm) { 739566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(snes->dm, &j1a)); 749566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(snes->dm, &j2a)); 759566063dSJacob Faibussowitsch PetscCall(DMGetGlobalVector(snes->dm, &x2)); 76b1f624c7SBarry Smith } else { 77aa79bc6dSLois Curfman McInnes snes->nvwork = 3; 789566063dSJacob Faibussowitsch PetscCall(VecDuplicateVecs(x1, snes->nvwork, &snes->vwork)); 799371c9d4SSatish Balay j1a = snes->vwork[0]; 809371c9d4SSatish Balay j2a = snes->vwork[1]; 819371c9d4SSatish Balay x2 = snes->vwork[2]; 82b1f624c7SBarry Smith } 83b1f624c7SBarry Smith } 8423242f5aSBarry Smith 859566063dSJacob Faibussowitsch PetscCall(VecGetSize(x1, &N)); 869566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRange(x1, &start, &end)); 879566063dSJacob Faibussowitsch PetscCall(SNESGetDM(snes, &dm)); 889566063dSJacob Faibussowitsch PetscCall(DMGetDMSNES(dm, &dms)); 890df40c35SBarry Smith if (dms->ops->computemffunction) { 909566063dSJacob Faibussowitsch PetscCall(SNESComputeMFFunction(snes, x1, j1a)); 910df40c35SBarry Smith } else { 929566063dSJacob Faibussowitsch PetscCall(SNESComputeFunction(snes, x1, j1a)); 930df40c35SBarry Smith } 94c005e166SLois Curfman McInnes 95d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)snes), ((PetscObject)snes)->prefix, "Differencing options", "SNES"); 969566063dSJacob Faibussowitsch PetscCall(PetscOptionsEList("-mat_fd_type", "Algorithm to compute difference parameter", "SNESComputeJacobianDefault", list, 2, "wp", &value, &flg)); 97d0609cedSBarry Smith PetscOptionsEnd(); 98f5af7f23SKarl Rupp if (flg && !value) use_wp = PETSC_FALSE; 99f5af7f23SKarl Rupp 10048a46eb9SPierre Jolivet if (use_wp) PetscCall(VecNorm(x1, NORM_2, &unorm)); 101c005e166SLois Curfman McInnes /* Compute Jacobian approximation, 1 column at a time. 10288c956adSLois Curfman McInnes x1 = current iterate, j1a = F(x1) 10388c956adSLois Curfman McInnes x2 = perturbed iterate, j2a = F(x2) 104c005e166SLois Curfman McInnes */ 10539e2f89bSBarry Smith for (i = 0; i < N; i++) { 1069566063dSJacob Faibussowitsch PetscCall(VecCopy(x1, x2)); 10723242f5aSBarry Smith if (i >= start && i < end) { 1089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x1, &xx)); 1095620d6dcSBarry Smith if (use_wp) dx = PetscSqrtReal(1.0 + unorm); 110f5af7f23SKarl Rupp else dx = xx[i - start]; 1119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x1, &xx)); 1126bd79f97SJed Brown if (PetscAbsScalar(dx) < dx_min) dx = (PetscRealPart(dx) < 0. ? -1. : 1.) * dx_par; 11339e2f89bSBarry Smith dx *= epsilon; 11474f6f00dSLois Curfman McInnes wscale = 1.0 / dx; 1159566063dSJacob Faibussowitsch PetscCall(VecSetValues(x2, 1, &i, &dx, ADD_VALUES)); 1166c783aadSBarry Smith } else { 117bbb6d6a8SBarry Smith wscale = 0.0; 118bbb6d6a8SBarry Smith } 1199566063dSJacob Faibussowitsch PetscCall(VecAssemblyBegin(x2)); 1209566063dSJacob Faibussowitsch PetscCall(VecAssemblyEnd(x2)); 1210df40c35SBarry Smith if (dms->ops->computemffunction) { 1229566063dSJacob Faibussowitsch PetscCall(SNESComputeMFFunction(snes, x2, j2a)); 1230df40c35SBarry Smith } else { 1249566063dSJacob Faibussowitsch PetscCall(SNESComputeFunction(snes, x2, j2a)); 1250df40c35SBarry Smith } 1269566063dSJacob Faibussowitsch PetscCall(VecAXPY(j2a, -1.0, j1a)); 12786c88abdSHong Zhang /* Communicate scale=1/dx_i to all processors */ 1289566063dSJacob Faibussowitsch PetscCall(VecGetOwnershipRanges(x1, &ranges)); 12986c88abdSHong Zhang root = size; 13086c88abdSHong Zhang for (j = size - 1; j > -1; j--) { 13186c88abdSHong Zhang root--; 13286c88abdSHong Zhang if (i >= ranges[j]) break; 13386c88abdSHong Zhang } 1349566063dSJacob Faibussowitsch PetscCallMPI(MPI_Bcast(&wscale, 1, MPIU_SCALAR, root, comm)); 1359566063dSJacob Faibussowitsch PetscCall(VecScale(j2a, wscale)); 1369371c9d4SSatish Balay PetscCall(VecNorm(j2a, NORM_INFINITY, &amax)); 1379371c9d4SSatish Balay amax *= 1.e-14; 1389566063dSJacob Faibussowitsch PetscCall(VecGetArray(j2a, &y)); 13923242f5aSBarry Smith for (j = start; j < end; j++) { 14048a46eb9SPierre Jolivet if (PetscAbsScalar(y[j - start]) > amax || j == i) PetscCall(MatSetValues(B, 1, &j, 1, &i, y + j - start, INSERT_VALUES)); 14123242f5aSBarry Smith } 1429566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(j2a, &y)); 14323242f5aSBarry Smith } 144b1f624c7SBarry Smith if (snes->dm) { 1459566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(snes->dm, &j1a)); 1469566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(snes->dm, &j2a)); 1479566063dSJacob Faibussowitsch PetscCall(DMRestoreGlobalVector(snes->dm, &x2)); 148b1f624c7SBarry Smith } 1499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 1509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 15194ab13aaSBarry Smith if (B != J) { 1529566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(J, MAT_FINAL_ASSEMBLY)); 1539566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(J, MAT_FINAL_ASSEMBLY)); 154f588057bSBarry Smith } 1550df40c35SBarry Smith snes->max_funcs = max_funcs; 1560df40c35SBarry Smith snes->nfuncs -= N; 1573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15811320018SBarry Smith } 159