Lines Matching full:auto
204 const auto mcu = MatCUPMCast(m); in SetPreallocation_()
205 const auto nrows = m->rmap->n; in SetPreallocation_()
206 const auto ncols = m->cmap->n; in SetPreallocation_()
207 auto &lda = MatIMPLCast(m)->lda; in SetPreallocation_()
236 const auto nrows = m->rmap->n; in HostToDevice_()
237 const auto ncols = m->cmap->n; in HostToDevice_()
238 …const auto copy = m->offloadmask == PETSC_OFFLOAD_CPU || m->offloadmask == PETSC_OFFLOAD_UNALLOCA… in HostToDevice_()
245 const auto mcu = MatCUPMCast(m); in HostToDevice_()
253 const auto mimpl = MatIMPLCast(m); in HostToDevice_()
254 const auto lda = mimpl->lda; in HostToDevice_()
255 const auto src = mimpl->v; in HostToDevice_()
256 const auto dest = mcu->d_v; in HostToDevice_()
274 const auto nrows = m->rmap->n; in DeviceToHost_()
275 const auto ncols = m->cmap->n; in DeviceToHost_()
276 const auto copy = m->offloadmask == PETSC_OFFLOAD_GPU; in DeviceToHost_()
282 const auto mimpl = MatIMPLCast(m); in DeviceToHost_()
290 const auto lda = mimpl->lda; in DeviceToHost_()
291 const auto dest = mimpl->v; in DeviceToHost_()
292 const auto src = MatCUPMCast(m)->d_v; in DeviceToHost_()
350 const auto mcu = MatCUPMCast(A); in FactorPrepare()
375 const auto m = static_cast<cupmBlasInt_t>(A->rmap->n); in Factor()
376 const auto n = static_cast<cupmBlasInt_t>(A->cmap->n); in Factor()
386 const auto mcu = MatCUPMCast(A); in Factor()
387 const auto da = DeviceArrayReadWrite(dctx, A); in Factor()
388 const auto lda = static_cast<cupmBlasInt_t>(MatIMPLCast(A)->lda); in Factor()
415 const auto mcu = MatCUPMCast(A); in Solve()
416 const auto fact_info = mcu->d_fact_info; in Solve()
417 const auto fact_ipiv = mcu->d_fact_ipiv; in Solve()
425 constexpr auto op = transpose ? CUPMSOLVER_OP_T : CUPMSOLVER_OP_N; in Solve()
426 const auto da = DeviceArrayRead(dctx, A); in Solve()
427 const auto lda = static_cast<cupmBlasInt_t>(MatIMPLCast(A)->lda); in Solve()
460 const auto n = static_cast<cupmBlasInt_t>(A->rmap->n); in Factor()
471 const auto mcu = MatCUPMCast(A); in Factor()
472 const auto da = DeviceArrayReadWrite(dctx, A); in Factor()
473 const auto lda = static_cast<cupmBlasInt_t>(MatIMPLCast(A)->lda); in Factor()
515 const auto mcu = MatCUPMCast(A); in Solve()
516 const auto fact_info = mcu->d_fact_info; in Solve()
525 const auto da = DeviceArrayRead(dctx, A); in Solve()
526 const auto lda = static_cast<cupmBlasInt_t>(MatIMPLCast(A)->lda); in Solve()
559 const auto m = static_cast<cupmBlasInt_t>(A->rmap->n); in Factor()
560 const auto n = static_cast<cupmBlasInt_t>(A->cmap->n); in Factor()
561 const auto min = std::min(m, n); in Factor()
562 const auto mimpl = MatIMPLCast(A); in Factor()
573 const auto mcu = MatCUPMCast(A); in Factor()
574 const auto da = DeviceArrayReadWrite(dctx, A); in Factor()
575 const auto lda = static_cast<cupmBlasInt_t>(mimpl->lda); in Factor()
602 const auto mimpl = MatIMPLCast(A); in Solve()
603 const auto rank = static_cast<cupmBlasInt_t>(mimpl->rank); in Solve()
604 const auto mcu = MatCUPMCast(A); in Solve()
605 const auto fact_info = mcu->d_fact_info; in Solve()
606 const auto fact_tau = mcu->d_fact_tau; in Solve()
607 const auto fact_work = mcu->d_fact_work; in Solve()
608 const auto fact_lwork = mcu->d_fact_lwork; in Solve()
617 const auto da = DeviceArrayRead(dctx, A); in Solve()
618 const auto one = cupmScalarCast(1.0); in Solve()
619 const auto lda = static_cast<cupmBlasInt_t>(mimpl->lda); in Solve()
626 constexpr auto op = PetscDefined(USE_COMPLEX) ? CUPMSOLVER_OP_C : CUPMSOLVER_OP_T; in Solve()
644 const auto pobj_A = PetscObjectCast(A); in MatSolve_Factored_Dispatch_()
645 const auto m = static_cast<cupmBlasInt_t>(A->rmap->n); in MatSolve_Factored_Dispatch_()
646 const auto k = static_cast<cupmBlasInt_t>(A->cmap->n); in MatSolve_Factored_Dispatch_()
647 auto &workvec = MatCUPMCast(A)->workvec; in MatSolve_Factored_Dispatch_()
664 const auto xisdevice = xiscupm && PetscOffloadDevice(x->offloadmask); in MatSolve_Factored_Dispatch_()
665 const auto copy_mode = xisdevice ? cupmMemcpyDeviceToDevice : cupmMemcpyHostToDevice; in MatSolve_Factored_Dispatch_()
695 const auto copy_mode = yiscupm ? cupmMemcpyDeviceToDevice : cupmMemcpyDeviceToHost; in MatSolve_Factored_Dispatch_()
721 const auto m = static_cast<cupmBlasInt_t>(A->rmap->n); in MatMatSolve_Factored_Dispatch_()
722 const auto k = static_cast<cupmBlasInt_t>(A->cmap->n); in MatMatSolve_Factored_Dispatch_()
752 const auto bisdevice = biscupm && PetscOffloadDevice(B->offloadmask); in MatMatSolve_Factored_Dispatch_()
753 const auto copy_mode = bisdevice ? cupmMemcpyDeviceToDevice : cupmMemcpyHostToDevice; in MatMatSolve_Factored_Dispatch_()
785 const auto copy_mode = xiscupm ? cupmMemcpyDeviceToDevice : cupmMemcpyDeviceToHost; in MatMatSolve_Factored_Dispatch_()
807 const auto m = static_cast<cupmBlasInt_t>(A->rmap->n); in MatMultAddColumnRange_Dispatch_()
808 const auto n = static_cast<cupmBlasInt_t>(c_end - c_start); in MatMultAddColumnRange_Dispatch_()
809 const auto lda = static_cast<cupmBlasInt_t>(MatIMPLCast(A)->lda); in MatMultAddColumnRange_Dispatch_()
854 constexpr auto op = transpose ? (hermitian ? CUPMBLAS_OP_C : CUPMBLAS_OP_T) : CUPMBLAS_OP_N; in MatMultAddColumnRange_Dispatch_()
855 const auto one = cupmScalarCast(1.0); in MatMultAddColumnRange_Dispatch_()
856 const auto zero = cupmScalarCast(0.0); in MatMultAddColumnRange_Dispatch_()
857 const auto da = DeviceArrayRead(dctx, A); in MatMultAddColumnRange_Dispatch_()
858 const auto dxx = VecSeq_CUPM::DeviceArrayRead(dctx, x); in MatMultAddColumnRange_Dispatch_()
859 const auto dzz = VecSeq_CUPM::DeviceArrayReadWrite(dctx, z); in MatMultAddColumnRange_Dispatch_()
906 const auto B = *newmat; in Convert_Dispatch_()
907 const auto pobj = PetscObjectCast(B); in Convert_Dispatch_()
1030 if (const auto mcu = MatCUPMCast(A)) { in Reset()
1051 const auto mimpl = MatIMPLCast(A); in BindToCPU()
1052 const auto pobj = PetscObjectCast(A); in BindToCPU()
1068 if (auto &cvec = mimpl->cvec) { in BindToCPU()
1072 if (auto &cmat = mimpl->cmat) { in BindToCPU()
1134 if (const auto cmat = mimpl->cmat) PetscCall(MatBindToCPU(cmat, to_host)); in BindToCPU()
1160 constexpr auto hostmem = PetscMemTypeHost(mtype); in GetArray()
1161 constexpr auto read_access = PetscMemoryAccessRead(access); in GetArray()
1232 const auto mimpl = MatIMPLCast(A); in PlaceArray()
1233 const auto mcu = MatCUPMCast(A); in PlaceArray()
1253 const auto mimpl = MatIMPLCast(A); in ReplaceArray()
1254 const auto mcu = MatCUPMCast(A); in ReplaceArray()
1274 const auto mimpl = MatIMPLCast(A); in ResetArray()
1275 const auto mcu = MatCUPMCast(A); in ResetArray()
1319 const auto one = cupmScalarCast(1.0); in MatMatMult_Numeric_Dispatch()
1320 const auto zero = cupmScalarCast(0.0); in MatMatMult_Numeric_Dispatch()
1321 const auto da = DeviceArrayRead(dctx, A); in MatMatMult_Numeric_Dispatch()
1322 const auto db = DeviceArrayRead(dctx, B); in MatMatMult_Numeric_Dispatch()
1323 const auto dc = DeviceArrayWrite(dctx, C); in MatMatMult_Numeric_Dispatch()
1342 const auto m = A->rmap->n; in Copy()
1343 const auto n = A->cmap->n; in Copy()
1355 const auto va = DeviceArrayRead(dctx, A); in Copy()
1356 const auto vb = DeviceArrayWrite(dctx, B); in Copy()
1359 const auto lda_a = MatIMPLCast(A)->lda; in Copy()
1360 const auto lda_b = MatIMPLCast(B)->lda; in Copy()
1387 const auto va = DeviceArrayWrite(dctx, m); in ZeroEntries()
1388 const auto lda = MatIMPLCast(m)->lda; in ZeroEntries()
1389 const auto ma = m->rmap->n; in ZeroEntries()
1390 const auto na = m->cmap->n; in ZeroEntries()
1443 const auto nrows = rend - rstart; in make_submat_iterator()
1444 const auto ncols = cend - cstart; in make_submat_iterator()
1445 const auto dptr = thrust::device_pointer_cast(ptr); in make_submat_iterator()
1461 const auto m = A->rmap->n; in Conjugate()
1462 const auto n = A->cmap->n; in Conjugate()
1463 const auto N = m * n; in Conjugate()
1472 const auto da = DeviceArrayReadWrite(dctx, A); in Conjugate()
1473 const auto lda = MatIMPLCast(A)->lda; in Conjugate()
1480 const auto sub_mat = detail::make_submat_iterator(0, m, 0, n, lda, da.data()); in Conjugate()
1493 const auto aptr = thrust::device_pointer_cast(da.data()); in Conjugate()
1513 const auto m = A->rmap->n; in Scale()
1514 const auto n = A->cmap->n; in Scale()
1515 const auto N = m * n; in Scale()
1522 const auto da = DeviceArrayReadWrite(dctx, A); in Scale()
1523 const auto lda = MatIMPLCast(A)->lda; in Scale()
1531 const auto sub_mat = detail::make_submat_iterator(0, m, 0, n, lda, da.data()); in Scale()
1542 const auto cu_alpha = cupmScalarCast(alpha); in Scale()
1558 const auto m_x = X->rmap->n, m_y = Y->rmap->n; in AXPY()
1559 const auto n_x = X->cmap->n, n_y = Y->cmap->n; in AXPY()
1560 const auto N = m_x * n_x; in AXPY()
1568 const auto dx = DeviceArrayRead(dctx, X); in AXPY()
1569 const auto dy = DeviceArrayReadWrite(dctx, Y); in AXPY()
1570 const auto lda_x = MatIMPLCast(X)->lda; in AXPY()
1571 const auto lda_y = MatIMPLCast(Y)->lda; in AXPY()
1579 const auto sub_mat_y = detail::make_submat_iterator(0, m_y, 0, n_y, lda_y, dy.data()); in AXPY()
1580 const auto sub_mat_x = detail::make_submat_iterator(0, m_x, 0, n_x, lda_x, dx.data()); in AXPY()
1591 const auto cu_alpha = cupmScalarCast(alpha); in AXPY()
1607 …const auto hopt = (opt == MAT_COPY_VALUES && A->offloadmask != PETSC_OFFLOAD_CPU) ? MAT_DO… in Duplicate()
1632 const auto m = A->rmap->n; in SetRandom()
1633 const auto n = A->cmap->n; in SetRandom()
1638 const auto a = DeviceArrayWrite(dctx, A); in SetRandom()
1662 const auto offloadmask = A->offloadmask; in GetColumnVector()
1663 const auto n = A->rmap->n; in GetColumnVector()
1664 …const auto col_offset = [&](const PetscScalar *ptr) { return ptr + col * MatIMPLCast(A)->… in GetColumnVector()
1673 const auto x = VecSeq_CUPM::DeviceArrayWrite(dctx, v); in GetColumnVector()
1701 const auto mimpl = MatIMPLCast(A); in GetColumnVec()
1722 const auto mimpl = MatIMPLCast(A); in RestoreColumnVec()
1723 const auto cvec = mimpl->cvec; in RestoreColumnVec()
1761 const auto pobj = PetscObjectCast(fact); in GetFactor()
1783 const auto mimpl = MatIMPLCast(A); in InvertFactors()
1784 const auto mcu = MatCUPMCast(A); in InvertFactors()
1785 const auto n = static_cast<cupmBlasInt_t>(A->cmap->n); in InvertFactors()
1802 const auto da = DeviceArrayReadWrite(dctx, A); in InvertFactors()
1803 const auto lda = static_cast<cupmBlasInt_t>(mimpl->lda); in InvertFactors()
1835 const auto mimpl = MatIMPLCast(A); in GetSubMatrix()
1836 …const auto array_offset = [&](PetscScalar *ptr) { return ptr + rbegin + static_cast<std::s… in GetSubMatrix()
1837 const auto n = rend - rbegin; in GetSubMatrix()
1838 const auto m = cend - cbegin; in GetSubMatrix()
1839 auto &cmat = mimpl->cmat; in GetSubMatrix()
1852 const auto device_array = array_offset(MatCUPMCast(A)->d_v); in GetSubMatrix()
1862 if (const auto host_array = mimpl->v) { in GetSubMatrix()
1875 const auto mimpl = MatIMPLCast(A); in RestoreSubMatrix()
1876 const auto cmat = mimpl->cmat; in RestoreSubMatrix()
1877 const auto reset = static_cast<bool>(mimpl->v); in RestoreSubMatrix()
1940 for (auto ftype : util::make_array(MAT_FACTOR_LU, MAT_FACTOR_CHOLESKY, MAT_FACTOR_QR)) { in MatSolverTypeRegister_DENSECUPM()