Lines Matching refs:chunk_slice_map
19 PetscInt *chunk_slice_map; /* starting slice for each chunk, device pointer */ member
29 if ((*cudastruct)->chunk_slice_map) PetscCallCUDA(cudaFree((*cudastruct)->chunk_slice_map)); in MatSeqSELLCUDA_Destroy()
51 if (cudastruct->chunk_slice_map) PetscCallCUDA(cudaFree(cudastruct->chunk_slice_map)); in MatSeqSELLCUDACopyToGPU()
64 …CallCUDA(cudaMalloc((void **)&cudastruct->chunk_slice_map, a->totalchunks * sizeof(*cudastruct->ch… in MatSeqSELLCUDACopyToGPU()
65 …etscCallCUDA(cudaMemcpy(cudastruct->chunk_slice_map, a->chunk_slice_map, a->totalchunks * sizeof(*… in MatSeqSELLCUDACopyToGPU()
185 …ight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt *chunk_slice_map, const PetscI… in matmult_seqsell_tiled_kernel8() argument
199 start_slice = chunk_slice_map[cid]; /* starting slice at each iteration */ in matmult_seqsell_tiled_kernel8()
240 …ight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt *chunk_slice_map, const PetscI… in matmultadd_seqsell_tiled_kernel8() argument
254 start_slice = chunk_slice_map[cid]; /* starting slice at each iteration */ in matmultadd_seqsell_tiled_kernel8()
579 PetscInt chunksperblock, nchunks, *chunk_slice_map; in MatMult_SeqSELLCUDA() local
664 chunk_slice_map = cudastruct->chunk_slice_map; in MatMult_SeqSELLCUDA()
666 …nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMult_SeqSELLCUDA()
668 …nblocks, dim3(32, 4)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMult_SeqSELLCUDA()
670 …nblocks, dim3(32, 8)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMult_SeqSELLCUDA()
672 …blocks, dim3(32, 16)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMult_SeqSELLCUDA()
674 …blocks, dim3(32, 32)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMult_SeqSELLCUDA()
676 …nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMult_SeqSELLCUDA()
720 PetscInt chunksperblock, nchunks, *chunk_slice_map; in MatMultAdd_SeqSELLCUDA() local
760 chunk_slice_map = cudastruct->chunk_slice_map; in MatMultAdd_SeqSELLCUDA()
762 …nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
764 …nblocks, dim3(32, 4)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
766 …nblocks, dim3(32, 8)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
768 …blocks, dim3(32, 16)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
770 …blocks, dim3(32, 32)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
772 …nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
825 chunk_slice_map = cudastruct->chunk_slice_map; in MatMultAdd_SeqSELLCUDA()
827 …nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
829 …nblocks, dim3(32, 4)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
831 …nblocks, dim3(32, 8)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
833 …blocks, dim3(32, 16)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
835 …blocks, dim3(32, 32)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()
837 …nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map, acolidx, ava… in MatMultAdd_SeqSELLCUDA()