1cb23e90cSJeremy L Thompson // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC. 2cb23e90cSJeremy L Thompson // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707. 3cb23e90cSJeremy L Thompson // All Rights reserved. See files LICENSE and NOTICE for details. 4cb23e90cSJeremy L Thompson // 5cb23e90cSJeremy L Thompson // This file is part of CEED, a collection of benchmarks, miniapps, software 6cb23e90cSJeremy L Thompson // libraries and APIs for efficient high-order finite element and spectral 7cb23e90cSJeremy L Thompson // element discretizations for exascale applications. For more information and 8cb23e90cSJeremy L Thompson // source code availability see http://github.com/ceed. 9cb23e90cSJeremy L Thompson // 10cb23e90cSJeremy L Thompson // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC, 11cb23e90cSJeremy L Thompson // a collaborative effort of two U.S. Department of Energy organizations (Office 12cb23e90cSJeremy L Thompson // of Science and the National Nuclear Security Administration) responsible for 13cb23e90cSJeremy L Thompson // the planning and preparation of a capable exascale ecosystem, including 14cb23e90cSJeremy L Thompson // software, applications, hardware, advanced system engineering and early 15cb23e90cSJeremy L Thompson // testbed platforms, in support of the nation's exascale computing imperative. 16cb23e90cSJeremy L Thompson 17ec3da8bcSJed Brown #include <ceed/ceed.h> 18ec3da8bcSJed Brown #include <ceed/backend.h> 19*6dbfb411Snbeams #include <string.h> 20*6dbfb411Snbeams #include <stdlib.h> 21cb23e90cSJeremy L Thompson #include "ceed-magma.h" 22cb23e90cSJeremy L Thompson 231d013790SJed Brown CEED_INTERN int CeedInit_Magma_Det(const char *resource, Ceed ceed) { 24cb23e90cSJeremy L Thompson int ierr; 25*6dbfb411Snbeams const int nrc = 18; // number of characters in resource 26*6dbfb411Snbeams if (strncmp(resource, "/gpu/cuda/magma/det", nrc) 27*6dbfb411Snbeams && strncmp(resource, "/gpu/hip/magma/det", nrc)) 28cb23e90cSJeremy L Thompson // LCOV_EXCL_START 29e15f9bd0SJeremy L Thompson return CeedError(ceed, CEED_ERROR_BACKEND, 30e15f9bd0SJeremy L Thompson "Magma backend cannot use resource: %s", resource); 31cb23e90cSJeremy L Thompson // LCOV_EXCL_STOP 32e15f9bd0SJeremy L Thompson ierr = CeedSetDeterministic(ceed, true); CeedChkBackend(ierr); 33cb23e90cSJeremy L Thompson 34*6dbfb411Snbeams Ceed_Magma *data; 35*6dbfb411Snbeams ierr = CeedCalloc(sizeof(Ceed_Magma), &data); CeedChkBackend(ierr); 36*6dbfb411Snbeams ierr = CeedSetData(ceed, data); CeedChkBackend(ierr); 37*6dbfb411Snbeams 38*6dbfb411Snbeams // get/set device ID 39*6dbfb411Snbeams const char *device_spec = strstr(resource, ":device_id="); 40*6dbfb411Snbeams const int deviceID = (device_spec) ? atoi(device_spec+11) : -1; 41*6dbfb411Snbeams 42*6dbfb411Snbeams int currentDeviceID; 43*6dbfb411Snbeams magma_getdevice(¤tDeviceID); 44*6dbfb411Snbeams if (deviceID >= 0 && currentDeviceID != deviceID) { 45*6dbfb411Snbeams magma_setdevice(deviceID); 46*6dbfb411Snbeams currentDeviceID = deviceID; 47*6dbfb411Snbeams } 48*6dbfb411Snbeams // create a queue that uses the null stream 49*6dbfb411Snbeams data->device = currentDeviceID; 50*6dbfb411Snbeams 51cb23e90cSJeremy L Thompson // Create reference CEED that implementation will be dispatched 52cb23e90cSJeremy L Thompson // through unless overridden 53cb23e90cSJeremy L Thompson Ceed ceedref; 54adb2481bSnbeams #ifdef HAVE_HIP 5540461fa4Snbeams CeedInit("/gpu/hip/magma", &ceedref); 56adb2481bSnbeams #else 5740461fa4Snbeams CeedInit("/gpu/cuda/magma", &ceedref); 58adb2481bSnbeams #endif 59e15f9bd0SJeremy L Thompson ierr = CeedSetDelegate(ceed, ceedref); CeedChkBackend(ierr); 60cb23e90cSJeremy L Thompson 61cb23e90cSJeremy L Thompson // Create reference CEED for restriction 62cb23e90cSJeremy L Thompson Ceed restrictionceedref; 63a31f51a5Snbeams #ifdef HAVE_HIP 64a31f51a5Snbeams CeedInit("/gpu/hip/ref", &restrictionceedref); 65a31f51a5Snbeams #else 66461525f5SNatalie Beams CeedInit("/gpu/cuda/ref", &restrictionceedref); 67a31f51a5Snbeams #endif 68cb23e90cSJeremy L Thompson ierr = CeedSetObjectDelegate(ceed, restrictionceedref, "ElemRestriction"); 69e15f9bd0SJeremy L Thompson CeedChkBackend(ierr); 70cb23e90cSJeremy L Thompson 71e15f9bd0SJeremy L Thompson return CEED_ERROR_SUCCESS; 72cb23e90cSJeremy L Thompson } 73cb23e90cSJeremy L Thompson 741d013790SJed Brown CEED_INTERN int CeedRegister_Magma_Det(void) { 75adb2481bSnbeams #ifdef HAVE_HIP 761d013790SJed Brown return CeedRegister("/gpu/hip/magma/det", CeedInit_Magma_Det, 125); 77adb2481bSnbeams #else 781d013790SJed Brown return CeedRegister("/gpu/cuda/magma/det", CeedInit_Magma_Det, 125); 79adb2481bSnbeams #endif 80cb23e90cSJeremy L Thompson } 81