xref: /libCEED/rust/libceed-sys/c-src/backends/magma/ceed-magma-det.c (revision 6dbfb411544a7a6bdd33f391c97c69cd9e1f444a)
1cb23e90cSJeremy L Thompson // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
2cb23e90cSJeremy L Thompson // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
3cb23e90cSJeremy L Thompson // All Rights reserved. See files LICENSE and NOTICE for details.
4cb23e90cSJeremy L Thompson //
5cb23e90cSJeremy L Thompson // This file is part of CEED, a collection of benchmarks, miniapps, software
6cb23e90cSJeremy L Thompson // libraries and APIs for efficient high-order finite element and spectral
7cb23e90cSJeremy L Thompson // element discretizations for exascale applications. For more information and
8cb23e90cSJeremy L Thompson // source code availability see http://github.com/ceed.
9cb23e90cSJeremy L Thompson //
10cb23e90cSJeremy L Thompson // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
11cb23e90cSJeremy L Thompson // a collaborative effort of two U.S. Department of Energy organizations (Office
12cb23e90cSJeremy L Thompson // of Science and the National Nuclear Security Administration) responsible for
13cb23e90cSJeremy L Thompson // the planning and preparation of a capable exascale ecosystem, including
14cb23e90cSJeremy L Thompson // software, applications, hardware, advanced system engineering and early
15cb23e90cSJeremy L Thompson // testbed platforms, in support of the nation's exascale computing imperative.
16cb23e90cSJeremy L Thompson 
17ec3da8bcSJed Brown #include <ceed/ceed.h>
18ec3da8bcSJed Brown #include <ceed/backend.h>
19*6dbfb411Snbeams #include <string.h>
20*6dbfb411Snbeams #include <stdlib.h>
21cb23e90cSJeremy L Thompson #include "ceed-magma.h"
22cb23e90cSJeremy L Thompson 
231d013790SJed Brown CEED_INTERN int CeedInit_Magma_Det(const char *resource, Ceed ceed) {
24cb23e90cSJeremy L Thompson   int ierr;
25*6dbfb411Snbeams   const int nrc = 18; // number of characters in resource
26*6dbfb411Snbeams   if (strncmp(resource, "/gpu/cuda/magma/det", nrc)
27*6dbfb411Snbeams       && strncmp(resource, "/gpu/hip/magma/det", nrc))
28cb23e90cSJeremy L Thompson     // LCOV_EXCL_START
29e15f9bd0SJeremy L Thompson     return CeedError(ceed, CEED_ERROR_BACKEND,
30e15f9bd0SJeremy L Thompson                      "Magma backend cannot use resource: %s", resource);
31cb23e90cSJeremy L Thompson   // LCOV_EXCL_STOP
32e15f9bd0SJeremy L Thompson   ierr = CeedSetDeterministic(ceed, true); CeedChkBackend(ierr);
33cb23e90cSJeremy L Thompson 
34*6dbfb411Snbeams   Ceed_Magma *data;
35*6dbfb411Snbeams   ierr = CeedCalloc(sizeof(Ceed_Magma), &data); CeedChkBackend(ierr);
36*6dbfb411Snbeams   ierr = CeedSetData(ceed, data); CeedChkBackend(ierr);
37*6dbfb411Snbeams 
38*6dbfb411Snbeams   // get/set device ID
39*6dbfb411Snbeams   const char *device_spec = strstr(resource, ":device_id=");
40*6dbfb411Snbeams   const int deviceID = (device_spec) ? atoi(device_spec+11) : -1;
41*6dbfb411Snbeams 
42*6dbfb411Snbeams   int currentDeviceID;
43*6dbfb411Snbeams   magma_getdevice(&currentDeviceID);
44*6dbfb411Snbeams   if (deviceID >= 0 && currentDeviceID != deviceID) {
45*6dbfb411Snbeams     magma_setdevice(deviceID);
46*6dbfb411Snbeams     currentDeviceID = deviceID;
47*6dbfb411Snbeams   }
48*6dbfb411Snbeams   // create a queue that uses the null stream
49*6dbfb411Snbeams   data->device = currentDeviceID;
50*6dbfb411Snbeams 
51cb23e90cSJeremy L Thompson   // Create reference CEED that implementation will be dispatched
52cb23e90cSJeremy L Thompson   //   through unless overridden
53cb23e90cSJeremy L Thompson   Ceed ceedref;
54adb2481bSnbeams   #ifdef HAVE_HIP
5540461fa4Snbeams   CeedInit("/gpu/hip/magma", &ceedref);
56adb2481bSnbeams   #else
5740461fa4Snbeams   CeedInit("/gpu/cuda/magma", &ceedref);
58adb2481bSnbeams   #endif
59e15f9bd0SJeremy L Thompson   ierr = CeedSetDelegate(ceed, ceedref); CeedChkBackend(ierr);
60cb23e90cSJeremy L Thompson 
61cb23e90cSJeremy L Thompson   // Create reference CEED for restriction
62cb23e90cSJeremy L Thompson   Ceed restrictionceedref;
63a31f51a5Snbeams   #ifdef HAVE_HIP
64a31f51a5Snbeams   CeedInit("/gpu/hip/ref", &restrictionceedref);
65a31f51a5Snbeams   #else
66461525f5SNatalie Beams   CeedInit("/gpu/cuda/ref", &restrictionceedref);
67a31f51a5Snbeams   #endif
68cb23e90cSJeremy L Thompson   ierr = CeedSetObjectDelegate(ceed, restrictionceedref, "ElemRestriction");
69e15f9bd0SJeremy L Thompson   CeedChkBackend(ierr);
70cb23e90cSJeremy L Thompson 
71e15f9bd0SJeremy L Thompson   return CEED_ERROR_SUCCESS;
72cb23e90cSJeremy L Thompson }
73cb23e90cSJeremy L Thompson 
741d013790SJed Brown CEED_INTERN int CeedRegister_Magma_Det(void) {
75adb2481bSnbeams   #ifdef HAVE_HIP
761d013790SJed Brown   return CeedRegister("/gpu/hip/magma/det", CeedInit_Magma_Det, 125);
77adb2481bSnbeams   #else
781d013790SJed Brown   return CeedRegister("/gpu/cuda/magma/det", CeedInit_Magma_Det, 125);
79adb2481bSnbeams   #endif
80cb23e90cSJeremy L Thompson }
81