xref: /libCEED/rust/libceed-sys/c-src/backends/xsmm/ceed-xsmm.h (revision 80a9ef0545a39c00cdcaab1ca26f8053604f3120)
18d713cf6Sjeremylt // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
28d713cf6Sjeremylt // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
38d713cf6Sjeremylt // All Rights reserved. See files LICENSE and NOTICE for details.
48d713cf6Sjeremylt //
58d713cf6Sjeremylt // This file is part of CEED, a collection of benchmarks, miniapps, software
68d713cf6Sjeremylt // libraries and APIs for efficient high-order finite element and spectral
78d713cf6Sjeremylt // element discretizations for exascale applications. For more information and
88d713cf6Sjeremylt // source code availability see http://github.com/ceed.
98d713cf6Sjeremylt //
108d713cf6Sjeremylt // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
118d713cf6Sjeremylt // a collaborative effort of two U.S. Department of Energy organizations (Office
128d713cf6Sjeremylt // of Science and the National Nuclear Security Administration) responsible for
138d713cf6Sjeremylt // the planning and preparation of a capable exascale ecosystem, including
148d713cf6Sjeremylt // software, applications, hardware, advanced system engineering and early
158d713cf6Sjeremylt // testbed platforms, in support of the nation's exascale computing imperative.
168d713cf6Sjeremylt 
173d576824SJeremy L Thompson #ifndef _ceed_xsmm_h
183d576824SJeremy L Thompson #define _ceed_xsmm_h
193d576824SJeremy L Thompson 
20ec3da8bcSJed Brown #include <ceed/ceed.h>
21ec3da8bcSJed Brown #include <ceed/backend.h>
22ec3da8bcSJed Brown #include <ceed/hash.h>
233d0fd664Sjeremylt #include <libxsmm.h>
248d713cf6Sjeremylt 
2520aaa365SJeremy L Thompson // Instantiate khash structs and methods
26*80a9ef05SNatalie Beams CeedHashIJKLMInit(f32, libxsmm_smmfunction)
27*80a9ef05SNatalie Beams CeedHashIJKLMInit(f64, libxsmm_dmmfunction)
2820aaa365SJeremy L Thompson 
293d0fd664Sjeremylt typedef struct {
30d1d35e2fSjeremylt   bool is_tensor;
3120aaa365SJeremy L Thompson   CeedInt P, Q, dim;
32*80a9ef05SNatalie Beams   khash_t(f32) *lookup_f32;
33*80a9ef05SNatalie Beams   khash_t(f64) *lookup_f64;
343d0fd664Sjeremylt } CeedTensorContract_Xsmm;
353d0fd664Sjeremylt 
36*80a9ef05SNatalie Beams CEED_INTERN int CeedTensorContractCreate_f32_Xsmm(CeedBasis basis,
37*80a9ef05SNatalie Beams     CeedTensorContract contract);
38*80a9ef05SNatalie Beams 
39*80a9ef05SNatalie Beams CEED_INTERN int CeedTensorContractCreate_f64_Xsmm(CeedBasis basis,
40c71e1dcdSjeremylt     CeedTensorContract contract);
413d576824SJeremy L Thompson 
423d576824SJeremy L Thompson #endif // _ceed_xsmm_h
43