Stokhos Package Browser (Single Doxygen Collection)  Version of the Day
Stokhos_Tpetra_ETI_Helpers_MP_Vector.hpp
Go to the documentation of this file.
1 // @HEADER
2 // ***********************************************************************
3 //
4 // Stokhos Package
5 // Copyright (2009) Sandia Corporation
6 //
7 // Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive
8 // license for use of this work by or on behalf of the U.S. Government.
9 //
10 // Redistribution and use in source and binary forms, with or without
11 // modification, are permitted provided that the following conditions are
12 // met:
13 //
14 // 1. Redistributions of source code must retain the above copyright
15 // notice, this list of conditions and the following disclaimer.
16 //
17 // 2. Redistributions in binary form must reproduce the above copyright
18 // notice, this list of conditions and the following disclaimer in the
19 // documentation and/or other materials provided with the distribution.
20 //
21 // 3. Neither the name of the Corporation nor the names of the
22 // contributors may be used to endorse or promote products derived from
23 // this software without specific prior written permission.
24 //
25 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
26 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
28 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
29 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
30 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
31 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
32 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 //
37 // Questions? Contact Eric T. Phipps (etphipp@sandia.gov).
38 //
39 // ***********************************************************************
40 // @HEADER
41 
42 // MP::Vector includes
44 #include "TpetraCore_ETIHelperMacros.h"
45 
46 #define INSTANTIATE_MP_VECTOR_STORAGE(INSTMACRO, STORAGE, LO, GO, N) \
47  INSTMACRO( Sacado::MP::Vector<STORAGE>, LO, GO, N )
48 
49 #define INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, NUM, D, LO, GO, N) \
50  typedef Stokhos::StaticFixedStorage<L,S,NUM,D::execution_space> SFS_ ## L ## _ ## S ## _ ## NUM ## _ ## D; \
51  INSTANTIATE_MP_VECTOR_STORAGE(INSTMACRO, SFS_ ## L ## _ ## S ## _ ## NUM ## _ ## D, LO, GO, N)
52 
53 #if defined(__MIC__)
54 // For MIC (Xeon Phi) -- vector width = 8 (double precision)
55 #define INSTANTIATE_MP_VECTOR_SFS_SLD_CPU(INSTMACRO, S, L, D, LO, GO, N) \
56  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 8, D, LO, GO, N) \
57  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 16, D, LO, GO, N) \
58  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 32, D, LO, GO, N)
59 #else
60 // For CPU with AVX instructions -- vector width = 4 (double precision)
61 #define INSTANTIATE_MP_VECTOR_SFS_SLD_CPU(INSTMACRO, S, L, D, LO, GO, N) \
62  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 4, D, LO, GO, N) \
63  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 8, D, LO, GO, N) \
64  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 16, D, LO, GO, N) \
65  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 32, D, LO, GO, N)
66 #endif
67 
68 // For CUDA GPU -- warp size = 32
69 #define INSTANTIATE_MP_VECTOR_SFS_SLD_GPU(INSTMACRO, S, L, D, LO, GO, N) \
70  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 16, D, LO, GO, N) \
71  INSTANTIATE_MP_VECTOR_SFS_SLND(INSTMACRO, S, L, 32, D, LO, GO, N)
72 
73 #define INSTANTIATE_MP_VECTOR_DS_SLD(INSTMACRO, S, L, D, LO, GO, N) \
74  typedef Stokhos::DynamicStorage<L,S,D> DS_ ## L ## _ ## S ## _ ## _ ## D; \
75  INSTANTIATE_MP_VECTOR_STORAGE(INSTMACRO, DS_ ## L ## _ ## S ## _ ## _ ## D, LO, GO, N)
76 
77 #define INSTANTIATE_MP_VECTOR_S_D_CPU(INSTMACRO, D, LO, GO, N) \
78  INSTANTIATE_MP_VECTOR_SFS_SLD_CPU(INSTMACRO, double, int, D, LO, GO, N)
79 #define INSTANTIATE_MP_VECTOR_S_D_GPU(INSTMACRO, D, LO, GO, N) \
80  INSTANTIATE_MP_VECTOR_SFS_SLD_GPU(INSTMACRO, double, int, D, LO, GO, N)
81 
82 // Disabling dynamic storage ETI -- we don't really need it
83 // INSTANTIATE_MP_VECTOR_DS_SLD(INSTMACRO, double, int, D, LO, GO, N)
84 
85 #define INSTANTIATE_MP_VECTOR_S_CPU(INSTMACRO, LO, GO, N) \
86  typedef Stokhos::DeviceForNode<N>::type DFN_CPU_ ## LO ## _ ## GO ## _ ## N; \
87  INSTANTIATE_MP_VECTOR_S_D_CPU(INSTMACRO, DFN_CPU_ ## LO ## _ ## GO ## _ ## N, LO, GO, N)
88 #define INSTANTIATE_MP_VECTOR_S_GPU(INSTMACRO, LO, GO, N) \
89  typedef Stokhos::DeviceForNode<N>::type DFN_GPU_ ## LO ## _ ## GO ## _ ## N; \
90  INSTANTIATE_MP_VECTOR_S_D_GPU(INSTMACRO, DFN_GPU_ ## LO ## _ ## GO ## _ ## N, LO, GO, N)
91 
92 #if defined(HAVE_TPETRACORE_TEUCHOSKOKKOSCOMPAT) && defined(HAVE_TPETRA_INST_SERIAL)
93 #define INSTANTIATE_TPETRA_MP_VECTOR_SERIAL(INSTMACRO) \
94  using default_local_ordinal_type = Tpetra::Map<>::local_ordinal_type; \
95  using default_global_ordinal_type = Tpetra::Map<>::global_ordinal_type; \
96  INSTANTIATE_MP_VECTOR_S_CPU(INSTMACRO, default_local_ordinal_type, default_global_ordinal_type, Kokkos_Compat_KokkosSerialWrapperNode)
97 #else
98 #define INSTANTIATE_TPETRA_MP_VECTOR_SERIAL(INSTMACRO)
99 #endif
100 
101 
102 #if defined(HAVE_TPETRACORE_TEUCHOSKOKKOSCOMPAT) && defined(HAVE_TPETRA_INST_PTHREAD)
103 #define INSTANTIATE_TPETRA_MP_VECTOR_THREADS(INSTMACRO) \
104  using default_local_ordinal_type = Tpetra::Map<>::local_ordinal_type; \
105  using default_global_ordinal_type = Tpetra::Map<>::global_ordinal_type; \
106  INSTANTIATE_MP_VECTOR_S_CPU(INSTMACRO, default_local_ordinal_type, default_global_ordinal_type, Kokkos_Compat_KokkosThreadsWrapperNode)
107 #else
108 #define INSTANTIATE_TPETRA_MP_VECTOR_THREADS(INSTMACRO)
109 #endif
110 
111 #if defined(HAVE_TPETRACORE_TEUCHOSKOKKOSCOMPAT) && defined(HAVE_TPETRA_INST_OPENMP)
112 #define INSTANTIATE_TPETRA_MP_VECTOR_OPENMP(INSTMACRO) \
113  using default_local_ordinal_type = Tpetra::Map<>::local_ordinal_type; \
114  using default_global_ordinal_type = Tpetra::Map<>::global_ordinal_type; \
115  INSTANTIATE_MP_VECTOR_S_CPU(INSTMACRO, default_local_ordinal_type, default_global_ordinal_type, Kokkos_Compat_KokkosOpenMPWrapperNode)
116 #else
117 #define INSTANTIATE_TPETRA_MP_VECTOR_OPENMP(INSTMACRO)
118 #endif
119 
120 #if defined(HAVE_TPETRACORE_TEUCHOSKOKKOSCOMPAT) && defined(HAVE_TPETRA_INST_CUDA)
121 #define INSTANTIATE_TPETRA_MP_VECTOR_CUDA(INSTMACRO) \
122  using default_local_ordinal_type = Tpetra::Map<>::local_ordinal_type; \
123  using default_global_ordinal_type = Tpetra::Map<>::global_ordinal_type; \
124  INSTANTIATE_MP_VECTOR_S_GPU(INSTMACRO, default_local_ordinal_type, default_global_ordinal_type, Kokkos_Compat_KokkosCudaWrapperNode)
125 #else
126 #define INSTANTIATE_TPETRA_MP_VECTOR_CUDA(INSTMACRO)
127 #endif
128 
129 #define INSTANTIATE_TPETRA_MP_VECTOR_WRAPPER_NODES(INSTMACRO) \
130  INSTANTIATE_TPETRA_MP_VECTOR_THREADS(INSTMACRO) \
131  INSTANTIATE_TPETRA_MP_VECTOR_OPENMP(INSTMACRO) \
132  INSTANTIATE_TPETRA_MP_VECTOR_CUDA(INSTMACRO)
133 
134 #define INSTANTIATE_TPETRA_MP_VECTOR(INSTMACRO) \
135  namespace Tpetra { \
136  \
137  TPETRA_ETI_MANGLING_TYPEDEFS() \
138  \
139  INSTANTIATE_TPETRA_MP_VECTOR_WRAPPER_NODES(INSTMACRO) \
140  \
141 }