Tpetra parallel linear algebra
Version of the Day
Toggle main menu visibility
Loading...
Searching...
No Matches
core
src
Tpetra_Details_reallocDualViewIfNeeded.hpp
Go to the documentation of this file.
1
// @HEADER
2
// ***********************************************************************
3
//
4
// Tpetra: Templated Linear Algebra Services Package
5
// Copyright (2008) Sandia Corporation
6
//
7
// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
8
// the U.S. Government retains certain rights in this software.
9
//
10
// Redistribution and use in source and binary forms, with or without
11
// modification, are permitted provided that the following conditions are
12
// met:
13
//
14
// 1. Redistributions of source code must retain the above copyright
15
// notice, this list of conditions and the following disclaimer.
16
//
17
// 2. Redistributions in binary form must reproduce the above copyright
18
// notice, this list of conditions and the following disclaimer in the
19
// documentation and/or other materials provided with the distribution.
20
//
21
// 3. Neither the name of the Corporation nor the names of the
22
// contributors may be used to endorse or promote products derived from
23
// this software without specific prior written permission.
24
//
25
// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
26
// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
27
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
28
// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
29
// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
30
// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
31
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
32
// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33
// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34
// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35
// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36
//
37
// Questions? Contact Michael A. Heroux (maherou@sandia.gov)
38
//
39
// ************************************************************************
40
// @HEADER
41
42
#ifndef TPETRA_DETAILS_REALLOCDUALVIEWIFNEEDED_HPP
43
#define TPETRA_DETAILS_REALLOCDUALVIEWIFNEEDED_HPP
44
51
52
#include "
Tpetra_Details_Profiling.hpp
"
53
#include "Kokkos_DualView.hpp"
54
55
namespace
Tpetra
{
56
namespace
Details
{
57
81
template
<
class
ValueType,
class
DeviceType>
82
bool
83
reallocDualViewIfNeeded
(Kokkos::DualView<ValueType*, DeviceType>& dv,
84
const
size_t
newSize,
85
const
char
newLabel[],
86
const
size_t
tooBigFactor = 2,
87
const
bool
needFenceBeforeRealloc =
true
)
88
{
89
typedef
typename
DeviceType::execution_space
execution_space
;
90
typedef
Kokkos::DualView<ValueType*, DeviceType> dual_view_type;
91
typedef
Kokkos::pair<size_t, size_t> range_type;
92
93
// Profiling this matters, because GPU allocations can be expensive.
94
using
Tpetra::Details::ProfilingRegion
;
95
ProfilingRegion
region (
"Tpetra::Details::reallocDualViewIfNeeded"
);
96
97
const
size_t
curSize =
static_cast<
size_t
>
(dv.extent (0));
98
if
(curSize == newSize) {
99
return
false
;
// did not reallocate
100
}
101
else
if
(curSize < newSize) {
// too small; need to reallocate
102
if
(needFenceBeforeRealloc) {
103
execution_space
().fence ();
// keep this fence to respect needFenceBeforeRealloc
104
}
105
dv = dual_view_type ();
// free first, in order to save memory
106
// If current size is 0, the DualView's Views likely lack a label.
107
dv = dual_view_type (curSize == 0 ? newLabel : dv.d_view.label (), newSize);
108
return
true
;
// we did reallocate
109
}
110
else
{
111
if
(newSize == 0) {
// special case: realloc to 0 means always do it
112
if
(needFenceBeforeRealloc) {
113
execution_space
().fence ();
// keep this fence to respect needFenceBeforeRealloc
114
}
115
// If current size is 0, the DualView's Views likely lack a label.
116
dv = dual_view_type (curSize == 0 ? newLabel : dv.d_view.label (), 0);
117
return
true
;
// we did reallocate
118
}
119
// Instead of writing curSize >= tooBigFactor * newSize, express
120
// via division to avoid overflow (for very large right-hand side).
121
// We've already tested whether newSize == 0, so this is safe.
122
else
if
(curSize / newSize >= tooBigFactor) {
123
// The allocation is much too big, so free it and reallocate
124
// to the new, smaller size.
125
if
(needFenceBeforeRealloc) {
126
execution_space
().fence ();
// keep this fence to respect needFenceBeforeRealloc
127
}
128
dv = dual_view_type ();
// free first, in order to save memory
129
// If current size is 0, the DualView's Views likely lack a label.
130
dv = dual_view_type (curSize == 0 ? newLabel : dv.d_view.label (), newSize);
131
return
true
;
// we did reallocate
132
}
133
else
{
134
dv.d_view = Kokkos::subview (dv.d_view, range_type (0, newSize));
135
dv.h_view = Kokkos::subview (dv.h_view, range_type (0, newSize));
136
return
false
;
// we did not reallocate
137
}
138
}
139
}
140
142
template
<
class
ValueType,
class
DeviceType>
143
bool
144
reallocDualViewIfNeeded
(Kokkos::DualView<ValueType*, DeviceType>& exports,
145
const
size_t
newSize,
146
const
std::string& newLabel,
147
const
size_t
tooBigFactor = 2,
148
const
bool
needFenceBeforeRealloc =
true
)
149
{
150
return
reallocDualViewIfNeeded<ValueType, DeviceType>
(exports, newSize,
151
newLabel.c_str (),
152
tooBigFactor,
153
needFenceBeforeRealloc);
154
}
155
156
}
// namespace Details
157
}
// namespace Tpetra
158
159
#endif
// TPETRA_DETAILS_REALLOCDUALVIEWIFNEEDED_HPP
Tpetra_Details_Profiling.hpp
Declaration of Tpetra::Details::Profiling, a scope guard for Kokkos Profiling.
Tpetra::execution_space
Tpetra::Details::ProfilingRegion
Profile the given scope.
Definition
Tpetra_Details_Profiling.hpp:103
Tpetra::Details
Nonmember function that computes a residual Computes R = B - A * X.
Definition
Tpetra_KokkosRefactor_Details_MultiVectorLocalDeepCopy.hpp:51
Tpetra::Details::reallocDualViewIfNeeded
bool reallocDualViewIfNeeded(Kokkos::DualView< ValueType *, DeviceType > &dv, const size_t newSize, const char newLabel[], const size_t tooBigFactor=2, const bool needFenceBeforeRealloc=true)
Reallocate the DualView in/out argument, if needed.
Definition
Tpetra_Details_reallocDualViewIfNeeded.hpp:83
Tpetra
Namespace Tpetra contains the class and methods constituting the Tpetra library.
Generated by
1.17.0