-
Notifications
You must be signed in to change notification settings - Fork 722
/
Copy pathpipe_utils.hpp
271 lines (229 loc) · 9.57 KB
/
pipe_utils.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
//==============================================================
// Copyright Intel Corporation
//
// SPDX-License-Identifier: MIT
// =============================================================
#ifndef __PIPE_UTILS_HPP__
#define __PIPE_UTILS_HPP__
#include <sycl/sycl.hpp>
#include <sycl/ext/intel/fpga_extensions.hpp>
#include <utility>
/*
This header defines the following utilities for use with pipes in SYCL FPGA
designs.
1. PipeArray
Create a collection of pipes that can be indexed like an array.
template <class Id, // identifier for the pipe array
typename BaseTy, // type to write/read for each pipe
size_t min_depth, // minimum capacity of each pipe
size_t... dims // depth of each dimension in the array
// any number of dimensions are supported
>
struct PipeArray
Example usage:
class PipeArrayId;
constexpr int min_depth = 0;
constexpr int num_pipes = 4;
using MyPipeArray = PipeArray<PipeArrayId, int, min_depth, num_pipes>;
...
constexpr int pipe_idx = 1;
MyPipeArray::PipeAt<pipe_idx>::read();
2. PipeDuplicator
Fan-out a single pipe write to multiple pipe instances,
each of which will receive the same data.
A blocking write will perform a blocking write to each pipe.
A non-blocking write will perform a non-blocking write to each pipe,
and set success to true only if ALL writes were successful.
Note that the special case of 0 pipe instances is supported, which can
be useful as a stub for writes to pipes that are not needed in your particular
design.
template <class Id, // name of this PipeDuplicator
typename T, // data type to transfer
typename... Pipes // all pipes to send duplicated writes to
>
struct PipeDuplicator
Example usage:
class PipeID1;
class PipeID2;
using MyPipe1 = sycl::ext::intel::pipe<PipeID1, int>;
using MyPipe2 = sycl::ext::intel::pipe<PipeID2, int>;
class PipeDuplicatorID;
using MyPipeDuplicator = PipeDuplicator<PipeDuplicatorID, int, MyPipe1, MyPipe2>;
...
MyPipeDuplicator::write(1); // write the value 1 to both MyPipe1 and MyPipe2
*/
// =============================================================
// Internal Helper Functions/Structs
// =============================================================
namespace fpga_tools {
namespace detail {
// Templated classes for verifying dimensions when accessing elements in the
// pipe array.
template <size_t dim1, size_t... dims>
struct VerifierDimLayer {
template <size_t idx1, size_t... idxs>
struct VerifierIdxLayer {
static constexpr bool IsValid() {
return idx1 < dim1 &&
(VerifierDimLayer<dims...>::template VerifierIdxLayer<
idxs...>::IsValid());
}
};
};
template <size_t dim>
struct VerifierDimLayer<dim> {
template <size_t idx>
struct VerifierIdxLayer {
static constexpr bool IsValid() { return idx < dim; }
};
};
// Templated classes to perform 'currying' write to all pipes in the array
// Primary template, dummy
template <template <std::size_t...> class WriteFunc, typename BaseTy,
typename PartialSequence, typename... RemainingSequences>
struct write_currying {};
// Induction case
template <template <std::size_t...> class WriteFunc, typename BaseTy,
std::size_t... I, std::size_t... J, typename... RemainingSequences>
struct write_currying<WriteFunc, BaseTy, std::index_sequence<I...>,
std::index_sequence<J...>, RemainingSequences...> {
void operator()(const BaseTy &data, bool &success) const {
(write_currying<WriteFunc, BaseTy, std::index_sequence<I..., J>,
RemainingSequences...>()(data, success),
...);
}
};
// Base case
template <template <std::size_t...> class WriteFunc, typename BaseTy,
std::size_t... I>
struct write_currying<WriteFunc, BaseTy, std::index_sequence<I...>> {
void operator()(const BaseTy &data, bool &success) const {
WriteFunc<I...>()(data, success);
}
};
} // namespace detail
// =============================================================
// PipeArray
// =============================================================
template <class Id, // identifier for the pipe array
typename BaseTy, // type to write/read for each pipe
size_t min_depth, // minimum capacity of each pipe
size_t... dims // depth of each dimension in the array
// any number of dimensions are supported
>
struct PipeArray {
PipeArray() = delete; // ensure we cannot create an instance
template <size_t... idxs>
struct StructId; // the ID of each pipe in the array
// VerifyIndices checks that we only access pipe indicies that are in range
template <size_t... idxs>
struct VerifyIndices {
static_assert(sizeof...(idxs) == sizeof...(dims),
"Indexing into a PipeArray requires as many indices as "
"dimensions of the PipeArray.");
static_assert(fpga_tools::detail::VerifierDimLayer<dims...>::template
VerifierIdxLayer<idxs...>::IsValid(),
"Index out of bounds");
using VerifiedPipe =
sycl::ext::intel::pipe<StructId<idxs...>, BaseTy, min_depth>;
};
// helpers for accessing the dimensions of the pipe array
// usage:
// MyPipeArray::GetNumDims() - number of dimensions in this pipe array
// MyPipeArray::GetDimSize<3>() - size of dimension 3 in this pipe array
static constexpr size_t GetNumDims() { return (sizeof...(dims)); }
template <int dim_num>
static constexpr size_t GetDimSize() {
return std::get<dim_num>(dims...);
}
// PipeAt<idxs...> is used to reference a pipe at a particular index
template <size_t... idxs>
using PipeAt = typename VerifyIndices<idxs...>::VerifiedPipe;
// functor to impllement blocking write to all pipes in the array
template <std::size_t... I>
struct BlockingWriteFunc {
void operator()(const BaseTy &data, bool &success) const {
PipeAt<I...>::write(data);
}
};
// functor to impllement non-blocking write to all pipes in the array
template <std::size_t... I>
struct NonBlockingWriteFunc {
void operator()(const BaseTy &data, bool &success) const {
PipeAt<I...>::write(data, success);
}
};
// helper function for implementing write() call to all pipes in the array
template <template <std::size_t...> class WriteFunc,
typename... IndexSequences>
static void write_currying_helper(const BaseTy &data, bool &success,
IndexSequences...) {
fpga_tools::detail::write_currying<WriteFunc, BaseTy,
std::index_sequence<>, IndexSequences...>()(data, success);
}
// blocking write
// write the same data to all pipes in the array using blocking writes
static void write(const BaseTy &data) {
bool success; // temporary variable, ignored in BlockingWriteFunc
write_currying_helper<BlockingWriteFunc>(
data, success, std::make_index_sequence<dims>()...);
}
// non-blocking write
// write the same data to all pipes in the array using non-blocking writes
static void write(const BaseTy &data, bool &success) {
write_currying_helper<NonBlockingWriteFunc>(
data, success, std::make_index_sequence<dims>()...);
}
}; // end of struct PipeArray
// =============================================================
// PipeDuplicator
// =============================================================
// Connect a kernel that writes to a single pipe to multiple pipe instances,
// each of which will receive the same data.
// A blocking write will perform a blocking write to each pipe. A non-blocking
// write will perform a non-blocking write to each pipe, and set success to
// true only if ALL writes were successful.
// primary template, dummy
template <class Id, // name of this PipeDuplicator
typename T, // data type to transfer
typename... Pipes // all pipes to send duplicated writes to
>
struct PipeDuplicator {};
// recursive case, write to each pipe
template <class Id, // name of this PipeDuplicator
typename T, // data type to transfer
typename FirstPipe, // at least one output pipe
typename... RemainingPipes // additional copies of the output pipe
>
struct PipeDuplicator<Id, T, FirstPipe, RemainingPipes...> {
PipeDuplicator() = delete; // ensure we cannot create an instance
// Non-blocking write
static void write(const T &data, bool &success) {
bool local_success;
FirstPipe::write(data, local_success);
success = local_success;
PipeDuplicator<Id, T, RemainingPipes...>::write(data, local_success);
success &= local_success;
}
// Blocking write
static void write(const T &data) {
FirstPipe::write(data);
PipeDuplicator<Id, T, RemainingPipes...>::write(data);
}
};
// base case for recursion, no pipes to write to
// also useful as a 'null' pipe, writes don't do anything
template <class Id, // name of this PipeDuplicator
typename T // data type to transfer
>
struct PipeDuplicator<Id, T> {
PipeDuplicator() = delete; // ensure we cannot create an instance
// Non-blocking write
static void write(const T & /*data*/, bool &success) { success = true; }
// Blocking write
static void write(const T & /*data*/) {
// do nothing
}
};
} // namespace fpga_tools
#endif /* __PIPE_UTILS_HPP__ */