annotate liboffloadmic/runtime/offload_engine.h @ 136:4627f235cf2a

fix c-next example
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Thu, 08 Nov 2018 14:11:56 +0900
parents 04ced10e8804
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
111
kono
parents:
diff changeset
1 /*
kono
parents:
diff changeset
2 Copyright (c) 2014-2016 Intel Corporation. All Rights Reserved.
kono
parents:
diff changeset
3
kono
parents:
diff changeset
4 Redistribution and use in source and binary forms, with or without
kono
parents:
diff changeset
5 modification, are permitted provided that the following conditions
kono
parents:
diff changeset
6 are met:
kono
parents:
diff changeset
7
kono
parents:
diff changeset
8 * Redistributions of source code must retain the above copyright
kono
parents:
diff changeset
9 notice, this list of conditions and the following disclaimer.
kono
parents:
diff changeset
10 * Redistributions in binary form must reproduce the above copyright
kono
parents:
diff changeset
11 notice, this list of conditions and the following disclaimer in the
kono
parents:
diff changeset
12 documentation and/or other materials provided with the distribution.
kono
parents:
diff changeset
13 * Neither the name of Intel Corporation nor the names of its
kono
parents:
diff changeset
14 contributors may be used to endorse or promote products derived
kono
parents:
diff changeset
15 from this software without specific prior written permission.
kono
parents:
diff changeset
16
kono
parents:
diff changeset
17 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
kono
parents:
diff changeset
18 "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
kono
parents:
diff changeset
19 LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
kono
parents:
diff changeset
20 A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
kono
parents:
diff changeset
21 HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
kono
parents:
diff changeset
22 SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
kono
parents:
diff changeset
23 LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
kono
parents:
diff changeset
24 DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
kono
parents:
diff changeset
25 THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
kono
parents:
diff changeset
26 (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
kono
parents:
diff changeset
27 OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
kono
parents:
diff changeset
28 */
kono
parents:
diff changeset
29
kono
parents:
diff changeset
30
kono
parents:
diff changeset
31 #ifndef OFFLOAD_ENGINE_H_INCLUDED
kono
parents:
diff changeset
32 #define OFFLOAD_ENGINE_H_INCLUDED
kono
parents:
diff changeset
33
kono
parents:
diff changeset
34 #include <limits.h>
kono
parents:
diff changeset
35 #include <bitset>
kono
parents:
diff changeset
36 #include <list>
kono
parents:
diff changeset
37 #include <set>
kono
parents:
diff changeset
38 #include <map>
kono
parents:
diff changeset
39 #include "offload_common.h"
kono
parents:
diff changeset
40 #include "coi/coi_client.h"
kono
parents:
diff changeset
41
kono
parents:
diff changeset
42 #define SIGNAL_HAS_COMPLETED ((OffloadDescriptor *)-1)
kono
parents:
diff changeset
43 const int64_t no_stream = -1;
kono
parents:
diff changeset
44
kono
parents:
diff changeset
45 // Address range
kono
parents:
diff changeset
46 class MemRange {
kono
parents:
diff changeset
47 public:
kono
parents:
diff changeset
48 MemRange() : m_start(0), m_length(0) {}
kono
parents:
diff changeset
49 MemRange(const void *addr, uint64_t len) : m_start(addr), m_length(len) {}
kono
parents:
diff changeset
50
kono
parents:
diff changeset
51 const void* start() const {
kono
parents:
diff changeset
52 return m_start;
kono
parents:
diff changeset
53 }
kono
parents:
diff changeset
54
kono
parents:
diff changeset
55 const void* end() const {
kono
parents:
diff changeset
56 return static_cast<const char*>(m_start) + m_length;
kono
parents:
diff changeset
57 }
kono
parents:
diff changeset
58
kono
parents:
diff changeset
59 uint64_t length() const {
kono
parents:
diff changeset
60 return m_length;
kono
parents:
diff changeset
61 }
kono
parents:
diff changeset
62
kono
parents:
diff changeset
63 // returns true if given range overlaps with another one
kono
parents:
diff changeset
64 bool overlaps(const MemRange &o) const {
kono
parents:
diff changeset
65 // Two address ranges A[start, end) and B[start,end) overlap
kono
parents:
diff changeset
66 // if A.start < B.end and A.end > B.start.
kono
parents:
diff changeset
67 return start() < o.end() && end() > o.start();
kono
parents:
diff changeset
68 }
kono
parents:
diff changeset
69
kono
parents:
diff changeset
70 // returns true if given range contains the other range
kono
parents:
diff changeset
71 bool contains(const MemRange &o) const {
kono
parents:
diff changeset
72 return start() <= o.start() && o.end() <= end();
kono
parents:
diff changeset
73 }
kono
parents:
diff changeset
74
kono
parents:
diff changeset
75 private:
kono
parents:
diff changeset
76 const void* m_start;
kono
parents:
diff changeset
77 uint64_t m_length;
kono
parents:
diff changeset
78 };
kono
parents:
diff changeset
79
kono
parents:
diff changeset
80 // Data associated with a pointer variable
kono
parents:
diff changeset
81 class PtrData {
kono
parents:
diff changeset
82 public:
kono
parents:
diff changeset
83 PtrData(const void *addr, uint64_t len) :
kono
parents:
diff changeset
84 cpu_addr(addr, len), cpu_buf(0),
kono
parents:
diff changeset
85 mic_addr(0), alloc_disp(0), mic_buf(0), mic_offset(0),
kono
parents:
diff changeset
86 ref_count(0), is_static(false), is_omp_associate(false)
kono
parents:
diff changeset
87 {}
kono
parents:
diff changeset
88
kono
parents:
diff changeset
89 //
kono
parents:
diff changeset
90 // Copy constructor
kono
parents:
diff changeset
91 //
kono
parents:
diff changeset
92 PtrData(const PtrData& ptr):
kono
parents:
diff changeset
93 cpu_addr(ptr.cpu_addr), cpu_buf(ptr.cpu_buf),
kono
parents:
diff changeset
94 mic_addr(ptr.mic_addr), alloc_disp(ptr.alloc_disp),
kono
parents:
diff changeset
95 mic_buf(ptr.mic_buf), mic_offset(ptr.mic_offset),
kono
parents:
diff changeset
96 ref_count(ptr.ref_count), is_static(ptr.is_static),
kono
parents:
diff changeset
97 is_omp_associate(ptr.is_omp_associate),
kono
parents:
diff changeset
98 var_alloc_type(0)
kono
parents:
diff changeset
99 {}
kono
parents:
diff changeset
100
kono
parents:
diff changeset
101 bool operator<(const PtrData &o) const {
kono
parents:
diff changeset
102 // Variables are sorted by the CPU start address.
kono
parents:
diff changeset
103 // Overlapping memory ranges are considered equal.
kono
parents:
diff changeset
104 return (cpu_addr.start() < o.cpu_addr.start()) &&
kono
parents:
diff changeset
105 !cpu_addr.overlaps(o.cpu_addr);
kono
parents:
diff changeset
106 }
kono
parents:
diff changeset
107
kono
parents:
diff changeset
108 long add_reference() {
kono
parents:
diff changeset
109 if (is_omp_associate || (is_static && !var_alloc_type)) {
kono
parents:
diff changeset
110 return LONG_MAX;
kono
parents:
diff changeset
111 }
kono
parents:
diff changeset
112 #ifndef TARGET_WINNT
kono
parents:
diff changeset
113 return __sync_fetch_and_add(&ref_count, 1);
kono
parents:
diff changeset
114 #else // TARGET_WINNT
kono
parents:
diff changeset
115 return _InterlockedIncrement(&ref_count) - 1;
kono
parents:
diff changeset
116 #endif // TARGET_WINNT
kono
parents:
diff changeset
117 }
kono
parents:
diff changeset
118
kono
parents:
diff changeset
119 long remove_reference() {
kono
parents:
diff changeset
120 if (is_omp_associate || (is_static && !var_alloc_type)) {
kono
parents:
diff changeset
121 return LONG_MAX;
kono
parents:
diff changeset
122 }
kono
parents:
diff changeset
123 #ifndef TARGET_WINNT
kono
parents:
diff changeset
124 return __sync_sub_and_fetch(&ref_count, 1);
kono
parents:
diff changeset
125 #else // TARGET_WINNT
kono
parents:
diff changeset
126 return _InterlockedDecrement(&ref_count);
kono
parents:
diff changeset
127 #endif // TARGET_WINNT
kono
parents:
diff changeset
128 }
kono
parents:
diff changeset
129
kono
parents:
diff changeset
130 long get_reference() const {
kono
parents:
diff changeset
131 if (is_omp_associate || (is_static && !var_alloc_type)) {
kono
parents:
diff changeset
132 return LONG_MAX;
kono
parents:
diff changeset
133 }
kono
parents:
diff changeset
134 return ref_count;
kono
parents:
diff changeset
135 }
kono
parents:
diff changeset
136
kono
parents:
diff changeset
137 public:
kono
parents:
diff changeset
138 // CPU address range
kono
parents:
diff changeset
139 const MemRange cpu_addr;
kono
parents:
diff changeset
140
kono
parents:
diff changeset
141 // CPU and MIC buffers
kono
parents:
diff changeset
142 COIBUFFER cpu_buf;
kono
parents:
diff changeset
143 COIBUFFER mic_buf;
kono
parents:
diff changeset
144
kono
parents:
diff changeset
145 // placeholder for buffer address on mic
kono
parents:
diff changeset
146 uint64_t mic_addr;
kono
parents:
diff changeset
147
kono
parents:
diff changeset
148 uint64_t alloc_disp;
kono
parents:
diff changeset
149
kono
parents:
diff changeset
150 // additional offset to pointer data on MIC for improving bandwidth for
kono
parents:
diff changeset
151 // data which is not 4K aligned
kono
parents:
diff changeset
152 uint32_t mic_offset;
kono
parents:
diff changeset
153
kono
parents:
diff changeset
154 // if true buffers are created from static memory
kono
parents:
diff changeset
155 bool is_static;
kono
parents:
diff changeset
156
kono
parents:
diff changeset
157 // true if MIC buffer created by omp_target_associate
kono
parents:
diff changeset
158 bool is_omp_associate;
kono
parents:
diff changeset
159
kono
parents:
diff changeset
160 bool var_alloc_type;
kono
parents:
diff changeset
161 mutex_t alloc_ptr_data_lock;
kono
parents:
diff changeset
162
kono
parents:
diff changeset
163 private:
kono
parents:
diff changeset
164 // reference count for the entry
kono
parents:
diff changeset
165 long ref_count;
kono
parents:
diff changeset
166 };
kono
parents:
diff changeset
167
kono
parents:
diff changeset
168 typedef std::list<PtrData*> PtrDataList;
kono
parents:
diff changeset
169
kono
parents:
diff changeset
170 class PtrDataTable {
kono
parents:
diff changeset
171 public:
kono
parents:
diff changeset
172 typedef std::set<PtrData> PtrSet;
kono
parents:
diff changeset
173
kono
parents:
diff changeset
174 PtrData* find_ptr_data(const void *ptr) {
kono
parents:
diff changeset
175 m_ptr_lock.lock();
kono
parents:
diff changeset
176 PtrSet::iterator res = list.find(PtrData(ptr, 0));
kono
parents:
diff changeset
177
kono
parents:
diff changeset
178 m_ptr_lock.unlock();
kono
parents:
diff changeset
179 if (res == list.end()) {
kono
parents:
diff changeset
180 return 0;
kono
parents:
diff changeset
181 }
kono
parents:
diff changeset
182 return const_cast<PtrData*>(res.operator->());
kono
parents:
diff changeset
183 }
kono
parents:
diff changeset
184
kono
parents:
diff changeset
185 PtrData* insert_ptr_data(const void *ptr, uint64_t len, bool &is_new) {
kono
parents:
diff changeset
186 m_ptr_lock.lock();
kono
parents:
diff changeset
187 std::pair<PtrSet::iterator, bool> res =
kono
parents:
diff changeset
188 list.insert(PtrData(ptr, len));
kono
parents:
diff changeset
189
kono
parents:
diff changeset
190 PtrData* ptr_data = const_cast<PtrData*>(res.first.operator->());
kono
parents:
diff changeset
191 m_ptr_lock.unlock();
kono
parents:
diff changeset
192
kono
parents:
diff changeset
193 is_new = res.second;
kono
parents:
diff changeset
194 if (is_new) {
kono
parents:
diff changeset
195 // It's necessary to lock as soon as possible.
kono
parents:
diff changeset
196 // unlock must be done at call site of insert_ptr_data at
kono
parents:
diff changeset
197 // branch for is_new
kono
parents:
diff changeset
198 ptr_data->alloc_ptr_data_lock.lock();
kono
parents:
diff changeset
199 }
kono
parents:
diff changeset
200 return ptr_data;
kono
parents:
diff changeset
201 }
kono
parents:
diff changeset
202
kono
parents:
diff changeset
203 void remove_ptr_data(const void *ptr) {
kono
parents:
diff changeset
204 m_ptr_lock.lock();
kono
parents:
diff changeset
205 list.erase(PtrData(ptr, 0));
kono
parents:
diff changeset
206 m_ptr_lock.unlock();
kono
parents:
diff changeset
207 }
kono
parents:
diff changeset
208 private:
kono
parents:
diff changeset
209
kono
parents:
diff changeset
210 PtrSet list;
kono
parents:
diff changeset
211 mutex_t m_ptr_lock;
kono
parents:
diff changeset
212 };
kono
parents:
diff changeset
213
kono
parents:
diff changeset
214 // Data associated with automatic variable
kono
parents:
diff changeset
215 class AutoData {
kono
parents:
diff changeset
216 public:
kono
parents:
diff changeset
217 AutoData(const void *addr, uint64_t len) :
kono
parents:
diff changeset
218 cpu_addr(addr, len), ref_count(0)
kono
parents:
diff changeset
219 {}
kono
parents:
diff changeset
220
kono
parents:
diff changeset
221 bool operator<(const AutoData &o) const {
kono
parents:
diff changeset
222 // Variables are sorted by the CPU start address.
kono
parents:
diff changeset
223 // Overlapping memory ranges are considered equal.
kono
parents:
diff changeset
224 return (cpu_addr.start() < o.cpu_addr.start()) &&
kono
parents:
diff changeset
225 !cpu_addr.overlaps(o.cpu_addr);
kono
parents:
diff changeset
226 }
kono
parents:
diff changeset
227
kono
parents:
diff changeset
228 long add_reference() {
kono
parents:
diff changeset
229 #ifndef TARGET_WINNT
kono
parents:
diff changeset
230 return __sync_fetch_and_add(&ref_count, 1);
kono
parents:
diff changeset
231 #else // TARGET_WINNT
kono
parents:
diff changeset
232 return _InterlockedIncrement(&ref_count) - 1;
kono
parents:
diff changeset
233 #endif // TARGET_WINNT
kono
parents:
diff changeset
234 }
kono
parents:
diff changeset
235
kono
parents:
diff changeset
236 long remove_reference() {
kono
parents:
diff changeset
237 #ifndef TARGET_WINNT
kono
parents:
diff changeset
238 return __sync_sub_and_fetch(&ref_count, 1);
kono
parents:
diff changeset
239 #else // TARGET_WINNT
kono
parents:
diff changeset
240 return _InterlockedDecrement(&ref_count);
kono
parents:
diff changeset
241 #endif // TARGET_WINNT
kono
parents:
diff changeset
242 }
kono
parents:
diff changeset
243
kono
parents:
diff changeset
244 long nullify_reference() {
kono
parents:
diff changeset
245 #ifndef TARGET_WINNT
kono
parents:
diff changeset
246 return __sync_lock_test_and_set(&ref_count, 0);
kono
parents:
diff changeset
247 #else // TARGET_WINNT
kono
parents:
diff changeset
248 return _InterlockedExchange(&ref_count,0);
kono
parents:
diff changeset
249 #endif // TARGET_WINNT
kono
parents:
diff changeset
250 }
kono
parents:
diff changeset
251
kono
parents:
diff changeset
252 long get_reference() const {
kono
parents:
diff changeset
253 return ref_count;
kono
parents:
diff changeset
254 }
kono
parents:
diff changeset
255
kono
parents:
diff changeset
256 public:
kono
parents:
diff changeset
257 // CPU address range
kono
parents:
diff changeset
258 const MemRange cpu_addr;
kono
parents:
diff changeset
259
kono
parents:
diff changeset
260 private:
kono
parents:
diff changeset
261 // reference count for the entry
kono
parents:
diff changeset
262 long ref_count;
kono
parents:
diff changeset
263 };
kono
parents:
diff changeset
264
kono
parents:
diff changeset
265 // Set of autimatic variables
kono
parents:
diff changeset
266 typedef std::set<AutoData> AutoSet;
kono
parents:
diff changeset
267
kono
parents:
diff changeset
268 // Target image data
kono
parents:
diff changeset
269 struct TargetImage
kono
parents:
diff changeset
270 {
kono
parents:
diff changeset
271 TargetImage(const char *_name, const void *_data, uint64_t _size,
kono
parents:
diff changeset
272 const char *_origin, uint64_t _offset) :
kono
parents:
diff changeset
273 name(_name), data(_data), size(_size),
kono
parents:
diff changeset
274 origin(_origin), offset(_offset)
kono
parents:
diff changeset
275 {}
kono
parents:
diff changeset
276
kono
parents:
diff changeset
277 // library name
kono
parents:
diff changeset
278 const char* name;
kono
parents:
diff changeset
279
kono
parents:
diff changeset
280 // contents and size
kono
parents:
diff changeset
281 const void* data;
kono
parents:
diff changeset
282 uint64_t size;
kono
parents:
diff changeset
283
kono
parents:
diff changeset
284 // file of origin and offset within that file
kono
parents:
diff changeset
285 const char* origin;
kono
parents:
diff changeset
286 uint64_t offset;
kono
parents:
diff changeset
287 };
kono
parents:
diff changeset
288
kono
parents:
diff changeset
289 typedef std::list<TargetImage> TargetImageList;
kono
parents:
diff changeset
290
kono
parents:
diff changeset
291 // dynamic library and Image associated with lib
kono
parents:
diff changeset
292 struct DynLib
kono
parents:
diff changeset
293 {
kono
parents:
diff changeset
294 DynLib(const char *_name, const void *_data,
kono
parents:
diff changeset
295 COILIBRARY _lib) :
kono
parents:
diff changeset
296 name(_name), data(_data), lib(_lib)
kono
parents:
diff changeset
297 {}
kono
parents:
diff changeset
298 // library name
kono
parents:
diff changeset
299 const char* name;
kono
parents:
diff changeset
300
kono
parents:
diff changeset
301 // contents
kono
parents:
diff changeset
302 const void* data;
kono
parents:
diff changeset
303
kono
parents:
diff changeset
304 COILIBRARY lib;
kono
parents:
diff changeset
305 };
kono
parents:
diff changeset
306 typedef std::list<DynLib> DynLibList;
kono
parents:
diff changeset
307
kono
parents:
diff changeset
308 // Data associated with persistent auto objects
kono
parents:
diff changeset
309 struct PersistData
kono
parents:
diff changeset
310 {
kono
parents:
diff changeset
311 PersistData(const void *addr, uint64_t routine_num,
kono
parents:
diff changeset
312 uint64_t size, uint64_t thread) :
kono
parents:
diff changeset
313 stack_cpu_addr(addr), routine_id(routine_num), thread_id(thread)
kono
parents:
diff changeset
314 {
kono
parents:
diff changeset
315 stack_ptr_data = new PtrData(0, size);
kono
parents:
diff changeset
316 }
kono
parents:
diff changeset
317 // 1-st key value - beginning of the stack at CPU
kono
parents:
diff changeset
318 const void * stack_cpu_addr;
kono
parents:
diff changeset
319 // 2-nd key value - identifier of routine invocation at CPU
kono
parents:
diff changeset
320 uint64_t routine_id;
kono
parents:
diff changeset
321 // 3-rd key value - thread identifier
kono
parents:
diff changeset
322 uint64_t thread_id;
kono
parents:
diff changeset
323
kono
parents:
diff changeset
324 // corresponded PtrData; only stack_ptr_data->mic_buf is used
kono
parents:
diff changeset
325 PtrData * stack_ptr_data;
kono
parents:
diff changeset
326 // used to get offset of the variable in stack buffer
kono
parents:
diff changeset
327 char * cpu_stack_addr;
kono
parents:
diff changeset
328 };
kono
parents:
diff changeset
329
kono
parents:
diff changeset
330 typedef std::list<PersistData> PersistDataList;
kono
parents:
diff changeset
331
kono
parents:
diff changeset
332 // Data associated with stream
kono
parents:
diff changeset
333 struct Stream
kono
parents:
diff changeset
334 {
kono
parents:
diff changeset
335 Stream(int device, int num_of_cpus) :
kono
parents:
diff changeset
336 m_number_of_cpus(num_of_cpus), m_pipeline(0), m_last_offload(0),
kono
parents:
diff changeset
337 m_device(device)
kono
parents:
diff changeset
338 {}
kono
parents:
diff changeset
339 ~Stream() {
kono
parents:
diff changeset
340 if (m_pipeline) {
kono
parents:
diff changeset
341 COI::PipelineDestroy(m_pipeline);
kono
parents:
diff changeset
342 }
kono
parents:
diff changeset
343 }
kono
parents:
diff changeset
344
kono
parents:
diff changeset
345 COIPIPELINE get_pipeline(void) {
kono
parents:
diff changeset
346 return(m_pipeline);
kono
parents:
diff changeset
347 }
kono
parents:
diff changeset
348
kono
parents:
diff changeset
349 int get_device(void) {
kono
parents:
diff changeset
350 return(m_device);
kono
parents:
diff changeset
351 }
kono
parents:
diff changeset
352
kono
parents:
diff changeset
353 int get_cpu_number(void) {
kono
parents:
diff changeset
354 return(m_number_of_cpus);
kono
parents:
diff changeset
355 }
kono
parents:
diff changeset
356
kono
parents:
diff changeset
357 void set_pipeline(COIPIPELINE pipeline) {
kono
parents:
diff changeset
358 m_pipeline = pipeline;
kono
parents:
diff changeset
359 }
kono
parents:
diff changeset
360
kono
parents:
diff changeset
361 OffloadDescriptor* get_last_offload(void) {
kono
parents:
diff changeset
362 return(m_last_offload);
kono
parents:
diff changeset
363 }
kono
parents:
diff changeset
364
kono
parents:
diff changeset
365 void set_last_offload(OffloadDescriptor* last_offload) {
kono
parents:
diff changeset
366 m_last_offload = last_offload;
kono
parents:
diff changeset
367 }
kono
parents:
diff changeset
368
kono
parents:
diff changeset
369 static Stream* find_stream(uint64_t handle, bool remove);
kono
parents:
diff changeset
370
kono
parents:
diff changeset
371 static _Offload_stream add_stream(int device, int number_of_cpus) {
kono
parents:
diff changeset
372 _Offload_stream result;
kono
parents:
diff changeset
373 m_stream_lock.lock();
kono
parents:
diff changeset
374 result = ++m_streams_count;
kono
parents:
diff changeset
375 all_streams[m_streams_count] = new Stream(device, number_of_cpus);
kono
parents:
diff changeset
376 m_stream_lock.unlock();
kono
parents:
diff changeset
377 return(result);
kono
parents:
diff changeset
378 }
kono
parents:
diff changeset
379
kono
parents:
diff changeset
380 static uint64_t get_streams_count() {
kono
parents:
diff changeset
381 return m_streams_count;
kono
parents:
diff changeset
382 }
kono
parents:
diff changeset
383
kono
parents:
diff changeset
384 typedef std::map<uint64_t, Stream*> StreamMap;
kono
parents:
diff changeset
385
kono
parents:
diff changeset
386 static uint64_t m_streams_count;
kono
parents:
diff changeset
387 static StreamMap all_streams;
kono
parents:
diff changeset
388 static mutex_t m_stream_lock;
kono
parents:
diff changeset
389
kono
parents:
diff changeset
390 int m_device;
kono
parents:
diff changeset
391
kono
parents:
diff changeset
392 // number of cpus
kono
parents:
diff changeset
393 int m_number_of_cpus;
kono
parents:
diff changeset
394
kono
parents:
diff changeset
395 // The pipeline associated with the stream
kono
parents:
diff changeset
396 COIPIPELINE m_pipeline;
kono
parents:
diff changeset
397
kono
parents:
diff changeset
398 // The last offload occured via the stream
kono
parents:
diff changeset
399 OffloadDescriptor* m_last_offload;
kono
parents:
diff changeset
400
kono
parents:
diff changeset
401 // Cpus used by the stream
kono
parents:
diff changeset
402 std::bitset<COI_MAX_HW_THREADS> m_stream_cpus;
kono
parents:
diff changeset
403 };
kono
parents:
diff changeset
404
kono
parents:
diff changeset
405 typedef std::map<uint64_t, Stream*> StreamMap;
kono
parents:
diff changeset
406 typedef std::bitset<COI_MAX_HW_THREADS> micLcpuMask;
kono
parents:
diff changeset
407
kono
parents:
diff changeset
408 // ordered by count double linked list of cpus used by streams
kono
parents:
diff changeset
409 typedef struct CpuEl{
kono
parents:
diff changeset
410 uint64_t count; // number of streams using the cpu
kono
parents:
diff changeset
411 struct CpuEl* prev; // cpu with the same or lesser count
kono
parents:
diff changeset
412 struct CpuEl* next; // cpu with the same or greater count
kono
parents:
diff changeset
413 } CpuEl;
kono
parents:
diff changeset
414
kono
parents:
diff changeset
415 // class representing a single engine
kono
parents:
diff changeset
416 struct Engine {
kono
parents:
diff changeset
417 friend void __offload_init_library_once(void);
kono
parents:
diff changeset
418 friend void __offload_fini_library(void);
kono
parents:
diff changeset
419
kono
parents:
diff changeset
420 #define CPU_INDEX(x) (x - m_cpus)
kono
parents:
diff changeset
421 #define check_result(res, tag, ...) \
kono
parents:
diff changeset
422 { \
kono
parents:
diff changeset
423 if (res == COI_PROCESS_DIED) { \
kono
parents:
diff changeset
424 fini_process(true); \
kono
parents:
diff changeset
425 exit(1); \
kono
parents:
diff changeset
426 } \
kono
parents:
diff changeset
427 if (res != COI_SUCCESS) { \
kono
parents:
diff changeset
428 __liboffload_error_support(tag, __VA_ARGS__); \
kono
parents:
diff changeset
429 exit(1); \
kono
parents:
diff changeset
430 } \
kono
parents:
diff changeset
431 }
kono
parents:
diff changeset
432
kono
parents:
diff changeset
433 int get_logical_index() const {
kono
parents:
diff changeset
434 return m_index;
kono
parents:
diff changeset
435 }
kono
parents:
diff changeset
436
kono
parents:
diff changeset
437 int get_physical_index() const {
kono
parents:
diff changeset
438 return m_physical_index;
kono
parents:
diff changeset
439 }
kono
parents:
diff changeset
440
kono
parents:
diff changeset
441 const COIPROCESS& get_process() const {
kono
parents:
diff changeset
442 return m_process;
kono
parents:
diff changeset
443 }
kono
parents:
diff changeset
444
kono
parents:
diff changeset
445 bool get_ready() {
kono
parents:
diff changeset
446 return m_ready;
kono
parents:
diff changeset
447 }
kono
parents:
diff changeset
448
kono
parents:
diff changeset
449 uint64_t get_thread_id(void);
kono
parents:
diff changeset
450
kono
parents:
diff changeset
451 // initialize device
kono
parents:
diff changeset
452 void init(void);
kono
parents:
diff changeset
453
kono
parents:
diff changeset
454 // unload library
kono
parents:
diff changeset
455 void unload_library(const void *data, const char *name);
kono
parents:
diff changeset
456
kono
parents:
diff changeset
457 // add new library
kono
parents:
diff changeset
458 void add_lib(const TargetImage &lib)
kono
parents:
diff changeset
459 {
kono
parents:
diff changeset
460 m_lock.lock();
kono
parents:
diff changeset
461 m_ready = false;
kono
parents:
diff changeset
462 m_images.push_back(lib);
kono
parents:
diff changeset
463 m_lock.unlock();
kono
parents:
diff changeset
464 }
kono
parents:
diff changeset
465
kono
parents:
diff changeset
466 COIRESULT compute(
kono
parents:
diff changeset
467 _Offload_stream stream,
kono
parents:
diff changeset
468 const std::list<COIBUFFER> &buffers,
kono
parents:
diff changeset
469 const void* data,
kono
parents:
diff changeset
470 uint16_t data_size,
kono
parents:
diff changeset
471 void* ret,
kono
parents:
diff changeset
472 uint16_t ret_size,
kono
parents:
diff changeset
473 uint32_t num_deps,
kono
parents:
diff changeset
474 const COIEVENT* deps,
kono
parents:
diff changeset
475 COIEVENT* event
kono
parents:
diff changeset
476 );
kono
parents:
diff changeset
477
kono
parents:
diff changeset
478 #ifdef MYO_SUPPORT
kono
parents:
diff changeset
479 // temporary workaround for blocking behavior for myoiLibInit/Fini calls
kono
parents:
diff changeset
480 void init_myo(COIEVENT *event) {
kono
parents:
diff changeset
481 COIRESULT res;
kono
parents:
diff changeset
482 res = COI::PipelineRunFunction(get_pipeline(),
kono
parents:
diff changeset
483 m_funcs[c_func_myo_init],
kono
parents:
diff changeset
484 0, 0, 0, 0, 0, 0, 0, 0, 0,
kono
parents:
diff changeset
485 event);
kono
parents:
diff changeset
486 check_result(res, c_pipeline_run_func, m_index, res);
kono
parents:
diff changeset
487 }
kono
parents:
diff changeset
488
kono
parents:
diff changeset
489 void fini_myo(COIEVENT *event) {
kono
parents:
diff changeset
490 COIRESULT res;
kono
parents:
diff changeset
491 res = COI::PipelineRunFunction(get_pipeline(),
kono
parents:
diff changeset
492 m_funcs[c_func_myo_fini],
kono
parents:
diff changeset
493 0, 0, 0, 0, 0, 0, 0, 0, 0,
kono
parents:
diff changeset
494 event);
kono
parents:
diff changeset
495 check_result(res, c_pipeline_run_func, m_index, res);
kono
parents:
diff changeset
496 }
kono
parents:
diff changeset
497 #endif // MYO_SUPPORT
kono
parents:
diff changeset
498
kono
parents:
diff changeset
499 //
kono
parents:
diff changeset
500 // Memory association table
kono
parents:
diff changeset
501 //
kono
parents:
diff changeset
502 PtrData* find_ptr_data(const void *ptr) {
kono
parents:
diff changeset
503 return m_ptr_set.find_ptr_data(ptr);
kono
parents:
diff changeset
504 }
kono
parents:
diff changeset
505
kono
parents:
diff changeset
506 PtrData* find_targetptr_data(const void *ptr) {
kono
parents:
diff changeset
507 return m_targetptr_set.find_ptr_data(ptr);
kono
parents:
diff changeset
508 }
kono
parents:
diff changeset
509
kono
parents:
diff changeset
510 PtrData* insert_ptr_data(const void *ptr, uint64_t len, bool &is_new) {
kono
parents:
diff changeset
511 return m_ptr_set.insert_ptr_data(ptr, len, is_new);
kono
parents:
diff changeset
512 }
kono
parents:
diff changeset
513
kono
parents:
diff changeset
514 PtrData* insert_targetptr_data(const void *ptr, uint64_t len,
kono
parents:
diff changeset
515 bool &is_new) {
kono
parents:
diff changeset
516 return m_targetptr_set.insert_ptr_data(ptr, len, is_new);
kono
parents:
diff changeset
517 }
kono
parents:
diff changeset
518
kono
parents:
diff changeset
519 void remove_ptr_data(const void *ptr) {
kono
parents:
diff changeset
520 m_ptr_set.remove_ptr_data(ptr);
kono
parents:
diff changeset
521 }
kono
parents:
diff changeset
522
kono
parents:
diff changeset
523 void remove_targetptr_data(const void *ptr) {
kono
parents:
diff changeset
524 m_targetptr_set.remove_ptr_data(ptr);
kono
parents:
diff changeset
525 }
kono
parents:
diff changeset
526
kono
parents:
diff changeset
527 //
kono
parents:
diff changeset
528 // Automatic variables
kono
parents:
diff changeset
529 //
kono
parents:
diff changeset
530 AutoData* find_auto_data(const void *ptr) {
kono
parents:
diff changeset
531 AutoSet &auto_vars = get_auto_vars();
kono
parents:
diff changeset
532 AutoSet::iterator res = auto_vars.find(AutoData(ptr, 0));
kono
parents:
diff changeset
533 if (res == auto_vars.end()) {
kono
parents:
diff changeset
534 return 0;
kono
parents:
diff changeset
535 }
kono
parents:
diff changeset
536 return const_cast<AutoData*>(res.operator->());
kono
parents:
diff changeset
537 }
kono
parents:
diff changeset
538
kono
parents:
diff changeset
539 AutoData* insert_auto_data(const void *ptr, uint64_t len) {
kono
parents:
diff changeset
540 AutoSet &auto_vars = get_auto_vars();
kono
parents:
diff changeset
541 std::pair<AutoSet::iterator, bool> res =
kono
parents:
diff changeset
542 auto_vars.insert(AutoData(ptr, len));
kono
parents:
diff changeset
543 return const_cast<AutoData*>(res.first.operator->());
kono
parents:
diff changeset
544 }
kono
parents:
diff changeset
545
kono
parents:
diff changeset
546 void remove_auto_data(const void *ptr) {
kono
parents:
diff changeset
547 get_auto_vars().erase(AutoData(ptr, 0));
kono
parents:
diff changeset
548 }
kono
parents:
diff changeset
549
kono
parents:
diff changeset
550 //
kono
parents:
diff changeset
551 // Signals
kono
parents:
diff changeset
552 //
kono
parents:
diff changeset
553 void add_signal(const void *signal, OffloadDescriptor *desc) {
kono
parents:
diff changeset
554 m_signal_lock.lock();
kono
parents:
diff changeset
555 m_signal_map[signal] = desc;
kono
parents:
diff changeset
556 m_signal_lock.unlock();
kono
parents:
diff changeset
557 }
kono
parents:
diff changeset
558
kono
parents:
diff changeset
559 OffloadDescriptor* find_signal(const void *signal, bool remove) {
kono
parents:
diff changeset
560 OffloadDescriptor *desc = 0;
kono
parents:
diff changeset
561
kono
parents:
diff changeset
562 m_signal_lock.lock();
kono
parents:
diff changeset
563 {
kono
parents:
diff changeset
564 SignalMap::iterator it = m_signal_map.find(signal);
kono
parents:
diff changeset
565 if (it != m_signal_map.end()) {
kono
parents:
diff changeset
566 desc = it->second;
kono
parents:
diff changeset
567 if (remove) {
kono
parents:
diff changeset
568 it->second = SIGNAL_HAS_COMPLETED;
kono
parents:
diff changeset
569 }
kono
parents:
diff changeset
570 }
kono
parents:
diff changeset
571 }
kono
parents:
diff changeset
572 m_signal_lock.unlock();
kono
parents:
diff changeset
573
kono
parents:
diff changeset
574 return desc;
kono
parents:
diff changeset
575 }
kono
parents:
diff changeset
576
kono
parents:
diff changeset
577 void complete_signaled_ofld(const void *signal) {
kono
parents:
diff changeset
578
kono
parents:
diff changeset
579 m_signal_lock.lock();
kono
parents:
diff changeset
580 {
kono
parents:
diff changeset
581 SignalMap::iterator it = m_signal_map.find(signal);
kono
parents:
diff changeset
582 if (it != m_signal_map.end()) {
kono
parents:
diff changeset
583 it->second = SIGNAL_HAS_COMPLETED;
kono
parents:
diff changeset
584 }
kono
parents:
diff changeset
585 }
kono
parents:
diff changeset
586 m_signal_lock.unlock();
kono
parents:
diff changeset
587 }
kono
parents:
diff changeset
588
kono
parents:
diff changeset
589 void stream_destroy(_Offload_stream handle);
kono
parents:
diff changeset
590
kono
parents:
diff changeset
591 void move_cpu_el_after(CpuEl* cpu_what, CpuEl* cpu_after);
kono
parents:
diff changeset
592 void print_stream_cpu_list(const char *);
kono
parents:
diff changeset
593
kono
parents:
diff changeset
594 COIPIPELINE get_pipeline(_Offload_stream stream);
kono
parents:
diff changeset
595
kono
parents:
diff changeset
596 StreamMap get_stream_map() {
kono
parents:
diff changeset
597 return m_stream_map;
kono
parents:
diff changeset
598 }
kono
parents:
diff changeset
599
kono
parents:
diff changeset
600 // stop device process
kono
parents:
diff changeset
601 void fini_process(bool verbose);
kono
parents:
diff changeset
602
kono
parents:
diff changeset
603 // list of stacks active at the engine
kono
parents:
diff changeset
604 PersistDataList m_persist_list;
kono
parents:
diff changeset
605
kono
parents:
diff changeset
606 private:
kono
parents:
diff changeset
607 Engine() : m_index(-1), m_physical_index(-1), m_process(0), m_ready(false),
kono
parents:
diff changeset
608 m_proc_number(0), m_assigned_cpus(0), m_cpus(0), m_cpu_head(0)
kono
parents:
diff changeset
609 {}
kono
parents:
diff changeset
610
kono
parents:
diff changeset
611 ~Engine() {
kono
parents:
diff changeset
612 m_ready = false;
kono
parents:
diff changeset
613 for (StreamMap::iterator it = m_stream_map.begin();
kono
parents:
diff changeset
614 it != m_stream_map.end(); it++) {
kono
parents:
diff changeset
615 Stream * stream = it->second;
kono
parents:
diff changeset
616 delete stream;
kono
parents:
diff changeset
617 }
kono
parents:
diff changeset
618 if (m_process != 0) {
kono
parents:
diff changeset
619 fini_process(false);
kono
parents:
diff changeset
620 }
kono
parents:
diff changeset
621 if (m_assigned_cpus) {
kono
parents:
diff changeset
622 delete m_assigned_cpus;
kono
parents:
diff changeset
623 }
kono
parents:
diff changeset
624 }
kono
parents:
diff changeset
625
kono
parents:
diff changeset
626 // set indexes
kono
parents:
diff changeset
627 void set_indexes(int logical_index, int physical_index) {
kono
parents:
diff changeset
628 m_index = logical_index;
kono
parents:
diff changeset
629 m_physical_index = physical_index;
kono
parents:
diff changeset
630 }
kono
parents:
diff changeset
631
kono
parents:
diff changeset
632 // set CPU mask
kono
parents:
diff changeset
633 void set_cpu_mask(micLcpuMask *cpu_mask)
kono
parents:
diff changeset
634 {
kono
parents:
diff changeset
635 m_assigned_cpus = cpu_mask;
kono
parents:
diff changeset
636 }
kono
parents:
diff changeset
637
kono
parents:
diff changeset
638 // start process on device
kono
parents:
diff changeset
639 void init_process();
kono
parents:
diff changeset
640
kono
parents:
diff changeset
641 void load_libraries(void);
kono
parents:
diff changeset
642 void init_ptr_data(void);
kono
parents:
diff changeset
643
kono
parents:
diff changeset
644 // performs library intialization on the device side
kono
parents:
diff changeset
645 pid_t init_device(void);
kono
parents:
diff changeset
646
kono
parents:
diff changeset
647 private:
kono
parents:
diff changeset
648 // get pipeline associated with a calling thread
kono
parents:
diff changeset
649 COIPIPELINE get_pipeline(void);
kono
parents:
diff changeset
650
kono
parents:
diff changeset
651 // get automatic vars set associated with the calling thread
kono
parents:
diff changeset
652 AutoSet& get_auto_vars(void);
kono
parents:
diff changeset
653
kono
parents:
diff changeset
654 // destructor for thread data
kono
parents:
diff changeset
655 static void destroy_thread_data(void *data);
kono
parents:
diff changeset
656
kono
parents:
diff changeset
657 private:
kono
parents:
diff changeset
658 typedef std::set<PtrData> PtrSet;
kono
parents:
diff changeset
659 typedef std::map<const void*, OffloadDescriptor*> SignalMap;
kono
parents:
diff changeset
660
kono
parents:
diff changeset
661 // device indexes
kono
parents:
diff changeset
662 int m_index;
kono
parents:
diff changeset
663 int m_physical_index;
kono
parents:
diff changeset
664
kono
parents:
diff changeset
665 // cpu mask
kono
parents:
diff changeset
666 micLcpuMask *m_assigned_cpus;
kono
parents:
diff changeset
667
kono
parents:
diff changeset
668 // number of COI pipes created for the engine
kono
parents:
diff changeset
669 long m_proc_number;
kono
parents:
diff changeset
670
kono
parents:
diff changeset
671 // process handle
kono
parents:
diff changeset
672 COIPROCESS m_process;
kono
parents:
diff changeset
673
kono
parents:
diff changeset
674 // If false, device either has not been initialized or new libraries
kono
parents:
diff changeset
675 // have been added.
kono
parents:
diff changeset
676 bool m_ready;
kono
parents:
diff changeset
677 mutex_t m_lock;
kono
parents:
diff changeset
678
kono
parents:
diff changeset
679 // List of libraries to be loaded
kono
parents:
diff changeset
680 TargetImageList m_images;
kono
parents:
diff changeset
681
kono
parents:
diff changeset
682 // var tables
kono
parents:
diff changeset
683 PtrDataTable m_ptr_set;
kono
parents:
diff changeset
684 PtrDataTable m_targetptr_set;
kono
parents:
diff changeset
685
kono
parents:
diff changeset
686 // signals
kono
parents:
diff changeset
687 SignalMap m_signal_map;
kono
parents:
diff changeset
688 mutex_t m_signal_lock;
kono
parents:
diff changeset
689
kono
parents:
diff changeset
690 // streams
kono
parents:
diff changeset
691 StreamMap m_stream_map;
kono
parents:
diff changeset
692 mutex_t m_stream_lock;
kono
parents:
diff changeset
693 int m_num_cores;
kono
parents:
diff changeset
694 int m_num_threads;
kono
parents:
diff changeset
695 CpuEl* m_cpus;
kono
parents:
diff changeset
696 CpuEl* m_cpu_head;
kono
parents:
diff changeset
697
kono
parents:
diff changeset
698 // List of dynamic libraries to be registred
kono
parents:
diff changeset
699 DynLibList m_dyn_libs;
kono
parents:
diff changeset
700
kono
parents:
diff changeset
701 // constants for accessing device function handles
kono
parents:
diff changeset
702 enum {
kono
parents:
diff changeset
703 c_func_compute = 0,
kono
parents:
diff changeset
704 #ifdef MYO_SUPPORT
kono
parents:
diff changeset
705 c_func_myo_init,
kono
parents:
diff changeset
706 c_func_myo_fini,
kono
parents:
diff changeset
707 #endif // MYO_SUPPORT
kono
parents:
diff changeset
708 c_func_init,
kono
parents:
diff changeset
709 c_func_var_table_size,
kono
parents:
diff changeset
710 c_func_var_table_copy,
kono
parents:
diff changeset
711 c_func_set_stream_affinity,
kono
parents:
diff changeset
712 c_funcs_total
kono
parents:
diff changeset
713 };
kono
parents:
diff changeset
714 static const char* m_func_names[c_funcs_total];
kono
parents:
diff changeset
715
kono
parents:
diff changeset
716 // device function handles
kono
parents:
diff changeset
717 COIFUNCTION m_funcs[c_funcs_total];
kono
parents:
diff changeset
718
kono
parents:
diff changeset
719 // int -> name mapping for device signals
kono
parents:
diff changeset
720 static const int c_signal_max = 32;
kono
parents:
diff changeset
721 static const char* c_signal_names[c_signal_max];
kono
parents:
diff changeset
722 };
kono
parents:
diff changeset
723
kono
parents:
diff changeset
724 #endif // OFFLOAD_ENGINE_H_INCLUDED