annotate gcc/omp-offload.c @ 120:f93fa5091070

fix conv1.c
author mir3636
date Thu, 08 Mar 2018 14:53:42 +0900
parents 04ced10e8804
children 84e7813d76e9
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
111
kono
parents:
diff changeset
1 /* Bits of OpenMP and OpenACC handling that is specific to device offloading
kono
parents:
diff changeset
2 and a lowering pass for OpenACC device directives.
kono
parents:
diff changeset
3
kono
parents:
diff changeset
4 Copyright (C) 2005-2017 Free Software Foundation, Inc.
kono
parents:
diff changeset
5
kono
parents:
diff changeset
6 This file is part of GCC.
kono
parents:
diff changeset
7
kono
parents:
diff changeset
8 GCC is free software; you can redistribute it and/or modify it under
kono
parents:
diff changeset
9 the terms of the GNU General Public License as published by the Free
kono
parents:
diff changeset
10 Software Foundation; either version 3, or (at your option) any later
kono
parents:
diff changeset
11 version.
kono
parents:
diff changeset
12
kono
parents:
diff changeset
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
kono
parents:
diff changeset
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
kono
parents:
diff changeset
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
kono
parents:
diff changeset
16 for more details.
kono
parents:
diff changeset
17
kono
parents:
diff changeset
18 You should have received a copy of the GNU General Public License
kono
parents:
diff changeset
19 along with GCC; see the file COPYING3. If not see
kono
parents:
diff changeset
20 <http://www.gnu.org/licenses/>. */
kono
parents:
diff changeset
21
kono
parents:
diff changeset
22 #include "config.h"
kono
parents:
diff changeset
23 #include "system.h"
kono
parents:
diff changeset
24 #include "coretypes.h"
kono
parents:
diff changeset
25 #include "backend.h"
kono
parents:
diff changeset
26 #include "target.h"
kono
parents:
diff changeset
27 #include "tree.h"
kono
parents:
diff changeset
28 #include "gimple.h"
kono
parents:
diff changeset
29 #include "tree-pass.h"
kono
parents:
diff changeset
30 #include "ssa.h"
kono
parents:
diff changeset
31 #include "cgraph.h"
kono
parents:
diff changeset
32 #include "pretty-print.h"
kono
parents:
diff changeset
33 #include "diagnostic-core.h"
kono
parents:
diff changeset
34 #include "fold-const.h"
kono
parents:
diff changeset
35 #include "internal-fn.h"
kono
parents:
diff changeset
36 #include "langhooks.h"
kono
parents:
diff changeset
37 #include "gimplify.h"
kono
parents:
diff changeset
38 #include "gimple-iterator.h"
kono
parents:
diff changeset
39 #include "gimplify-me.h"
kono
parents:
diff changeset
40 #include "gimple-walk.h"
kono
parents:
diff changeset
41 #include "tree-cfg.h"
kono
parents:
diff changeset
42 #include "tree-into-ssa.h"
kono
parents:
diff changeset
43 #include "tree-nested.h"
kono
parents:
diff changeset
44 #include "stor-layout.h"
kono
parents:
diff changeset
45 #include "common/common-target.h"
kono
parents:
diff changeset
46 #include "omp-general.h"
kono
parents:
diff changeset
47 #include "omp-offload.h"
kono
parents:
diff changeset
48 #include "lto-section-names.h"
kono
parents:
diff changeset
49 #include "gomp-constants.h"
kono
parents:
diff changeset
50 #include "gimple-pretty-print.h"
kono
parents:
diff changeset
51 #include "intl.h"
kono
parents:
diff changeset
52 #include "stringpool.h"
kono
parents:
diff changeset
53 #include "attribs.h"
kono
parents:
diff changeset
54 #include "cfgloop.h"
kono
parents:
diff changeset
55
kono
parents:
diff changeset
56 /* Describe the OpenACC looping structure of a function. The entire
kono
parents:
diff changeset
57 function is held in a 'NULL' loop. */
kono
parents:
diff changeset
58
kono
parents:
diff changeset
59 struct oacc_loop
kono
parents:
diff changeset
60 {
kono
parents:
diff changeset
61 oacc_loop *parent; /* Containing loop. */
kono
parents:
diff changeset
62
kono
parents:
diff changeset
63 oacc_loop *child; /* First inner loop. */
kono
parents:
diff changeset
64
kono
parents:
diff changeset
65 oacc_loop *sibling; /* Next loop within same parent. */
kono
parents:
diff changeset
66
kono
parents:
diff changeset
67 location_t loc; /* Location of the loop start. */
kono
parents:
diff changeset
68
kono
parents:
diff changeset
69 gcall *marker; /* Initial head marker. */
kono
parents:
diff changeset
70
kono
parents:
diff changeset
71 gcall *heads[GOMP_DIM_MAX]; /* Head marker functions. */
kono
parents:
diff changeset
72 gcall *tails[GOMP_DIM_MAX]; /* Tail marker functions. */
kono
parents:
diff changeset
73
kono
parents:
diff changeset
74 tree routine; /* Pseudo-loop enclosing a routine. */
kono
parents:
diff changeset
75
kono
parents:
diff changeset
76 unsigned mask; /* Partitioning mask. */
kono
parents:
diff changeset
77 unsigned e_mask; /* Partitioning of element loops (when tiling). */
kono
parents:
diff changeset
78 unsigned inner; /* Partitioning of inner loops. */
kono
parents:
diff changeset
79 unsigned flags; /* Partitioning flags. */
kono
parents:
diff changeset
80 vec<gcall *> ifns; /* Contained loop abstraction functions. */
kono
parents:
diff changeset
81 tree chunk_size; /* Chunk size. */
kono
parents:
diff changeset
82 gcall *head_end; /* Final marker of head sequence. */
kono
parents:
diff changeset
83 };
kono
parents:
diff changeset
84
kono
parents:
diff changeset
85 /* Holds offload tables with decls. */
kono
parents:
diff changeset
86 vec<tree, va_gc> *offload_funcs, *offload_vars;
kono
parents:
diff changeset
87
kono
parents:
diff changeset
88 /* Return level at which oacc routine may spawn a partitioned loop, or
kono
parents:
diff changeset
89 -1 if it is not a routine (i.e. is an offload fn). */
kono
parents:
diff changeset
90
kono
parents:
diff changeset
91 static int
kono
parents:
diff changeset
92 oacc_fn_attrib_level (tree attr)
kono
parents:
diff changeset
93 {
kono
parents:
diff changeset
94 tree pos = TREE_VALUE (attr);
kono
parents:
diff changeset
95
kono
parents:
diff changeset
96 if (!TREE_PURPOSE (pos))
kono
parents:
diff changeset
97 return -1;
kono
parents:
diff changeset
98
kono
parents:
diff changeset
99 int ix = 0;
kono
parents:
diff changeset
100 for (ix = 0; ix != GOMP_DIM_MAX;
kono
parents:
diff changeset
101 ix++, pos = TREE_CHAIN (pos))
kono
parents:
diff changeset
102 if (!integer_zerop (TREE_PURPOSE (pos)))
kono
parents:
diff changeset
103 break;
kono
parents:
diff changeset
104
kono
parents:
diff changeset
105 return ix;
kono
parents:
diff changeset
106 }
kono
parents:
diff changeset
107
kono
parents:
diff changeset
108 /* Helper function for omp_finish_file routine. Takes decls from V_DECLS and
kono
parents:
diff changeset
109 adds their addresses and sizes to constructor-vector V_CTOR. */
kono
parents:
diff changeset
110
kono
parents:
diff changeset
111 static void
kono
parents:
diff changeset
112 add_decls_addresses_to_decl_constructor (vec<tree, va_gc> *v_decls,
kono
parents:
diff changeset
113 vec<constructor_elt, va_gc> *v_ctor)
kono
parents:
diff changeset
114 {
kono
parents:
diff changeset
115 unsigned len = vec_safe_length (v_decls);
kono
parents:
diff changeset
116 for (unsigned i = 0; i < len; i++)
kono
parents:
diff changeset
117 {
kono
parents:
diff changeset
118 tree it = (*v_decls)[i];
kono
parents:
diff changeset
119 bool is_var = VAR_P (it);
kono
parents:
diff changeset
120 bool is_link_var
kono
parents:
diff changeset
121 = is_var
kono
parents:
diff changeset
122 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
123 && DECL_HAS_VALUE_EXPR_P (it)
kono
parents:
diff changeset
124 #endif
kono
parents:
diff changeset
125 && lookup_attribute ("omp declare target link", DECL_ATTRIBUTES (it));
kono
parents:
diff changeset
126
kono
parents:
diff changeset
127 tree size = NULL_TREE;
kono
parents:
diff changeset
128 if (is_var)
kono
parents:
diff changeset
129 size = fold_convert (const_ptr_type_node, DECL_SIZE_UNIT (it));
kono
parents:
diff changeset
130
kono
parents:
diff changeset
131 tree addr;
kono
parents:
diff changeset
132 if (!is_link_var)
kono
parents:
diff changeset
133 addr = build_fold_addr_expr (it);
kono
parents:
diff changeset
134 else
kono
parents:
diff changeset
135 {
kono
parents:
diff changeset
136 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
137 /* For "omp declare target link" vars add address of the pointer to
kono
parents:
diff changeset
138 the target table, instead of address of the var. */
kono
parents:
diff changeset
139 tree value_expr = DECL_VALUE_EXPR (it);
kono
parents:
diff changeset
140 tree link_ptr_decl = TREE_OPERAND (value_expr, 0);
kono
parents:
diff changeset
141 varpool_node::finalize_decl (link_ptr_decl);
kono
parents:
diff changeset
142 addr = build_fold_addr_expr (link_ptr_decl);
kono
parents:
diff changeset
143 #else
kono
parents:
diff changeset
144 addr = build_fold_addr_expr (it);
kono
parents:
diff changeset
145 #endif
kono
parents:
diff changeset
146
kono
parents:
diff changeset
147 /* Most significant bit of the size marks "omp declare target link"
kono
parents:
diff changeset
148 vars in host and target tables. */
kono
parents:
diff changeset
149 unsigned HOST_WIDE_INT isize = tree_to_uhwi (size);
kono
parents:
diff changeset
150 isize |= 1ULL << (int_size_in_bytes (const_ptr_type_node)
kono
parents:
diff changeset
151 * BITS_PER_UNIT - 1);
kono
parents:
diff changeset
152 size = wide_int_to_tree (const_ptr_type_node, isize);
kono
parents:
diff changeset
153 }
kono
parents:
diff changeset
154
kono
parents:
diff changeset
155 CONSTRUCTOR_APPEND_ELT (v_ctor, NULL_TREE, addr);
kono
parents:
diff changeset
156 if (is_var)
kono
parents:
diff changeset
157 CONSTRUCTOR_APPEND_ELT (v_ctor, NULL_TREE, size);
kono
parents:
diff changeset
158 }
kono
parents:
diff changeset
159 }
kono
parents:
diff changeset
160
kono
parents:
diff changeset
161 /* Create new symbols containing (address, size) pairs for global variables,
kono
parents:
diff changeset
162 marked with "omp declare target" attribute, as well as addresses for the
kono
parents:
diff changeset
163 functions, which are outlined offloading regions. */
kono
parents:
diff changeset
164 void
kono
parents:
diff changeset
165 omp_finish_file (void)
kono
parents:
diff changeset
166 {
kono
parents:
diff changeset
167 unsigned num_funcs = vec_safe_length (offload_funcs);
kono
parents:
diff changeset
168 unsigned num_vars = vec_safe_length (offload_vars);
kono
parents:
diff changeset
169
kono
parents:
diff changeset
170 if (num_funcs == 0 && num_vars == 0)
kono
parents:
diff changeset
171 return;
kono
parents:
diff changeset
172
kono
parents:
diff changeset
173 if (targetm_common.have_named_sections)
kono
parents:
diff changeset
174 {
kono
parents:
diff changeset
175 vec<constructor_elt, va_gc> *v_f, *v_v;
kono
parents:
diff changeset
176 vec_alloc (v_f, num_funcs);
kono
parents:
diff changeset
177 vec_alloc (v_v, num_vars * 2);
kono
parents:
diff changeset
178
kono
parents:
diff changeset
179 add_decls_addresses_to_decl_constructor (offload_funcs, v_f);
kono
parents:
diff changeset
180 add_decls_addresses_to_decl_constructor (offload_vars, v_v);
kono
parents:
diff changeset
181
kono
parents:
diff changeset
182 tree vars_decl_type = build_array_type_nelts (pointer_sized_int_node,
kono
parents:
diff changeset
183 num_vars * 2);
kono
parents:
diff changeset
184 tree funcs_decl_type = build_array_type_nelts (pointer_sized_int_node,
kono
parents:
diff changeset
185 num_funcs);
kono
parents:
diff changeset
186 SET_TYPE_ALIGN (vars_decl_type, TYPE_ALIGN (pointer_sized_int_node));
kono
parents:
diff changeset
187 SET_TYPE_ALIGN (funcs_decl_type, TYPE_ALIGN (pointer_sized_int_node));
kono
parents:
diff changeset
188 tree ctor_v = build_constructor (vars_decl_type, v_v);
kono
parents:
diff changeset
189 tree ctor_f = build_constructor (funcs_decl_type, v_f);
kono
parents:
diff changeset
190 TREE_CONSTANT (ctor_v) = TREE_CONSTANT (ctor_f) = 1;
kono
parents:
diff changeset
191 TREE_STATIC (ctor_v) = TREE_STATIC (ctor_f) = 1;
kono
parents:
diff changeset
192 tree funcs_decl = build_decl (UNKNOWN_LOCATION, VAR_DECL,
kono
parents:
diff changeset
193 get_identifier (".offload_func_table"),
kono
parents:
diff changeset
194 funcs_decl_type);
kono
parents:
diff changeset
195 tree vars_decl = build_decl (UNKNOWN_LOCATION, VAR_DECL,
kono
parents:
diff changeset
196 get_identifier (".offload_var_table"),
kono
parents:
diff changeset
197 vars_decl_type);
kono
parents:
diff changeset
198 TREE_STATIC (funcs_decl) = TREE_STATIC (vars_decl) = 1;
kono
parents:
diff changeset
199 /* Do not align tables more than TYPE_ALIGN (pointer_sized_int_node),
kono
parents:
diff changeset
200 otherwise a joint table in a binary will contain padding between
kono
parents:
diff changeset
201 tables from multiple object files. */
kono
parents:
diff changeset
202 DECL_USER_ALIGN (funcs_decl) = DECL_USER_ALIGN (vars_decl) = 1;
kono
parents:
diff changeset
203 SET_DECL_ALIGN (funcs_decl, TYPE_ALIGN (funcs_decl_type));
kono
parents:
diff changeset
204 SET_DECL_ALIGN (vars_decl, TYPE_ALIGN (vars_decl_type));
kono
parents:
diff changeset
205 DECL_INITIAL (funcs_decl) = ctor_f;
kono
parents:
diff changeset
206 DECL_INITIAL (vars_decl) = ctor_v;
kono
parents:
diff changeset
207 set_decl_section_name (funcs_decl, OFFLOAD_FUNC_TABLE_SECTION_NAME);
kono
parents:
diff changeset
208 set_decl_section_name (vars_decl, OFFLOAD_VAR_TABLE_SECTION_NAME);
kono
parents:
diff changeset
209
kono
parents:
diff changeset
210 varpool_node::finalize_decl (vars_decl);
kono
parents:
diff changeset
211 varpool_node::finalize_decl (funcs_decl);
kono
parents:
diff changeset
212 }
kono
parents:
diff changeset
213 else
kono
parents:
diff changeset
214 {
kono
parents:
diff changeset
215 for (unsigned i = 0; i < num_funcs; i++)
kono
parents:
diff changeset
216 {
kono
parents:
diff changeset
217 tree it = (*offload_funcs)[i];
kono
parents:
diff changeset
218 targetm.record_offload_symbol (it);
kono
parents:
diff changeset
219 }
kono
parents:
diff changeset
220 for (unsigned i = 0; i < num_vars; i++)
kono
parents:
diff changeset
221 {
kono
parents:
diff changeset
222 tree it = (*offload_vars)[i];
kono
parents:
diff changeset
223 targetm.record_offload_symbol (it);
kono
parents:
diff changeset
224 }
kono
parents:
diff changeset
225 }
kono
parents:
diff changeset
226 }
kono
parents:
diff changeset
227
kono
parents:
diff changeset
228 /* Call dim_pos (POS == true) or dim_size (POS == false) builtins for
kono
parents:
diff changeset
229 axis DIM. Return a tmp var holding the result. */
kono
parents:
diff changeset
230
kono
parents:
diff changeset
231 static tree
kono
parents:
diff changeset
232 oacc_dim_call (bool pos, int dim, gimple_seq *seq)
kono
parents:
diff changeset
233 {
kono
parents:
diff changeset
234 tree arg = build_int_cst (unsigned_type_node, dim);
kono
parents:
diff changeset
235 tree size = create_tmp_var (integer_type_node);
kono
parents:
diff changeset
236 enum internal_fn fn = pos ? IFN_GOACC_DIM_POS : IFN_GOACC_DIM_SIZE;
kono
parents:
diff changeset
237 gimple *call = gimple_build_call_internal (fn, 1, arg);
kono
parents:
diff changeset
238
kono
parents:
diff changeset
239 gimple_call_set_lhs (call, size);
kono
parents:
diff changeset
240 gimple_seq_add_stmt (seq, call);
kono
parents:
diff changeset
241
kono
parents:
diff changeset
242 return size;
kono
parents:
diff changeset
243 }
kono
parents:
diff changeset
244
kono
parents:
diff changeset
245 /* Find the number of threads (POS = false), or thread number (POS =
kono
parents:
diff changeset
246 true) for an OpenACC region partitioned as MASK. Setup code
kono
parents:
diff changeset
247 required for the calculation is added to SEQ. */
kono
parents:
diff changeset
248
kono
parents:
diff changeset
249 static tree
kono
parents:
diff changeset
250 oacc_thread_numbers (bool pos, int mask, gimple_seq *seq)
kono
parents:
diff changeset
251 {
kono
parents:
diff changeset
252 tree res = pos ? NULL_TREE : build_int_cst (unsigned_type_node, 1);
kono
parents:
diff changeset
253 unsigned ix;
kono
parents:
diff changeset
254
kono
parents:
diff changeset
255 /* Start at gang level, and examine relevant dimension indices. */
kono
parents:
diff changeset
256 for (ix = GOMP_DIM_GANG; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
257 if (GOMP_DIM_MASK (ix) & mask)
kono
parents:
diff changeset
258 {
kono
parents:
diff changeset
259 if (res)
kono
parents:
diff changeset
260 {
kono
parents:
diff changeset
261 /* We had an outer index, so scale that by the size of
kono
parents:
diff changeset
262 this dimension. */
kono
parents:
diff changeset
263 tree n = oacc_dim_call (false, ix, seq);
kono
parents:
diff changeset
264 res = fold_build2 (MULT_EXPR, integer_type_node, res, n);
kono
parents:
diff changeset
265 }
kono
parents:
diff changeset
266 if (pos)
kono
parents:
diff changeset
267 {
kono
parents:
diff changeset
268 /* Determine index in this dimension. */
kono
parents:
diff changeset
269 tree id = oacc_dim_call (true, ix, seq);
kono
parents:
diff changeset
270 if (res)
kono
parents:
diff changeset
271 res = fold_build2 (PLUS_EXPR, integer_type_node, res, id);
kono
parents:
diff changeset
272 else
kono
parents:
diff changeset
273 res = id;
kono
parents:
diff changeset
274 }
kono
parents:
diff changeset
275 }
kono
parents:
diff changeset
276
kono
parents:
diff changeset
277 if (res == NULL_TREE)
kono
parents:
diff changeset
278 res = integer_zero_node;
kono
parents:
diff changeset
279
kono
parents:
diff changeset
280 return res;
kono
parents:
diff changeset
281 }
kono
parents:
diff changeset
282
kono
parents:
diff changeset
283 /* Transform IFN_GOACC_LOOP calls to actual code. See
kono
parents:
diff changeset
284 expand_oacc_for for where these are generated. At the vector
kono
parents:
diff changeset
285 level, we stride loops, such that each member of a warp will
kono
parents:
diff changeset
286 operate on adjacent iterations. At the worker and gang level,
kono
parents:
diff changeset
287 each gang/warp executes a set of contiguous iterations. Chunking
kono
parents:
diff changeset
288 can override this such that each iteration engine executes a
kono
parents:
diff changeset
289 contiguous chunk, and then moves on to stride to the next chunk. */
kono
parents:
diff changeset
290
kono
parents:
diff changeset
291 static void
kono
parents:
diff changeset
292 oacc_xform_loop (gcall *call)
kono
parents:
diff changeset
293 {
kono
parents:
diff changeset
294 gimple_stmt_iterator gsi = gsi_for_stmt (call);
kono
parents:
diff changeset
295 enum ifn_goacc_loop_kind code
kono
parents:
diff changeset
296 = (enum ifn_goacc_loop_kind) TREE_INT_CST_LOW (gimple_call_arg (call, 0));
kono
parents:
diff changeset
297 tree dir = gimple_call_arg (call, 1);
kono
parents:
diff changeset
298 tree range = gimple_call_arg (call, 2);
kono
parents:
diff changeset
299 tree step = gimple_call_arg (call, 3);
kono
parents:
diff changeset
300 tree chunk_size = NULL_TREE;
kono
parents:
diff changeset
301 unsigned mask = (unsigned) TREE_INT_CST_LOW (gimple_call_arg (call, 5));
kono
parents:
diff changeset
302 tree lhs = gimple_call_lhs (call);
kono
parents:
diff changeset
303 tree type = TREE_TYPE (lhs);
kono
parents:
diff changeset
304 tree diff_type = TREE_TYPE (range);
kono
parents:
diff changeset
305 tree r = NULL_TREE;
kono
parents:
diff changeset
306 gimple_seq seq = NULL;
kono
parents:
diff changeset
307 bool chunking = false, striding = true;
kono
parents:
diff changeset
308 unsigned outer_mask = mask & (~mask + 1); // Outermost partitioning
kono
parents:
diff changeset
309 unsigned inner_mask = mask & ~outer_mask; // Inner partitioning (if any)
kono
parents:
diff changeset
310
kono
parents:
diff changeset
311 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
312 chunk_size = gimple_call_arg (call, 4);
kono
parents:
diff changeset
313 if (integer_minus_onep (chunk_size) /* Force static allocation. */
kono
parents:
diff changeset
314 || integer_zerop (chunk_size)) /* Default (also static). */
kono
parents:
diff changeset
315 {
kono
parents:
diff changeset
316 /* If we're at the gang level, we want each to execute a
kono
parents:
diff changeset
317 contiguous run of iterations. Otherwise we want each element
kono
parents:
diff changeset
318 to stride. */
kono
parents:
diff changeset
319 striding = !(outer_mask & GOMP_DIM_MASK (GOMP_DIM_GANG));
kono
parents:
diff changeset
320 chunking = false;
kono
parents:
diff changeset
321 }
kono
parents:
diff changeset
322 else
kono
parents:
diff changeset
323 {
kono
parents:
diff changeset
324 /* Chunk of size 1 is striding. */
kono
parents:
diff changeset
325 striding = integer_onep (chunk_size);
kono
parents:
diff changeset
326 chunking = !striding;
kono
parents:
diff changeset
327 }
kono
parents:
diff changeset
328 #endif
kono
parents:
diff changeset
329
kono
parents:
diff changeset
330 /* striding=true, chunking=true
kono
parents:
diff changeset
331 -> invalid.
kono
parents:
diff changeset
332 striding=true, chunking=false
kono
parents:
diff changeset
333 -> chunks=1
kono
parents:
diff changeset
334 striding=false,chunking=true
kono
parents:
diff changeset
335 -> chunks=ceil (range/(chunksize*threads*step))
kono
parents:
diff changeset
336 striding=false,chunking=false
kono
parents:
diff changeset
337 -> chunk_size=ceil(range/(threads*step)),chunks=1 */
kono
parents:
diff changeset
338 push_gimplify_context (true);
kono
parents:
diff changeset
339
kono
parents:
diff changeset
340 switch (code)
kono
parents:
diff changeset
341 {
kono
parents:
diff changeset
342 default: gcc_unreachable ();
kono
parents:
diff changeset
343
kono
parents:
diff changeset
344 case IFN_GOACC_LOOP_CHUNKS:
kono
parents:
diff changeset
345 if (!chunking)
kono
parents:
diff changeset
346 r = build_int_cst (type, 1);
kono
parents:
diff changeset
347 else
kono
parents:
diff changeset
348 {
kono
parents:
diff changeset
349 /* chunk_max
kono
parents:
diff changeset
350 = (range - dir) / (chunks * step * num_threads) + dir */
kono
parents:
diff changeset
351 tree per = oacc_thread_numbers (false, mask, &seq);
kono
parents:
diff changeset
352 per = fold_convert (type, per);
kono
parents:
diff changeset
353 chunk_size = fold_convert (type, chunk_size);
kono
parents:
diff changeset
354 per = fold_build2 (MULT_EXPR, type, per, chunk_size);
kono
parents:
diff changeset
355 per = fold_build2 (MULT_EXPR, type, per, step);
kono
parents:
diff changeset
356 r = build2 (MINUS_EXPR, type, range, dir);
kono
parents:
diff changeset
357 r = build2 (PLUS_EXPR, type, r, per);
kono
parents:
diff changeset
358 r = build2 (TRUNC_DIV_EXPR, type, r, per);
kono
parents:
diff changeset
359 }
kono
parents:
diff changeset
360 break;
kono
parents:
diff changeset
361
kono
parents:
diff changeset
362 case IFN_GOACC_LOOP_STEP:
kono
parents:
diff changeset
363 {
kono
parents:
diff changeset
364 /* If striding, step by the entire compute volume, otherwise
kono
parents:
diff changeset
365 step by the inner volume. */
kono
parents:
diff changeset
366 unsigned volume = striding ? mask : inner_mask;
kono
parents:
diff changeset
367
kono
parents:
diff changeset
368 r = oacc_thread_numbers (false, volume, &seq);
kono
parents:
diff changeset
369 r = build2 (MULT_EXPR, type, fold_convert (type, r), step);
kono
parents:
diff changeset
370 }
kono
parents:
diff changeset
371 break;
kono
parents:
diff changeset
372
kono
parents:
diff changeset
373 case IFN_GOACC_LOOP_OFFSET:
kono
parents:
diff changeset
374 /* Enable vectorization on non-SIMT targets. */
kono
parents:
diff changeset
375 if (!targetm.simt.vf
kono
parents:
diff changeset
376 && outer_mask == GOMP_DIM_MASK (GOMP_DIM_VECTOR)
kono
parents:
diff changeset
377 /* If not -fno-tree-loop-vectorize, hint that we want to vectorize
kono
parents:
diff changeset
378 the loop. */
kono
parents:
diff changeset
379 && (flag_tree_loop_vectorize
kono
parents:
diff changeset
380 || !global_options_set.x_flag_tree_loop_vectorize))
kono
parents:
diff changeset
381 {
kono
parents:
diff changeset
382 basic_block bb = gsi_bb (gsi);
kono
parents:
diff changeset
383 struct loop *parent = bb->loop_father;
kono
parents:
diff changeset
384 struct loop *body = parent->inner;
kono
parents:
diff changeset
385
kono
parents:
diff changeset
386 parent->force_vectorize = true;
kono
parents:
diff changeset
387 parent->safelen = INT_MAX;
kono
parents:
diff changeset
388
kono
parents:
diff changeset
389 /* "Chunking loops" may have inner loops. */
kono
parents:
diff changeset
390 if (parent->inner)
kono
parents:
diff changeset
391 {
kono
parents:
diff changeset
392 body->force_vectorize = true;
kono
parents:
diff changeset
393 body->safelen = INT_MAX;
kono
parents:
diff changeset
394 }
kono
parents:
diff changeset
395
kono
parents:
diff changeset
396 cfun->has_force_vectorize_loops = true;
kono
parents:
diff changeset
397 }
kono
parents:
diff changeset
398 if (striding)
kono
parents:
diff changeset
399 {
kono
parents:
diff changeset
400 r = oacc_thread_numbers (true, mask, &seq);
kono
parents:
diff changeset
401 r = fold_convert (diff_type, r);
kono
parents:
diff changeset
402 }
kono
parents:
diff changeset
403 else
kono
parents:
diff changeset
404 {
kono
parents:
diff changeset
405 tree inner_size = oacc_thread_numbers (false, inner_mask, &seq);
kono
parents:
diff changeset
406 tree outer_size = oacc_thread_numbers (false, outer_mask, &seq);
kono
parents:
diff changeset
407 tree volume = fold_build2 (MULT_EXPR, TREE_TYPE (inner_size),
kono
parents:
diff changeset
408 inner_size, outer_size);
kono
parents:
diff changeset
409
kono
parents:
diff changeset
410 volume = fold_convert (diff_type, volume);
kono
parents:
diff changeset
411 if (chunking)
kono
parents:
diff changeset
412 chunk_size = fold_convert (diff_type, chunk_size);
kono
parents:
diff changeset
413 else
kono
parents:
diff changeset
414 {
kono
parents:
diff changeset
415 tree per = fold_build2 (MULT_EXPR, diff_type, volume, step);
kono
parents:
diff changeset
416
kono
parents:
diff changeset
417 chunk_size = build2 (MINUS_EXPR, diff_type, range, dir);
kono
parents:
diff changeset
418 chunk_size = build2 (PLUS_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
419 chunk_size = build2 (TRUNC_DIV_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
420 }
kono
parents:
diff changeset
421
kono
parents:
diff changeset
422 tree span = build2 (MULT_EXPR, diff_type, chunk_size,
kono
parents:
diff changeset
423 fold_convert (diff_type, inner_size));
kono
parents:
diff changeset
424 r = oacc_thread_numbers (true, outer_mask, &seq);
kono
parents:
diff changeset
425 r = fold_convert (diff_type, r);
kono
parents:
diff changeset
426 r = build2 (MULT_EXPR, diff_type, r, span);
kono
parents:
diff changeset
427
kono
parents:
diff changeset
428 tree inner = oacc_thread_numbers (true, inner_mask, &seq);
kono
parents:
diff changeset
429 inner = fold_convert (diff_type, inner);
kono
parents:
diff changeset
430 r = fold_build2 (PLUS_EXPR, diff_type, r, inner);
kono
parents:
diff changeset
431
kono
parents:
diff changeset
432 if (chunking)
kono
parents:
diff changeset
433 {
kono
parents:
diff changeset
434 tree chunk = fold_convert (diff_type, gimple_call_arg (call, 6));
kono
parents:
diff changeset
435 tree per
kono
parents:
diff changeset
436 = fold_build2 (MULT_EXPR, diff_type, volume, chunk_size);
kono
parents:
diff changeset
437 per = build2 (MULT_EXPR, diff_type, per, chunk);
kono
parents:
diff changeset
438
kono
parents:
diff changeset
439 r = build2 (PLUS_EXPR, diff_type, r, per);
kono
parents:
diff changeset
440 }
kono
parents:
diff changeset
441 }
kono
parents:
diff changeset
442 r = fold_build2 (MULT_EXPR, diff_type, r, step);
kono
parents:
diff changeset
443 if (type != diff_type)
kono
parents:
diff changeset
444 r = fold_convert (type, r);
kono
parents:
diff changeset
445 break;
kono
parents:
diff changeset
446
kono
parents:
diff changeset
447 case IFN_GOACC_LOOP_BOUND:
kono
parents:
diff changeset
448 if (striding)
kono
parents:
diff changeset
449 r = range;
kono
parents:
diff changeset
450 else
kono
parents:
diff changeset
451 {
kono
parents:
diff changeset
452 tree inner_size = oacc_thread_numbers (false, inner_mask, &seq);
kono
parents:
diff changeset
453 tree outer_size = oacc_thread_numbers (false, outer_mask, &seq);
kono
parents:
diff changeset
454 tree volume = fold_build2 (MULT_EXPR, TREE_TYPE (inner_size),
kono
parents:
diff changeset
455 inner_size, outer_size);
kono
parents:
diff changeset
456
kono
parents:
diff changeset
457 volume = fold_convert (diff_type, volume);
kono
parents:
diff changeset
458 if (chunking)
kono
parents:
diff changeset
459 chunk_size = fold_convert (diff_type, chunk_size);
kono
parents:
diff changeset
460 else
kono
parents:
diff changeset
461 {
kono
parents:
diff changeset
462 tree per = fold_build2 (MULT_EXPR, diff_type, volume, step);
kono
parents:
diff changeset
463
kono
parents:
diff changeset
464 chunk_size = build2 (MINUS_EXPR, diff_type, range, dir);
kono
parents:
diff changeset
465 chunk_size = build2 (PLUS_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
466 chunk_size = build2 (TRUNC_DIV_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
467 }
kono
parents:
diff changeset
468
kono
parents:
diff changeset
469 tree span = build2 (MULT_EXPR, diff_type, chunk_size,
kono
parents:
diff changeset
470 fold_convert (diff_type, inner_size));
kono
parents:
diff changeset
471
kono
parents:
diff changeset
472 r = fold_build2 (MULT_EXPR, diff_type, span, step);
kono
parents:
diff changeset
473
kono
parents:
diff changeset
474 tree offset = gimple_call_arg (call, 6);
kono
parents:
diff changeset
475 r = build2 (PLUS_EXPR, diff_type, r,
kono
parents:
diff changeset
476 fold_convert (diff_type, offset));
kono
parents:
diff changeset
477 r = build2 (integer_onep (dir) ? MIN_EXPR : MAX_EXPR,
kono
parents:
diff changeset
478 diff_type, r, range);
kono
parents:
diff changeset
479 }
kono
parents:
diff changeset
480 if (diff_type != type)
kono
parents:
diff changeset
481 r = fold_convert (type, r);
kono
parents:
diff changeset
482 break;
kono
parents:
diff changeset
483 }
kono
parents:
diff changeset
484
kono
parents:
diff changeset
485 gimplify_assign (lhs, r, &seq);
kono
parents:
diff changeset
486
kono
parents:
diff changeset
487 pop_gimplify_context (NULL);
kono
parents:
diff changeset
488
kono
parents:
diff changeset
489 gsi_replace_with_seq (&gsi, seq, true);
kono
parents:
diff changeset
490 }
kono
parents:
diff changeset
491
kono
parents:
diff changeset
492 /* Transform a GOACC_TILE call. Determines the element loop span for
kono
parents:
diff changeset
493 the specified loop of the nest. This is 1 if we're not tiling.
kono
parents:
diff changeset
494
kono
parents:
diff changeset
495 GOACC_TILE (collapse_count, loop_no, tile_arg, gwv_tile, gwv_element); */
kono
parents:
diff changeset
496
kono
parents:
diff changeset
497 static void
kono
parents:
diff changeset
498 oacc_xform_tile (gcall *call)
kono
parents:
diff changeset
499 {
kono
parents:
diff changeset
500 gimple_stmt_iterator gsi = gsi_for_stmt (call);
kono
parents:
diff changeset
501 unsigned collapse = tree_to_uhwi (gimple_call_arg (call, 0));
kono
parents:
diff changeset
502 /* Inner loops have higher loop_nos. */
kono
parents:
diff changeset
503 unsigned loop_no = tree_to_uhwi (gimple_call_arg (call, 1));
kono
parents:
diff changeset
504 tree tile_size = gimple_call_arg (call, 2);
kono
parents:
diff changeset
505 unsigned e_mask = tree_to_uhwi (gimple_call_arg (call, 4));
kono
parents:
diff changeset
506 tree lhs = gimple_call_lhs (call);
kono
parents:
diff changeset
507 tree type = TREE_TYPE (lhs);
kono
parents:
diff changeset
508 gimple_seq seq = NULL;
kono
parents:
diff changeset
509 tree span = build_int_cst (type, 1);
kono
parents:
diff changeset
510
kono
parents:
diff changeset
511 gcc_assert (!(e_mask
kono
parents:
diff changeset
512 & ~(GOMP_DIM_MASK (GOMP_DIM_VECTOR)
kono
parents:
diff changeset
513 | GOMP_DIM_MASK (GOMP_DIM_WORKER))));
kono
parents:
diff changeset
514 push_gimplify_context (!seen_error ());
kono
parents:
diff changeset
515
kono
parents:
diff changeset
516 #ifndef ACCEL_COMPILER
kono
parents:
diff changeset
517 /* Partitioning disabled on host compilers. */
kono
parents:
diff changeset
518 e_mask = 0;
kono
parents:
diff changeset
519 #endif
kono
parents:
diff changeset
520 if (!e_mask)
kono
parents:
diff changeset
521 /* Not paritioning. */
kono
parents:
diff changeset
522 span = integer_one_node;
kono
parents:
diff changeset
523 else if (!integer_zerop (tile_size))
kono
parents:
diff changeset
524 /* User explicitly specified size. */
kono
parents:
diff changeset
525 span = tile_size;
kono
parents:
diff changeset
526 else
kono
parents:
diff changeset
527 {
kono
parents:
diff changeset
528 /* Pick a size based on the paritioning of the element loop and
kono
parents:
diff changeset
529 the number of loop nests. */
kono
parents:
diff changeset
530 tree first_size = NULL_TREE;
kono
parents:
diff changeset
531 tree second_size = NULL_TREE;
kono
parents:
diff changeset
532
kono
parents:
diff changeset
533 if (e_mask & GOMP_DIM_MASK (GOMP_DIM_VECTOR))
kono
parents:
diff changeset
534 first_size = oacc_dim_call (false, GOMP_DIM_VECTOR, &seq);
kono
parents:
diff changeset
535 if (e_mask & GOMP_DIM_MASK (GOMP_DIM_WORKER))
kono
parents:
diff changeset
536 second_size = oacc_dim_call (false, GOMP_DIM_WORKER, &seq);
kono
parents:
diff changeset
537
kono
parents:
diff changeset
538 if (!first_size)
kono
parents:
diff changeset
539 {
kono
parents:
diff changeset
540 first_size = second_size;
kono
parents:
diff changeset
541 second_size = NULL_TREE;
kono
parents:
diff changeset
542 }
kono
parents:
diff changeset
543
kono
parents:
diff changeset
544 if (loop_no + 1 == collapse)
kono
parents:
diff changeset
545 {
kono
parents:
diff changeset
546 span = first_size;
kono
parents:
diff changeset
547 if (!loop_no && second_size)
kono
parents:
diff changeset
548 span = fold_build2 (MULT_EXPR, TREE_TYPE (span),
kono
parents:
diff changeset
549 span, second_size);
kono
parents:
diff changeset
550 }
kono
parents:
diff changeset
551 else if (loop_no + 2 == collapse)
kono
parents:
diff changeset
552 span = second_size;
kono
parents:
diff changeset
553 else
kono
parents:
diff changeset
554 span = NULL_TREE;
kono
parents:
diff changeset
555
kono
parents:
diff changeset
556 if (!span)
kono
parents:
diff changeset
557 /* There's no obvious element size for this loop. Options
kono
parents:
diff changeset
558 are 1, first_size or some non-unity constant (32 is my
kono
parents:
diff changeset
559 favourite). We should gather some statistics. */
kono
parents:
diff changeset
560 span = first_size;
kono
parents:
diff changeset
561 }
kono
parents:
diff changeset
562
kono
parents:
diff changeset
563 span = fold_convert (type, span);
kono
parents:
diff changeset
564 gimplify_assign (lhs, span, &seq);
kono
parents:
diff changeset
565
kono
parents:
diff changeset
566 pop_gimplify_context (NULL);
kono
parents:
diff changeset
567
kono
parents:
diff changeset
568 gsi_replace_with_seq (&gsi, seq, true);
kono
parents:
diff changeset
569 }
kono
parents:
diff changeset
570
kono
parents:
diff changeset
571 /* Default partitioned and minimum partitioned dimensions. */
kono
parents:
diff changeset
572
kono
parents:
diff changeset
573 static int oacc_default_dims[GOMP_DIM_MAX];
kono
parents:
diff changeset
574 static int oacc_min_dims[GOMP_DIM_MAX];
kono
parents:
diff changeset
575
kono
parents:
diff changeset
576 /* Parse the default dimension parameter. This is a set of
kono
parents:
diff changeset
577 :-separated optional compute dimensions. Each specified dimension
kono
parents:
diff changeset
578 is a positive integer. When device type support is added, it is
kono
parents:
diff changeset
579 planned to be a comma separated list of such compute dimensions,
kono
parents:
diff changeset
580 with all but the first prefixed by the colon-terminated device
kono
parents:
diff changeset
581 type. */
kono
parents:
diff changeset
582
kono
parents:
diff changeset
583 static void
kono
parents:
diff changeset
584 oacc_parse_default_dims (const char *dims)
kono
parents:
diff changeset
585 {
kono
parents:
diff changeset
586 int ix;
kono
parents:
diff changeset
587
kono
parents:
diff changeset
588 for (ix = GOMP_DIM_MAX; ix--;)
kono
parents:
diff changeset
589 {
kono
parents:
diff changeset
590 oacc_default_dims[ix] = -1;
kono
parents:
diff changeset
591 oacc_min_dims[ix] = 1;
kono
parents:
diff changeset
592 }
kono
parents:
diff changeset
593
kono
parents:
diff changeset
594 #ifndef ACCEL_COMPILER
kono
parents:
diff changeset
595 /* Cannot be overridden on the host. */
kono
parents:
diff changeset
596 dims = NULL;
kono
parents:
diff changeset
597 #endif
kono
parents:
diff changeset
598 if (dims)
kono
parents:
diff changeset
599 {
kono
parents:
diff changeset
600 const char *pos = dims;
kono
parents:
diff changeset
601
kono
parents:
diff changeset
602 for (ix = 0; *pos && ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
603 {
kono
parents:
diff changeset
604 if (ix)
kono
parents:
diff changeset
605 {
kono
parents:
diff changeset
606 if (*pos != ':')
kono
parents:
diff changeset
607 goto malformed;
kono
parents:
diff changeset
608 pos++;
kono
parents:
diff changeset
609 }
kono
parents:
diff changeset
610
kono
parents:
diff changeset
611 if (*pos != ':')
kono
parents:
diff changeset
612 {
kono
parents:
diff changeset
613 long val;
kono
parents:
diff changeset
614 const char *eptr;
kono
parents:
diff changeset
615
kono
parents:
diff changeset
616 errno = 0;
kono
parents:
diff changeset
617 val = strtol (pos, CONST_CAST (char **, &eptr), 10);
kono
parents:
diff changeset
618 if (errno || val <= 0 || (int) val != val)
kono
parents:
diff changeset
619 goto malformed;
kono
parents:
diff changeset
620 pos = eptr;
kono
parents:
diff changeset
621 oacc_default_dims[ix] = (int) val;
kono
parents:
diff changeset
622 }
kono
parents:
diff changeset
623 }
kono
parents:
diff changeset
624 if (*pos)
kono
parents:
diff changeset
625 {
kono
parents:
diff changeset
626 malformed:
kono
parents:
diff changeset
627 error_at (UNKNOWN_LOCATION,
kono
parents:
diff changeset
628 "-fopenacc-dim operand is malformed at '%s'", pos);
kono
parents:
diff changeset
629 }
kono
parents:
diff changeset
630 }
kono
parents:
diff changeset
631
kono
parents:
diff changeset
632 /* Allow the backend to validate the dimensions. */
kono
parents:
diff changeset
633 targetm.goacc.validate_dims (NULL_TREE, oacc_default_dims, -1);
kono
parents:
diff changeset
634 targetm.goacc.validate_dims (NULL_TREE, oacc_min_dims, -2);
kono
parents:
diff changeset
635 }
kono
parents:
diff changeset
636
kono
parents:
diff changeset
637 /* Validate and update the dimensions for offloaded FN. ATTRS is the
kono
parents:
diff changeset
638 raw attribute. DIMS is an array of dimensions, which is filled in.
kono
parents:
diff changeset
639 LEVEL is the partitioning level of a routine, or -1 for an offload
kono
parents:
diff changeset
640 region itself. USED is the mask of partitioned execution in the
kono
parents:
diff changeset
641 function. */
kono
parents:
diff changeset
642
kono
parents:
diff changeset
643 static void
kono
parents:
diff changeset
644 oacc_validate_dims (tree fn, tree attrs, int *dims, int level, unsigned used)
kono
parents:
diff changeset
645 {
kono
parents:
diff changeset
646 tree purpose[GOMP_DIM_MAX];
kono
parents:
diff changeset
647 unsigned ix;
kono
parents:
diff changeset
648 tree pos = TREE_VALUE (attrs);
kono
parents:
diff changeset
649
kono
parents:
diff changeset
650 /* Make sure the attribute creator attached the dimension
kono
parents:
diff changeset
651 information. */
kono
parents:
diff changeset
652 gcc_assert (pos);
kono
parents:
diff changeset
653
kono
parents:
diff changeset
654 for (ix = 0; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
655 {
kono
parents:
diff changeset
656 purpose[ix] = TREE_PURPOSE (pos);
kono
parents:
diff changeset
657 tree val = TREE_VALUE (pos);
kono
parents:
diff changeset
658 dims[ix] = val ? TREE_INT_CST_LOW (val) : -1;
kono
parents:
diff changeset
659 pos = TREE_CHAIN (pos);
kono
parents:
diff changeset
660 }
kono
parents:
diff changeset
661
kono
parents:
diff changeset
662 bool changed = targetm.goacc.validate_dims (fn, dims, level);
kono
parents:
diff changeset
663
kono
parents:
diff changeset
664 /* Default anything left to 1 or a partitioned default. */
kono
parents:
diff changeset
665 for (ix = 0; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
666 if (dims[ix] < 0)
kono
parents:
diff changeset
667 {
kono
parents:
diff changeset
668 /* The OpenACC spec says 'If the [num_gangs] clause is not
kono
parents:
diff changeset
669 specified, an implementation-defined default will be used;
kono
parents:
diff changeset
670 the default may depend on the code within the construct.'
kono
parents:
diff changeset
671 (2.5.6). Thus an implementation is free to choose
kono
parents:
diff changeset
672 non-unity default for a parallel region that doesn't have
kono
parents:
diff changeset
673 any gang-partitioned loops. However, it appears that there
kono
parents:
diff changeset
674 is a sufficient body of user code that expects non-gang
kono
parents:
diff changeset
675 partitioned regions to not execute in gang-redundant mode.
kono
parents:
diff changeset
676 So we (a) don't warn about the non-portability and (b) pick
kono
parents:
diff changeset
677 the minimum permissible dimension size when there is no
kono
parents:
diff changeset
678 partitioned execution. Otherwise we pick the global
kono
parents:
diff changeset
679 default for the dimension, which the user can control. The
kono
parents:
diff changeset
680 same wording and logic applies to num_workers and
kono
parents:
diff changeset
681 vector_length, however the worker- or vector- single
kono
parents:
diff changeset
682 execution doesn't have the same impact as gang-redundant
kono
parents:
diff changeset
683 execution. (If the minimum gang-level partioning is not 1,
kono
parents:
diff changeset
684 the target is probably too confusing.) */
kono
parents:
diff changeset
685 dims[ix] = (used & GOMP_DIM_MASK (ix)
kono
parents:
diff changeset
686 ? oacc_default_dims[ix] : oacc_min_dims[ix]);
kono
parents:
diff changeset
687 changed = true;
kono
parents:
diff changeset
688 }
kono
parents:
diff changeset
689
kono
parents:
diff changeset
690 if (changed)
kono
parents:
diff changeset
691 {
kono
parents:
diff changeset
692 /* Replace the attribute with new values. */
kono
parents:
diff changeset
693 pos = NULL_TREE;
kono
parents:
diff changeset
694 for (ix = GOMP_DIM_MAX; ix--;)
kono
parents:
diff changeset
695 pos = tree_cons (purpose[ix],
kono
parents:
diff changeset
696 build_int_cst (integer_type_node, dims[ix]), pos);
kono
parents:
diff changeset
697 oacc_replace_fn_attrib (fn, pos);
kono
parents:
diff changeset
698 }
kono
parents:
diff changeset
699 }
kono
parents:
diff changeset
700
kono
parents:
diff changeset
701 /* Create an empty OpenACC loop structure at LOC. */
kono
parents:
diff changeset
702
kono
parents:
diff changeset
703 static oacc_loop *
kono
parents:
diff changeset
704 new_oacc_loop_raw (oacc_loop *parent, location_t loc)
kono
parents:
diff changeset
705 {
kono
parents:
diff changeset
706 oacc_loop *loop = XCNEW (oacc_loop);
kono
parents:
diff changeset
707
kono
parents:
diff changeset
708 loop->parent = parent;
kono
parents:
diff changeset
709
kono
parents:
diff changeset
710 if (parent)
kono
parents:
diff changeset
711 {
kono
parents:
diff changeset
712 loop->sibling = parent->child;
kono
parents:
diff changeset
713 parent->child = loop;
kono
parents:
diff changeset
714 }
kono
parents:
diff changeset
715
kono
parents:
diff changeset
716 loop->loc = loc;
kono
parents:
diff changeset
717 return loop;
kono
parents:
diff changeset
718 }
kono
parents:
diff changeset
719
kono
parents:
diff changeset
720 /* Create an outermost, dummy OpenACC loop for offloaded function
kono
parents:
diff changeset
721 DECL. */
kono
parents:
diff changeset
722
kono
parents:
diff changeset
723 static oacc_loop *
kono
parents:
diff changeset
724 new_oacc_loop_outer (tree decl)
kono
parents:
diff changeset
725 {
kono
parents:
diff changeset
726 return new_oacc_loop_raw (NULL, DECL_SOURCE_LOCATION (decl));
kono
parents:
diff changeset
727 }
kono
parents:
diff changeset
728
kono
parents:
diff changeset
729 /* Start a new OpenACC loop structure beginning at head marker HEAD.
kono
parents:
diff changeset
730 Link into PARENT loop. Return the new loop. */
kono
parents:
diff changeset
731
kono
parents:
diff changeset
732 static oacc_loop *
kono
parents:
diff changeset
733 new_oacc_loop (oacc_loop *parent, gcall *marker)
kono
parents:
diff changeset
734 {
kono
parents:
diff changeset
735 oacc_loop *loop = new_oacc_loop_raw (parent, gimple_location (marker));
kono
parents:
diff changeset
736
kono
parents:
diff changeset
737 loop->marker = marker;
kono
parents:
diff changeset
738
kono
parents:
diff changeset
739 /* TODO: This is where device_type flattening would occur for the loop
kono
parents:
diff changeset
740 flags. */
kono
parents:
diff changeset
741
kono
parents:
diff changeset
742 loop->flags = TREE_INT_CST_LOW (gimple_call_arg (marker, 3));
kono
parents:
diff changeset
743
kono
parents:
diff changeset
744 tree chunk_size = integer_zero_node;
kono
parents:
diff changeset
745 if (loop->flags & OLF_GANG_STATIC)
kono
parents:
diff changeset
746 chunk_size = gimple_call_arg (marker, 4);
kono
parents:
diff changeset
747 loop->chunk_size = chunk_size;
kono
parents:
diff changeset
748
kono
parents:
diff changeset
749 return loop;
kono
parents:
diff changeset
750 }
kono
parents:
diff changeset
751
kono
parents:
diff changeset
752 /* Create a dummy loop encompassing a call to a openACC routine.
kono
parents:
diff changeset
753 Extract the routine's partitioning requirements. */
kono
parents:
diff changeset
754
kono
parents:
diff changeset
755 static void
kono
parents:
diff changeset
756 new_oacc_loop_routine (oacc_loop *parent, gcall *call, tree decl, tree attrs)
kono
parents:
diff changeset
757 {
kono
parents:
diff changeset
758 oacc_loop *loop = new_oacc_loop_raw (parent, gimple_location (call));
kono
parents:
diff changeset
759 int level = oacc_fn_attrib_level (attrs);
kono
parents:
diff changeset
760
kono
parents:
diff changeset
761 gcc_assert (level >= 0);
kono
parents:
diff changeset
762
kono
parents:
diff changeset
763 loop->marker = call;
kono
parents:
diff changeset
764 loop->routine = decl;
kono
parents:
diff changeset
765 loop->mask = ((GOMP_DIM_MASK (GOMP_DIM_MAX) - 1)
kono
parents:
diff changeset
766 ^ (GOMP_DIM_MASK (level) - 1));
kono
parents:
diff changeset
767 }
kono
parents:
diff changeset
768
kono
parents:
diff changeset
769 /* Finish off the current OpenACC loop ending at tail marker TAIL.
kono
parents:
diff changeset
770 Return the parent loop. */
kono
parents:
diff changeset
771
kono
parents:
diff changeset
772 static oacc_loop *
kono
parents:
diff changeset
773 finish_oacc_loop (oacc_loop *loop)
kono
parents:
diff changeset
774 {
kono
parents:
diff changeset
775 /* If the loop has been collapsed, don't partition it. */
kono
parents:
diff changeset
776 if (loop->ifns.is_empty ())
kono
parents:
diff changeset
777 loop->mask = loop->flags = 0;
kono
parents:
diff changeset
778 return loop->parent;
kono
parents:
diff changeset
779 }
kono
parents:
diff changeset
780
kono
parents:
diff changeset
781 /* Free all OpenACC loop structures within LOOP (inclusive). */
kono
parents:
diff changeset
782
kono
parents:
diff changeset
783 static void
kono
parents:
diff changeset
784 free_oacc_loop (oacc_loop *loop)
kono
parents:
diff changeset
785 {
kono
parents:
diff changeset
786 if (loop->sibling)
kono
parents:
diff changeset
787 free_oacc_loop (loop->sibling);
kono
parents:
diff changeset
788 if (loop->child)
kono
parents:
diff changeset
789 free_oacc_loop (loop->child);
kono
parents:
diff changeset
790
kono
parents:
diff changeset
791 loop->ifns.release ();
kono
parents:
diff changeset
792 free (loop);
kono
parents:
diff changeset
793 }
kono
parents:
diff changeset
794
kono
parents:
diff changeset
795 /* Dump out the OpenACC loop head or tail beginning at FROM. */
kono
parents:
diff changeset
796
kono
parents:
diff changeset
797 static void
kono
parents:
diff changeset
798 dump_oacc_loop_part (FILE *file, gcall *from, int depth,
kono
parents:
diff changeset
799 const char *title, int level)
kono
parents:
diff changeset
800 {
kono
parents:
diff changeset
801 enum ifn_unique_kind kind
kono
parents:
diff changeset
802 = (enum ifn_unique_kind) TREE_INT_CST_LOW (gimple_call_arg (from, 0));
kono
parents:
diff changeset
803
kono
parents:
diff changeset
804 fprintf (file, "%*s%s-%d:\n", depth * 2, "", title, level);
kono
parents:
diff changeset
805 for (gimple_stmt_iterator gsi = gsi_for_stmt (from);;)
kono
parents:
diff changeset
806 {
kono
parents:
diff changeset
807 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
808
kono
parents:
diff changeset
809 if (gimple_call_internal_p (stmt, IFN_UNIQUE))
kono
parents:
diff changeset
810 {
kono
parents:
diff changeset
811 enum ifn_unique_kind k
kono
parents:
diff changeset
812 = ((enum ifn_unique_kind) TREE_INT_CST_LOW
kono
parents:
diff changeset
813 (gimple_call_arg (stmt, 0)));
kono
parents:
diff changeset
814
kono
parents:
diff changeset
815 if (k == kind && stmt != from)
kono
parents:
diff changeset
816 break;
kono
parents:
diff changeset
817 }
kono
parents:
diff changeset
818 print_gimple_stmt (file, stmt, depth * 2 + 2);
kono
parents:
diff changeset
819
kono
parents:
diff changeset
820 gsi_next (&gsi);
kono
parents:
diff changeset
821 while (gsi_end_p (gsi))
kono
parents:
diff changeset
822 gsi = gsi_start_bb (single_succ (gsi_bb (gsi)));
kono
parents:
diff changeset
823 }
kono
parents:
diff changeset
824 }
kono
parents:
diff changeset
825
kono
parents:
diff changeset
826 /* Dump OpenACC loops LOOP, its siblings and its children. */
kono
parents:
diff changeset
827
kono
parents:
diff changeset
828 static void
kono
parents:
diff changeset
829 dump_oacc_loop (FILE *file, oacc_loop *loop, int depth)
kono
parents:
diff changeset
830 {
kono
parents:
diff changeset
831 int ix;
kono
parents:
diff changeset
832
kono
parents:
diff changeset
833 fprintf (file, "%*sLoop %x(%x) %s:%u\n", depth * 2, "",
kono
parents:
diff changeset
834 loop->flags, loop->mask,
kono
parents:
diff changeset
835 LOCATION_FILE (loop->loc), LOCATION_LINE (loop->loc));
kono
parents:
diff changeset
836
kono
parents:
diff changeset
837 if (loop->marker)
kono
parents:
diff changeset
838 print_gimple_stmt (file, loop->marker, depth * 2);
kono
parents:
diff changeset
839
kono
parents:
diff changeset
840 if (loop->routine)
kono
parents:
diff changeset
841 fprintf (file, "%*sRoutine %s:%u:%s\n",
kono
parents:
diff changeset
842 depth * 2, "", DECL_SOURCE_FILE (loop->routine),
kono
parents:
diff changeset
843 DECL_SOURCE_LINE (loop->routine),
kono
parents:
diff changeset
844 IDENTIFIER_POINTER (DECL_NAME (loop->routine)));
kono
parents:
diff changeset
845
kono
parents:
diff changeset
846 for (ix = GOMP_DIM_GANG; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
847 if (loop->heads[ix])
kono
parents:
diff changeset
848 dump_oacc_loop_part (file, loop->heads[ix], depth, "Head", ix);
kono
parents:
diff changeset
849 for (ix = GOMP_DIM_MAX; ix--;)
kono
parents:
diff changeset
850 if (loop->tails[ix])
kono
parents:
diff changeset
851 dump_oacc_loop_part (file, loop->tails[ix], depth, "Tail", ix);
kono
parents:
diff changeset
852
kono
parents:
diff changeset
853 if (loop->child)
kono
parents:
diff changeset
854 dump_oacc_loop (file, loop->child, depth + 1);
kono
parents:
diff changeset
855 if (loop->sibling)
kono
parents:
diff changeset
856 dump_oacc_loop (file, loop->sibling, depth);
kono
parents:
diff changeset
857 }
kono
parents:
diff changeset
858
kono
parents:
diff changeset
859 void debug_oacc_loop (oacc_loop *);
kono
parents:
diff changeset
860
kono
parents:
diff changeset
861 /* Dump loops to stderr. */
kono
parents:
diff changeset
862
kono
parents:
diff changeset
863 DEBUG_FUNCTION void
kono
parents:
diff changeset
864 debug_oacc_loop (oacc_loop *loop)
kono
parents:
diff changeset
865 {
kono
parents:
diff changeset
866 dump_oacc_loop (stderr, loop, 0);
kono
parents:
diff changeset
867 }
kono
parents:
diff changeset
868
kono
parents:
diff changeset
869 /* DFS walk of basic blocks BB onwards, creating OpenACC loop
kono
parents:
diff changeset
870 structures as we go. By construction these loops are properly
kono
parents:
diff changeset
871 nested. */
kono
parents:
diff changeset
872
kono
parents:
diff changeset
873 static void
kono
parents:
diff changeset
874 oacc_loop_discover_walk (oacc_loop *loop, basic_block bb)
kono
parents:
diff changeset
875 {
kono
parents:
diff changeset
876 int marker = 0;
kono
parents:
diff changeset
877 int remaining = 0;
kono
parents:
diff changeset
878
kono
parents:
diff changeset
879 if (bb->flags & BB_VISITED)
kono
parents:
diff changeset
880 return;
kono
parents:
diff changeset
881
kono
parents:
diff changeset
882 follow:
kono
parents:
diff changeset
883 bb->flags |= BB_VISITED;
kono
parents:
diff changeset
884
kono
parents:
diff changeset
885 /* Scan for loop markers. */
kono
parents:
diff changeset
886 for (gimple_stmt_iterator gsi = gsi_start_bb (bb); !gsi_end_p (gsi);
kono
parents:
diff changeset
887 gsi_next (&gsi))
kono
parents:
diff changeset
888 {
kono
parents:
diff changeset
889 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
890
kono
parents:
diff changeset
891 if (!is_gimple_call (stmt))
kono
parents:
diff changeset
892 continue;
kono
parents:
diff changeset
893
kono
parents:
diff changeset
894 gcall *call = as_a <gcall *> (stmt);
kono
parents:
diff changeset
895
kono
parents:
diff changeset
896 /* If this is a routine, make a dummy loop for it. */
kono
parents:
diff changeset
897 if (tree decl = gimple_call_fndecl (call))
kono
parents:
diff changeset
898 if (tree attrs = oacc_get_fn_attrib (decl))
kono
parents:
diff changeset
899 {
kono
parents:
diff changeset
900 gcc_assert (!marker);
kono
parents:
diff changeset
901 new_oacc_loop_routine (loop, call, decl, attrs);
kono
parents:
diff changeset
902 }
kono
parents:
diff changeset
903
kono
parents:
diff changeset
904 if (!gimple_call_internal_p (call))
kono
parents:
diff changeset
905 continue;
kono
parents:
diff changeset
906
kono
parents:
diff changeset
907 switch (gimple_call_internal_fn (call))
kono
parents:
diff changeset
908 {
kono
parents:
diff changeset
909 default:
kono
parents:
diff changeset
910 break;
kono
parents:
diff changeset
911
kono
parents:
diff changeset
912 case IFN_GOACC_LOOP:
kono
parents:
diff changeset
913 case IFN_GOACC_TILE:
kono
parents:
diff changeset
914 /* Record the abstraction function, so we can manipulate it
kono
parents:
diff changeset
915 later. */
kono
parents:
diff changeset
916 loop->ifns.safe_push (call);
kono
parents:
diff changeset
917 break;
kono
parents:
diff changeset
918
kono
parents:
diff changeset
919 case IFN_UNIQUE:
kono
parents:
diff changeset
920 enum ifn_unique_kind kind
kono
parents:
diff changeset
921 = (enum ifn_unique_kind) (TREE_INT_CST_LOW
kono
parents:
diff changeset
922 (gimple_call_arg (call, 0)));
kono
parents:
diff changeset
923 if (kind == IFN_UNIQUE_OACC_HEAD_MARK
kono
parents:
diff changeset
924 || kind == IFN_UNIQUE_OACC_TAIL_MARK)
kono
parents:
diff changeset
925 {
kono
parents:
diff changeset
926 if (gimple_call_num_args (call) == 2)
kono
parents:
diff changeset
927 {
kono
parents:
diff changeset
928 gcc_assert (marker && !remaining);
kono
parents:
diff changeset
929 marker = 0;
kono
parents:
diff changeset
930 if (kind == IFN_UNIQUE_OACC_TAIL_MARK)
kono
parents:
diff changeset
931 loop = finish_oacc_loop (loop);
kono
parents:
diff changeset
932 else
kono
parents:
diff changeset
933 loop->head_end = call;
kono
parents:
diff changeset
934 }
kono
parents:
diff changeset
935 else
kono
parents:
diff changeset
936 {
kono
parents:
diff changeset
937 int count = TREE_INT_CST_LOW (gimple_call_arg (call, 2));
kono
parents:
diff changeset
938
kono
parents:
diff changeset
939 if (!marker)
kono
parents:
diff changeset
940 {
kono
parents:
diff changeset
941 if (kind == IFN_UNIQUE_OACC_HEAD_MARK)
kono
parents:
diff changeset
942 loop = new_oacc_loop (loop, call);
kono
parents:
diff changeset
943 remaining = count;
kono
parents:
diff changeset
944 }
kono
parents:
diff changeset
945 gcc_assert (count == remaining);
kono
parents:
diff changeset
946 if (remaining)
kono
parents:
diff changeset
947 {
kono
parents:
diff changeset
948 remaining--;
kono
parents:
diff changeset
949 if (kind == IFN_UNIQUE_OACC_HEAD_MARK)
kono
parents:
diff changeset
950 loop->heads[marker] = call;
kono
parents:
diff changeset
951 else
kono
parents:
diff changeset
952 loop->tails[remaining] = call;
kono
parents:
diff changeset
953 }
kono
parents:
diff changeset
954 marker++;
kono
parents:
diff changeset
955 }
kono
parents:
diff changeset
956 }
kono
parents:
diff changeset
957 }
kono
parents:
diff changeset
958 }
kono
parents:
diff changeset
959 if (remaining || marker)
kono
parents:
diff changeset
960 {
kono
parents:
diff changeset
961 bb = single_succ (bb);
kono
parents:
diff changeset
962 gcc_assert (single_pred_p (bb) && !(bb->flags & BB_VISITED));
kono
parents:
diff changeset
963 goto follow;
kono
parents:
diff changeset
964 }
kono
parents:
diff changeset
965
kono
parents:
diff changeset
966 /* Walk successor blocks. */
kono
parents:
diff changeset
967 edge e;
kono
parents:
diff changeset
968 edge_iterator ei;
kono
parents:
diff changeset
969
kono
parents:
diff changeset
970 FOR_EACH_EDGE (e, ei, bb->succs)
kono
parents:
diff changeset
971 oacc_loop_discover_walk (loop, e->dest);
kono
parents:
diff changeset
972 }
kono
parents:
diff changeset
973
kono
parents:
diff changeset
974 /* LOOP is the first sibling. Reverse the order in place and return
kono
parents:
diff changeset
975 the new first sibling. Recurse to child loops. */
kono
parents:
diff changeset
976
kono
parents:
diff changeset
977 static oacc_loop *
kono
parents:
diff changeset
978 oacc_loop_sibling_nreverse (oacc_loop *loop)
kono
parents:
diff changeset
979 {
kono
parents:
diff changeset
980 oacc_loop *last = NULL;
kono
parents:
diff changeset
981 do
kono
parents:
diff changeset
982 {
kono
parents:
diff changeset
983 if (loop->child)
kono
parents:
diff changeset
984 loop->child = oacc_loop_sibling_nreverse (loop->child);
kono
parents:
diff changeset
985
kono
parents:
diff changeset
986 oacc_loop *next = loop->sibling;
kono
parents:
diff changeset
987 loop->sibling = last;
kono
parents:
diff changeset
988 last = loop;
kono
parents:
diff changeset
989 loop = next;
kono
parents:
diff changeset
990 }
kono
parents:
diff changeset
991 while (loop);
kono
parents:
diff changeset
992
kono
parents:
diff changeset
993 return last;
kono
parents:
diff changeset
994 }
kono
parents:
diff changeset
995
kono
parents:
diff changeset
996 /* Discover the OpenACC loops marked up by HEAD and TAIL markers for
kono
parents:
diff changeset
997 the current function. */
kono
parents:
diff changeset
998
kono
parents:
diff changeset
999 static oacc_loop *
kono
parents:
diff changeset
1000 oacc_loop_discovery ()
kono
parents:
diff changeset
1001 {
kono
parents:
diff changeset
1002 /* Clear basic block flags, in particular BB_VISITED which we're going to use
kono
parents:
diff changeset
1003 in the following. */
kono
parents:
diff changeset
1004 clear_bb_flags ();
kono
parents:
diff changeset
1005
kono
parents:
diff changeset
1006 oacc_loop *top = new_oacc_loop_outer (current_function_decl);
kono
parents:
diff changeset
1007 oacc_loop_discover_walk (top, ENTRY_BLOCK_PTR_FOR_FN (cfun));
kono
parents:
diff changeset
1008
kono
parents:
diff changeset
1009 /* The siblings were constructed in reverse order, reverse them so
kono
parents:
diff changeset
1010 that diagnostics come out in an unsurprising order. */
kono
parents:
diff changeset
1011 top = oacc_loop_sibling_nreverse (top);
kono
parents:
diff changeset
1012
kono
parents:
diff changeset
1013 return top;
kono
parents:
diff changeset
1014 }
kono
parents:
diff changeset
1015
kono
parents:
diff changeset
1016 /* Transform the abstract internal function markers starting at FROM
kono
parents:
diff changeset
1017 to be for partitioning level LEVEL. Stop when we meet another HEAD
kono
parents:
diff changeset
1018 or TAIL marker. */
kono
parents:
diff changeset
1019
kono
parents:
diff changeset
1020 static void
kono
parents:
diff changeset
1021 oacc_loop_xform_head_tail (gcall *from, int level)
kono
parents:
diff changeset
1022 {
kono
parents:
diff changeset
1023 enum ifn_unique_kind kind
kono
parents:
diff changeset
1024 = (enum ifn_unique_kind) TREE_INT_CST_LOW (gimple_call_arg (from, 0));
kono
parents:
diff changeset
1025 tree replacement = build_int_cst (unsigned_type_node, level);
kono
parents:
diff changeset
1026
kono
parents:
diff changeset
1027 for (gimple_stmt_iterator gsi = gsi_for_stmt (from);;)
kono
parents:
diff changeset
1028 {
kono
parents:
diff changeset
1029 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
1030
kono
parents:
diff changeset
1031 if (gimple_call_internal_p (stmt, IFN_UNIQUE))
kono
parents:
diff changeset
1032 {
kono
parents:
diff changeset
1033 enum ifn_unique_kind k
kono
parents:
diff changeset
1034 = ((enum ifn_unique_kind)
kono
parents:
diff changeset
1035 TREE_INT_CST_LOW (gimple_call_arg (stmt, 0)));
kono
parents:
diff changeset
1036
kono
parents:
diff changeset
1037 if (k == IFN_UNIQUE_OACC_FORK || k == IFN_UNIQUE_OACC_JOIN)
kono
parents:
diff changeset
1038 *gimple_call_arg_ptr (stmt, 2) = replacement;
kono
parents:
diff changeset
1039 else if (k == kind && stmt != from)
kono
parents:
diff changeset
1040 break;
kono
parents:
diff changeset
1041 }
kono
parents:
diff changeset
1042 else if (gimple_call_internal_p (stmt, IFN_GOACC_REDUCTION))
kono
parents:
diff changeset
1043 *gimple_call_arg_ptr (stmt, 3) = replacement;
kono
parents:
diff changeset
1044
kono
parents:
diff changeset
1045 gsi_next (&gsi);
kono
parents:
diff changeset
1046 while (gsi_end_p (gsi))
kono
parents:
diff changeset
1047 gsi = gsi_start_bb (single_succ (gsi_bb (gsi)));
kono
parents:
diff changeset
1048 }
kono
parents:
diff changeset
1049 }
kono
parents:
diff changeset
1050
kono
parents:
diff changeset
1051 /* Process the discovered OpenACC loops, setting the correct
kono
parents:
diff changeset
1052 partitioning level etc. */
kono
parents:
diff changeset
1053
kono
parents:
diff changeset
1054 static void
kono
parents:
diff changeset
1055 oacc_loop_process (oacc_loop *loop)
kono
parents:
diff changeset
1056 {
kono
parents:
diff changeset
1057 if (loop->child)
kono
parents:
diff changeset
1058 oacc_loop_process (loop->child);
kono
parents:
diff changeset
1059
kono
parents:
diff changeset
1060 if (loop->mask && !loop->routine)
kono
parents:
diff changeset
1061 {
kono
parents:
diff changeset
1062 int ix;
kono
parents:
diff changeset
1063 tree mask_arg = build_int_cst (unsigned_type_node, loop->mask);
kono
parents:
diff changeset
1064 tree e_mask_arg = build_int_cst (unsigned_type_node, loop->e_mask);
kono
parents:
diff changeset
1065 tree chunk_arg = loop->chunk_size;
kono
parents:
diff changeset
1066 gcall *call;
kono
parents:
diff changeset
1067
kono
parents:
diff changeset
1068 for (ix = 0; loop->ifns.iterate (ix, &call); ix++)
kono
parents:
diff changeset
1069 switch (gimple_call_internal_fn (call))
kono
parents:
diff changeset
1070 {
kono
parents:
diff changeset
1071 case IFN_GOACC_LOOP:
kono
parents:
diff changeset
1072 {
kono
parents:
diff changeset
1073 bool is_e = gimple_call_arg (call, 5) == integer_minus_one_node;
kono
parents:
diff changeset
1074 gimple_call_set_arg (call, 5, is_e ? e_mask_arg : mask_arg);
kono
parents:
diff changeset
1075 if (!is_e)
kono
parents:
diff changeset
1076 gimple_call_set_arg (call, 4, chunk_arg);
kono
parents:
diff changeset
1077 }
kono
parents:
diff changeset
1078 break;
kono
parents:
diff changeset
1079
kono
parents:
diff changeset
1080 case IFN_GOACC_TILE:
kono
parents:
diff changeset
1081 gimple_call_set_arg (call, 3, mask_arg);
kono
parents:
diff changeset
1082 gimple_call_set_arg (call, 4, e_mask_arg);
kono
parents:
diff changeset
1083 break;
kono
parents:
diff changeset
1084
kono
parents:
diff changeset
1085 default:
kono
parents:
diff changeset
1086 gcc_unreachable ();
kono
parents:
diff changeset
1087 }
kono
parents:
diff changeset
1088
kono
parents:
diff changeset
1089 unsigned dim = GOMP_DIM_GANG;
kono
parents:
diff changeset
1090 unsigned mask = loop->mask | loop->e_mask;
kono
parents:
diff changeset
1091 for (ix = 0; ix != GOMP_DIM_MAX && mask; ix++)
kono
parents:
diff changeset
1092 {
kono
parents:
diff changeset
1093 while (!(GOMP_DIM_MASK (dim) & mask))
kono
parents:
diff changeset
1094 dim++;
kono
parents:
diff changeset
1095
kono
parents:
diff changeset
1096 oacc_loop_xform_head_tail (loop->heads[ix], dim);
kono
parents:
diff changeset
1097 oacc_loop_xform_head_tail (loop->tails[ix], dim);
kono
parents:
diff changeset
1098
kono
parents:
diff changeset
1099 mask ^= GOMP_DIM_MASK (dim);
kono
parents:
diff changeset
1100 }
kono
parents:
diff changeset
1101 }
kono
parents:
diff changeset
1102
kono
parents:
diff changeset
1103 if (loop->sibling)
kono
parents:
diff changeset
1104 oacc_loop_process (loop->sibling);
kono
parents:
diff changeset
1105 }
kono
parents:
diff changeset
1106
kono
parents:
diff changeset
1107 /* Walk the OpenACC loop heirarchy checking and assigning the
kono
parents:
diff changeset
1108 programmer-specified partitionings. OUTER_MASK is the partitioning
kono
parents:
diff changeset
1109 this loop is contained within. Return mask of partitioning
kono
parents:
diff changeset
1110 encountered. If any auto loops are discovered, set GOMP_DIM_MAX
kono
parents:
diff changeset
1111 bit. */
kono
parents:
diff changeset
1112
kono
parents:
diff changeset
1113 static unsigned
kono
parents:
diff changeset
1114 oacc_loop_fixed_partitions (oacc_loop *loop, unsigned outer_mask)
kono
parents:
diff changeset
1115 {
kono
parents:
diff changeset
1116 unsigned this_mask = loop->mask;
kono
parents:
diff changeset
1117 unsigned mask_all = 0;
kono
parents:
diff changeset
1118 bool noisy = true;
kono
parents:
diff changeset
1119
kono
parents:
diff changeset
1120 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1121 /* When device_type is supported, we want the device compiler to be
kono
parents:
diff changeset
1122 noisy, if the loop parameters are device_type-specific. */
kono
parents:
diff changeset
1123 noisy = false;
kono
parents:
diff changeset
1124 #endif
kono
parents:
diff changeset
1125
kono
parents:
diff changeset
1126 if (!loop->routine)
kono
parents:
diff changeset
1127 {
kono
parents:
diff changeset
1128 bool auto_par = (loop->flags & OLF_AUTO) != 0;
kono
parents:
diff changeset
1129 bool seq_par = (loop->flags & OLF_SEQ) != 0;
kono
parents:
diff changeset
1130 bool tiling = (loop->flags & OLF_TILE) != 0;
kono
parents:
diff changeset
1131
kono
parents:
diff changeset
1132 this_mask = ((loop->flags >> OLF_DIM_BASE)
kono
parents:
diff changeset
1133 & (GOMP_DIM_MASK (GOMP_DIM_MAX) - 1));
kono
parents:
diff changeset
1134
kono
parents:
diff changeset
1135 /* Apply auto partitioning if this is a non-partitioned regular
kono
parents:
diff changeset
1136 loop, or (no more than) single axis tiled loop. */
kono
parents:
diff changeset
1137 bool maybe_auto
kono
parents:
diff changeset
1138 = !seq_par && this_mask == (tiling ? this_mask & -this_mask : 0);
kono
parents:
diff changeset
1139
kono
parents:
diff changeset
1140 if ((this_mask != 0) + auto_par + seq_par > 1)
kono
parents:
diff changeset
1141 {
kono
parents:
diff changeset
1142 if (noisy)
kono
parents:
diff changeset
1143 error_at (loop->loc,
kono
parents:
diff changeset
1144 seq_par
kono
parents:
diff changeset
1145 ? G_("%<seq%> overrides other OpenACC loop specifiers")
kono
parents:
diff changeset
1146 : G_("%<auto%> conflicts with other OpenACC loop "
kono
parents:
diff changeset
1147 "specifiers"));
kono
parents:
diff changeset
1148 maybe_auto = false;
kono
parents:
diff changeset
1149 loop->flags &= ~OLF_AUTO;
kono
parents:
diff changeset
1150 if (seq_par)
kono
parents:
diff changeset
1151 {
kono
parents:
diff changeset
1152 loop->flags
kono
parents:
diff changeset
1153 &= ~((GOMP_DIM_MASK (GOMP_DIM_MAX) - 1) << OLF_DIM_BASE);
kono
parents:
diff changeset
1154 this_mask = 0;
kono
parents:
diff changeset
1155 }
kono
parents:
diff changeset
1156 }
kono
parents:
diff changeset
1157
kono
parents:
diff changeset
1158 if (maybe_auto && (loop->flags & OLF_INDEPENDENT))
kono
parents:
diff changeset
1159 {
kono
parents:
diff changeset
1160 loop->flags |= OLF_AUTO;
kono
parents:
diff changeset
1161 mask_all |= GOMP_DIM_MASK (GOMP_DIM_MAX);
kono
parents:
diff changeset
1162 }
kono
parents:
diff changeset
1163 }
kono
parents:
diff changeset
1164
kono
parents:
diff changeset
1165 if (this_mask & outer_mask)
kono
parents:
diff changeset
1166 {
kono
parents:
diff changeset
1167 const oacc_loop *outer;
kono
parents:
diff changeset
1168 for (outer = loop->parent; outer; outer = outer->parent)
kono
parents:
diff changeset
1169 if ((outer->mask | outer->e_mask) & this_mask)
kono
parents:
diff changeset
1170 break;
kono
parents:
diff changeset
1171
kono
parents:
diff changeset
1172 if (noisy)
kono
parents:
diff changeset
1173 {
kono
parents:
diff changeset
1174 if (outer)
kono
parents:
diff changeset
1175 {
kono
parents:
diff changeset
1176 error_at (loop->loc,
kono
parents:
diff changeset
1177 loop->routine
kono
parents:
diff changeset
1178 ? G_("routine call uses same OpenACC parallelism"
kono
parents:
diff changeset
1179 " as containing loop")
kono
parents:
diff changeset
1180 : G_("inner loop uses same OpenACC parallelism"
kono
parents:
diff changeset
1181 " as containing loop"));
kono
parents:
diff changeset
1182 inform (outer->loc, "containing loop here");
kono
parents:
diff changeset
1183 }
kono
parents:
diff changeset
1184 else
kono
parents:
diff changeset
1185 error_at (loop->loc,
kono
parents:
diff changeset
1186 loop->routine
kono
parents:
diff changeset
1187 ? G_("routine call uses OpenACC parallelism disallowed"
kono
parents:
diff changeset
1188 " by containing routine")
kono
parents:
diff changeset
1189 : G_("loop uses OpenACC parallelism disallowed"
kono
parents:
diff changeset
1190 " by containing routine"));
kono
parents:
diff changeset
1191
kono
parents:
diff changeset
1192 if (loop->routine)
kono
parents:
diff changeset
1193 inform (DECL_SOURCE_LOCATION (loop->routine),
kono
parents:
diff changeset
1194 "routine %qD declared here", loop->routine);
kono
parents:
diff changeset
1195 }
kono
parents:
diff changeset
1196 this_mask &= ~outer_mask;
kono
parents:
diff changeset
1197 }
kono
parents:
diff changeset
1198 else
kono
parents:
diff changeset
1199 {
kono
parents:
diff changeset
1200 unsigned outermost = least_bit_hwi (this_mask);
kono
parents:
diff changeset
1201
kono
parents:
diff changeset
1202 if (outermost && outermost <= outer_mask)
kono
parents:
diff changeset
1203 {
kono
parents:
diff changeset
1204 if (noisy)
kono
parents:
diff changeset
1205 {
kono
parents:
diff changeset
1206 error_at (loop->loc,
kono
parents:
diff changeset
1207 "incorrectly nested OpenACC loop parallelism");
kono
parents:
diff changeset
1208
kono
parents:
diff changeset
1209 const oacc_loop *outer;
kono
parents:
diff changeset
1210 for (outer = loop->parent;
kono
parents:
diff changeset
1211 outer->flags && outer->flags < outermost;
kono
parents:
diff changeset
1212 outer = outer->parent)
kono
parents:
diff changeset
1213 continue;
kono
parents:
diff changeset
1214 inform (outer->loc, "containing loop here");
kono
parents:
diff changeset
1215 }
kono
parents:
diff changeset
1216
kono
parents:
diff changeset
1217 this_mask &= ~outermost;
kono
parents:
diff changeset
1218 }
kono
parents:
diff changeset
1219 }
kono
parents:
diff changeset
1220
kono
parents:
diff changeset
1221 mask_all |= this_mask;
kono
parents:
diff changeset
1222
kono
parents:
diff changeset
1223 if (loop->flags & OLF_TILE)
kono
parents:
diff changeset
1224 {
kono
parents:
diff changeset
1225 /* When tiling, vector goes to the element loop, and failing
kono
parents:
diff changeset
1226 that we put worker there. The std doesn't contemplate
kono
parents:
diff changeset
1227 specifying all three. We choose to put worker and vector on
kono
parents:
diff changeset
1228 the element loops in that case. */
kono
parents:
diff changeset
1229 unsigned this_e_mask = this_mask & GOMP_DIM_MASK (GOMP_DIM_VECTOR);
kono
parents:
diff changeset
1230 if (!this_e_mask || this_mask & GOMP_DIM_MASK (GOMP_DIM_GANG))
kono
parents:
diff changeset
1231 this_e_mask |= this_mask & GOMP_DIM_MASK (GOMP_DIM_WORKER);
kono
parents:
diff changeset
1232
kono
parents:
diff changeset
1233 loop->e_mask = this_e_mask;
kono
parents:
diff changeset
1234 this_mask ^= this_e_mask;
kono
parents:
diff changeset
1235 }
kono
parents:
diff changeset
1236
kono
parents:
diff changeset
1237 loop->mask = this_mask;
kono
parents:
diff changeset
1238
kono
parents:
diff changeset
1239 if (dump_file)
kono
parents:
diff changeset
1240 fprintf (dump_file, "Loop %s:%d user specified %d & %d\n",
kono
parents:
diff changeset
1241 LOCATION_FILE (loop->loc), LOCATION_LINE (loop->loc),
kono
parents:
diff changeset
1242 loop->mask, loop->e_mask);
kono
parents:
diff changeset
1243
kono
parents:
diff changeset
1244 if (loop->child)
kono
parents:
diff changeset
1245 {
kono
parents:
diff changeset
1246 unsigned tmp_mask = outer_mask | this_mask | loop->e_mask;
kono
parents:
diff changeset
1247 loop->inner = oacc_loop_fixed_partitions (loop->child, tmp_mask);
kono
parents:
diff changeset
1248 mask_all |= loop->inner;
kono
parents:
diff changeset
1249 }
kono
parents:
diff changeset
1250
kono
parents:
diff changeset
1251 if (loop->sibling)
kono
parents:
diff changeset
1252 mask_all |= oacc_loop_fixed_partitions (loop->sibling, outer_mask);
kono
parents:
diff changeset
1253
kono
parents:
diff changeset
1254 return mask_all;
kono
parents:
diff changeset
1255 }
kono
parents:
diff changeset
1256
kono
parents:
diff changeset
1257 /* Walk the OpenACC loop heirarchy to assign auto-partitioned loops.
kono
parents:
diff changeset
1258 OUTER_MASK is the partitioning this loop is contained within.
kono
parents:
diff changeset
1259 OUTER_ASSIGN is true if an outer loop is being auto-partitioned.
kono
parents:
diff changeset
1260 Return the cumulative partitioning used by this loop, siblings and
kono
parents:
diff changeset
1261 children. */
kono
parents:
diff changeset
1262
kono
parents:
diff changeset
1263 static unsigned
kono
parents:
diff changeset
1264 oacc_loop_auto_partitions (oacc_loop *loop, unsigned outer_mask,
kono
parents:
diff changeset
1265 bool outer_assign)
kono
parents:
diff changeset
1266 {
kono
parents:
diff changeset
1267 bool assign = (loop->flags & OLF_AUTO) && (loop->flags & OLF_INDEPENDENT);
kono
parents:
diff changeset
1268 bool noisy = true;
kono
parents:
diff changeset
1269 bool tiling = loop->flags & OLF_TILE;
kono
parents:
diff changeset
1270
kono
parents:
diff changeset
1271 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1272 /* When device_type is supported, we want the device compiler to be
kono
parents:
diff changeset
1273 noisy, if the loop parameters are device_type-specific. */
kono
parents:
diff changeset
1274 noisy = false;
kono
parents:
diff changeset
1275 #endif
kono
parents:
diff changeset
1276
kono
parents:
diff changeset
1277 if (assign && (!outer_assign || loop->inner))
kono
parents:
diff changeset
1278 {
kono
parents:
diff changeset
1279 /* Allocate outermost and non-innermost loops at the outermost
kono
parents:
diff changeset
1280 non-innermost available level. */
kono
parents:
diff changeset
1281 unsigned this_mask = GOMP_DIM_MASK (GOMP_DIM_GANG);
kono
parents:
diff changeset
1282
kono
parents:
diff changeset
1283 /* Find the first outermost available partition. */
kono
parents:
diff changeset
1284 while (this_mask <= outer_mask)
kono
parents:
diff changeset
1285 this_mask <<= 1;
kono
parents:
diff changeset
1286
kono
parents:
diff changeset
1287 /* Grab two axes if tiling, and we've not assigned anything */
kono
parents:
diff changeset
1288 if (tiling && !(loop->mask | loop->e_mask))
kono
parents:
diff changeset
1289 this_mask |= this_mask << 1;
kono
parents:
diff changeset
1290
kono
parents:
diff changeset
1291 /* Prohibit the innermost partitioning at the moment. */
kono
parents:
diff changeset
1292 this_mask &= GOMP_DIM_MASK (GOMP_DIM_MAX - 1) - 1;
kono
parents:
diff changeset
1293
kono
parents:
diff changeset
1294 /* Don't use any dimension explicitly claimed by an inner loop. */
kono
parents:
diff changeset
1295 this_mask &= ~loop->inner;
kono
parents:
diff changeset
1296
kono
parents:
diff changeset
1297 if (tiling && !loop->e_mask)
kono
parents:
diff changeset
1298 {
kono
parents:
diff changeset
1299 /* If we got two axes, allocate the inner one to the element
kono
parents:
diff changeset
1300 loop. */
kono
parents:
diff changeset
1301 loop->e_mask = this_mask & (this_mask << 1);
kono
parents:
diff changeset
1302 this_mask ^= loop->e_mask;
kono
parents:
diff changeset
1303 }
kono
parents:
diff changeset
1304
kono
parents:
diff changeset
1305 loop->mask |= this_mask;
kono
parents:
diff changeset
1306 }
kono
parents:
diff changeset
1307
kono
parents:
diff changeset
1308 if (loop->child)
kono
parents:
diff changeset
1309 {
kono
parents:
diff changeset
1310 unsigned tmp_mask = outer_mask | loop->mask | loop->e_mask;
kono
parents:
diff changeset
1311 loop->inner = oacc_loop_auto_partitions (loop->child, tmp_mask,
kono
parents:
diff changeset
1312 outer_assign | assign);
kono
parents:
diff changeset
1313 }
kono
parents:
diff changeset
1314
kono
parents:
diff changeset
1315 if (assign && (!loop->mask || (tiling && !loop->e_mask) || !outer_assign))
kono
parents:
diff changeset
1316 {
kono
parents:
diff changeset
1317 /* Allocate the loop at the innermost available level. Note
kono
parents:
diff changeset
1318 that we do this even if we already assigned this loop the
kono
parents:
diff changeset
1319 outermost available level above. That way we'll partition
kono
parents:
diff changeset
1320 this along 2 axes, if they are available. */
kono
parents:
diff changeset
1321 unsigned this_mask = 0;
kono
parents:
diff changeset
1322
kono
parents:
diff changeset
1323 /* Determine the outermost partitioning used within this loop. */
kono
parents:
diff changeset
1324 this_mask = loop->inner | GOMP_DIM_MASK (GOMP_DIM_MAX);
kono
parents:
diff changeset
1325 this_mask = least_bit_hwi (this_mask);
kono
parents:
diff changeset
1326
kono
parents:
diff changeset
1327 /* Pick the partitioning just inside that one. */
kono
parents:
diff changeset
1328 this_mask >>= 1;
kono
parents:
diff changeset
1329
kono
parents:
diff changeset
1330 /* And avoid picking one use by an outer loop. */
kono
parents:
diff changeset
1331 this_mask &= ~outer_mask;
kono
parents:
diff changeset
1332
kono
parents:
diff changeset
1333 /* If tiling and we failed completely above, grab the next one
kono
parents:
diff changeset
1334 too. Making sure it doesn't hit an outer loop. */
kono
parents:
diff changeset
1335 if (tiling)
kono
parents:
diff changeset
1336 {
kono
parents:
diff changeset
1337 this_mask &= ~(loop->e_mask | loop->mask);
kono
parents:
diff changeset
1338 unsigned tile_mask = ((this_mask >> 1)
kono
parents:
diff changeset
1339 & ~(outer_mask | loop->e_mask | loop->mask));
kono
parents:
diff changeset
1340
kono
parents:
diff changeset
1341 if (tile_mask || loop->mask)
kono
parents:
diff changeset
1342 {
kono
parents:
diff changeset
1343 loop->e_mask |= this_mask;
kono
parents:
diff changeset
1344 this_mask = tile_mask;
kono
parents:
diff changeset
1345 }
kono
parents:
diff changeset
1346 if (!loop->e_mask && noisy)
kono
parents:
diff changeset
1347 warning_at (loop->loc, 0,
kono
parents:
diff changeset
1348 "insufficient partitioning available"
kono
parents:
diff changeset
1349 " to parallelize element loop");
kono
parents:
diff changeset
1350 }
kono
parents:
diff changeset
1351
kono
parents:
diff changeset
1352 loop->mask |= this_mask;
kono
parents:
diff changeset
1353 if (!loop->mask && noisy)
kono
parents:
diff changeset
1354 warning_at (loop->loc, 0,
kono
parents:
diff changeset
1355 tiling
kono
parents:
diff changeset
1356 ? G_("insufficient partitioning available"
kono
parents:
diff changeset
1357 " to parallelize tile loop")
kono
parents:
diff changeset
1358 : G_("insufficient partitioning available"
kono
parents:
diff changeset
1359 " to parallelize loop"));
kono
parents:
diff changeset
1360 }
kono
parents:
diff changeset
1361
kono
parents:
diff changeset
1362 if (assign && dump_file)
kono
parents:
diff changeset
1363 fprintf (dump_file, "Auto loop %s:%d assigned %d & %d\n",
kono
parents:
diff changeset
1364 LOCATION_FILE (loop->loc), LOCATION_LINE (loop->loc),
kono
parents:
diff changeset
1365 loop->mask, loop->e_mask);
kono
parents:
diff changeset
1366
kono
parents:
diff changeset
1367 unsigned inner_mask = 0;
kono
parents:
diff changeset
1368
kono
parents:
diff changeset
1369 if (loop->sibling)
kono
parents:
diff changeset
1370 inner_mask |= oacc_loop_auto_partitions (loop->sibling,
kono
parents:
diff changeset
1371 outer_mask, outer_assign);
kono
parents:
diff changeset
1372
kono
parents:
diff changeset
1373 inner_mask |= loop->inner | loop->mask | loop->e_mask;
kono
parents:
diff changeset
1374
kono
parents:
diff changeset
1375 return inner_mask;
kono
parents:
diff changeset
1376 }
kono
parents:
diff changeset
1377
kono
parents:
diff changeset
1378 /* Walk the OpenACC loop heirarchy to check and assign partitioning
kono
parents:
diff changeset
1379 axes. Return mask of partitioning. */
kono
parents:
diff changeset
1380
kono
parents:
diff changeset
1381 static unsigned
kono
parents:
diff changeset
1382 oacc_loop_partition (oacc_loop *loop, unsigned outer_mask)
kono
parents:
diff changeset
1383 {
kono
parents:
diff changeset
1384 unsigned mask_all = oacc_loop_fixed_partitions (loop, outer_mask);
kono
parents:
diff changeset
1385
kono
parents:
diff changeset
1386 if (mask_all & GOMP_DIM_MASK (GOMP_DIM_MAX))
kono
parents:
diff changeset
1387 {
kono
parents:
diff changeset
1388 mask_all ^= GOMP_DIM_MASK (GOMP_DIM_MAX);
kono
parents:
diff changeset
1389 mask_all |= oacc_loop_auto_partitions (loop, outer_mask, false);
kono
parents:
diff changeset
1390 }
kono
parents:
diff changeset
1391 return mask_all;
kono
parents:
diff changeset
1392 }
kono
parents:
diff changeset
1393
kono
parents:
diff changeset
1394 /* Default fork/join early expander. Delete the function calls if
kono
parents:
diff changeset
1395 there is no RTL expander. */
kono
parents:
diff changeset
1396
kono
parents:
diff changeset
1397 bool
kono
parents:
diff changeset
1398 default_goacc_fork_join (gcall *ARG_UNUSED (call),
kono
parents:
diff changeset
1399 const int *ARG_UNUSED (dims), bool is_fork)
kono
parents:
diff changeset
1400 {
kono
parents:
diff changeset
1401 if (is_fork)
kono
parents:
diff changeset
1402 return targetm.have_oacc_fork ();
kono
parents:
diff changeset
1403 else
kono
parents:
diff changeset
1404 return targetm.have_oacc_join ();
kono
parents:
diff changeset
1405 }
kono
parents:
diff changeset
1406
kono
parents:
diff changeset
1407 /* Default goacc.reduction early expander.
kono
parents:
diff changeset
1408
kono
parents:
diff changeset
1409 LHS-opt = IFN_REDUCTION (KIND, RES_PTR, VAR, LEVEL, OP, OFFSET)
kono
parents:
diff changeset
1410 If RES_PTR is not integer-zerop:
kono
parents:
diff changeset
1411 SETUP - emit 'LHS = *RES_PTR', LHS = NULL
kono
parents:
diff changeset
1412 TEARDOWN - emit '*RES_PTR = VAR'
kono
parents:
diff changeset
1413 If LHS is not NULL
kono
parents:
diff changeset
1414 emit 'LHS = VAR' */
kono
parents:
diff changeset
1415
kono
parents:
diff changeset
1416 void
kono
parents:
diff changeset
1417 default_goacc_reduction (gcall *call)
kono
parents:
diff changeset
1418 {
kono
parents:
diff changeset
1419 unsigned code = (unsigned)TREE_INT_CST_LOW (gimple_call_arg (call, 0));
kono
parents:
diff changeset
1420 gimple_stmt_iterator gsi = gsi_for_stmt (call);
kono
parents:
diff changeset
1421 tree lhs = gimple_call_lhs (call);
kono
parents:
diff changeset
1422 tree var = gimple_call_arg (call, 2);
kono
parents:
diff changeset
1423 gimple_seq seq = NULL;
kono
parents:
diff changeset
1424
kono
parents:
diff changeset
1425 if (code == IFN_GOACC_REDUCTION_SETUP
kono
parents:
diff changeset
1426 || code == IFN_GOACC_REDUCTION_TEARDOWN)
kono
parents:
diff changeset
1427 {
kono
parents:
diff changeset
1428 /* Setup and Teardown need to copy from/to the receiver object,
kono
parents:
diff changeset
1429 if there is one. */
kono
parents:
diff changeset
1430 tree ref_to_res = gimple_call_arg (call, 1);
kono
parents:
diff changeset
1431
kono
parents:
diff changeset
1432 if (!integer_zerop (ref_to_res))
kono
parents:
diff changeset
1433 {
kono
parents:
diff changeset
1434 tree dst = build_simple_mem_ref (ref_to_res);
kono
parents:
diff changeset
1435 tree src = var;
kono
parents:
diff changeset
1436
kono
parents:
diff changeset
1437 if (code == IFN_GOACC_REDUCTION_SETUP)
kono
parents:
diff changeset
1438 {
kono
parents:
diff changeset
1439 src = dst;
kono
parents:
diff changeset
1440 dst = lhs;
kono
parents:
diff changeset
1441 lhs = NULL;
kono
parents:
diff changeset
1442 }
kono
parents:
diff changeset
1443 gimple_seq_add_stmt (&seq, gimple_build_assign (dst, src));
kono
parents:
diff changeset
1444 }
kono
parents:
diff changeset
1445 }
kono
parents:
diff changeset
1446
kono
parents:
diff changeset
1447 /* Copy VAR to LHS, if there is an LHS. */
kono
parents:
diff changeset
1448 if (lhs)
kono
parents:
diff changeset
1449 gimple_seq_add_stmt (&seq, gimple_build_assign (lhs, var));
kono
parents:
diff changeset
1450
kono
parents:
diff changeset
1451 gsi_replace_with_seq (&gsi, seq, true);
kono
parents:
diff changeset
1452 }
kono
parents:
diff changeset
1453
kono
parents:
diff changeset
1454 /* Main entry point for oacc transformations which run on the device
kono
parents:
diff changeset
1455 compiler after LTO, so we know what the target device is at this
kono
parents:
diff changeset
1456 point (including the host fallback). */
kono
parents:
diff changeset
1457
kono
parents:
diff changeset
1458 static unsigned int
kono
parents:
diff changeset
1459 execute_oacc_device_lower ()
kono
parents:
diff changeset
1460 {
kono
parents:
diff changeset
1461 tree attrs = oacc_get_fn_attrib (current_function_decl);
kono
parents:
diff changeset
1462
kono
parents:
diff changeset
1463 if (!attrs)
kono
parents:
diff changeset
1464 /* Not an offloaded function. */
kono
parents:
diff changeset
1465 return 0;
kono
parents:
diff changeset
1466
kono
parents:
diff changeset
1467 /* Parse the default dim argument exactly once. */
kono
parents:
diff changeset
1468 if ((const void *)flag_openacc_dims != &flag_openacc_dims)
kono
parents:
diff changeset
1469 {
kono
parents:
diff changeset
1470 oacc_parse_default_dims (flag_openacc_dims);
kono
parents:
diff changeset
1471 flag_openacc_dims = (char *)&flag_openacc_dims;
kono
parents:
diff changeset
1472 }
kono
parents:
diff changeset
1473
kono
parents:
diff changeset
1474 bool is_oacc_kernels
kono
parents:
diff changeset
1475 = (lookup_attribute ("oacc kernels",
kono
parents:
diff changeset
1476 DECL_ATTRIBUTES (current_function_decl)) != NULL);
kono
parents:
diff changeset
1477 bool is_oacc_kernels_parallelized
kono
parents:
diff changeset
1478 = (lookup_attribute ("oacc kernels parallelized",
kono
parents:
diff changeset
1479 DECL_ATTRIBUTES (current_function_decl)) != NULL);
kono
parents:
diff changeset
1480
kono
parents:
diff changeset
1481 /* Unparallelized OpenACC kernels constructs must get launched as 1 x 1 x 1
kono
parents:
diff changeset
1482 kernels, so remove the parallelism dimensions function attributes
kono
parents:
diff changeset
1483 potentially set earlier on. */
kono
parents:
diff changeset
1484 if (is_oacc_kernels && !is_oacc_kernels_parallelized)
kono
parents:
diff changeset
1485 {
kono
parents:
diff changeset
1486 oacc_set_fn_attrib (current_function_decl, NULL, NULL);
kono
parents:
diff changeset
1487 attrs = oacc_get_fn_attrib (current_function_decl);
kono
parents:
diff changeset
1488 }
kono
parents:
diff changeset
1489
kono
parents:
diff changeset
1490 /* Discover, partition and process the loops. */
kono
parents:
diff changeset
1491 oacc_loop *loops = oacc_loop_discovery ();
kono
parents:
diff changeset
1492 int fn_level = oacc_fn_attrib_level (attrs);
kono
parents:
diff changeset
1493
kono
parents:
diff changeset
1494 if (dump_file)
kono
parents:
diff changeset
1495 {
kono
parents:
diff changeset
1496 if (fn_level >= 0)
kono
parents:
diff changeset
1497 fprintf (dump_file, "Function is OpenACC routine level %d\n",
kono
parents:
diff changeset
1498 fn_level);
kono
parents:
diff changeset
1499 else if (is_oacc_kernels)
kono
parents:
diff changeset
1500 fprintf (dump_file, "Function is %s OpenACC kernels offload\n",
kono
parents:
diff changeset
1501 (is_oacc_kernels_parallelized
kono
parents:
diff changeset
1502 ? "parallelized" : "unparallelized"));
kono
parents:
diff changeset
1503 else
kono
parents:
diff changeset
1504 fprintf (dump_file, "Function is OpenACC parallel offload\n");
kono
parents:
diff changeset
1505 }
kono
parents:
diff changeset
1506
kono
parents:
diff changeset
1507 unsigned outer_mask = fn_level >= 0 ? GOMP_DIM_MASK (fn_level) - 1 : 0;
kono
parents:
diff changeset
1508 unsigned used_mask = oacc_loop_partition (loops, outer_mask);
kono
parents:
diff changeset
1509 /* OpenACC kernels constructs are special: they currently don't use the
kono
parents:
diff changeset
1510 generic oacc_loop infrastructure and attribute/dimension processing. */
kono
parents:
diff changeset
1511 if (is_oacc_kernels && is_oacc_kernels_parallelized)
kono
parents:
diff changeset
1512 {
kono
parents:
diff changeset
1513 /* Parallelized OpenACC kernels constructs use gang parallelism. See
kono
parents:
diff changeset
1514 also tree-parloops.c:create_parallel_loop. */
kono
parents:
diff changeset
1515 used_mask |= GOMP_DIM_MASK (GOMP_DIM_GANG);
kono
parents:
diff changeset
1516 }
kono
parents:
diff changeset
1517
kono
parents:
diff changeset
1518 int dims[GOMP_DIM_MAX];
kono
parents:
diff changeset
1519 oacc_validate_dims (current_function_decl, attrs, dims, fn_level, used_mask);
kono
parents:
diff changeset
1520
kono
parents:
diff changeset
1521 if (dump_file)
kono
parents:
diff changeset
1522 {
kono
parents:
diff changeset
1523 const char *comma = "Compute dimensions [";
kono
parents:
diff changeset
1524 for (int ix = 0; ix != GOMP_DIM_MAX; ix++, comma = ", ")
kono
parents:
diff changeset
1525 fprintf (dump_file, "%s%d", comma, dims[ix]);
kono
parents:
diff changeset
1526 fprintf (dump_file, "]\n");
kono
parents:
diff changeset
1527 }
kono
parents:
diff changeset
1528
kono
parents:
diff changeset
1529 oacc_loop_process (loops);
kono
parents:
diff changeset
1530 if (dump_file)
kono
parents:
diff changeset
1531 {
kono
parents:
diff changeset
1532 fprintf (dump_file, "OpenACC loops\n");
kono
parents:
diff changeset
1533 dump_oacc_loop (dump_file, loops, 0);
kono
parents:
diff changeset
1534 fprintf (dump_file, "\n");
kono
parents:
diff changeset
1535 }
kono
parents:
diff changeset
1536
kono
parents:
diff changeset
1537 /* Offloaded targets may introduce new basic blocks, which require
kono
parents:
diff changeset
1538 dominance information to update SSA. */
kono
parents:
diff changeset
1539 calculate_dominance_info (CDI_DOMINATORS);
kono
parents:
diff changeset
1540
kono
parents:
diff changeset
1541 /* Now lower internal loop functions to target-specific code
kono
parents:
diff changeset
1542 sequences. */
kono
parents:
diff changeset
1543 basic_block bb;
kono
parents:
diff changeset
1544 FOR_ALL_BB_FN (bb, cfun)
kono
parents:
diff changeset
1545 for (gimple_stmt_iterator gsi = gsi_start_bb (bb); !gsi_end_p (gsi);)
kono
parents:
diff changeset
1546 {
kono
parents:
diff changeset
1547 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
1548 if (!is_gimple_call (stmt))
kono
parents:
diff changeset
1549 {
kono
parents:
diff changeset
1550 gsi_next (&gsi);
kono
parents:
diff changeset
1551 continue;
kono
parents:
diff changeset
1552 }
kono
parents:
diff changeset
1553
kono
parents:
diff changeset
1554 gcall *call = as_a <gcall *> (stmt);
kono
parents:
diff changeset
1555 if (!gimple_call_internal_p (call))
kono
parents:
diff changeset
1556 {
kono
parents:
diff changeset
1557 gsi_next (&gsi);
kono
parents:
diff changeset
1558 continue;
kono
parents:
diff changeset
1559 }
kono
parents:
diff changeset
1560
kono
parents:
diff changeset
1561 /* Rewind to allow rescan. */
kono
parents:
diff changeset
1562 gsi_prev (&gsi);
kono
parents:
diff changeset
1563 bool rescan = false, remove = false;
kono
parents:
diff changeset
1564 enum internal_fn ifn_code = gimple_call_internal_fn (call);
kono
parents:
diff changeset
1565
kono
parents:
diff changeset
1566 switch (ifn_code)
kono
parents:
diff changeset
1567 {
kono
parents:
diff changeset
1568 default: break;
kono
parents:
diff changeset
1569
kono
parents:
diff changeset
1570 case IFN_GOACC_TILE:
kono
parents:
diff changeset
1571 oacc_xform_tile (call);
kono
parents:
diff changeset
1572 rescan = true;
kono
parents:
diff changeset
1573 break;
kono
parents:
diff changeset
1574
kono
parents:
diff changeset
1575 case IFN_GOACC_LOOP:
kono
parents:
diff changeset
1576 oacc_xform_loop (call);
kono
parents:
diff changeset
1577 rescan = true;
kono
parents:
diff changeset
1578 break;
kono
parents:
diff changeset
1579
kono
parents:
diff changeset
1580 case IFN_GOACC_REDUCTION:
kono
parents:
diff changeset
1581 /* Mark the function for SSA renaming. */
kono
parents:
diff changeset
1582 mark_virtual_operands_for_renaming (cfun);
kono
parents:
diff changeset
1583
kono
parents:
diff changeset
1584 /* If the level is -1, this ended up being an unused
kono
parents:
diff changeset
1585 axis. Handle as a default. */
kono
parents:
diff changeset
1586 if (integer_minus_onep (gimple_call_arg (call, 3)))
kono
parents:
diff changeset
1587 default_goacc_reduction (call);
kono
parents:
diff changeset
1588 else
kono
parents:
diff changeset
1589 targetm.goacc.reduction (call);
kono
parents:
diff changeset
1590 rescan = true;
kono
parents:
diff changeset
1591 break;
kono
parents:
diff changeset
1592
kono
parents:
diff changeset
1593 case IFN_UNIQUE:
kono
parents:
diff changeset
1594 {
kono
parents:
diff changeset
1595 enum ifn_unique_kind kind
kono
parents:
diff changeset
1596 = ((enum ifn_unique_kind)
kono
parents:
diff changeset
1597 TREE_INT_CST_LOW (gimple_call_arg (call, 0)));
kono
parents:
diff changeset
1598
kono
parents:
diff changeset
1599 switch (kind)
kono
parents:
diff changeset
1600 {
kono
parents:
diff changeset
1601 default:
kono
parents:
diff changeset
1602 break;
kono
parents:
diff changeset
1603
kono
parents:
diff changeset
1604 case IFN_UNIQUE_OACC_FORK:
kono
parents:
diff changeset
1605 case IFN_UNIQUE_OACC_JOIN:
kono
parents:
diff changeset
1606 if (integer_minus_onep (gimple_call_arg (call, 2)))
kono
parents:
diff changeset
1607 remove = true;
kono
parents:
diff changeset
1608 else if (!targetm.goacc.fork_join
kono
parents:
diff changeset
1609 (call, dims, kind == IFN_UNIQUE_OACC_FORK))
kono
parents:
diff changeset
1610 remove = true;
kono
parents:
diff changeset
1611 break;
kono
parents:
diff changeset
1612
kono
parents:
diff changeset
1613 case IFN_UNIQUE_OACC_HEAD_MARK:
kono
parents:
diff changeset
1614 case IFN_UNIQUE_OACC_TAIL_MARK:
kono
parents:
diff changeset
1615 remove = true;
kono
parents:
diff changeset
1616 break;
kono
parents:
diff changeset
1617 }
kono
parents:
diff changeset
1618 break;
kono
parents:
diff changeset
1619 }
kono
parents:
diff changeset
1620 }
kono
parents:
diff changeset
1621
kono
parents:
diff changeset
1622 if (gsi_end_p (gsi))
kono
parents:
diff changeset
1623 /* We rewound past the beginning of the BB. */
kono
parents:
diff changeset
1624 gsi = gsi_start_bb (bb);
kono
parents:
diff changeset
1625 else
kono
parents:
diff changeset
1626 /* Undo the rewind. */
kono
parents:
diff changeset
1627 gsi_next (&gsi);
kono
parents:
diff changeset
1628
kono
parents:
diff changeset
1629 if (remove)
kono
parents:
diff changeset
1630 {
kono
parents:
diff changeset
1631 if (gimple_vdef (call))
kono
parents:
diff changeset
1632 replace_uses_by (gimple_vdef (call), gimple_vuse (call));
kono
parents:
diff changeset
1633 if (gimple_call_lhs (call))
kono
parents:
diff changeset
1634 {
kono
parents:
diff changeset
1635 /* Propagate the data dependency var. */
kono
parents:
diff changeset
1636 gimple *ass = gimple_build_assign (gimple_call_lhs (call),
kono
parents:
diff changeset
1637 gimple_call_arg (call, 1));
kono
parents:
diff changeset
1638 gsi_replace (&gsi, ass, false);
kono
parents:
diff changeset
1639 }
kono
parents:
diff changeset
1640 else
kono
parents:
diff changeset
1641 gsi_remove (&gsi, true);
kono
parents:
diff changeset
1642 }
kono
parents:
diff changeset
1643 else if (!rescan)
kono
parents:
diff changeset
1644 /* If not rescanning, advance over the call. */
kono
parents:
diff changeset
1645 gsi_next (&gsi);
kono
parents:
diff changeset
1646 }
kono
parents:
diff changeset
1647
kono
parents:
diff changeset
1648 free_oacc_loop (loops);
kono
parents:
diff changeset
1649
kono
parents:
diff changeset
1650 return 0;
kono
parents:
diff changeset
1651 }
kono
parents:
diff changeset
1652
kono
parents:
diff changeset
1653 /* Default launch dimension validator. Force everything to 1. A
kono
parents:
diff changeset
1654 backend that wants to provide larger dimensions must override this
kono
parents:
diff changeset
1655 hook. */
kono
parents:
diff changeset
1656
kono
parents:
diff changeset
1657 bool
kono
parents:
diff changeset
1658 default_goacc_validate_dims (tree ARG_UNUSED (decl), int *dims,
kono
parents:
diff changeset
1659 int ARG_UNUSED (fn_level))
kono
parents:
diff changeset
1660 {
kono
parents:
diff changeset
1661 bool changed = false;
kono
parents:
diff changeset
1662
kono
parents:
diff changeset
1663 for (unsigned ix = 0; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
1664 {
kono
parents:
diff changeset
1665 if (dims[ix] != 1)
kono
parents:
diff changeset
1666 {
kono
parents:
diff changeset
1667 dims[ix] = 1;
kono
parents:
diff changeset
1668 changed = true;
kono
parents:
diff changeset
1669 }
kono
parents:
diff changeset
1670 }
kono
parents:
diff changeset
1671
kono
parents:
diff changeset
1672 return changed;
kono
parents:
diff changeset
1673 }
kono
parents:
diff changeset
1674
kono
parents:
diff changeset
1675 /* Default dimension bound is unknown on accelerator and 1 on host. */
kono
parents:
diff changeset
1676
kono
parents:
diff changeset
1677 int
kono
parents:
diff changeset
1678 default_goacc_dim_limit (int ARG_UNUSED (axis))
kono
parents:
diff changeset
1679 {
kono
parents:
diff changeset
1680 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1681 return 0;
kono
parents:
diff changeset
1682 #else
kono
parents:
diff changeset
1683 return 1;
kono
parents:
diff changeset
1684 #endif
kono
parents:
diff changeset
1685 }
kono
parents:
diff changeset
1686
kono
parents:
diff changeset
1687 namespace {
kono
parents:
diff changeset
1688
kono
parents:
diff changeset
1689 const pass_data pass_data_oacc_device_lower =
kono
parents:
diff changeset
1690 {
kono
parents:
diff changeset
1691 GIMPLE_PASS, /* type */
kono
parents:
diff changeset
1692 "oaccdevlow", /* name */
kono
parents:
diff changeset
1693 OPTGROUP_OMP, /* optinfo_flags */
kono
parents:
diff changeset
1694 TV_NONE, /* tv_id */
kono
parents:
diff changeset
1695 PROP_cfg, /* properties_required */
kono
parents:
diff changeset
1696 0 /* Possibly PROP_gimple_eomp. */, /* properties_provided */
kono
parents:
diff changeset
1697 0, /* properties_destroyed */
kono
parents:
diff changeset
1698 0, /* todo_flags_start */
kono
parents:
diff changeset
1699 TODO_update_ssa | TODO_cleanup_cfg, /* todo_flags_finish */
kono
parents:
diff changeset
1700 };
kono
parents:
diff changeset
1701
kono
parents:
diff changeset
1702 class pass_oacc_device_lower : public gimple_opt_pass
kono
parents:
diff changeset
1703 {
kono
parents:
diff changeset
1704 public:
kono
parents:
diff changeset
1705 pass_oacc_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1706 : gimple_opt_pass (pass_data_oacc_device_lower, ctxt)
kono
parents:
diff changeset
1707 {}
kono
parents:
diff changeset
1708
kono
parents:
diff changeset
1709 /* opt_pass methods: */
kono
parents:
diff changeset
1710 virtual bool gate (function *) { return flag_openacc; };
kono
parents:
diff changeset
1711
kono
parents:
diff changeset
1712 virtual unsigned int execute (function *)
kono
parents:
diff changeset
1713 {
kono
parents:
diff changeset
1714 return execute_oacc_device_lower ();
kono
parents:
diff changeset
1715 }
kono
parents:
diff changeset
1716
kono
parents:
diff changeset
1717 }; // class pass_oacc_device_lower
kono
parents:
diff changeset
1718
kono
parents:
diff changeset
1719 } // anon namespace
kono
parents:
diff changeset
1720
kono
parents:
diff changeset
1721 gimple_opt_pass *
kono
parents:
diff changeset
1722 make_pass_oacc_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1723 {
kono
parents:
diff changeset
1724 return new pass_oacc_device_lower (ctxt);
kono
parents:
diff changeset
1725 }
kono
parents:
diff changeset
1726
kono
parents:
diff changeset
1727
kono
parents:
diff changeset
1728 /* Rewrite GOMP_SIMT_ENTER_ALLOC call given by GSI and remove the preceding
kono
parents:
diff changeset
1729 GOMP_SIMT_ENTER call identifying the privatized variables, which are
kono
parents:
diff changeset
1730 turned to structure fields and receive a DECL_VALUE_EXPR accordingly.
kono
parents:
diff changeset
1731 Set *REGIMPLIFY to true, except if no privatized variables were seen. */
kono
parents:
diff changeset
1732
kono
parents:
diff changeset
1733 static void
kono
parents:
diff changeset
1734 ompdevlow_adjust_simt_enter (gimple_stmt_iterator *gsi, bool *regimplify)
kono
parents:
diff changeset
1735 {
kono
parents:
diff changeset
1736 gimple *alloc_stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
1737 tree simtrec = gimple_call_lhs (alloc_stmt);
kono
parents:
diff changeset
1738 tree simduid = gimple_call_arg (alloc_stmt, 0);
kono
parents:
diff changeset
1739 gimple *enter_stmt = SSA_NAME_DEF_STMT (simduid);
kono
parents:
diff changeset
1740 gcc_assert (gimple_call_internal_p (enter_stmt, IFN_GOMP_SIMT_ENTER));
kono
parents:
diff changeset
1741 tree rectype = lang_hooks.types.make_type (RECORD_TYPE);
kono
parents:
diff changeset
1742 TYPE_ARTIFICIAL (rectype) = TYPE_NAMELESS (rectype) = 1;
kono
parents:
diff changeset
1743 TREE_ADDRESSABLE (rectype) = 1;
kono
parents:
diff changeset
1744 TREE_TYPE (simtrec) = build_pointer_type (rectype);
kono
parents:
diff changeset
1745 for (unsigned i = 1; i < gimple_call_num_args (enter_stmt); i++)
kono
parents:
diff changeset
1746 {
kono
parents:
diff changeset
1747 tree *argp = gimple_call_arg_ptr (enter_stmt, i);
kono
parents:
diff changeset
1748 if (*argp == null_pointer_node)
kono
parents:
diff changeset
1749 continue;
kono
parents:
diff changeset
1750 gcc_assert (TREE_CODE (*argp) == ADDR_EXPR
kono
parents:
diff changeset
1751 && VAR_P (TREE_OPERAND (*argp, 0)));
kono
parents:
diff changeset
1752 tree var = TREE_OPERAND (*argp, 0);
kono
parents:
diff changeset
1753
kono
parents:
diff changeset
1754 tree field = build_decl (DECL_SOURCE_LOCATION (var), FIELD_DECL,
kono
parents:
diff changeset
1755 DECL_NAME (var), TREE_TYPE (var));
kono
parents:
diff changeset
1756 SET_DECL_ALIGN (field, DECL_ALIGN (var));
kono
parents:
diff changeset
1757 DECL_USER_ALIGN (field) = DECL_USER_ALIGN (var);
kono
parents:
diff changeset
1758 TREE_THIS_VOLATILE (field) = TREE_THIS_VOLATILE (var);
kono
parents:
diff changeset
1759
kono
parents:
diff changeset
1760 insert_field_into_struct (rectype, field);
kono
parents:
diff changeset
1761
kono
parents:
diff changeset
1762 tree t = build_simple_mem_ref (simtrec);
kono
parents:
diff changeset
1763 t = build3 (COMPONENT_REF, TREE_TYPE (var), t, field, NULL);
kono
parents:
diff changeset
1764 TREE_THIS_VOLATILE (t) = TREE_THIS_VOLATILE (var);
kono
parents:
diff changeset
1765 SET_DECL_VALUE_EXPR (var, t);
kono
parents:
diff changeset
1766 DECL_HAS_VALUE_EXPR_P (var) = 1;
kono
parents:
diff changeset
1767 *regimplify = true;
kono
parents:
diff changeset
1768 }
kono
parents:
diff changeset
1769 layout_type (rectype);
kono
parents:
diff changeset
1770 tree size = TYPE_SIZE_UNIT (rectype);
kono
parents:
diff changeset
1771 tree align = build_int_cst (TREE_TYPE (size), TYPE_ALIGN_UNIT (rectype));
kono
parents:
diff changeset
1772
kono
parents:
diff changeset
1773 alloc_stmt
kono
parents:
diff changeset
1774 = gimple_build_call_internal (IFN_GOMP_SIMT_ENTER_ALLOC, 2, size, align);
kono
parents:
diff changeset
1775 gimple_call_set_lhs (alloc_stmt, simtrec);
kono
parents:
diff changeset
1776 gsi_replace (gsi, alloc_stmt, false);
kono
parents:
diff changeset
1777 gimple_stmt_iterator enter_gsi = gsi_for_stmt (enter_stmt);
kono
parents:
diff changeset
1778 enter_stmt = gimple_build_assign (simduid, gimple_call_arg (enter_stmt, 0));
kono
parents:
diff changeset
1779 gsi_replace (&enter_gsi, enter_stmt, false);
kono
parents:
diff changeset
1780
kono
parents:
diff changeset
1781 use_operand_p use;
kono
parents:
diff changeset
1782 gimple *exit_stmt;
kono
parents:
diff changeset
1783 if (single_imm_use (simtrec, &use, &exit_stmt))
kono
parents:
diff changeset
1784 {
kono
parents:
diff changeset
1785 gcc_assert (gimple_call_internal_p (exit_stmt, IFN_GOMP_SIMT_EXIT));
kono
parents:
diff changeset
1786 gimple_stmt_iterator exit_gsi = gsi_for_stmt (exit_stmt);
kono
parents:
diff changeset
1787 tree clobber = build_constructor (rectype, NULL);
kono
parents:
diff changeset
1788 TREE_THIS_VOLATILE (clobber) = 1;
kono
parents:
diff changeset
1789 exit_stmt = gimple_build_assign (build_simple_mem_ref (simtrec), clobber);
kono
parents:
diff changeset
1790 gsi_insert_before (&exit_gsi, exit_stmt, GSI_SAME_STMT);
kono
parents:
diff changeset
1791 }
kono
parents:
diff changeset
1792 else
kono
parents:
diff changeset
1793 gcc_checking_assert (has_zero_uses (simtrec));
kono
parents:
diff changeset
1794 }
kono
parents:
diff changeset
1795
kono
parents:
diff changeset
1796 /* Callback for walk_gimple_stmt used to scan for SIMT-privatized variables. */
kono
parents:
diff changeset
1797
kono
parents:
diff changeset
1798 static tree
kono
parents:
diff changeset
1799 find_simtpriv_var_op (tree *tp, int *walk_subtrees, void *)
kono
parents:
diff changeset
1800 {
kono
parents:
diff changeset
1801 tree t = *tp;
kono
parents:
diff changeset
1802
kono
parents:
diff changeset
1803 if (VAR_P (t)
kono
parents:
diff changeset
1804 && DECL_HAS_VALUE_EXPR_P (t)
kono
parents:
diff changeset
1805 && lookup_attribute ("omp simt private", DECL_ATTRIBUTES (t)))
kono
parents:
diff changeset
1806 {
kono
parents:
diff changeset
1807 *walk_subtrees = 0;
kono
parents:
diff changeset
1808 return t;
kono
parents:
diff changeset
1809 }
kono
parents:
diff changeset
1810 return NULL_TREE;
kono
parents:
diff changeset
1811 }
kono
parents:
diff changeset
1812
kono
parents:
diff changeset
1813 /* Cleanup uses of SIMT placeholder internal functions: on non-SIMT targets,
kono
parents:
diff changeset
1814 VF is 1 and LANE is 0; on SIMT targets, VF is folded to a constant, and
kono
parents:
diff changeset
1815 LANE is kept to be expanded to RTL later on. Also cleanup all other SIMT
kono
parents:
diff changeset
1816 internal functions on non-SIMT targets, and likewise some SIMD internal
kono
parents:
diff changeset
1817 functions on SIMT targets. */
kono
parents:
diff changeset
1818
kono
parents:
diff changeset
1819 static unsigned int
kono
parents:
diff changeset
1820 execute_omp_device_lower ()
kono
parents:
diff changeset
1821 {
kono
parents:
diff changeset
1822 int vf = targetm.simt.vf ? targetm.simt.vf () : 1;
kono
parents:
diff changeset
1823 bool regimplify = false;
kono
parents:
diff changeset
1824 basic_block bb;
kono
parents:
diff changeset
1825 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
1826 FOR_EACH_BB_FN (bb, cfun)
kono
parents:
diff changeset
1827 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
1828 {
kono
parents:
diff changeset
1829 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
1830 if (!is_gimple_call (stmt) || !gimple_call_internal_p (stmt))
kono
parents:
diff changeset
1831 continue;
kono
parents:
diff changeset
1832 tree lhs = gimple_call_lhs (stmt), rhs = NULL_TREE;
kono
parents:
diff changeset
1833 tree type = lhs ? TREE_TYPE (lhs) : integer_type_node;
kono
parents:
diff changeset
1834 switch (gimple_call_internal_fn (stmt))
kono
parents:
diff changeset
1835 {
kono
parents:
diff changeset
1836 case IFN_GOMP_USE_SIMT:
kono
parents:
diff changeset
1837 rhs = vf == 1 ? integer_zero_node : integer_one_node;
kono
parents:
diff changeset
1838 break;
kono
parents:
diff changeset
1839 case IFN_GOMP_SIMT_ENTER:
kono
parents:
diff changeset
1840 rhs = vf == 1 ? gimple_call_arg (stmt, 0) : NULL_TREE;
kono
parents:
diff changeset
1841 goto simtreg_enter_exit;
kono
parents:
diff changeset
1842 case IFN_GOMP_SIMT_ENTER_ALLOC:
kono
parents:
diff changeset
1843 if (vf != 1)
kono
parents:
diff changeset
1844 ompdevlow_adjust_simt_enter (&gsi, &regimplify);
kono
parents:
diff changeset
1845 rhs = vf == 1 ? null_pointer_node : NULL_TREE;
kono
parents:
diff changeset
1846 goto simtreg_enter_exit;
kono
parents:
diff changeset
1847 case IFN_GOMP_SIMT_EXIT:
kono
parents:
diff changeset
1848 simtreg_enter_exit:
kono
parents:
diff changeset
1849 if (vf != 1)
kono
parents:
diff changeset
1850 continue;
kono
parents:
diff changeset
1851 unlink_stmt_vdef (stmt);
kono
parents:
diff changeset
1852 break;
kono
parents:
diff changeset
1853 case IFN_GOMP_SIMT_LANE:
kono
parents:
diff changeset
1854 case IFN_GOMP_SIMT_LAST_LANE:
kono
parents:
diff changeset
1855 rhs = vf == 1 ? build_zero_cst (type) : NULL_TREE;
kono
parents:
diff changeset
1856 break;
kono
parents:
diff changeset
1857 case IFN_GOMP_SIMT_VF:
kono
parents:
diff changeset
1858 rhs = build_int_cst (type, vf);
kono
parents:
diff changeset
1859 break;
kono
parents:
diff changeset
1860 case IFN_GOMP_SIMT_ORDERED_PRED:
kono
parents:
diff changeset
1861 rhs = vf == 1 ? integer_zero_node : NULL_TREE;
kono
parents:
diff changeset
1862 if (rhs || !lhs)
kono
parents:
diff changeset
1863 unlink_stmt_vdef (stmt);
kono
parents:
diff changeset
1864 break;
kono
parents:
diff changeset
1865 case IFN_GOMP_SIMT_VOTE_ANY:
kono
parents:
diff changeset
1866 case IFN_GOMP_SIMT_XCHG_BFLY:
kono
parents:
diff changeset
1867 case IFN_GOMP_SIMT_XCHG_IDX:
kono
parents:
diff changeset
1868 rhs = vf == 1 ? gimple_call_arg (stmt, 0) : NULL_TREE;
kono
parents:
diff changeset
1869 break;
kono
parents:
diff changeset
1870 case IFN_GOMP_SIMD_LANE:
kono
parents:
diff changeset
1871 case IFN_GOMP_SIMD_LAST_LANE:
kono
parents:
diff changeset
1872 rhs = vf != 1 ? build_zero_cst (type) : NULL_TREE;
kono
parents:
diff changeset
1873 break;
kono
parents:
diff changeset
1874 case IFN_GOMP_SIMD_VF:
kono
parents:
diff changeset
1875 rhs = vf != 1 ? build_one_cst (type) : NULL_TREE;
kono
parents:
diff changeset
1876 break;
kono
parents:
diff changeset
1877 default:
kono
parents:
diff changeset
1878 continue;
kono
parents:
diff changeset
1879 }
kono
parents:
diff changeset
1880 if (lhs && !rhs)
kono
parents:
diff changeset
1881 continue;
kono
parents:
diff changeset
1882 stmt = lhs ? gimple_build_assign (lhs, rhs) : gimple_build_nop ();
kono
parents:
diff changeset
1883 gsi_replace (&gsi, stmt, false);
kono
parents:
diff changeset
1884 }
kono
parents:
diff changeset
1885 if (regimplify)
kono
parents:
diff changeset
1886 FOR_EACH_BB_REVERSE_FN (bb, cfun)
kono
parents:
diff changeset
1887 for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi); gsi_prev (&gsi))
kono
parents:
diff changeset
1888 if (walk_gimple_stmt (&gsi, NULL, find_simtpriv_var_op, NULL))
kono
parents:
diff changeset
1889 {
kono
parents:
diff changeset
1890 if (gimple_clobber_p (gsi_stmt (gsi)))
kono
parents:
diff changeset
1891 gsi_remove (&gsi, true);
kono
parents:
diff changeset
1892 else
kono
parents:
diff changeset
1893 gimple_regimplify_operands (gsi_stmt (gsi), &gsi);
kono
parents:
diff changeset
1894 }
kono
parents:
diff changeset
1895 if (vf != 1)
kono
parents:
diff changeset
1896 cfun->has_force_vectorize_loops = false;
kono
parents:
diff changeset
1897 return 0;
kono
parents:
diff changeset
1898 }
kono
parents:
diff changeset
1899
kono
parents:
diff changeset
1900 namespace {
kono
parents:
diff changeset
1901
kono
parents:
diff changeset
1902 const pass_data pass_data_omp_device_lower =
kono
parents:
diff changeset
1903 {
kono
parents:
diff changeset
1904 GIMPLE_PASS, /* type */
kono
parents:
diff changeset
1905 "ompdevlow", /* name */
kono
parents:
diff changeset
1906 OPTGROUP_OMP, /* optinfo_flags */
kono
parents:
diff changeset
1907 TV_NONE, /* tv_id */
kono
parents:
diff changeset
1908 PROP_cfg, /* properties_required */
kono
parents:
diff changeset
1909 PROP_gimple_lomp_dev, /* properties_provided */
kono
parents:
diff changeset
1910 0, /* properties_destroyed */
kono
parents:
diff changeset
1911 0, /* todo_flags_start */
kono
parents:
diff changeset
1912 TODO_update_ssa, /* todo_flags_finish */
kono
parents:
diff changeset
1913 };
kono
parents:
diff changeset
1914
kono
parents:
diff changeset
1915 class pass_omp_device_lower : public gimple_opt_pass
kono
parents:
diff changeset
1916 {
kono
parents:
diff changeset
1917 public:
kono
parents:
diff changeset
1918 pass_omp_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1919 : gimple_opt_pass (pass_data_omp_device_lower, ctxt)
kono
parents:
diff changeset
1920 {}
kono
parents:
diff changeset
1921
kono
parents:
diff changeset
1922 /* opt_pass methods: */
kono
parents:
diff changeset
1923 virtual bool gate (function *fun)
kono
parents:
diff changeset
1924 {
kono
parents:
diff changeset
1925 return !(fun->curr_properties & PROP_gimple_lomp_dev);
kono
parents:
diff changeset
1926 }
kono
parents:
diff changeset
1927 virtual unsigned int execute (function *)
kono
parents:
diff changeset
1928 {
kono
parents:
diff changeset
1929 return execute_omp_device_lower ();
kono
parents:
diff changeset
1930 }
kono
parents:
diff changeset
1931
kono
parents:
diff changeset
1932 }; // class pass_expand_omp_ssa
kono
parents:
diff changeset
1933
kono
parents:
diff changeset
1934 } // anon namespace
kono
parents:
diff changeset
1935
kono
parents:
diff changeset
1936 gimple_opt_pass *
kono
parents:
diff changeset
1937 make_pass_omp_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1938 {
kono
parents:
diff changeset
1939 return new pass_omp_device_lower (ctxt);
kono
parents:
diff changeset
1940 }
kono
parents:
diff changeset
1941
kono
parents:
diff changeset
1942 /* "omp declare target link" handling pass. */
kono
parents:
diff changeset
1943
kono
parents:
diff changeset
1944 namespace {
kono
parents:
diff changeset
1945
kono
parents:
diff changeset
1946 const pass_data pass_data_omp_target_link =
kono
parents:
diff changeset
1947 {
kono
parents:
diff changeset
1948 GIMPLE_PASS, /* type */
kono
parents:
diff changeset
1949 "omptargetlink", /* name */
kono
parents:
diff changeset
1950 OPTGROUP_OMP, /* optinfo_flags */
kono
parents:
diff changeset
1951 TV_NONE, /* tv_id */
kono
parents:
diff changeset
1952 PROP_ssa, /* properties_required */
kono
parents:
diff changeset
1953 0, /* properties_provided */
kono
parents:
diff changeset
1954 0, /* properties_destroyed */
kono
parents:
diff changeset
1955 0, /* todo_flags_start */
kono
parents:
diff changeset
1956 TODO_update_ssa, /* todo_flags_finish */
kono
parents:
diff changeset
1957 };
kono
parents:
diff changeset
1958
kono
parents:
diff changeset
1959 class pass_omp_target_link : public gimple_opt_pass
kono
parents:
diff changeset
1960 {
kono
parents:
diff changeset
1961 public:
kono
parents:
diff changeset
1962 pass_omp_target_link (gcc::context *ctxt)
kono
parents:
diff changeset
1963 : gimple_opt_pass (pass_data_omp_target_link, ctxt)
kono
parents:
diff changeset
1964 {}
kono
parents:
diff changeset
1965
kono
parents:
diff changeset
1966 /* opt_pass methods: */
kono
parents:
diff changeset
1967 virtual bool gate (function *fun)
kono
parents:
diff changeset
1968 {
kono
parents:
diff changeset
1969 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1970 tree attrs = DECL_ATTRIBUTES (fun->decl);
kono
parents:
diff changeset
1971 return lookup_attribute ("omp declare target", attrs)
kono
parents:
diff changeset
1972 || lookup_attribute ("omp target entrypoint", attrs);
kono
parents:
diff changeset
1973 #else
kono
parents:
diff changeset
1974 (void) fun;
kono
parents:
diff changeset
1975 return false;
kono
parents:
diff changeset
1976 #endif
kono
parents:
diff changeset
1977 }
kono
parents:
diff changeset
1978
kono
parents:
diff changeset
1979 virtual unsigned execute (function *);
kono
parents:
diff changeset
1980 };
kono
parents:
diff changeset
1981
kono
parents:
diff changeset
1982 /* Callback for walk_gimple_stmt used to scan for link var operands. */
kono
parents:
diff changeset
1983
kono
parents:
diff changeset
1984 static tree
kono
parents:
diff changeset
1985 find_link_var_op (tree *tp, int *walk_subtrees, void *)
kono
parents:
diff changeset
1986 {
kono
parents:
diff changeset
1987 tree t = *tp;
kono
parents:
diff changeset
1988
kono
parents:
diff changeset
1989 if (VAR_P (t)
kono
parents:
diff changeset
1990 && DECL_HAS_VALUE_EXPR_P (t)
kono
parents:
diff changeset
1991 && is_global_var (t)
kono
parents:
diff changeset
1992 && lookup_attribute ("omp declare target link", DECL_ATTRIBUTES (t)))
kono
parents:
diff changeset
1993 {
kono
parents:
diff changeset
1994 *walk_subtrees = 0;
kono
parents:
diff changeset
1995 return t;
kono
parents:
diff changeset
1996 }
kono
parents:
diff changeset
1997
kono
parents:
diff changeset
1998 return NULL_TREE;
kono
parents:
diff changeset
1999 }
kono
parents:
diff changeset
2000
kono
parents:
diff changeset
2001 unsigned
kono
parents:
diff changeset
2002 pass_omp_target_link::execute (function *fun)
kono
parents:
diff changeset
2003 {
kono
parents:
diff changeset
2004 basic_block bb;
kono
parents:
diff changeset
2005 FOR_EACH_BB_FN (bb, fun)
kono
parents:
diff changeset
2006 {
kono
parents:
diff changeset
2007 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
2008 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
2009 if (walk_gimple_stmt (&gsi, NULL, find_link_var_op, NULL))
kono
parents:
diff changeset
2010 gimple_regimplify_operands (gsi_stmt (gsi), &gsi);
kono
parents:
diff changeset
2011 }
kono
parents:
diff changeset
2012
kono
parents:
diff changeset
2013 return 0;
kono
parents:
diff changeset
2014 }
kono
parents:
diff changeset
2015
kono
parents:
diff changeset
2016 } // anon namespace
kono
parents:
diff changeset
2017
kono
parents:
diff changeset
2018 gimple_opt_pass *
kono
parents:
diff changeset
2019 make_pass_omp_target_link (gcc::context *ctxt)
kono
parents:
diff changeset
2020 {
kono
parents:
diff changeset
2021 return new pass_omp_target_link (ctxt);
kono
parents:
diff changeset
2022 }