annotate gcc/omp-offload.c @ 158:494b0b89df80 default tip

...
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Mon, 25 May 2020 18:13:55 +0900
parents 1830386684a0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
111
kono
parents:
diff changeset
1 /* Bits of OpenMP and OpenACC handling that is specific to device offloading
kono
parents:
diff changeset
2 and a lowering pass for OpenACC device directives.
kono
parents:
diff changeset
3
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
4 Copyright (C) 2005-2020 Free Software Foundation, Inc.
111
kono
parents:
diff changeset
5
kono
parents:
diff changeset
6 This file is part of GCC.
kono
parents:
diff changeset
7
kono
parents:
diff changeset
8 GCC is free software; you can redistribute it and/or modify it under
kono
parents:
diff changeset
9 the terms of the GNU General Public License as published by the Free
kono
parents:
diff changeset
10 Software Foundation; either version 3, or (at your option) any later
kono
parents:
diff changeset
11 version.
kono
parents:
diff changeset
12
kono
parents:
diff changeset
13 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
kono
parents:
diff changeset
14 WARRANTY; without even the implied warranty of MERCHANTABILITY or
kono
parents:
diff changeset
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
kono
parents:
diff changeset
16 for more details.
kono
parents:
diff changeset
17
kono
parents:
diff changeset
18 You should have received a copy of the GNU General Public License
kono
parents:
diff changeset
19 along with GCC; see the file COPYING3. If not see
kono
parents:
diff changeset
20 <http://www.gnu.org/licenses/>. */
kono
parents:
diff changeset
21
kono
parents:
diff changeset
22 #include "config.h"
kono
parents:
diff changeset
23 #include "system.h"
kono
parents:
diff changeset
24 #include "coretypes.h"
kono
parents:
diff changeset
25 #include "backend.h"
kono
parents:
diff changeset
26 #include "target.h"
kono
parents:
diff changeset
27 #include "tree.h"
kono
parents:
diff changeset
28 #include "gimple.h"
kono
parents:
diff changeset
29 #include "tree-pass.h"
kono
parents:
diff changeset
30 #include "ssa.h"
kono
parents:
diff changeset
31 #include "cgraph.h"
kono
parents:
diff changeset
32 #include "pretty-print.h"
kono
parents:
diff changeset
33 #include "diagnostic-core.h"
kono
parents:
diff changeset
34 #include "fold-const.h"
kono
parents:
diff changeset
35 #include "internal-fn.h"
kono
parents:
diff changeset
36 #include "langhooks.h"
kono
parents:
diff changeset
37 #include "gimplify.h"
kono
parents:
diff changeset
38 #include "gimple-iterator.h"
kono
parents:
diff changeset
39 #include "gimplify-me.h"
kono
parents:
diff changeset
40 #include "gimple-walk.h"
kono
parents:
diff changeset
41 #include "tree-cfg.h"
kono
parents:
diff changeset
42 #include "tree-into-ssa.h"
kono
parents:
diff changeset
43 #include "tree-nested.h"
kono
parents:
diff changeset
44 #include "stor-layout.h"
kono
parents:
diff changeset
45 #include "common/common-target.h"
kono
parents:
diff changeset
46 #include "omp-general.h"
kono
parents:
diff changeset
47 #include "omp-offload.h"
kono
parents:
diff changeset
48 #include "lto-section-names.h"
kono
parents:
diff changeset
49 #include "gomp-constants.h"
kono
parents:
diff changeset
50 #include "gimple-pretty-print.h"
kono
parents:
diff changeset
51 #include "intl.h"
kono
parents:
diff changeset
52 #include "stringpool.h"
kono
parents:
diff changeset
53 #include "attribs.h"
kono
parents:
diff changeset
54 #include "cfgloop.h"
kono
parents:
diff changeset
55
kono
parents:
diff changeset
56 /* Describe the OpenACC looping structure of a function. The entire
kono
parents:
diff changeset
57 function is held in a 'NULL' loop. */
kono
parents:
diff changeset
58
kono
parents:
diff changeset
59 struct oacc_loop
kono
parents:
diff changeset
60 {
kono
parents:
diff changeset
61 oacc_loop *parent; /* Containing loop. */
kono
parents:
diff changeset
62
kono
parents:
diff changeset
63 oacc_loop *child; /* First inner loop. */
kono
parents:
diff changeset
64
kono
parents:
diff changeset
65 oacc_loop *sibling; /* Next loop within same parent. */
kono
parents:
diff changeset
66
kono
parents:
diff changeset
67 location_t loc; /* Location of the loop start. */
kono
parents:
diff changeset
68
kono
parents:
diff changeset
69 gcall *marker; /* Initial head marker. */
kono
parents:
diff changeset
70
kono
parents:
diff changeset
71 gcall *heads[GOMP_DIM_MAX]; /* Head marker functions. */
kono
parents:
diff changeset
72 gcall *tails[GOMP_DIM_MAX]; /* Tail marker functions. */
kono
parents:
diff changeset
73
kono
parents:
diff changeset
74 tree routine; /* Pseudo-loop enclosing a routine. */
kono
parents:
diff changeset
75
kono
parents:
diff changeset
76 unsigned mask; /* Partitioning mask. */
kono
parents:
diff changeset
77 unsigned e_mask; /* Partitioning of element loops (when tiling). */
kono
parents:
diff changeset
78 unsigned inner; /* Partitioning of inner loops. */
kono
parents:
diff changeset
79 unsigned flags; /* Partitioning flags. */
kono
parents:
diff changeset
80 vec<gcall *> ifns; /* Contained loop abstraction functions. */
kono
parents:
diff changeset
81 tree chunk_size; /* Chunk size. */
kono
parents:
diff changeset
82 gcall *head_end; /* Final marker of head sequence. */
kono
parents:
diff changeset
83 };
kono
parents:
diff changeset
84
kono
parents:
diff changeset
85 /* Holds offload tables with decls. */
kono
parents:
diff changeset
86 vec<tree, va_gc> *offload_funcs, *offload_vars;
kono
parents:
diff changeset
87
kono
parents:
diff changeset
88 /* Return level at which oacc routine may spawn a partitioned loop, or
kono
parents:
diff changeset
89 -1 if it is not a routine (i.e. is an offload fn). */
kono
parents:
diff changeset
90
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
91 int
111
kono
parents:
diff changeset
92 oacc_fn_attrib_level (tree attr)
kono
parents:
diff changeset
93 {
kono
parents:
diff changeset
94 tree pos = TREE_VALUE (attr);
kono
parents:
diff changeset
95
kono
parents:
diff changeset
96 if (!TREE_PURPOSE (pos))
kono
parents:
diff changeset
97 return -1;
kono
parents:
diff changeset
98
kono
parents:
diff changeset
99 int ix = 0;
kono
parents:
diff changeset
100 for (ix = 0; ix != GOMP_DIM_MAX;
kono
parents:
diff changeset
101 ix++, pos = TREE_CHAIN (pos))
kono
parents:
diff changeset
102 if (!integer_zerop (TREE_PURPOSE (pos)))
kono
parents:
diff changeset
103 break;
kono
parents:
diff changeset
104
kono
parents:
diff changeset
105 return ix;
kono
parents:
diff changeset
106 }
kono
parents:
diff changeset
107
kono
parents:
diff changeset
108 /* Helper function for omp_finish_file routine. Takes decls from V_DECLS and
kono
parents:
diff changeset
109 adds their addresses and sizes to constructor-vector V_CTOR. */
kono
parents:
diff changeset
110
kono
parents:
diff changeset
111 static void
kono
parents:
diff changeset
112 add_decls_addresses_to_decl_constructor (vec<tree, va_gc> *v_decls,
kono
parents:
diff changeset
113 vec<constructor_elt, va_gc> *v_ctor)
kono
parents:
diff changeset
114 {
kono
parents:
diff changeset
115 unsigned len = vec_safe_length (v_decls);
kono
parents:
diff changeset
116 for (unsigned i = 0; i < len; i++)
kono
parents:
diff changeset
117 {
kono
parents:
diff changeset
118 tree it = (*v_decls)[i];
kono
parents:
diff changeset
119 bool is_var = VAR_P (it);
kono
parents:
diff changeset
120 bool is_link_var
kono
parents:
diff changeset
121 = is_var
kono
parents:
diff changeset
122 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
123 && DECL_HAS_VALUE_EXPR_P (it)
kono
parents:
diff changeset
124 #endif
kono
parents:
diff changeset
125 && lookup_attribute ("omp declare target link", DECL_ATTRIBUTES (it));
kono
parents:
diff changeset
126
kono
parents:
diff changeset
127 tree size = NULL_TREE;
kono
parents:
diff changeset
128 if (is_var)
kono
parents:
diff changeset
129 size = fold_convert (const_ptr_type_node, DECL_SIZE_UNIT (it));
kono
parents:
diff changeset
130
kono
parents:
diff changeset
131 tree addr;
kono
parents:
diff changeset
132 if (!is_link_var)
kono
parents:
diff changeset
133 addr = build_fold_addr_expr (it);
kono
parents:
diff changeset
134 else
kono
parents:
diff changeset
135 {
kono
parents:
diff changeset
136 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
137 /* For "omp declare target link" vars add address of the pointer to
kono
parents:
diff changeset
138 the target table, instead of address of the var. */
kono
parents:
diff changeset
139 tree value_expr = DECL_VALUE_EXPR (it);
kono
parents:
diff changeset
140 tree link_ptr_decl = TREE_OPERAND (value_expr, 0);
kono
parents:
diff changeset
141 varpool_node::finalize_decl (link_ptr_decl);
kono
parents:
diff changeset
142 addr = build_fold_addr_expr (link_ptr_decl);
kono
parents:
diff changeset
143 #else
kono
parents:
diff changeset
144 addr = build_fold_addr_expr (it);
kono
parents:
diff changeset
145 #endif
kono
parents:
diff changeset
146
kono
parents:
diff changeset
147 /* Most significant bit of the size marks "omp declare target link"
kono
parents:
diff changeset
148 vars in host and target tables. */
kono
parents:
diff changeset
149 unsigned HOST_WIDE_INT isize = tree_to_uhwi (size);
kono
parents:
diff changeset
150 isize |= 1ULL << (int_size_in_bytes (const_ptr_type_node)
kono
parents:
diff changeset
151 * BITS_PER_UNIT - 1);
kono
parents:
diff changeset
152 size = wide_int_to_tree (const_ptr_type_node, isize);
kono
parents:
diff changeset
153 }
kono
parents:
diff changeset
154
kono
parents:
diff changeset
155 CONSTRUCTOR_APPEND_ELT (v_ctor, NULL_TREE, addr);
kono
parents:
diff changeset
156 if (is_var)
kono
parents:
diff changeset
157 CONSTRUCTOR_APPEND_ELT (v_ctor, NULL_TREE, size);
kono
parents:
diff changeset
158 }
kono
parents:
diff changeset
159 }
kono
parents:
diff changeset
160
kono
parents:
diff changeset
161 /* Create new symbols containing (address, size) pairs for global variables,
kono
parents:
diff changeset
162 marked with "omp declare target" attribute, as well as addresses for the
kono
parents:
diff changeset
163 functions, which are outlined offloading regions. */
kono
parents:
diff changeset
164 void
kono
parents:
diff changeset
165 omp_finish_file (void)
kono
parents:
diff changeset
166 {
kono
parents:
diff changeset
167 unsigned num_funcs = vec_safe_length (offload_funcs);
kono
parents:
diff changeset
168 unsigned num_vars = vec_safe_length (offload_vars);
kono
parents:
diff changeset
169
kono
parents:
diff changeset
170 if (num_funcs == 0 && num_vars == 0)
kono
parents:
diff changeset
171 return;
kono
parents:
diff changeset
172
kono
parents:
diff changeset
173 if (targetm_common.have_named_sections)
kono
parents:
diff changeset
174 {
kono
parents:
diff changeset
175 vec<constructor_elt, va_gc> *v_f, *v_v;
kono
parents:
diff changeset
176 vec_alloc (v_f, num_funcs);
kono
parents:
diff changeset
177 vec_alloc (v_v, num_vars * 2);
kono
parents:
diff changeset
178
kono
parents:
diff changeset
179 add_decls_addresses_to_decl_constructor (offload_funcs, v_f);
kono
parents:
diff changeset
180 add_decls_addresses_to_decl_constructor (offload_vars, v_v);
kono
parents:
diff changeset
181
kono
parents:
diff changeset
182 tree vars_decl_type = build_array_type_nelts (pointer_sized_int_node,
kono
parents:
diff changeset
183 num_vars * 2);
kono
parents:
diff changeset
184 tree funcs_decl_type = build_array_type_nelts (pointer_sized_int_node,
kono
parents:
diff changeset
185 num_funcs);
kono
parents:
diff changeset
186 SET_TYPE_ALIGN (vars_decl_type, TYPE_ALIGN (pointer_sized_int_node));
kono
parents:
diff changeset
187 SET_TYPE_ALIGN (funcs_decl_type, TYPE_ALIGN (pointer_sized_int_node));
kono
parents:
diff changeset
188 tree ctor_v = build_constructor (vars_decl_type, v_v);
kono
parents:
diff changeset
189 tree ctor_f = build_constructor (funcs_decl_type, v_f);
kono
parents:
diff changeset
190 TREE_CONSTANT (ctor_v) = TREE_CONSTANT (ctor_f) = 1;
kono
parents:
diff changeset
191 TREE_STATIC (ctor_v) = TREE_STATIC (ctor_f) = 1;
kono
parents:
diff changeset
192 tree funcs_decl = build_decl (UNKNOWN_LOCATION, VAR_DECL,
kono
parents:
diff changeset
193 get_identifier (".offload_func_table"),
kono
parents:
diff changeset
194 funcs_decl_type);
kono
parents:
diff changeset
195 tree vars_decl = build_decl (UNKNOWN_LOCATION, VAR_DECL,
kono
parents:
diff changeset
196 get_identifier (".offload_var_table"),
kono
parents:
diff changeset
197 vars_decl_type);
kono
parents:
diff changeset
198 TREE_STATIC (funcs_decl) = TREE_STATIC (vars_decl) = 1;
kono
parents:
diff changeset
199 /* Do not align tables more than TYPE_ALIGN (pointer_sized_int_node),
kono
parents:
diff changeset
200 otherwise a joint table in a binary will contain padding between
kono
parents:
diff changeset
201 tables from multiple object files. */
kono
parents:
diff changeset
202 DECL_USER_ALIGN (funcs_decl) = DECL_USER_ALIGN (vars_decl) = 1;
kono
parents:
diff changeset
203 SET_DECL_ALIGN (funcs_decl, TYPE_ALIGN (funcs_decl_type));
kono
parents:
diff changeset
204 SET_DECL_ALIGN (vars_decl, TYPE_ALIGN (vars_decl_type));
kono
parents:
diff changeset
205 DECL_INITIAL (funcs_decl) = ctor_f;
kono
parents:
diff changeset
206 DECL_INITIAL (vars_decl) = ctor_v;
kono
parents:
diff changeset
207 set_decl_section_name (funcs_decl, OFFLOAD_FUNC_TABLE_SECTION_NAME);
kono
parents:
diff changeset
208 set_decl_section_name (vars_decl, OFFLOAD_VAR_TABLE_SECTION_NAME);
kono
parents:
diff changeset
209
kono
parents:
diff changeset
210 varpool_node::finalize_decl (vars_decl);
kono
parents:
diff changeset
211 varpool_node::finalize_decl (funcs_decl);
kono
parents:
diff changeset
212 }
kono
parents:
diff changeset
213 else
kono
parents:
diff changeset
214 {
kono
parents:
diff changeset
215 for (unsigned i = 0; i < num_funcs; i++)
kono
parents:
diff changeset
216 {
kono
parents:
diff changeset
217 tree it = (*offload_funcs)[i];
kono
parents:
diff changeset
218 targetm.record_offload_symbol (it);
kono
parents:
diff changeset
219 }
kono
parents:
diff changeset
220 for (unsigned i = 0; i < num_vars; i++)
kono
parents:
diff changeset
221 {
kono
parents:
diff changeset
222 tree it = (*offload_vars)[i];
kono
parents:
diff changeset
223 targetm.record_offload_symbol (it);
kono
parents:
diff changeset
224 }
kono
parents:
diff changeset
225 }
kono
parents:
diff changeset
226 }
kono
parents:
diff changeset
227
kono
parents:
diff changeset
228 /* Call dim_pos (POS == true) or dim_size (POS == false) builtins for
kono
parents:
diff changeset
229 axis DIM. Return a tmp var holding the result. */
kono
parents:
diff changeset
230
kono
parents:
diff changeset
231 static tree
kono
parents:
diff changeset
232 oacc_dim_call (bool pos, int dim, gimple_seq *seq)
kono
parents:
diff changeset
233 {
kono
parents:
diff changeset
234 tree arg = build_int_cst (unsigned_type_node, dim);
kono
parents:
diff changeset
235 tree size = create_tmp_var (integer_type_node);
kono
parents:
diff changeset
236 enum internal_fn fn = pos ? IFN_GOACC_DIM_POS : IFN_GOACC_DIM_SIZE;
kono
parents:
diff changeset
237 gimple *call = gimple_build_call_internal (fn, 1, arg);
kono
parents:
diff changeset
238
kono
parents:
diff changeset
239 gimple_call_set_lhs (call, size);
kono
parents:
diff changeset
240 gimple_seq_add_stmt (seq, call);
kono
parents:
diff changeset
241
kono
parents:
diff changeset
242 return size;
kono
parents:
diff changeset
243 }
kono
parents:
diff changeset
244
kono
parents:
diff changeset
245 /* Find the number of threads (POS = false), or thread number (POS =
kono
parents:
diff changeset
246 true) for an OpenACC region partitioned as MASK. Setup code
kono
parents:
diff changeset
247 required for the calculation is added to SEQ. */
kono
parents:
diff changeset
248
kono
parents:
diff changeset
249 static tree
kono
parents:
diff changeset
250 oacc_thread_numbers (bool pos, int mask, gimple_seq *seq)
kono
parents:
diff changeset
251 {
kono
parents:
diff changeset
252 tree res = pos ? NULL_TREE : build_int_cst (unsigned_type_node, 1);
kono
parents:
diff changeset
253 unsigned ix;
kono
parents:
diff changeset
254
kono
parents:
diff changeset
255 /* Start at gang level, and examine relevant dimension indices. */
kono
parents:
diff changeset
256 for (ix = GOMP_DIM_GANG; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
257 if (GOMP_DIM_MASK (ix) & mask)
kono
parents:
diff changeset
258 {
kono
parents:
diff changeset
259 if (res)
kono
parents:
diff changeset
260 {
kono
parents:
diff changeset
261 /* We had an outer index, so scale that by the size of
kono
parents:
diff changeset
262 this dimension. */
kono
parents:
diff changeset
263 tree n = oacc_dim_call (false, ix, seq);
kono
parents:
diff changeset
264 res = fold_build2 (MULT_EXPR, integer_type_node, res, n);
kono
parents:
diff changeset
265 }
kono
parents:
diff changeset
266 if (pos)
kono
parents:
diff changeset
267 {
kono
parents:
diff changeset
268 /* Determine index in this dimension. */
kono
parents:
diff changeset
269 tree id = oacc_dim_call (true, ix, seq);
kono
parents:
diff changeset
270 if (res)
kono
parents:
diff changeset
271 res = fold_build2 (PLUS_EXPR, integer_type_node, res, id);
kono
parents:
diff changeset
272 else
kono
parents:
diff changeset
273 res = id;
kono
parents:
diff changeset
274 }
kono
parents:
diff changeset
275 }
kono
parents:
diff changeset
276
kono
parents:
diff changeset
277 if (res == NULL_TREE)
kono
parents:
diff changeset
278 res = integer_zero_node;
kono
parents:
diff changeset
279
kono
parents:
diff changeset
280 return res;
kono
parents:
diff changeset
281 }
kono
parents:
diff changeset
282
kono
parents:
diff changeset
283 /* Transform IFN_GOACC_LOOP calls to actual code. See
kono
parents:
diff changeset
284 expand_oacc_for for where these are generated. At the vector
kono
parents:
diff changeset
285 level, we stride loops, such that each member of a warp will
kono
parents:
diff changeset
286 operate on adjacent iterations. At the worker and gang level,
kono
parents:
diff changeset
287 each gang/warp executes a set of contiguous iterations. Chunking
kono
parents:
diff changeset
288 can override this such that each iteration engine executes a
kono
parents:
diff changeset
289 contiguous chunk, and then moves on to stride to the next chunk. */
kono
parents:
diff changeset
290
kono
parents:
diff changeset
291 static void
kono
parents:
diff changeset
292 oacc_xform_loop (gcall *call)
kono
parents:
diff changeset
293 {
kono
parents:
diff changeset
294 gimple_stmt_iterator gsi = gsi_for_stmt (call);
kono
parents:
diff changeset
295 enum ifn_goacc_loop_kind code
kono
parents:
diff changeset
296 = (enum ifn_goacc_loop_kind) TREE_INT_CST_LOW (gimple_call_arg (call, 0));
kono
parents:
diff changeset
297 tree dir = gimple_call_arg (call, 1);
kono
parents:
diff changeset
298 tree range = gimple_call_arg (call, 2);
kono
parents:
diff changeset
299 tree step = gimple_call_arg (call, 3);
kono
parents:
diff changeset
300 tree chunk_size = NULL_TREE;
kono
parents:
diff changeset
301 unsigned mask = (unsigned) TREE_INT_CST_LOW (gimple_call_arg (call, 5));
kono
parents:
diff changeset
302 tree lhs = gimple_call_lhs (call);
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
303 tree type = NULL_TREE;
111
kono
parents:
diff changeset
304 tree diff_type = TREE_TYPE (range);
kono
parents:
diff changeset
305 tree r = NULL_TREE;
kono
parents:
diff changeset
306 gimple_seq seq = NULL;
kono
parents:
diff changeset
307 bool chunking = false, striding = true;
kono
parents:
diff changeset
308 unsigned outer_mask = mask & (~mask + 1); // Outermost partitioning
kono
parents:
diff changeset
309 unsigned inner_mask = mask & ~outer_mask; // Inner partitioning (if any)
kono
parents:
diff changeset
310
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
311 /* Skip lowering if return value of IFN_GOACC_LOOP call is not used. */
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
312 if (!lhs)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
313 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
314 gsi_replace_with_seq (&gsi, seq, true);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
315 return;
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
316 }
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
317
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
318 type = TREE_TYPE (lhs);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
319
111
kono
parents:
diff changeset
320 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
321 chunk_size = gimple_call_arg (call, 4);
kono
parents:
diff changeset
322 if (integer_minus_onep (chunk_size) /* Force static allocation. */
kono
parents:
diff changeset
323 || integer_zerop (chunk_size)) /* Default (also static). */
kono
parents:
diff changeset
324 {
kono
parents:
diff changeset
325 /* If we're at the gang level, we want each to execute a
kono
parents:
diff changeset
326 contiguous run of iterations. Otherwise we want each element
kono
parents:
diff changeset
327 to stride. */
kono
parents:
diff changeset
328 striding = !(outer_mask & GOMP_DIM_MASK (GOMP_DIM_GANG));
kono
parents:
diff changeset
329 chunking = false;
kono
parents:
diff changeset
330 }
kono
parents:
diff changeset
331 else
kono
parents:
diff changeset
332 {
kono
parents:
diff changeset
333 /* Chunk of size 1 is striding. */
kono
parents:
diff changeset
334 striding = integer_onep (chunk_size);
kono
parents:
diff changeset
335 chunking = !striding;
kono
parents:
diff changeset
336 }
kono
parents:
diff changeset
337 #endif
kono
parents:
diff changeset
338
kono
parents:
diff changeset
339 /* striding=true, chunking=true
kono
parents:
diff changeset
340 -> invalid.
kono
parents:
diff changeset
341 striding=true, chunking=false
kono
parents:
diff changeset
342 -> chunks=1
kono
parents:
diff changeset
343 striding=false,chunking=true
kono
parents:
diff changeset
344 -> chunks=ceil (range/(chunksize*threads*step))
kono
parents:
diff changeset
345 striding=false,chunking=false
kono
parents:
diff changeset
346 -> chunk_size=ceil(range/(threads*step)),chunks=1 */
kono
parents:
diff changeset
347 push_gimplify_context (true);
kono
parents:
diff changeset
348
kono
parents:
diff changeset
349 switch (code)
kono
parents:
diff changeset
350 {
kono
parents:
diff changeset
351 default: gcc_unreachable ();
kono
parents:
diff changeset
352
kono
parents:
diff changeset
353 case IFN_GOACC_LOOP_CHUNKS:
kono
parents:
diff changeset
354 if (!chunking)
kono
parents:
diff changeset
355 r = build_int_cst (type, 1);
kono
parents:
diff changeset
356 else
kono
parents:
diff changeset
357 {
kono
parents:
diff changeset
358 /* chunk_max
kono
parents:
diff changeset
359 = (range - dir) / (chunks * step * num_threads) + dir */
kono
parents:
diff changeset
360 tree per = oacc_thread_numbers (false, mask, &seq);
kono
parents:
diff changeset
361 per = fold_convert (type, per);
kono
parents:
diff changeset
362 chunk_size = fold_convert (type, chunk_size);
kono
parents:
diff changeset
363 per = fold_build2 (MULT_EXPR, type, per, chunk_size);
kono
parents:
diff changeset
364 per = fold_build2 (MULT_EXPR, type, per, step);
kono
parents:
diff changeset
365 r = build2 (MINUS_EXPR, type, range, dir);
kono
parents:
diff changeset
366 r = build2 (PLUS_EXPR, type, r, per);
kono
parents:
diff changeset
367 r = build2 (TRUNC_DIV_EXPR, type, r, per);
kono
parents:
diff changeset
368 }
kono
parents:
diff changeset
369 break;
kono
parents:
diff changeset
370
kono
parents:
diff changeset
371 case IFN_GOACC_LOOP_STEP:
kono
parents:
diff changeset
372 {
kono
parents:
diff changeset
373 /* If striding, step by the entire compute volume, otherwise
kono
parents:
diff changeset
374 step by the inner volume. */
kono
parents:
diff changeset
375 unsigned volume = striding ? mask : inner_mask;
kono
parents:
diff changeset
376
kono
parents:
diff changeset
377 r = oacc_thread_numbers (false, volume, &seq);
kono
parents:
diff changeset
378 r = build2 (MULT_EXPR, type, fold_convert (type, r), step);
kono
parents:
diff changeset
379 }
kono
parents:
diff changeset
380 break;
kono
parents:
diff changeset
381
kono
parents:
diff changeset
382 case IFN_GOACC_LOOP_OFFSET:
kono
parents:
diff changeset
383 /* Enable vectorization on non-SIMT targets. */
kono
parents:
diff changeset
384 if (!targetm.simt.vf
kono
parents:
diff changeset
385 && outer_mask == GOMP_DIM_MASK (GOMP_DIM_VECTOR)
kono
parents:
diff changeset
386 /* If not -fno-tree-loop-vectorize, hint that we want to vectorize
kono
parents:
diff changeset
387 the loop. */
kono
parents:
diff changeset
388 && (flag_tree_loop_vectorize
kono
parents:
diff changeset
389 || !global_options_set.x_flag_tree_loop_vectorize))
kono
parents:
diff changeset
390 {
kono
parents:
diff changeset
391 basic_block bb = gsi_bb (gsi);
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
392 class loop *parent = bb->loop_father;
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
393 class loop *body = parent->inner;
111
kono
parents:
diff changeset
394
kono
parents:
diff changeset
395 parent->force_vectorize = true;
kono
parents:
diff changeset
396 parent->safelen = INT_MAX;
kono
parents:
diff changeset
397
kono
parents:
diff changeset
398 /* "Chunking loops" may have inner loops. */
kono
parents:
diff changeset
399 if (parent->inner)
kono
parents:
diff changeset
400 {
kono
parents:
diff changeset
401 body->force_vectorize = true;
kono
parents:
diff changeset
402 body->safelen = INT_MAX;
kono
parents:
diff changeset
403 }
kono
parents:
diff changeset
404
kono
parents:
diff changeset
405 cfun->has_force_vectorize_loops = true;
kono
parents:
diff changeset
406 }
kono
parents:
diff changeset
407 if (striding)
kono
parents:
diff changeset
408 {
kono
parents:
diff changeset
409 r = oacc_thread_numbers (true, mask, &seq);
kono
parents:
diff changeset
410 r = fold_convert (diff_type, r);
kono
parents:
diff changeset
411 }
kono
parents:
diff changeset
412 else
kono
parents:
diff changeset
413 {
kono
parents:
diff changeset
414 tree inner_size = oacc_thread_numbers (false, inner_mask, &seq);
kono
parents:
diff changeset
415 tree outer_size = oacc_thread_numbers (false, outer_mask, &seq);
kono
parents:
diff changeset
416 tree volume = fold_build2 (MULT_EXPR, TREE_TYPE (inner_size),
kono
parents:
diff changeset
417 inner_size, outer_size);
kono
parents:
diff changeset
418
kono
parents:
diff changeset
419 volume = fold_convert (diff_type, volume);
kono
parents:
diff changeset
420 if (chunking)
kono
parents:
diff changeset
421 chunk_size = fold_convert (diff_type, chunk_size);
kono
parents:
diff changeset
422 else
kono
parents:
diff changeset
423 {
kono
parents:
diff changeset
424 tree per = fold_build2 (MULT_EXPR, diff_type, volume, step);
kono
parents:
diff changeset
425
kono
parents:
diff changeset
426 chunk_size = build2 (MINUS_EXPR, diff_type, range, dir);
kono
parents:
diff changeset
427 chunk_size = build2 (PLUS_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
428 chunk_size = build2 (TRUNC_DIV_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
429 }
kono
parents:
diff changeset
430
kono
parents:
diff changeset
431 tree span = build2 (MULT_EXPR, diff_type, chunk_size,
kono
parents:
diff changeset
432 fold_convert (diff_type, inner_size));
kono
parents:
diff changeset
433 r = oacc_thread_numbers (true, outer_mask, &seq);
kono
parents:
diff changeset
434 r = fold_convert (diff_type, r);
kono
parents:
diff changeset
435 r = build2 (MULT_EXPR, diff_type, r, span);
kono
parents:
diff changeset
436
kono
parents:
diff changeset
437 tree inner = oacc_thread_numbers (true, inner_mask, &seq);
kono
parents:
diff changeset
438 inner = fold_convert (diff_type, inner);
kono
parents:
diff changeset
439 r = fold_build2 (PLUS_EXPR, diff_type, r, inner);
kono
parents:
diff changeset
440
kono
parents:
diff changeset
441 if (chunking)
kono
parents:
diff changeset
442 {
kono
parents:
diff changeset
443 tree chunk = fold_convert (diff_type, gimple_call_arg (call, 6));
kono
parents:
diff changeset
444 tree per
kono
parents:
diff changeset
445 = fold_build2 (MULT_EXPR, diff_type, volume, chunk_size);
kono
parents:
diff changeset
446 per = build2 (MULT_EXPR, diff_type, per, chunk);
kono
parents:
diff changeset
447
kono
parents:
diff changeset
448 r = build2 (PLUS_EXPR, diff_type, r, per);
kono
parents:
diff changeset
449 }
kono
parents:
diff changeset
450 }
kono
parents:
diff changeset
451 r = fold_build2 (MULT_EXPR, diff_type, r, step);
kono
parents:
diff changeset
452 if (type != diff_type)
kono
parents:
diff changeset
453 r = fold_convert (type, r);
kono
parents:
diff changeset
454 break;
kono
parents:
diff changeset
455
kono
parents:
diff changeset
456 case IFN_GOACC_LOOP_BOUND:
kono
parents:
diff changeset
457 if (striding)
kono
parents:
diff changeset
458 r = range;
kono
parents:
diff changeset
459 else
kono
parents:
diff changeset
460 {
kono
parents:
diff changeset
461 tree inner_size = oacc_thread_numbers (false, inner_mask, &seq);
kono
parents:
diff changeset
462 tree outer_size = oacc_thread_numbers (false, outer_mask, &seq);
kono
parents:
diff changeset
463 tree volume = fold_build2 (MULT_EXPR, TREE_TYPE (inner_size),
kono
parents:
diff changeset
464 inner_size, outer_size);
kono
parents:
diff changeset
465
kono
parents:
diff changeset
466 volume = fold_convert (diff_type, volume);
kono
parents:
diff changeset
467 if (chunking)
kono
parents:
diff changeset
468 chunk_size = fold_convert (diff_type, chunk_size);
kono
parents:
diff changeset
469 else
kono
parents:
diff changeset
470 {
kono
parents:
diff changeset
471 tree per = fold_build2 (MULT_EXPR, diff_type, volume, step);
kono
parents:
diff changeset
472
kono
parents:
diff changeset
473 chunk_size = build2 (MINUS_EXPR, diff_type, range, dir);
kono
parents:
diff changeset
474 chunk_size = build2 (PLUS_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
475 chunk_size = build2 (TRUNC_DIV_EXPR, diff_type, chunk_size, per);
kono
parents:
diff changeset
476 }
kono
parents:
diff changeset
477
kono
parents:
diff changeset
478 tree span = build2 (MULT_EXPR, diff_type, chunk_size,
kono
parents:
diff changeset
479 fold_convert (diff_type, inner_size));
kono
parents:
diff changeset
480
kono
parents:
diff changeset
481 r = fold_build2 (MULT_EXPR, diff_type, span, step);
kono
parents:
diff changeset
482
kono
parents:
diff changeset
483 tree offset = gimple_call_arg (call, 6);
kono
parents:
diff changeset
484 r = build2 (PLUS_EXPR, diff_type, r,
kono
parents:
diff changeset
485 fold_convert (diff_type, offset));
kono
parents:
diff changeset
486 r = build2 (integer_onep (dir) ? MIN_EXPR : MAX_EXPR,
kono
parents:
diff changeset
487 diff_type, r, range);
kono
parents:
diff changeset
488 }
kono
parents:
diff changeset
489 if (diff_type != type)
kono
parents:
diff changeset
490 r = fold_convert (type, r);
kono
parents:
diff changeset
491 break;
kono
parents:
diff changeset
492 }
kono
parents:
diff changeset
493
kono
parents:
diff changeset
494 gimplify_assign (lhs, r, &seq);
kono
parents:
diff changeset
495
kono
parents:
diff changeset
496 pop_gimplify_context (NULL);
kono
parents:
diff changeset
497
kono
parents:
diff changeset
498 gsi_replace_with_seq (&gsi, seq, true);
kono
parents:
diff changeset
499 }
kono
parents:
diff changeset
500
kono
parents:
diff changeset
501 /* Transform a GOACC_TILE call. Determines the element loop span for
kono
parents:
diff changeset
502 the specified loop of the nest. This is 1 if we're not tiling.
kono
parents:
diff changeset
503
kono
parents:
diff changeset
504 GOACC_TILE (collapse_count, loop_no, tile_arg, gwv_tile, gwv_element); */
kono
parents:
diff changeset
505
kono
parents:
diff changeset
506 static void
kono
parents:
diff changeset
507 oacc_xform_tile (gcall *call)
kono
parents:
diff changeset
508 {
kono
parents:
diff changeset
509 gimple_stmt_iterator gsi = gsi_for_stmt (call);
kono
parents:
diff changeset
510 unsigned collapse = tree_to_uhwi (gimple_call_arg (call, 0));
kono
parents:
diff changeset
511 /* Inner loops have higher loop_nos. */
kono
parents:
diff changeset
512 unsigned loop_no = tree_to_uhwi (gimple_call_arg (call, 1));
kono
parents:
diff changeset
513 tree tile_size = gimple_call_arg (call, 2);
kono
parents:
diff changeset
514 unsigned e_mask = tree_to_uhwi (gimple_call_arg (call, 4));
kono
parents:
diff changeset
515 tree lhs = gimple_call_lhs (call);
kono
parents:
diff changeset
516 tree type = TREE_TYPE (lhs);
kono
parents:
diff changeset
517 gimple_seq seq = NULL;
kono
parents:
diff changeset
518 tree span = build_int_cst (type, 1);
kono
parents:
diff changeset
519
kono
parents:
diff changeset
520 gcc_assert (!(e_mask
kono
parents:
diff changeset
521 & ~(GOMP_DIM_MASK (GOMP_DIM_VECTOR)
kono
parents:
diff changeset
522 | GOMP_DIM_MASK (GOMP_DIM_WORKER))));
kono
parents:
diff changeset
523 push_gimplify_context (!seen_error ());
kono
parents:
diff changeset
524
kono
parents:
diff changeset
525 #ifndef ACCEL_COMPILER
kono
parents:
diff changeset
526 /* Partitioning disabled on host compilers. */
kono
parents:
diff changeset
527 e_mask = 0;
kono
parents:
diff changeset
528 #endif
kono
parents:
diff changeset
529 if (!e_mask)
kono
parents:
diff changeset
530 /* Not paritioning. */
kono
parents:
diff changeset
531 span = integer_one_node;
kono
parents:
diff changeset
532 else if (!integer_zerop (tile_size))
kono
parents:
diff changeset
533 /* User explicitly specified size. */
kono
parents:
diff changeset
534 span = tile_size;
kono
parents:
diff changeset
535 else
kono
parents:
diff changeset
536 {
kono
parents:
diff changeset
537 /* Pick a size based on the paritioning of the element loop and
kono
parents:
diff changeset
538 the number of loop nests. */
kono
parents:
diff changeset
539 tree first_size = NULL_TREE;
kono
parents:
diff changeset
540 tree second_size = NULL_TREE;
kono
parents:
diff changeset
541
kono
parents:
diff changeset
542 if (e_mask & GOMP_DIM_MASK (GOMP_DIM_VECTOR))
kono
parents:
diff changeset
543 first_size = oacc_dim_call (false, GOMP_DIM_VECTOR, &seq);
kono
parents:
diff changeset
544 if (e_mask & GOMP_DIM_MASK (GOMP_DIM_WORKER))
kono
parents:
diff changeset
545 second_size = oacc_dim_call (false, GOMP_DIM_WORKER, &seq);
kono
parents:
diff changeset
546
kono
parents:
diff changeset
547 if (!first_size)
kono
parents:
diff changeset
548 {
kono
parents:
diff changeset
549 first_size = second_size;
kono
parents:
diff changeset
550 second_size = NULL_TREE;
kono
parents:
diff changeset
551 }
kono
parents:
diff changeset
552
kono
parents:
diff changeset
553 if (loop_no + 1 == collapse)
kono
parents:
diff changeset
554 {
kono
parents:
diff changeset
555 span = first_size;
kono
parents:
diff changeset
556 if (!loop_no && second_size)
kono
parents:
diff changeset
557 span = fold_build2 (MULT_EXPR, TREE_TYPE (span),
kono
parents:
diff changeset
558 span, second_size);
kono
parents:
diff changeset
559 }
kono
parents:
diff changeset
560 else if (loop_no + 2 == collapse)
kono
parents:
diff changeset
561 span = second_size;
kono
parents:
diff changeset
562 else
kono
parents:
diff changeset
563 span = NULL_TREE;
kono
parents:
diff changeset
564
kono
parents:
diff changeset
565 if (!span)
kono
parents:
diff changeset
566 /* There's no obvious element size for this loop. Options
kono
parents:
diff changeset
567 are 1, first_size or some non-unity constant (32 is my
kono
parents:
diff changeset
568 favourite). We should gather some statistics. */
kono
parents:
diff changeset
569 span = first_size;
kono
parents:
diff changeset
570 }
kono
parents:
diff changeset
571
kono
parents:
diff changeset
572 span = fold_convert (type, span);
kono
parents:
diff changeset
573 gimplify_assign (lhs, span, &seq);
kono
parents:
diff changeset
574
kono
parents:
diff changeset
575 pop_gimplify_context (NULL);
kono
parents:
diff changeset
576
kono
parents:
diff changeset
577 gsi_replace_with_seq (&gsi, seq, true);
kono
parents:
diff changeset
578 }
kono
parents:
diff changeset
579
kono
parents:
diff changeset
580 /* Default partitioned and minimum partitioned dimensions. */
kono
parents:
diff changeset
581
kono
parents:
diff changeset
582 static int oacc_default_dims[GOMP_DIM_MAX];
kono
parents:
diff changeset
583 static int oacc_min_dims[GOMP_DIM_MAX];
kono
parents:
diff changeset
584
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
585 int
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
586 oacc_get_default_dim (int dim)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
587 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
588 gcc_assert (0 <= dim && dim < GOMP_DIM_MAX);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
589 return oacc_default_dims[dim];
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
590 }
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
591
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
592 int
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
593 oacc_get_min_dim (int dim)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
594 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
595 gcc_assert (0 <= dim && dim < GOMP_DIM_MAX);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
596 return oacc_min_dims[dim];
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
597 }
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
598
111
kono
parents:
diff changeset
599 /* Parse the default dimension parameter. This is a set of
kono
parents:
diff changeset
600 :-separated optional compute dimensions. Each specified dimension
kono
parents:
diff changeset
601 is a positive integer. When device type support is added, it is
kono
parents:
diff changeset
602 planned to be a comma separated list of such compute dimensions,
kono
parents:
diff changeset
603 with all but the first prefixed by the colon-terminated device
kono
parents:
diff changeset
604 type. */
kono
parents:
diff changeset
605
kono
parents:
diff changeset
606 static void
kono
parents:
diff changeset
607 oacc_parse_default_dims (const char *dims)
kono
parents:
diff changeset
608 {
kono
parents:
diff changeset
609 int ix;
kono
parents:
diff changeset
610
kono
parents:
diff changeset
611 for (ix = GOMP_DIM_MAX; ix--;)
kono
parents:
diff changeset
612 {
kono
parents:
diff changeset
613 oacc_default_dims[ix] = -1;
kono
parents:
diff changeset
614 oacc_min_dims[ix] = 1;
kono
parents:
diff changeset
615 }
kono
parents:
diff changeset
616
kono
parents:
diff changeset
617 #ifndef ACCEL_COMPILER
kono
parents:
diff changeset
618 /* Cannot be overridden on the host. */
kono
parents:
diff changeset
619 dims = NULL;
kono
parents:
diff changeset
620 #endif
kono
parents:
diff changeset
621 if (dims)
kono
parents:
diff changeset
622 {
kono
parents:
diff changeset
623 const char *pos = dims;
kono
parents:
diff changeset
624
kono
parents:
diff changeset
625 for (ix = 0; *pos && ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
626 {
kono
parents:
diff changeset
627 if (ix)
kono
parents:
diff changeset
628 {
kono
parents:
diff changeset
629 if (*pos != ':')
kono
parents:
diff changeset
630 goto malformed;
kono
parents:
diff changeset
631 pos++;
kono
parents:
diff changeset
632 }
kono
parents:
diff changeset
633
kono
parents:
diff changeset
634 if (*pos != ':')
kono
parents:
diff changeset
635 {
kono
parents:
diff changeset
636 long val;
kono
parents:
diff changeset
637 const char *eptr;
kono
parents:
diff changeset
638
kono
parents:
diff changeset
639 errno = 0;
kono
parents:
diff changeset
640 val = strtol (pos, CONST_CAST (char **, &eptr), 10);
kono
parents:
diff changeset
641 if (errno || val <= 0 || (int) val != val)
kono
parents:
diff changeset
642 goto malformed;
kono
parents:
diff changeset
643 pos = eptr;
kono
parents:
diff changeset
644 oacc_default_dims[ix] = (int) val;
kono
parents:
diff changeset
645 }
kono
parents:
diff changeset
646 }
kono
parents:
diff changeset
647 if (*pos)
kono
parents:
diff changeset
648 {
kono
parents:
diff changeset
649 malformed:
kono
parents:
diff changeset
650 error_at (UNKNOWN_LOCATION,
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
651 "%<-fopenacc-dim%> operand is malformed at %qs", pos);
111
kono
parents:
diff changeset
652 }
kono
parents:
diff changeset
653 }
kono
parents:
diff changeset
654
kono
parents:
diff changeset
655 /* Allow the backend to validate the dimensions. */
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
656 targetm.goacc.validate_dims (NULL_TREE, oacc_default_dims, -1, 0);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
657 targetm.goacc.validate_dims (NULL_TREE, oacc_min_dims, -2, 0);
111
kono
parents:
diff changeset
658 }
kono
parents:
diff changeset
659
kono
parents:
diff changeset
660 /* Validate and update the dimensions for offloaded FN. ATTRS is the
kono
parents:
diff changeset
661 raw attribute. DIMS is an array of dimensions, which is filled in.
kono
parents:
diff changeset
662 LEVEL is the partitioning level of a routine, or -1 for an offload
kono
parents:
diff changeset
663 region itself. USED is the mask of partitioned execution in the
kono
parents:
diff changeset
664 function. */
kono
parents:
diff changeset
665
kono
parents:
diff changeset
666 static void
kono
parents:
diff changeset
667 oacc_validate_dims (tree fn, tree attrs, int *dims, int level, unsigned used)
kono
parents:
diff changeset
668 {
kono
parents:
diff changeset
669 tree purpose[GOMP_DIM_MAX];
kono
parents:
diff changeset
670 unsigned ix;
kono
parents:
diff changeset
671 tree pos = TREE_VALUE (attrs);
kono
parents:
diff changeset
672
kono
parents:
diff changeset
673 /* Make sure the attribute creator attached the dimension
kono
parents:
diff changeset
674 information. */
kono
parents:
diff changeset
675 gcc_assert (pos);
kono
parents:
diff changeset
676
kono
parents:
diff changeset
677 for (ix = 0; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
678 {
kono
parents:
diff changeset
679 purpose[ix] = TREE_PURPOSE (pos);
kono
parents:
diff changeset
680 tree val = TREE_VALUE (pos);
kono
parents:
diff changeset
681 dims[ix] = val ? TREE_INT_CST_LOW (val) : -1;
kono
parents:
diff changeset
682 pos = TREE_CHAIN (pos);
kono
parents:
diff changeset
683 }
kono
parents:
diff changeset
684
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
685 bool changed = targetm.goacc.validate_dims (fn, dims, level, used);
111
kono
parents:
diff changeset
686
kono
parents:
diff changeset
687 /* Default anything left to 1 or a partitioned default. */
kono
parents:
diff changeset
688 for (ix = 0; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
689 if (dims[ix] < 0)
kono
parents:
diff changeset
690 {
kono
parents:
diff changeset
691 /* The OpenACC spec says 'If the [num_gangs] clause is not
kono
parents:
diff changeset
692 specified, an implementation-defined default will be used;
kono
parents:
diff changeset
693 the default may depend on the code within the construct.'
kono
parents:
diff changeset
694 (2.5.6). Thus an implementation is free to choose
kono
parents:
diff changeset
695 non-unity default for a parallel region that doesn't have
kono
parents:
diff changeset
696 any gang-partitioned loops. However, it appears that there
kono
parents:
diff changeset
697 is a sufficient body of user code that expects non-gang
kono
parents:
diff changeset
698 partitioned regions to not execute in gang-redundant mode.
kono
parents:
diff changeset
699 So we (a) don't warn about the non-portability and (b) pick
kono
parents:
diff changeset
700 the minimum permissible dimension size when there is no
kono
parents:
diff changeset
701 partitioned execution. Otherwise we pick the global
kono
parents:
diff changeset
702 default for the dimension, which the user can control. The
kono
parents:
diff changeset
703 same wording and logic applies to num_workers and
kono
parents:
diff changeset
704 vector_length, however the worker- or vector- single
kono
parents:
diff changeset
705 execution doesn't have the same impact as gang-redundant
kono
parents:
diff changeset
706 execution. (If the minimum gang-level partioning is not 1,
kono
parents:
diff changeset
707 the target is probably too confusing.) */
kono
parents:
diff changeset
708 dims[ix] = (used & GOMP_DIM_MASK (ix)
kono
parents:
diff changeset
709 ? oacc_default_dims[ix] : oacc_min_dims[ix]);
kono
parents:
diff changeset
710 changed = true;
kono
parents:
diff changeset
711 }
kono
parents:
diff changeset
712
kono
parents:
diff changeset
713 if (changed)
kono
parents:
diff changeset
714 {
kono
parents:
diff changeset
715 /* Replace the attribute with new values. */
kono
parents:
diff changeset
716 pos = NULL_TREE;
kono
parents:
diff changeset
717 for (ix = GOMP_DIM_MAX; ix--;)
kono
parents:
diff changeset
718 pos = tree_cons (purpose[ix],
kono
parents:
diff changeset
719 build_int_cst (integer_type_node, dims[ix]), pos);
kono
parents:
diff changeset
720 oacc_replace_fn_attrib (fn, pos);
kono
parents:
diff changeset
721 }
kono
parents:
diff changeset
722 }
kono
parents:
diff changeset
723
kono
parents:
diff changeset
724 /* Create an empty OpenACC loop structure at LOC. */
kono
parents:
diff changeset
725
kono
parents:
diff changeset
726 static oacc_loop *
kono
parents:
diff changeset
727 new_oacc_loop_raw (oacc_loop *parent, location_t loc)
kono
parents:
diff changeset
728 {
kono
parents:
diff changeset
729 oacc_loop *loop = XCNEW (oacc_loop);
kono
parents:
diff changeset
730
kono
parents:
diff changeset
731 loop->parent = parent;
kono
parents:
diff changeset
732
kono
parents:
diff changeset
733 if (parent)
kono
parents:
diff changeset
734 {
kono
parents:
diff changeset
735 loop->sibling = parent->child;
kono
parents:
diff changeset
736 parent->child = loop;
kono
parents:
diff changeset
737 }
kono
parents:
diff changeset
738
kono
parents:
diff changeset
739 loop->loc = loc;
kono
parents:
diff changeset
740 return loop;
kono
parents:
diff changeset
741 }
kono
parents:
diff changeset
742
kono
parents:
diff changeset
743 /* Create an outermost, dummy OpenACC loop for offloaded function
kono
parents:
diff changeset
744 DECL. */
kono
parents:
diff changeset
745
kono
parents:
diff changeset
746 static oacc_loop *
kono
parents:
diff changeset
747 new_oacc_loop_outer (tree decl)
kono
parents:
diff changeset
748 {
kono
parents:
diff changeset
749 return new_oacc_loop_raw (NULL, DECL_SOURCE_LOCATION (decl));
kono
parents:
diff changeset
750 }
kono
parents:
diff changeset
751
kono
parents:
diff changeset
752 /* Start a new OpenACC loop structure beginning at head marker HEAD.
kono
parents:
diff changeset
753 Link into PARENT loop. Return the new loop. */
kono
parents:
diff changeset
754
kono
parents:
diff changeset
755 static oacc_loop *
kono
parents:
diff changeset
756 new_oacc_loop (oacc_loop *parent, gcall *marker)
kono
parents:
diff changeset
757 {
kono
parents:
diff changeset
758 oacc_loop *loop = new_oacc_loop_raw (parent, gimple_location (marker));
kono
parents:
diff changeset
759
kono
parents:
diff changeset
760 loop->marker = marker;
kono
parents:
diff changeset
761
kono
parents:
diff changeset
762 /* TODO: This is where device_type flattening would occur for the loop
kono
parents:
diff changeset
763 flags. */
kono
parents:
diff changeset
764
kono
parents:
diff changeset
765 loop->flags = TREE_INT_CST_LOW (gimple_call_arg (marker, 3));
kono
parents:
diff changeset
766
kono
parents:
diff changeset
767 tree chunk_size = integer_zero_node;
kono
parents:
diff changeset
768 if (loop->flags & OLF_GANG_STATIC)
kono
parents:
diff changeset
769 chunk_size = gimple_call_arg (marker, 4);
kono
parents:
diff changeset
770 loop->chunk_size = chunk_size;
kono
parents:
diff changeset
771
kono
parents:
diff changeset
772 return loop;
kono
parents:
diff changeset
773 }
kono
parents:
diff changeset
774
kono
parents:
diff changeset
775 /* Create a dummy loop encompassing a call to a openACC routine.
kono
parents:
diff changeset
776 Extract the routine's partitioning requirements. */
kono
parents:
diff changeset
777
kono
parents:
diff changeset
778 static void
kono
parents:
diff changeset
779 new_oacc_loop_routine (oacc_loop *parent, gcall *call, tree decl, tree attrs)
kono
parents:
diff changeset
780 {
kono
parents:
diff changeset
781 oacc_loop *loop = new_oacc_loop_raw (parent, gimple_location (call));
kono
parents:
diff changeset
782 int level = oacc_fn_attrib_level (attrs);
kono
parents:
diff changeset
783
kono
parents:
diff changeset
784 gcc_assert (level >= 0);
kono
parents:
diff changeset
785
kono
parents:
diff changeset
786 loop->marker = call;
kono
parents:
diff changeset
787 loop->routine = decl;
kono
parents:
diff changeset
788 loop->mask = ((GOMP_DIM_MASK (GOMP_DIM_MAX) - 1)
kono
parents:
diff changeset
789 ^ (GOMP_DIM_MASK (level) - 1));
kono
parents:
diff changeset
790 }
kono
parents:
diff changeset
791
kono
parents:
diff changeset
792 /* Finish off the current OpenACC loop ending at tail marker TAIL.
kono
parents:
diff changeset
793 Return the parent loop. */
kono
parents:
diff changeset
794
kono
parents:
diff changeset
795 static oacc_loop *
kono
parents:
diff changeset
796 finish_oacc_loop (oacc_loop *loop)
kono
parents:
diff changeset
797 {
kono
parents:
diff changeset
798 /* If the loop has been collapsed, don't partition it. */
kono
parents:
diff changeset
799 if (loop->ifns.is_empty ())
kono
parents:
diff changeset
800 loop->mask = loop->flags = 0;
kono
parents:
diff changeset
801 return loop->parent;
kono
parents:
diff changeset
802 }
kono
parents:
diff changeset
803
kono
parents:
diff changeset
804 /* Free all OpenACC loop structures within LOOP (inclusive). */
kono
parents:
diff changeset
805
kono
parents:
diff changeset
806 static void
kono
parents:
diff changeset
807 free_oacc_loop (oacc_loop *loop)
kono
parents:
diff changeset
808 {
kono
parents:
diff changeset
809 if (loop->sibling)
kono
parents:
diff changeset
810 free_oacc_loop (loop->sibling);
kono
parents:
diff changeset
811 if (loop->child)
kono
parents:
diff changeset
812 free_oacc_loop (loop->child);
kono
parents:
diff changeset
813
kono
parents:
diff changeset
814 loop->ifns.release ();
kono
parents:
diff changeset
815 free (loop);
kono
parents:
diff changeset
816 }
kono
parents:
diff changeset
817
kono
parents:
diff changeset
818 /* Dump out the OpenACC loop head or tail beginning at FROM. */
kono
parents:
diff changeset
819
kono
parents:
diff changeset
820 static void
kono
parents:
diff changeset
821 dump_oacc_loop_part (FILE *file, gcall *from, int depth,
kono
parents:
diff changeset
822 const char *title, int level)
kono
parents:
diff changeset
823 {
kono
parents:
diff changeset
824 enum ifn_unique_kind kind
kono
parents:
diff changeset
825 = (enum ifn_unique_kind) TREE_INT_CST_LOW (gimple_call_arg (from, 0));
kono
parents:
diff changeset
826
kono
parents:
diff changeset
827 fprintf (file, "%*s%s-%d:\n", depth * 2, "", title, level);
kono
parents:
diff changeset
828 for (gimple_stmt_iterator gsi = gsi_for_stmt (from);;)
kono
parents:
diff changeset
829 {
kono
parents:
diff changeset
830 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
831
kono
parents:
diff changeset
832 if (gimple_call_internal_p (stmt, IFN_UNIQUE))
kono
parents:
diff changeset
833 {
kono
parents:
diff changeset
834 enum ifn_unique_kind k
kono
parents:
diff changeset
835 = ((enum ifn_unique_kind) TREE_INT_CST_LOW
kono
parents:
diff changeset
836 (gimple_call_arg (stmt, 0)));
kono
parents:
diff changeset
837
kono
parents:
diff changeset
838 if (k == kind && stmt != from)
kono
parents:
diff changeset
839 break;
kono
parents:
diff changeset
840 }
kono
parents:
diff changeset
841 print_gimple_stmt (file, stmt, depth * 2 + 2);
kono
parents:
diff changeset
842
kono
parents:
diff changeset
843 gsi_next (&gsi);
kono
parents:
diff changeset
844 while (gsi_end_p (gsi))
kono
parents:
diff changeset
845 gsi = gsi_start_bb (single_succ (gsi_bb (gsi)));
kono
parents:
diff changeset
846 }
kono
parents:
diff changeset
847 }
kono
parents:
diff changeset
848
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
849 /* Dump OpenACC loop LOOP, its children, and its siblings. */
111
kono
parents:
diff changeset
850
kono
parents:
diff changeset
851 static void
kono
parents:
diff changeset
852 dump_oacc_loop (FILE *file, oacc_loop *loop, int depth)
kono
parents:
diff changeset
853 {
kono
parents:
diff changeset
854 int ix;
kono
parents:
diff changeset
855
kono
parents:
diff changeset
856 fprintf (file, "%*sLoop %x(%x) %s:%u\n", depth * 2, "",
kono
parents:
diff changeset
857 loop->flags, loop->mask,
kono
parents:
diff changeset
858 LOCATION_FILE (loop->loc), LOCATION_LINE (loop->loc));
kono
parents:
diff changeset
859
kono
parents:
diff changeset
860 if (loop->marker)
kono
parents:
diff changeset
861 print_gimple_stmt (file, loop->marker, depth * 2);
kono
parents:
diff changeset
862
kono
parents:
diff changeset
863 if (loop->routine)
kono
parents:
diff changeset
864 fprintf (file, "%*sRoutine %s:%u:%s\n",
kono
parents:
diff changeset
865 depth * 2, "", DECL_SOURCE_FILE (loop->routine),
kono
parents:
diff changeset
866 DECL_SOURCE_LINE (loop->routine),
kono
parents:
diff changeset
867 IDENTIFIER_POINTER (DECL_NAME (loop->routine)));
kono
parents:
diff changeset
868
kono
parents:
diff changeset
869 for (ix = GOMP_DIM_GANG; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
870 if (loop->heads[ix])
kono
parents:
diff changeset
871 dump_oacc_loop_part (file, loop->heads[ix], depth, "Head", ix);
kono
parents:
diff changeset
872 for (ix = GOMP_DIM_MAX; ix--;)
kono
parents:
diff changeset
873 if (loop->tails[ix])
kono
parents:
diff changeset
874 dump_oacc_loop_part (file, loop->tails[ix], depth, "Tail", ix);
kono
parents:
diff changeset
875
kono
parents:
diff changeset
876 if (loop->child)
kono
parents:
diff changeset
877 dump_oacc_loop (file, loop->child, depth + 1);
kono
parents:
diff changeset
878 if (loop->sibling)
kono
parents:
diff changeset
879 dump_oacc_loop (file, loop->sibling, depth);
kono
parents:
diff changeset
880 }
kono
parents:
diff changeset
881
kono
parents:
diff changeset
882 void debug_oacc_loop (oacc_loop *);
kono
parents:
diff changeset
883
kono
parents:
diff changeset
884 /* Dump loops to stderr. */
kono
parents:
diff changeset
885
kono
parents:
diff changeset
886 DEBUG_FUNCTION void
kono
parents:
diff changeset
887 debug_oacc_loop (oacc_loop *loop)
kono
parents:
diff changeset
888 {
kono
parents:
diff changeset
889 dump_oacc_loop (stderr, loop, 0);
kono
parents:
diff changeset
890 }
kono
parents:
diff changeset
891
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
892 /* Provide diagnostics on OpenACC loop LOOP, its children, and its
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
893 siblings. */
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
894
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
895 static void
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
896 inform_oacc_loop (const oacc_loop *loop)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
897 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
898 const char *gang
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
899 = loop->mask & GOMP_DIM_MASK (GOMP_DIM_GANG) ? " gang" : "";
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
900 const char *worker
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
901 = loop->mask & GOMP_DIM_MASK (GOMP_DIM_WORKER) ? " worker" : "";
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
902 const char *vector
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
903 = loop->mask & GOMP_DIM_MASK (GOMP_DIM_VECTOR) ? " vector" : "";
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
904 const char *seq = loop->mask == 0 ? " seq" : "";
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
905 const dump_user_location_t loc
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
906 = dump_user_location_t::from_location_t (loop->loc);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
907 dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, loc,
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
908 "assigned OpenACC%s%s%s%s loop parallelism\n", gang, worker,
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
909 vector, seq);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
910
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
911 if (loop->child)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
912 inform_oacc_loop (loop->child);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
913 if (loop->sibling)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
914 inform_oacc_loop (loop->sibling);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
915 }
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
916
111
kono
parents:
diff changeset
917 /* DFS walk of basic blocks BB onwards, creating OpenACC loop
kono
parents:
diff changeset
918 structures as we go. By construction these loops are properly
kono
parents:
diff changeset
919 nested. */
kono
parents:
diff changeset
920
kono
parents:
diff changeset
921 static void
kono
parents:
diff changeset
922 oacc_loop_discover_walk (oacc_loop *loop, basic_block bb)
kono
parents:
diff changeset
923 {
kono
parents:
diff changeset
924 int marker = 0;
kono
parents:
diff changeset
925 int remaining = 0;
kono
parents:
diff changeset
926
kono
parents:
diff changeset
927 if (bb->flags & BB_VISITED)
kono
parents:
diff changeset
928 return;
kono
parents:
diff changeset
929
kono
parents:
diff changeset
930 follow:
kono
parents:
diff changeset
931 bb->flags |= BB_VISITED;
kono
parents:
diff changeset
932
kono
parents:
diff changeset
933 /* Scan for loop markers. */
kono
parents:
diff changeset
934 for (gimple_stmt_iterator gsi = gsi_start_bb (bb); !gsi_end_p (gsi);
kono
parents:
diff changeset
935 gsi_next (&gsi))
kono
parents:
diff changeset
936 {
kono
parents:
diff changeset
937 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
938
kono
parents:
diff changeset
939 if (!is_gimple_call (stmt))
kono
parents:
diff changeset
940 continue;
kono
parents:
diff changeset
941
kono
parents:
diff changeset
942 gcall *call = as_a <gcall *> (stmt);
kono
parents:
diff changeset
943
kono
parents:
diff changeset
944 /* If this is a routine, make a dummy loop for it. */
kono
parents:
diff changeset
945 if (tree decl = gimple_call_fndecl (call))
kono
parents:
diff changeset
946 if (tree attrs = oacc_get_fn_attrib (decl))
kono
parents:
diff changeset
947 {
kono
parents:
diff changeset
948 gcc_assert (!marker);
kono
parents:
diff changeset
949 new_oacc_loop_routine (loop, call, decl, attrs);
kono
parents:
diff changeset
950 }
kono
parents:
diff changeset
951
kono
parents:
diff changeset
952 if (!gimple_call_internal_p (call))
kono
parents:
diff changeset
953 continue;
kono
parents:
diff changeset
954
kono
parents:
diff changeset
955 switch (gimple_call_internal_fn (call))
kono
parents:
diff changeset
956 {
kono
parents:
diff changeset
957 default:
kono
parents:
diff changeset
958 break;
kono
parents:
diff changeset
959
kono
parents:
diff changeset
960 case IFN_GOACC_LOOP:
kono
parents:
diff changeset
961 case IFN_GOACC_TILE:
kono
parents:
diff changeset
962 /* Record the abstraction function, so we can manipulate it
kono
parents:
diff changeset
963 later. */
kono
parents:
diff changeset
964 loop->ifns.safe_push (call);
kono
parents:
diff changeset
965 break;
kono
parents:
diff changeset
966
kono
parents:
diff changeset
967 case IFN_UNIQUE:
kono
parents:
diff changeset
968 enum ifn_unique_kind kind
kono
parents:
diff changeset
969 = (enum ifn_unique_kind) (TREE_INT_CST_LOW
kono
parents:
diff changeset
970 (gimple_call_arg (call, 0)));
kono
parents:
diff changeset
971 if (kind == IFN_UNIQUE_OACC_HEAD_MARK
kono
parents:
diff changeset
972 || kind == IFN_UNIQUE_OACC_TAIL_MARK)
kono
parents:
diff changeset
973 {
kono
parents:
diff changeset
974 if (gimple_call_num_args (call) == 2)
kono
parents:
diff changeset
975 {
kono
parents:
diff changeset
976 gcc_assert (marker && !remaining);
kono
parents:
diff changeset
977 marker = 0;
kono
parents:
diff changeset
978 if (kind == IFN_UNIQUE_OACC_TAIL_MARK)
kono
parents:
diff changeset
979 loop = finish_oacc_loop (loop);
kono
parents:
diff changeset
980 else
kono
parents:
diff changeset
981 loop->head_end = call;
kono
parents:
diff changeset
982 }
kono
parents:
diff changeset
983 else
kono
parents:
diff changeset
984 {
kono
parents:
diff changeset
985 int count = TREE_INT_CST_LOW (gimple_call_arg (call, 2));
kono
parents:
diff changeset
986
kono
parents:
diff changeset
987 if (!marker)
kono
parents:
diff changeset
988 {
kono
parents:
diff changeset
989 if (kind == IFN_UNIQUE_OACC_HEAD_MARK)
kono
parents:
diff changeset
990 loop = new_oacc_loop (loop, call);
kono
parents:
diff changeset
991 remaining = count;
kono
parents:
diff changeset
992 }
kono
parents:
diff changeset
993 gcc_assert (count == remaining);
kono
parents:
diff changeset
994 if (remaining)
kono
parents:
diff changeset
995 {
kono
parents:
diff changeset
996 remaining--;
kono
parents:
diff changeset
997 if (kind == IFN_UNIQUE_OACC_HEAD_MARK)
kono
parents:
diff changeset
998 loop->heads[marker] = call;
kono
parents:
diff changeset
999 else
kono
parents:
diff changeset
1000 loop->tails[remaining] = call;
kono
parents:
diff changeset
1001 }
kono
parents:
diff changeset
1002 marker++;
kono
parents:
diff changeset
1003 }
kono
parents:
diff changeset
1004 }
kono
parents:
diff changeset
1005 }
kono
parents:
diff changeset
1006 }
kono
parents:
diff changeset
1007 if (remaining || marker)
kono
parents:
diff changeset
1008 {
kono
parents:
diff changeset
1009 bb = single_succ (bb);
kono
parents:
diff changeset
1010 gcc_assert (single_pred_p (bb) && !(bb->flags & BB_VISITED));
kono
parents:
diff changeset
1011 goto follow;
kono
parents:
diff changeset
1012 }
kono
parents:
diff changeset
1013
kono
parents:
diff changeset
1014 /* Walk successor blocks. */
kono
parents:
diff changeset
1015 edge e;
kono
parents:
diff changeset
1016 edge_iterator ei;
kono
parents:
diff changeset
1017
kono
parents:
diff changeset
1018 FOR_EACH_EDGE (e, ei, bb->succs)
kono
parents:
diff changeset
1019 oacc_loop_discover_walk (loop, e->dest);
kono
parents:
diff changeset
1020 }
kono
parents:
diff changeset
1021
kono
parents:
diff changeset
1022 /* LOOP is the first sibling. Reverse the order in place and return
kono
parents:
diff changeset
1023 the new first sibling. Recurse to child loops. */
kono
parents:
diff changeset
1024
kono
parents:
diff changeset
1025 static oacc_loop *
kono
parents:
diff changeset
1026 oacc_loop_sibling_nreverse (oacc_loop *loop)
kono
parents:
diff changeset
1027 {
kono
parents:
diff changeset
1028 oacc_loop *last = NULL;
kono
parents:
diff changeset
1029 do
kono
parents:
diff changeset
1030 {
kono
parents:
diff changeset
1031 if (loop->child)
kono
parents:
diff changeset
1032 loop->child = oacc_loop_sibling_nreverse (loop->child);
kono
parents:
diff changeset
1033
kono
parents:
diff changeset
1034 oacc_loop *next = loop->sibling;
kono
parents:
diff changeset
1035 loop->sibling = last;
kono
parents:
diff changeset
1036 last = loop;
kono
parents:
diff changeset
1037 loop = next;
kono
parents:
diff changeset
1038 }
kono
parents:
diff changeset
1039 while (loop);
kono
parents:
diff changeset
1040
kono
parents:
diff changeset
1041 return last;
kono
parents:
diff changeset
1042 }
kono
parents:
diff changeset
1043
kono
parents:
diff changeset
1044 /* Discover the OpenACC loops marked up by HEAD and TAIL markers for
kono
parents:
diff changeset
1045 the current function. */
kono
parents:
diff changeset
1046
kono
parents:
diff changeset
1047 static oacc_loop *
kono
parents:
diff changeset
1048 oacc_loop_discovery ()
kono
parents:
diff changeset
1049 {
kono
parents:
diff changeset
1050 /* Clear basic block flags, in particular BB_VISITED which we're going to use
kono
parents:
diff changeset
1051 in the following. */
kono
parents:
diff changeset
1052 clear_bb_flags ();
kono
parents:
diff changeset
1053
kono
parents:
diff changeset
1054 oacc_loop *top = new_oacc_loop_outer (current_function_decl);
kono
parents:
diff changeset
1055 oacc_loop_discover_walk (top, ENTRY_BLOCK_PTR_FOR_FN (cfun));
kono
parents:
diff changeset
1056
kono
parents:
diff changeset
1057 /* The siblings were constructed in reverse order, reverse them so
kono
parents:
diff changeset
1058 that diagnostics come out in an unsurprising order. */
kono
parents:
diff changeset
1059 top = oacc_loop_sibling_nreverse (top);
kono
parents:
diff changeset
1060
kono
parents:
diff changeset
1061 return top;
kono
parents:
diff changeset
1062 }
kono
parents:
diff changeset
1063
kono
parents:
diff changeset
1064 /* Transform the abstract internal function markers starting at FROM
kono
parents:
diff changeset
1065 to be for partitioning level LEVEL. Stop when we meet another HEAD
kono
parents:
diff changeset
1066 or TAIL marker. */
kono
parents:
diff changeset
1067
kono
parents:
diff changeset
1068 static void
kono
parents:
diff changeset
1069 oacc_loop_xform_head_tail (gcall *from, int level)
kono
parents:
diff changeset
1070 {
kono
parents:
diff changeset
1071 enum ifn_unique_kind kind
kono
parents:
diff changeset
1072 = (enum ifn_unique_kind) TREE_INT_CST_LOW (gimple_call_arg (from, 0));
kono
parents:
diff changeset
1073 tree replacement = build_int_cst (unsigned_type_node, level);
kono
parents:
diff changeset
1074
kono
parents:
diff changeset
1075 for (gimple_stmt_iterator gsi = gsi_for_stmt (from);;)
kono
parents:
diff changeset
1076 {
kono
parents:
diff changeset
1077 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
1078
kono
parents:
diff changeset
1079 if (gimple_call_internal_p (stmt, IFN_UNIQUE))
kono
parents:
diff changeset
1080 {
kono
parents:
diff changeset
1081 enum ifn_unique_kind k
kono
parents:
diff changeset
1082 = ((enum ifn_unique_kind)
kono
parents:
diff changeset
1083 TREE_INT_CST_LOW (gimple_call_arg (stmt, 0)));
kono
parents:
diff changeset
1084
kono
parents:
diff changeset
1085 if (k == IFN_UNIQUE_OACC_FORK || k == IFN_UNIQUE_OACC_JOIN)
kono
parents:
diff changeset
1086 *gimple_call_arg_ptr (stmt, 2) = replacement;
kono
parents:
diff changeset
1087 else if (k == kind && stmt != from)
kono
parents:
diff changeset
1088 break;
kono
parents:
diff changeset
1089 }
kono
parents:
diff changeset
1090 else if (gimple_call_internal_p (stmt, IFN_GOACC_REDUCTION))
kono
parents:
diff changeset
1091 *gimple_call_arg_ptr (stmt, 3) = replacement;
kono
parents:
diff changeset
1092
kono
parents:
diff changeset
1093 gsi_next (&gsi);
kono
parents:
diff changeset
1094 while (gsi_end_p (gsi))
kono
parents:
diff changeset
1095 gsi = gsi_start_bb (single_succ (gsi_bb (gsi)));
kono
parents:
diff changeset
1096 }
kono
parents:
diff changeset
1097 }
kono
parents:
diff changeset
1098
kono
parents:
diff changeset
1099 /* Process the discovered OpenACC loops, setting the correct
kono
parents:
diff changeset
1100 partitioning level etc. */
kono
parents:
diff changeset
1101
kono
parents:
diff changeset
1102 static void
kono
parents:
diff changeset
1103 oacc_loop_process (oacc_loop *loop)
kono
parents:
diff changeset
1104 {
kono
parents:
diff changeset
1105 if (loop->child)
kono
parents:
diff changeset
1106 oacc_loop_process (loop->child);
kono
parents:
diff changeset
1107
kono
parents:
diff changeset
1108 if (loop->mask && !loop->routine)
kono
parents:
diff changeset
1109 {
kono
parents:
diff changeset
1110 int ix;
kono
parents:
diff changeset
1111 tree mask_arg = build_int_cst (unsigned_type_node, loop->mask);
kono
parents:
diff changeset
1112 tree e_mask_arg = build_int_cst (unsigned_type_node, loop->e_mask);
kono
parents:
diff changeset
1113 tree chunk_arg = loop->chunk_size;
kono
parents:
diff changeset
1114 gcall *call;
kono
parents:
diff changeset
1115
kono
parents:
diff changeset
1116 for (ix = 0; loop->ifns.iterate (ix, &call); ix++)
kono
parents:
diff changeset
1117 switch (gimple_call_internal_fn (call))
kono
parents:
diff changeset
1118 {
kono
parents:
diff changeset
1119 case IFN_GOACC_LOOP:
kono
parents:
diff changeset
1120 {
kono
parents:
diff changeset
1121 bool is_e = gimple_call_arg (call, 5) == integer_minus_one_node;
kono
parents:
diff changeset
1122 gimple_call_set_arg (call, 5, is_e ? e_mask_arg : mask_arg);
kono
parents:
diff changeset
1123 if (!is_e)
kono
parents:
diff changeset
1124 gimple_call_set_arg (call, 4, chunk_arg);
kono
parents:
diff changeset
1125 }
kono
parents:
diff changeset
1126 break;
kono
parents:
diff changeset
1127
kono
parents:
diff changeset
1128 case IFN_GOACC_TILE:
kono
parents:
diff changeset
1129 gimple_call_set_arg (call, 3, mask_arg);
kono
parents:
diff changeset
1130 gimple_call_set_arg (call, 4, e_mask_arg);
kono
parents:
diff changeset
1131 break;
kono
parents:
diff changeset
1132
kono
parents:
diff changeset
1133 default:
kono
parents:
diff changeset
1134 gcc_unreachable ();
kono
parents:
diff changeset
1135 }
kono
parents:
diff changeset
1136
kono
parents:
diff changeset
1137 unsigned dim = GOMP_DIM_GANG;
kono
parents:
diff changeset
1138 unsigned mask = loop->mask | loop->e_mask;
kono
parents:
diff changeset
1139 for (ix = 0; ix != GOMP_DIM_MAX && mask; ix++)
kono
parents:
diff changeset
1140 {
kono
parents:
diff changeset
1141 while (!(GOMP_DIM_MASK (dim) & mask))
kono
parents:
diff changeset
1142 dim++;
kono
parents:
diff changeset
1143
kono
parents:
diff changeset
1144 oacc_loop_xform_head_tail (loop->heads[ix], dim);
kono
parents:
diff changeset
1145 oacc_loop_xform_head_tail (loop->tails[ix], dim);
kono
parents:
diff changeset
1146
kono
parents:
diff changeset
1147 mask ^= GOMP_DIM_MASK (dim);
kono
parents:
diff changeset
1148 }
kono
parents:
diff changeset
1149 }
kono
parents:
diff changeset
1150
kono
parents:
diff changeset
1151 if (loop->sibling)
kono
parents:
diff changeset
1152 oacc_loop_process (loop->sibling);
kono
parents:
diff changeset
1153 }
kono
parents:
diff changeset
1154
kono
parents:
diff changeset
1155 /* Walk the OpenACC loop heirarchy checking and assigning the
kono
parents:
diff changeset
1156 programmer-specified partitionings. OUTER_MASK is the partitioning
kono
parents:
diff changeset
1157 this loop is contained within. Return mask of partitioning
kono
parents:
diff changeset
1158 encountered. If any auto loops are discovered, set GOMP_DIM_MAX
kono
parents:
diff changeset
1159 bit. */
kono
parents:
diff changeset
1160
kono
parents:
diff changeset
1161 static unsigned
kono
parents:
diff changeset
1162 oacc_loop_fixed_partitions (oacc_loop *loop, unsigned outer_mask)
kono
parents:
diff changeset
1163 {
kono
parents:
diff changeset
1164 unsigned this_mask = loop->mask;
kono
parents:
diff changeset
1165 unsigned mask_all = 0;
kono
parents:
diff changeset
1166 bool noisy = true;
kono
parents:
diff changeset
1167
kono
parents:
diff changeset
1168 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1169 /* When device_type is supported, we want the device compiler to be
kono
parents:
diff changeset
1170 noisy, if the loop parameters are device_type-specific. */
kono
parents:
diff changeset
1171 noisy = false;
kono
parents:
diff changeset
1172 #endif
kono
parents:
diff changeset
1173
kono
parents:
diff changeset
1174 if (!loop->routine)
kono
parents:
diff changeset
1175 {
kono
parents:
diff changeset
1176 bool auto_par = (loop->flags & OLF_AUTO) != 0;
kono
parents:
diff changeset
1177 bool seq_par = (loop->flags & OLF_SEQ) != 0;
kono
parents:
diff changeset
1178 bool tiling = (loop->flags & OLF_TILE) != 0;
kono
parents:
diff changeset
1179
kono
parents:
diff changeset
1180 this_mask = ((loop->flags >> OLF_DIM_BASE)
kono
parents:
diff changeset
1181 & (GOMP_DIM_MASK (GOMP_DIM_MAX) - 1));
kono
parents:
diff changeset
1182
kono
parents:
diff changeset
1183 /* Apply auto partitioning if this is a non-partitioned regular
kono
parents:
diff changeset
1184 loop, or (no more than) single axis tiled loop. */
kono
parents:
diff changeset
1185 bool maybe_auto
kono
parents:
diff changeset
1186 = !seq_par && this_mask == (tiling ? this_mask & -this_mask : 0);
kono
parents:
diff changeset
1187
kono
parents:
diff changeset
1188 if ((this_mask != 0) + auto_par + seq_par > 1)
kono
parents:
diff changeset
1189 {
kono
parents:
diff changeset
1190 if (noisy)
kono
parents:
diff changeset
1191 error_at (loop->loc,
kono
parents:
diff changeset
1192 seq_par
kono
parents:
diff changeset
1193 ? G_("%<seq%> overrides other OpenACC loop specifiers")
kono
parents:
diff changeset
1194 : G_("%<auto%> conflicts with other OpenACC loop "
kono
parents:
diff changeset
1195 "specifiers"));
kono
parents:
diff changeset
1196 maybe_auto = false;
kono
parents:
diff changeset
1197 loop->flags &= ~OLF_AUTO;
kono
parents:
diff changeset
1198 if (seq_par)
kono
parents:
diff changeset
1199 {
kono
parents:
diff changeset
1200 loop->flags
kono
parents:
diff changeset
1201 &= ~((GOMP_DIM_MASK (GOMP_DIM_MAX) - 1) << OLF_DIM_BASE);
kono
parents:
diff changeset
1202 this_mask = 0;
kono
parents:
diff changeset
1203 }
kono
parents:
diff changeset
1204 }
kono
parents:
diff changeset
1205
kono
parents:
diff changeset
1206 if (maybe_auto && (loop->flags & OLF_INDEPENDENT))
kono
parents:
diff changeset
1207 {
kono
parents:
diff changeset
1208 loop->flags |= OLF_AUTO;
kono
parents:
diff changeset
1209 mask_all |= GOMP_DIM_MASK (GOMP_DIM_MAX);
kono
parents:
diff changeset
1210 }
kono
parents:
diff changeset
1211 }
kono
parents:
diff changeset
1212
kono
parents:
diff changeset
1213 if (this_mask & outer_mask)
kono
parents:
diff changeset
1214 {
kono
parents:
diff changeset
1215 const oacc_loop *outer;
kono
parents:
diff changeset
1216 for (outer = loop->parent; outer; outer = outer->parent)
kono
parents:
diff changeset
1217 if ((outer->mask | outer->e_mask) & this_mask)
kono
parents:
diff changeset
1218 break;
kono
parents:
diff changeset
1219
kono
parents:
diff changeset
1220 if (noisy)
kono
parents:
diff changeset
1221 {
kono
parents:
diff changeset
1222 if (outer)
kono
parents:
diff changeset
1223 {
kono
parents:
diff changeset
1224 error_at (loop->loc,
kono
parents:
diff changeset
1225 loop->routine
kono
parents:
diff changeset
1226 ? G_("routine call uses same OpenACC parallelism"
kono
parents:
diff changeset
1227 " as containing loop")
kono
parents:
diff changeset
1228 : G_("inner loop uses same OpenACC parallelism"
kono
parents:
diff changeset
1229 " as containing loop"));
kono
parents:
diff changeset
1230 inform (outer->loc, "containing loop here");
kono
parents:
diff changeset
1231 }
kono
parents:
diff changeset
1232 else
kono
parents:
diff changeset
1233 error_at (loop->loc,
kono
parents:
diff changeset
1234 loop->routine
kono
parents:
diff changeset
1235 ? G_("routine call uses OpenACC parallelism disallowed"
kono
parents:
diff changeset
1236 " by containing routine")
kono
parents:
diff changeset
1237 : G_("loop uses OpenACC parallelism disallowed"
kono
parents:
diff changeset
1238 " by containing routine"));
kono
parents:
diff changeset
1239
kono
parents:
diff changeset
1240 if (loop->routine)
kono
parents:
diff changeset
1241 inform (DECL_SOURCE_LOCATION (loop->routine),
kono
parents:
diff changeset
1242 "routine %qD declared here", loop->routine);
kono
parents:
diff changeset
1243 }
kono
parents:
diff changeset
1244 this_mask &= ~outer_mask;
kono
parents:
diff changeset
1245 }
kono
parents:
diff changeset
1246 else
kono
parents:
diff changeset
1247 {
kono
parents:
diff changeset
1248 unsigned outermost = least_bit_hwi (this_mask);
kono
parents:
diff changeset
1249
kono
parents:
diff changeset
1250 if (outermost && outermost <= outer_mask)
kono
parents:
diff changeset
1251 {
kono
parents:
diff changeset
1252 if (noisy)
kono
parents:
diff changeset
1253 {
kono
parents:
diff changeset
1254 error_at (loop->loc,
kono
parents:
diff changeset
1255 "incorrectly nested OpenACC loop parallelism");
kono
parents:
diff changeset
1256
kono
parents:
diff changeset
1257 const oacc_loop *outer;
kono
parents:
diff changeset
1258 for (outer = loop->parent;
kono
parents:
diff changeset
1259 outer->flags && outer->flags < outermost;
kono
parents:
diff changeset
1260 outer = outer->parent)
kono
parents:
diff changeset
1261 continue;
kono
parents:
diff changeset
1262 inform (outer->loc, "containing loop here");
kono
parents:
diff changeset
1263 }
kono
parents:
diff changeset
1264
kono
parents:
diff changeset
1265 this_mask &= ~outermost;
kono
parents:
diff changeset
1266 }
kono
parents:
diff changeset
1267 }
kono
parents:
diff changeset
1268
kono
parents:
diff changeset
1269 mask_all |= this_mask;
kono
parents:
diff changeset
1270
kono
parents:
diff changeset
1271 if (loop->flags & OLF_TILE)
kono
parents:
diff changeset
1272 {
kono
parents:
diff changeset
1273 /* When tiling, vector goes to the element loop, and failing
kono
parents:
diff changeset
1274 that we put worker there. The std doesn't contemplate
kono
parents:
diff changeset
1275 specifying all three. We choose to put worker and vector on
kono
parents:
diff changeset
1276 the element loops in that case. */
kono
parents:
diff changeset
1277 unsigned this_e_mask = this_mask & GOMP_DIM_MASK (GOMP_DIM_VECTOR);
kono
parents:
diff changeset
1278 if (!this_e_mask || this_mask & GOMP_DIM_MASK (GOMP_DIM_GANG))
kono
parents:
diff changeset
1279 this_e_mask |= this_mask & GOMP_DIM_MASK (GOMP_DIM_WORKER);
kono
parents:
diff changeset
1280
kono
parents:
diff changeset
1281 loop->e_mask = this_e_mask;
kono
parents:
diff changeset
1282 this_mask ^= this_e_mask;
kono
parents:
diff changeset
1283 }
kono
parents:
diff changeset
1284
kono
parents:
diff changeset
1285 loop->mask = this_mask;
kono
parents:
diff changeset
1286
kono
parents:
diff changeset
1287 if (dump_file)
kono
parents:
diff changeset
1288 fprintf (dump_file, "Loop %s:%d user specified %d & %d\n",
kono
parents:
diff changeset
1289 LOCATION_FILE (loop->loc), LOCATION_LINE (loop->loc),
kono
parents:
diff changeset
1290 loop->mask, loop->e_mask);
kono
parents:
diff changeset
1291
kono
parents:
diff changeset
1292 if (loop->child)
kono
parents:
diff changeset
1293 {
kono
parents:
diff changeset
1294 unsigned tmp_mask = outer_mask | this_mask | loop->e_mask;
kono
parents:
diff changeset
1295 loop->inner = oacc_loop_fixed_partitions (loop->child, tmp_mask);
kono
parents:
diff changeset
1296 mask_all |= loop->inner;
kono
parents:
diff changeset
1297 }
kono
parents:
diff changeset
1298
kono
parents:
diff changeset
1299 if (loop->sibling)
kono
parents:
diff changeset
1300 mask_all |= oacc_loop_fixed_partitions (loop->sibling, outer_mask);
kono
parents:
diff changeset
1301
kono
parents:
diff changeset
1302 return mask_all;
kono
parents:
diff changeset
1303 }
kono
parents:
diff changeset
1304
kono
parents:
diff changeset
1305 /* Walk the OpenACC loop heirarchy to assign auto-partitioned loops.
kono
parents:
diff changeset
1306 OUTER_MASK is the partitioning this loop is contained within.
kono
parents:
diff changeset
1307 OUTER_ASSIGN is true if an outer loop is being auto-partitioned.
kono
parents:
diff changeset
1308 Return the cumulative partitioning used by this loop, siblings and
kono
parents:
diff changeset
1309 children. */
kono
parents:
diff changeset
1310
kono
parents:
diff changeset
1311 static unsigned
kono
parents:
diff changeset
1312 oacc_loop_auto_partitions (oacc_loop *loop, unsigned outer_mask,
kono
parents:
diff changeset
1313 bool outer_assign)
kono
parents:
diff changeset
1314 {
kono
parents:
diff changeset
1315 bool assign = (loop->flags & OLF_AUTO) && (loop->flags & OLF_INDEPENDENT);
kono
parents:
diff changeset
1316 bool noisy = true;
kono
parents:
diff changeset
1317 bool tiling = loop->flags & OLF_TILE;
kono
parents:
diff changeset
1318
kono
parents:
diff changeset
1319 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1320 /* When device_type is supported, we want the device compiler to be
kono
parents:
diff changeset
1321 noisy, if the loop parameters are device_type-specific. */
kono
parents:
diff changeset
1322 noisy = false;
kono
parents:
diff changeset
1323 #endif
kono
parents:
diff changeset
1324
kono
parents:
diff changeset
1325 if (assign && (!outer_assign || loop->inner))
kono
parents:
diff changeset
1326 {
kono
parents:
diff changeset
1327 /* Allocate outermost and non-innermost loops at the outermost
kono
parents:
diff changeset
1328 non-innermost available level. */
kono
parents:
diff changeset
1329 unsigned this_mask = GOMP_DIM_MASK (GOMP_DIM_GANG);
kono
parents:
diff changeset
1330
kono
parents:
diff changeset
1331 /* Find the first outermost available partition. */
kono
parents:
diff changeset
1332 while (this_mask <= outer_mask)
kono
parents:
diff changeset
1333 this_mask <<= 1;
kono
parents:
diff changeset
1334
kono
parents:
diff changeset
1335 /* Grab two axes if tiling, and we've not assigned anything */
kono
parents:
diff changeset
1336 if (tiling && !(loop->mask | loop->e_mask))
kono
parents:
diff changeset
1337 this_mask |= this_mask << 1;
kono
parents:
diff changeset
1338
kono
parents:
diff changeset
1339 /* Prohibit the innermost partitioning at the moment. */
kono
parents:
diff changeset
1340 this_mask &= GOMP_DIM_MASK (GOMP_DIM_MAX - 1) - 1;
kono
parents:
diff changeset
1341
kono
parents:
diff changeset
1342 /* Don't use any dimension explicitly claimed by an inner loop. */
kono
parents:
diff changeset
1343 this_mask &= ~loop->inner;
kono
parents:
diff changeset
1344
kono
parents:
diff changeset
1345 if (tiling && !loop->e_mask)
kono
parents:
diff changeset
1346 {
kono
parents:
diff changeset
1347 /* If we got two axes, allocate the inner one to the element
kono
parents:
diff changeset
1348 loop. */
kono
parents:
diff changeset
1349 loop->e_mask = this_mask & (this_mask << 1);
kono
parents:
diff changeset
1350 this_mask ^= loop->e_mask;
kono
parents:
diff changeset
1351 }
kono
parents:
diff changeset
1352
kono
parents:
diff changeset
1353 loop->mask |= this_mask;
kono
parents:
diff changeset
1354 }
kono
parents:
diff changeset
1355
kono
parents:
diff changeset
1356 if (loop->child)
kono
parents:
diff changeset
1357 {
kono
parents:
diff changeset
1358 unsigned tmp_mask = outer_mask | loop->mask | loop->e_mask;
kono
parents:
diff changeset
1359 loop->inner = oacc_loop_auto_partitions (loop->child, tmp_mask,
kono
parents:
diff changeset
1360 outer_assign | assign);
kono
parents:
diff changeset
1361 }
kono
parents:
diff changeset
1362
kono
parents:
diff changeset
1363 if (assign && (!loop->mask || (tiling && !loop->e_mask) || !outer_assign))
kono
parents:
diff changeset
1364 {
kono
parents:
diff changeset
1365 /* Allocate the loop at the innermost available level. Note
kono
parents:
diff changeset
1366 that we do this even if we already assigned this loop the
kono
parents:
diff changeset
1367 outermost available level above. That way we'll partition
kono
parents:
diff changeset
1368 this along 2 axes, if they are available. */
kono
parents:
diff changeset
1369 unsigned this_mask = 0;
kono
parents:
diff changeset
1370
kono
parents:
diff changeset
1371 /* Determine the outermost partitioning used within this loop. */
kono
parents:
diff changeset
1372 this_mask = loop->inner | GOMP_DIM_MASK (GOMP_DIM_MAX);
kono
parents:
diff changeset
1373 this_mask = least_bit_hwi (this_mask);
kono
parents:
diff changeset
1374
kono
parents:
diff changeset
1375 /* Pick the partitioning just inside that one. */
kono
parents:
diff changeset
1376 this_mask >>= 1;
kono
parents:
diff changeset
1377
kono
parents:
diff changeset
1378 /* And avoid picking one use by an outer loop. */
kono
parents:
diff changeset
1379 this_mask &= ~outer_mask;
kono
parents:
diff changeset
1380
kono
parents:
diff changeset
1381 /* If tiling and we failed completely above, grab the next one
kono
parents:
diff changeset
1382 too. Making sure it doesn't hit an outer loop. */
kono
parents:
diff changeset
1383 if (tiling)
kono
parents:
diff changeset
1384 {
kono
parents:
diff changeset
1385 this_mask &= ~(loop->e_mask | loop->mask);
kono
parents:
diff changeset
1386 unsigned tile_mask = ((this_mask >> 1)
kono
parents:
diff changeset
1387 & ~(outer_mask | loop->e_mask | loop->mask));
kono
parents:
diff changeset
1388
kono
parents:
diff changeset
1389 if (tile_mask || loop->mask)
kono
parents:
diff changeset
1390 {
kono
parents:
diff changeset
1391 loop->e_mask |= this_mask;
kono
parents:
diff changeset
1392 this_mask = tile_mask;
kono
parents:
diff changeset
1393 }
kono
parents:
diff changeset
1394 if (!loop->e_mask && noisy)
kono
parents:
diff changeset
1395 warning_at (loop->loc, 0,
kono
parents:
diff changeset
1396 "insufficient partitioning available"
kono
parents:
diff changeset
1397 " to parallelize element loop");
kono
parents:
diff changeset
1398 }
kono
parents:
diff changeset
1399
kono
parents:
diff changeset
1400 loop->mask |= this_mask;
kono
parents:
diff changeset
1401 if (!loop->mask && noisy)
kono
parents:
diff changeset
1402 warning_at (loop->loc, 0,
kono
parents:
diff changeset
1403 tiling
kono
parents:
diff changeset
1404 ? G_("insufficient partitioning available"
kono
parents:
diff changeset
1405 " to parallelize tile loop")
kono
parents:
diff changeset
1406 : G_("insufficient partitioning available"
kono
parents:
diff changeset
1407 " to parallelize loop"));
kono
parents:
diff changeset
1408 }
kono
parents:
diff changeset
1409
kono
parents:
diff changeset
1410 if (assign && dump_file)
kono
parents:
diff changeset
1411 fprintf (dump_file, "Auto loop %s:%d assigned %d & %d\n",
kono
parents:
diff changeset
1412 LOCATION_FILE (loop->loc), LOCATION_LINE (loop->loc),
kono
parents:
diff changeset
1413 loop->mask, loop->e_mask);
kono
parents:
diff changeset
1414
kono
parents:
diff changeset
1415 unsigned inner_mask = 0;
kono
parents:
diff changeset
1416
kono
parents:
diff changeset
1417 if (loop->sibling)
kono
parents:
diff changeset
1418 inner_mask |= oacc_loop_auto_partitions (loop->sibling,
kono
parents:
diff changeset
1419 outer_mask, outer_assign);
kono
parents:
diff changeset
1420
kono
parents:
diff changeset
1421 inner_mask |= loop->inner | loop->mask | loop->e_mask;
kono
parents:
diff changeset
1422
kono
parents:
diff changeset
1423 return inner_mask;
kono
parents:
diff changeset
1424 }
kono
parents:
diff changeset
1425
kono
parents:
diff changeset
1426 /* Walk the OpenACC loop heirarchy to check and assign partitioning
kono
parents:
diff changeset
1427 axes. Return mask of partitioning. */
kono
parents:
diff changeset
1428
kono
parents:
diff changeset
1429 static unsigned
kono
parents:
diff changeset
1430 oacc_loop_partition (oacc_loop *loop, unsigned outer_mask)
kono
parents:
diff changeset
1431 {
kono
parents:
diff changeset
1432 unsigned mask_all = oacc_loop_fixed_partitions (loop, outer_mask);
kono
parents:
diff changeset
1433
kono
parents:
diff changeset
1434 if (mask_all & GOMP_DIM_MASK (GOMP_DIM_MAX))
kono
parents:
diff changeset
1435 {
kono
parents:
diff changeset
1436 mask_all ^= GOMP_DIM_MASK (GOMP_DIM_MAX);
kono
parents:
diff changeset
1437 mask_all |= oacc_loop_auto_partitions (loop, outer_mask, false);
kono
parents:
diff changeset
1438 }
kono
parents:
diff changeset
1439 return mask_all;
kono
parents:
diff changeset
1440 }
kono
parents:
diff changeset
1441
kono
parents:
diff changeset
1442 /* Default fork/join early expander. Delete the function calls if
kono
parents:
diff changeset
1443 there is no RTL expander. */
kono
parents:
diff changeset
1444
kono
parents:
diff changeset
1445 bool
kono
parents:
diff changeset
1446 default_goacc_fork_join (gcall *ARG_UNUSED (call),
kono
parents:
diff changeset
1447 const int *ARG_UNUSED (dims), bool is_fork)
kono
parents:
diff changeset
1448 {
kono
parents:
diff changeset
1449 if (is_fork)
kono
parents:
diff changeset
1450 return targetm.have_oacc_fork ();
kono
parents:
diff changeset
1451 else
kono
parents:
diff changeset
1452 return targetm.have_oacc_join ();
kono
parents:
diff changeset
1453 }
kono
parents:
diff changeset
1454
kono
parents:
diff changeset
1455 /* Default goacc.reduction early expander.
kono
parents:
diff changeset
1456
kono
parents:
diff changeset
1457 LHS-opt = IFN_REDUCTION (KIND, RES_PTR, VAR, LEVEL, OP, OFFSET)
kono
parents:
diff changeset
1458 If RES_PTR is not integer-zerop:
kono
parents:
diff changeset
1459 SETUP - emit 'LHS = *RES_PTR', LHS = NULL
kono
parents:
diff changeset
1460 TEARDOWN - emit '*RES_PTR = VAR'
kono
parents:
diff changeset
1461 If LHS is not NULL
kono
parents:
diff changeset
1462 emit 'LHS = VAR' */
kono
parents:
diff changeset
1463
kono
parents:
diff changeset
1464 void
kono
parents:
diff changeset
1465 default_goacc_reduction (gcall *call)
kono
parents:
diff changeset
1466 {
kono
parents:
diff changeset
1467 unsigned code = (unsigned)TREE_INT_CST_LOW (gimple_call_arg (call, 0));
kono
parents:
diff changeset
1468 gimple_stmt_iterator gsi = gsi_for_stmt (call);
kono
parents:
diff changeset
1469 tree lhs = gimple_call_lhs (call);
kono
parents:
diff changeset
1470 tree var = gimple_call_arg (call, 2);
kono
parents:
diff changeset
1471 gimple_seq seq = NULL;
kono
parents:
diff changeset
1472
kono
parents:
diff changeset
1473 if (code == IFN_GOACC_REDUCTION_SETUP
kono
parents:
diff changeset
1474 || code == IFN_GOACC_REDUCTION_TEARDOWN)
kono
parents:
diff changeset
1475 {
kono
parents:
diff changeset
1476 /* Setup and Teardown need to copy from/to the receiver object,
kono
parents:
diff changeset
1477 if there is one. */
kono
parents:
diff changeset
1478 tree ref_to_res = gimple_call_arg (call, 1);
kono
parents:
diff changeset
1479
kono
parents:
diff changeset
1480 if (!integer_zerop (ref_to_res))
kono
parents:
diff changeset
1481 {
kono
parents:
diff changeset
1482 tree dst = build_simple_mem_ref (ref_to_res);
kono
parents:
diff changeset
1483 tree src = var;
kono
parents:
diff changeset
1484
kono
parents:
diff changeset
1485 if (code == IFN_GOACC_REDUCTION_SETUP)
kono
parents:
diff changeset
1486 {
kono
parents:
diff changeset
1487 src = dst;
kono
parents:
diff changeset
1488 dst = lhs;
kono
parents:
diff changeset
1489 lhs = NULL;
kono
parents:
diff changeset
1490 }
kono
parents:
diff changeset
1491 gimple_seq_add_stmt (&seq, gimple_build_assign (dst, src));
kono
parents:
diff changeset
1492 }
kono
parents:
diff changeset
1493 }
kono
parents:
diff changeset
1494
kono
parents:
diff changeset
1495 /* Copy VAR to LHS, if there is an LHS. */
kono
parents:
diff changeset
1496 if (lhs)
kono
parents:
diff changeset
1497 gimple_seq_add_stmt (&seq, gimple_build_assign (lhs, var));
kono
parents:
diff changeset
1498
kono
parents:
diff changeset
1499 gsi_replace_with_seq (&gsi, seq, true);
kono
parents:
diff changeset
1500 }
kono
parents:
diff changeset
1501
kono
parents:
diff changeset
1502 /* Main entry point for oacc transformations which run on the device
kono
parents:
diff changeset
1503 compiler after LTO, so we know what the target device is at this
kono
parents:
diff changeset
1504 point (including the host fallback). */
kono
parents:
diff changeset
1505
kono
parents:
diff changeset
1506 static unsigned int
kono
parents:
diff changeset
1507 execute_oacc_device_lower ()
kono
parents:
diff changeset
1508 {
kono
parents:
diff changeset
1509 tree attrs = oacc_get_fn_attrib (current_function_decl);
kono
parents:
diff changeset
1510
kono
parents:
diff changeset
1511 if (!attrs)
kono
parents:
diff changeset
1512 /* Not an offloaded function. */
kono
parents:
diff changeset
1513 return 0;
kono
parents:
diff changeset
1514
kono
parents:
diff changeset
1515 /* Parse the default dim argument exactly once. */
kono
parents:
diff changeset
1516 if ((const void *)flag_openacc_dims != &flag_openacc_dims)
kono
parents:
diff changeset
1517 {
kono
parents:
diff changeset
1518 oacc_parse_default_dims (flag_openacc_dims);
kono
parents:
diff changeset
1519 flag_openacc_dims = (char *)&flag_openacc_dims;
kono
parents:
diff changeset
1520 }
kono
parents:
diff changeset
1521
kono
parents:
diff changeset
1522 bool is_oacc_kernels
kono
parents:
diff changeset
1523 = (lookup_attribute ("oacc kernels",
kono
parents:
diff changeset
1524 DECL_ATTRIBUTES (current_function_decl)) != NULL);
kono
parents:
diff changeset
1525 bool is_oacc_kernels_parallelized
kono
parents:
diff changeset
1526 = (lookup_attribute ("oacc kernels parallelized",
kono
parents:
diff changeset
1527 DECL_ATTRIBUTES (current_function_decl)) != NULL);
kono
parents:
diff changeset
1528
kono
parents:
diff changeset
1529 /* Unparallelized OpenACC kernels constructs must get launched as 1 x 1 x 1
kono
parents:
diff changeset
1530 kernels, so remove the parallelism dimensions function attributes
kono
parents:
diff changeset
1531 potentially set earlier on. */
kono
parents:
diff changeset
1532 if (is_oacc_kernels && !is_oacc_kernels_parallelized)
kono
parents:
diff changeset
1533 {
kono
parents:
diff changeset
1534 oacc_set_fn_attrib (current_function_decl, NULL, NULL);
kono
parents:
diff changeset
1535 attrs = oacc_get_fn_attrib (current_function_decl);
kono
parents:
diff changeset
1536 }
kono
parents:
diff changeset
1537
kono
parents:
diff changeset
1538 /* Discover, partition and process the loops. */
kono
parents:
diff changeset
1539 oacc_loop *loops = oacc_loop_discovery ();
kono
parents:
diff changeset
1540 int fn_level = oacc_fn_attrib_level (attrs);
kono
parents:
diff changeset
1541
kono
parents:
diff changeset
1542 if (dump_file)
kono
parents:
diff changeset
1543 {
kono
parents:
diff changeset
1544 if (fn_level >= 0)
kono
parents:
diff changeset
1545 fprintf (dump_file, "Function is OpenACC routine level %d\n",
kono
parents:
diff changeset
1546 fn_level);
kono
parents:
diff changeset
1547 else if (is_oacc_kernels)
kono
parents:
diff changeset
1548 fprintf (dump_file, "Function is %s OpenACC kernels offload\n",
kono
parents:
diff changeset
1549 (is_oacc_kernels_parallelized
kono
parents:
diff changeset
1550 ? "parallelized" : "unparallelized"));
kono
parents:
diff changeset
1551 else
kono
parents:
diff changeset
1552 fprintf (dump_file, "Function is OpenACC parallel offload\n");
kono
parents:
diff changeset
1553 }
kono
parents:
diff changeset
1554
kono
parents:
diff changeset
1555 unsigned outer_mask = fn_level >= 0 ? GOMP_DIM_MASK (fn_level) - 1 : 0;
kono
parents:
diff changeset
1556 unsigned used_mask = oacc_loop_partition (loops, outer_mask);
kono
parents:
diff changeset
1557 /* OpenACC kernels constructs are special: they currently don't use the
kono
parents:
diff changeset
1558 generic oacc_loop infrastructure and attribute/dimension processing. */
kono
parents:
diff changeset
1559 if (is_oacc_kernels && is_oacc_kernels_parallelized)
kono
parents:
diff changeset
1560 {
kono
parents:
diff changeset
1561 /* Parallelized OpenACC kernels constructs use gang parallelism. See
kono
parents:
diff changeset
1562 also tree-parloops.c:create_parallel_loop. */
kono
parents:
diff changeset
1563 used_mask |= GOMP_DIM_MASK (GOMP_DIM_GANG);
kono
parents:
diff changeset
1564 }
kono
parents:
diff changeset
1565
kono
parents:
diff changeset
1566 int dims[GOMP_DIM_MAX];
kono
parents:
diff changeset
1567 oacc_validate_dims (current_function_decl, attrs, dims, fn_level, used_mask);
kono
parents:
diff changeset
1568
kono
parents:
diff changeset
1569 if (dump_file)
kono
parents:
diff changeset
1570 {
kono
parents:
diff changeset
1571 const char *comma = "Compute dimensions [";
kono
parents:
diff changeset
1572 for (int ix = 0; ix != GOMP_DIM_MAX; ix++, comma = ", ")
kono
parents:
diff changeset
1573 fprintf (dump_file, "%s%d", comma, dims[ix]);
kono
parents:
diff changeset
1574 fprintf (dump_file, "]\n");
kono
parents:
diff changeset
1575 }
kono
parents:
diff changeset
1576
kono
parents:
diff changeset
1577 oacc_loop_process (loops);
kono
parents:
diff changeset
1578 if (dump_file)
kono
parents:
diff changeset
1579 {
kono
parents:
diff changeset
1580 fprintf (dump_file, "OpenACC loops\n");
kono
parents:
diff changeset
1581 dump_oacc_loop (dump_file, loops, 0);
kono
parents:
diff changeset
1582 fprintf (dump_file, "\n");
kono
parents:
diff changeset
1583 }
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1584 if (dump_enabled_p ())
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1585 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1586 oacc_loop *l = loops;
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1587 /* OpenACC kernels constructs are special: they currently don't use the
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1588 generic oacc_loop infrastructure. */
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1589 if (is_oacc_kernels)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1590 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1591 /* Create a fake oacc_loop for diagnostic purposes. */
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1592 l = new_oacc_loop_raw (NULL,
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1593 DECL_SOURCE_LOCATION (current_function_decl));
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1594 l->mask = used_mask;
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1595 }
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1596 else
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1597 {
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1598 /* Skip the outermost, dummy OpenACC loop */
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1599 l = l->child;
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1600 }
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1601 if (l)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1602 inform_oacc_loop (l);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1603 if (is_oacc_kernels)
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1604 free_oacc_loop (l);
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1605 }
111
kono
parents:
diff changeset
1606
kono
parents:
diff changeset
1607 /* Offloaded targets may introduce new basic blocks, which require
kono
parents:
diff changeset
1608 dominance information to update SSA. */
kono
parents:
diff changeset
1609 calculate_dominance_info (CDI_DOMINATORS);
kono
parents:
diff changeset
1610
kono
parents:
diff changeset
1611 /* Now lower internal loop functions to target-specific code
kono
parents:
diff changeset
1612 sequences. */
kono
parents:
diff changeset
1613 basic_block bb;
kono
parents:
diff changeset
1614 FOR_ALL_BB_FN (bb, cfun)
kono
parents:
diff changeset
1615 for (gimple_stmt_iterator gsi = gsi_start_bb (bb); !gsi_end_p (gsi);)
kono
parents:
diff changeset
1616 {
kono
parents:
diff changeset
1617 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
1618 if (!is_gimple_call (stmt))
kono
parents:
diff changeset
1619 {
kono
parents:
diff changeset
1620 gsi_next (&gsi);
kono
parents:
diff changeset
1621 continue;
kono
parents:
diff changeset
1622 }
kono
parents:
diff changeset
1623
kono
parents:
diff changeset
1624 gcall *call = as_a <gcall *> (stmt);
kono
parents:
diff changeset
1625 if (!gimple_call_internal_p (call))
kono
parents:
diff changeset
1626 {
kono
parents:
diff changeset
1627 gsi_next (&gsi);
kono
parents:
diff changeset
1628 continue;
kono
parents:
diff changeset
1629 }
kono
parents:
diff changeset
1630
kono
parents:
diff changeset
1631 /* Rewind to allow rescan. */
kono
parents:
diff changeset
1632 gsi_prev (&gsi);
kono
parents:
diff changeset
1633 bool rescan = false, remove = false;
kono
parents:
diff changeset
1634 enum internal_fn ifn_code = gimple_call_internal_fn (call);
kono
parents:
diff changeset
1635
kono
parents:
diff changeset
1636 switch (ifn_code)
kono
parents:
diff changeset
1637 {
kono
parents:
diff changeset
1638 default: break;
kono
parents:
diff changeset
1639
kono
parents:
diff changeset
1640 case IFN_GOACC_TILE:
kono
parents:
diff changeset
1641 oacc_xform_tile (call);
kono
parents:
diff changeset
1642 rescan = true;
kono
parents:
diff changeset
1643 break;
kono
parents:
diff changeset
1644
kono
parents:
diff changeset
1645 case IFN_GOACC_LOOP:
kono
parents:
diff changeset
1646 oacc_xform_loop (call);
kono
parents:
diff changeset
1647 rescan = true;
kono
parents:
diff changeset
1648 break;
kono
parents:
diff changeset
1649
kono
parents:
diff changeset
1650 case IFN_GOACC_REDUCTION:
kono
parents:
diff changeset
1651 /* Mark the function for SSA renaming. */
kono
parents:
diff changeset
1652 mark_virtual_operands_for_renaming (cfun);
kono
parents:
diff changeset
1653
kono
parents:
diff changeset
1654 /* If the level is -1, this ended up being an unused
kono
parents:
diff changeset
1655 axis. Handle as a default. */
kono
parents:
diff changeset
1656 if (integer_minus_onep (gimple_call_arg (call, 3)))
kono
parents:
diff changeset
1657 default_goacc_reduction (call);
kono
parents:
diff changeset
1658 else
kono
parents:
diff changeset
1659 targetm.goacc.reduction (call);
kono
parents:
diff changeset
1660 rescan = true;
kono
parents:
diff changeset
1661 break;
kono
parents:
diff changeset
1662
kono
parents:
diff changeset
1663 case IFN_UNIQUE:
kono
parents:
diff changeset
1664 {
kono
parents:
diff changeset
1665 enum ifn_unique_kind kind
kono
parents:
diff changeset
1666 = ((enum ifn_unique_kind)
kono
parents:
diff changeset
1667 TREE_INT_CST_LOW (gimple_call_arg (call, 0)));
kono
parents:
diff changeset
1668
kono
parents:
diff changeset
1669 switch (kind)
kono
parents:
diff changeset
1670 {
kono
parents:
diff changeset
1671 default:
kono
parents:
diff changeset
1672 break;
kono
parents:
diff changeset
1673
kono
parents:
diff changeset
1674 case IFN_UNIQUE_OACC_FORK:
kono
parents:
diff changeset
1675 case IFN_UNIQUE_OACC_JOIN:
kono
parents:
diff changeset
1676 if (integer_minus_onep (gimple_call_arg (call, 2)))
kono
parents:
diff changeset
1677 remove = true;
kono
parents:
diff changeset
1678 else if (!targetm.goacc.fork_join
kono
parents:
diff changeset
1679 (call, dims, kind == IFN_UNIQUE_OACC_FORK))
kono
parents:
diff changeset
1680 remove = true;
kono
parents:
diff changeset
1681 break;
kono
parents:
diff changeset
1682
kono
parents:
diff changeset
1683 case IFN_UNIQUE_OACC_HEAD_MARK:
kono
parents:
diff changeset
1684 case IFN_UNIQUE_OACC_TAIL_MARK:
kono
parents:
diff changeset
1685 remove = true;
kono
parents:
diff changeset
1686 break;
kono
parents:
diff changeset
1687 }
kono
parents:
diff changeset
1688 break;
kono
parents:
diff changeset
1689 }
kono
parents:
diff changeset
1690 }
kono
parents:
diff changeset
1691
kono
parents:
diff changeset
1692 if (gsi_end_p (gsi))
kono
parents:
diff changeset
1693 /* We rewound past the beginning of the BB. */
kono
parents:
diff changeset
1694 gsi = gsi_start_bb (bb);
kono
parents:
diff changeset
1695 else
kono
parents:
diff changeset
1696 /* Undo the rewind. */
kono
parents:
diff changeset
1697 gsi_next (&gsi);
kono
parents:
diff changeset
1698
kono
parents:
diff changeset
1699 if (remove)
kono
parents:
diff changeset
1700 {
kono
parents:
diff changeset
1701 if (gimple_vdef (call))
kono
parents:
diff changeset
1702 replace_uses_by (gimple_vdef (call), gimple_vuse (call));
kono
parents:
diff changeset
1703 if (gimple_call_lhs (call))
kono
parents:
diff changeset
1704 {
kono
parents:
diff changeset
1705 /* Propagate the data dependency var. */
kono
parents:
diff changeset
1706 gimple *ass = gimple_build_assign (gimple_call_lhs (call),
kono
parents:
diff changeset
1707 gimple_call_arg (call, 1));
kono
parents:
diff changeset
1708 gsi_replace (&gsi, ass, false);
kono
parents:
diff changeset
1709 }
kono
parents:
diff changeset
1710 else
kono
parents:
diff changeset
1711 gsi_remove (&gsi, true);
kono
parents:
diff changeset
1712 }
kono
parents:
diff changeset
1713 else if (!rescan)
kono
parents:
diff changeset
1714 /* If not rescanning, advance over the call. */
kono
parents:
diff changeset
1715 gsi_next (&gsi);
kono
parents:
diff changeset
1716 }
kono
parents:
diff changeset
1717
kono
parents:
diff changeset
1718 free_oacc_loop (loops);
kono
parents:
diff changeset
1719
kono
parents:
diff changeset
1720 return 0;
kono
parents:
diff changeset
1721 }
kono
parents:
diff changeset
1722
kono
parents:
diff changeset
1723 /* Default launch dimension validator. Force everything to 1. A
kono
parents:
diff changeset
1724 backend that wants to provide larger dimensions must override this
kono
parents:
diff changeset
1725 hook. */
kono
parents:
diff changeset
1726
kono
parents:
diff changeset
1727 bool
kono
parents:
diff changeset
1728 default_goacc_validate_dims (tree ARG_UNUSED (decl), int *dims,
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1729 int ARG_UNUSED (fn_level),
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1730 unsigned ARG_UNUSED (used))
111
kono
parents:
diff changeset
1731 {
kono
parents:
diff changeset
1732 bool changed = false;
kono
parents:
diff changeset
1733
kono
parents:
diff changeset
1734 for (unsigned ix = 0; ix != GOMP_DIM_MAX; ix++)
kono
parents:
diff changeset
1735 {
kono
parents:
diff changeset
1736 if (dims[ix] != 1)
kono
parents:
diff changeset
1737 {
kono
parents:
diff changeset
1738 dims[ix] = 1;
kono
parents:
diff changeset
1739 changed = true;
kono
parents:
diff changeset
1740 }
kono
parents:
diff changeset
1741 }
kono
parents:
diff changeset
1742
kono
parents:
diff changeset
1743 return changed;
kono
parents:
diff changeset
1744 }
kono
parents:
diff changeset
1745
kono
parents:
diff changeset
1746 /* Default dimension bound is unknown on accelerator and 1 on host. */
kono
parents:
diff changeset
1747
kono
parents:
diff changeset
1748 int
kono
parents:
diff changeset
1749 default_goacc_dim_limit (int ARG_UNUSED (axis))
kono
parents:
diff changeset
1750 {
kono
parents:
diff changeset
1751 #ifdef ACCEL_COMPILER
kono
parents:
diff changeset
1752 return 0;
kono
parents:
diff changeset
1753 #else
kono
parents:
diff changeset
1754 return 1;
kono
parents:
diff changeset
1755 #endif
kono
parents:
diff changeset
1756 }
kono
parents:
diff changeset
1757
kono
parents:
diff changeset
1758 namespace {
kono
parents:
diff changeset
1759
kono
parents:
diff changeset
1760 const pass_data pass_data_oacc_device_lower =
kono
parents:
diff changeset
1761 {
kono
parents:
diff changeset
1762 GIMPLE_PASS, /* type */
kono
parents:
diff changeset
1763 "oaccdevlow", /* name */
kono
parents:
diff changeset
1764 OPTGROUP_OMP, /* optinfo_flags */
kono
parents:
diff changeset
1765 TV_NONE, /* tv_id */
kono
parents:
diff changeset
1766 PROP_cfg, /* properties_required */
kono
parents:
diff changeset
1767 0 /* Possibly PROP_gimple_eomp. */, /* properties_provided */
kono
parents:
diff changeset
1768 0, /* properties_destroyed */
kono
parents:
diff changeset
1769 0, /* todo_flags_start */
kono
parents:
diff changeset
1770 TODO_update_ssa | TODO_cleanup_cfg, /* todo_flags_finish */
kono
parents:
diff changeset
1771 };
kono
parents:
diff changeset
1772
kono
parents:
diff changeset
1773 class pass_oacc_device_lower : public gimple_opt_pass
kono
parents:
diff changeset
1774 {
kono
parents:
diff changeset
1775 public:
kono
parents:
diff changeset
1776 pass_oacc_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1777 : gimple_opt_pass (pass_data_oacc_device_lower, ctxt)
kono
parents:
diff changeset
1778 {}
kono
parents:
diff changeset
1779
kono
parents:
diff changeset
1780 /* opt_pass methods: */
kono
parents:
diff changeset
1781 virtual bool gate (function *) { return flag_openacc; };
kono
parents:
diff changeset
1782
kono
parents:
diff changeset
1783 virtual unsigned int execute (function *)
kono
parents:
diff changeset
1784 {
kono
parents:
diff changeset
1785 return execute_oacc_device_lower ();
kono
parents:
diff changeset
1786 }
kono
parents:
diff changeset
1787
kono
parents:
diff changeset
1788 }; // class pass_oacc_device_lower
kono
parents:
diff changeset
1789
kono
parents:
diff changeset
1790 } // anon namespace
kono
parents:
diff changeset
1791
kono
parents:
diff changeset
1792 gimple_opt_pass *
kono
parents:
diff changeset
1793 make_pass_oacc_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1794 {
kono
parents:
diff changeset
1795 return new pass_oacc_device_lower (ctxt);
kono
parents:
diff changeset
1796 }
kono
parents:
diff changeset
1797
kono
parents:
diff changeset
1798
kono
parents:
diff changeset
1799 /* Rewrite GOMP_SIMT_ENTER_ALLOC call given by GSI and remove the preceding
kono
parents:
diff changeset
1800 GOMP_SIMT_ENTER call identifying the privatized variables, which are
kono
parents:
diff changeset
1801 turned to structure fields and receive a DECL_VALUE_EXPR accordingly.
kono
parents:
diff changeset
1802 Set *REGIMPLIFY to true, except if no privatized variables were seen. */
kono
parents:
diff changeset
1803
kono
parents:
diff changeset
1804 static void
kono
parents:
diff changeset
1805 ompdevlow_adjust_simt_enter (gimple_stmt_iterator *gsi, bool *regimplify)
kono
parents:
diff changeset
1806 {
kono
parents:
diff changeset
1807 gimple *alloc_stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
1808 tree simtrec = gimple_call_lhs (alloc_stmt);
kono
parents:
diff changeset
1809 tree simduid = gimple_call_arg (alloc_stmt, 0);
kono
parents:
diff changeset
1810 gimple *enter_stmt = SSA_NAME_DEF_STMT (simduid);
kono
parents:
diff changeset
1811 gcc_assert (gimple_call_internal_p (enter_stmt, IFN_GOMP_SIMT_ENTER));
kono
parents:
diff changeset
1812 tree rectype = lang_hooks.types.make_type (RECORD_TYPE);
kono
parents:
diff changeset
1813 TYPE_ARTIFICIAL (rectype) = TYPE_NAMELESS (rectype) = 1;
kono
parents:
diff changeset
1814 TREE_ADDRESSABLE (rectype) = 1;
kono
parents:
diff changeset
1815 TREE_TYPE (simtrec) = build_pointer_type (rectype);
kono
parents:
diff changeset
1816 for (unsigned i = 1; i < gimple_call_num_args (enter_stmt); i++)
kono
parents:
diff changeset
1817 {
kono
parents:
diff changeset
1818 tree *argp = gimple_call_arg_ptr (enter_stmt, i);
kono
parents:
diff changeset
1819 if (*argp == null_pointer_node)
kono
parents:
diff changeset
1820 continue;
kono
parents:
diff changeset
1821 gcc_assert (TREE_CODE (*argp) == ADDR_EXPR
kono
parents:
diff changeset
1822 && VAR_P (TREE_OPERAND (*argp, 0)));
kono
parents:
diff changeset
1823 tree var = TREE_OPERAND (*argp, 0);
kono
parents:
diff changeset
1824
kono
parents:
diff changeset
1825 tree field = build_decl (DECL_SOURCE_LOCATION (var), FIELD_DECL,
kono
parents:
diff changeset
1826 DECL_NAME (var), TREE_TYPE (var));
kono
parents:
diff changeset
1827 SET_DECL_ALIGN (field, DECL_ALIGN (var));
kono
parents:
diff changeset
1828 DECL_USER_ALIGN (field) = DECL_USER_ALIGN (var);
kono
parents:
diff changeset
1829 TREE_THIS_VOLATILE (field) = TREE_THIS_VOLATILE (var);
kono
parents:
diff changeset
1830
kono
parents:
diff changeset
1831 insert_field_into_struct (rectype, field);
kono
parents:
diff changeset
1832
kono
parents:
diff changeset
1833 tree t = build_simple_mem_ref (simtrec);
kono
parents:
diff changeset
1834 t = build3 (COMPONENT_REF, TREE_TYPE (var), t, field, NULL);
kono
parents:
diff changeset
1835 TREE_THIS_VOLATILE (t) = TREE_THIS_VOLATILE (var);
kono
parents:
diff changeset
1836 SET_DECL_VALUE_EXPR (var, t);
kono
parents:
diff changeset
1837 DECL_HAS_VALUE_EXPR_P (var) = 1;
kono
parents:
diff changeset
1838 *regimplify = true;
kono
parents:
diff changeset
1839 }
kono
parents:
diff changeset
1840 layout_type (rectype);
kono
parents:
diff changeset
1841 tree size = TYPE_SIZE_UNIT (rectype);
kono
parents:
diff changeset
1842 tree align = build_int_cst (TREE_TYPE (size), TYPE_ALIGN_UNIT (rectype));
kono
parents:
diff changeset
1843
kono
parents:
diff changeset
1844 alloc_stmt
kono
parents:
diff changeset
1845 = gimple_build_call_internal (IFN_GOMP_SIMT_ENTER_ALLOC, 2, size, align);
kono
parents:
diff changeset
1846 gimple_call_set_lhs (alloc_stmt, simtrec);
kono
parents:
diff changeset
1847 gsi_replace (gsi, alloc_stmt, false);
kono
parents:
diff changeset
1848 gimple_stmt_iterator enter_gsi = gsi_for_stmt (enter_stmt);
kono
parents:
diff changeset
1849 enter_stmt = gimple_build_assign (simduid, gimple_call_arg (enter_stmt, 0));
kono
parents:
diff changeset
1850 gsi_replace (&enter_gsi, enter_stmt, false);
kono
parents:
diff changeset
1851
kono
parents:
diff changeset
1852 use_operand_p use;
kono
parents:
diff changeset
1853 gimple *exit_stmt;
kono
parents:
diff changeset
1854 if (single_imm_use (simtrec, &use, &exit_stmt))
kono
parents:
diff changeset
1855 {
kono
parents:
diff changeset
1856 gcc_assert (gimple_call_internal_p (exit_stmt, IFN_GOMP_SIMT_EXIT));
kono
parents:
diff changeset
1857 gimple_stmt_iterator exit_gsi = gsi_for_stmt (exit_stmt);
145
1830386684a0 gcc-9.2.0
anatofuz
parents: 131
diff changeset
1858 tree clobber = build_clobber (rectype);
111
kono
parents:
diff changeset
1859 exit_stmt = gimple_build_assign (build_simple_mem_ref (simtrec), clobber);
kono
parents:
diff changeset
1860 gsi_insert_before (&exit_gsi, exit_stmt, GSI_SAME_STMT);
kono
parents:
diff changeset
1861 }
kono
parents:
diff changeset
1862 else
kono
parents:
diff changeset
1863 gcc_checking_assert (has_zero_uses (simtrec));
kono
parents:
diff changeset
1864 }
kono
parents:
diff changeset
1865
kono
parents:
diff changeset
1866 /* Callback for walk_gimple_stmt used to scan for SIMT-privatized variables. */
kono
parents:
diff changeset
1867
kono
parents:
diff changeset
1868 static tree
kono
parents:
diff changeset
1869 find_simtpriv_var_op (tree *tp, int *walk_subtrees, void *)
kono
parents:
diff changeset
1870 {
kono
parents:
diff changeset
1871 tree t = *tp;
kono
parents:
diff changeset
1872
kono
parents:
diff changeset
1873 if (VAR_P (t)
kono
parents:
diff changeset
1874 && DECL_HAS_VALUE_EXPR_P (t)
kono
parents:
diff changeset
1875 && lookup_attribute ("omp simt private", DECL_ATTRIBUTES (t)))
kono
parents:
diff changeset
1876 {
kono
parents:
diff changeset
1877 *walk_subtrees = 0;
kono
parents:
diff changeset
1878 return t;
kono
parents:
diff changeset
1879 }
kono
parents:
diff changeset
1880 return NULL_TREE;
kono
parents:
diff changeset
1881 }
kono
parents:
diff changeset
1882
kono
parents:
diff changeset
1883 /* Cleanup uses of SIMT placeholder internal functions: on non-SIMT targets,
kono
parents:
diff changeset
1884 VF is 1 and LANE is 0; on SIMT targets, VF is folded to a constant, and
kono
parents:
diff changeset
1885 LANE is kept to be expanded to RTL later on. Also cleanup all other SIMT
kono
parents:
diff changeset
1886 internal functions on non-SIMT targets, and likewise some SIMD internal
kono
parents:
diff changeset
1887 functions on SIMT targets. */
kono
parents:
diff changeset
1888
kono
parents:
diff changeset
1889 static unsigned int
kono
parents:
diff changeset
1890 execute_omp_device_lower ()
kono
parents:
diff changeset
1891 {
kono
parents:
diff changeset
1892 int vf = targetm.simt.vf ? targetm.simt.vf () : 1;
kono
parents:
diff changeset
1893 bool regimplify = false;
kono
parents:
diff changeset
1894 basic_block bb;
kono
parents:
diff changeset
1895 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
1896 FOR_EACH_BB_FN (bb, cfun)
kono
parents:
diff changeset
1897 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
1898 {
kono
parents:
diff changeset
1899 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
1900 if (!is_gimple_call (stmt) || !gimple_call_internal_p (stmt))
kono
parents:
diff changeset
1901 continue;
kono
parents:
diff changeset
1902 tree lhs = gimple_call_lhs (stmt), rhs = NULL_TREE;
kono
parents:
diff changeset
1903 tree type = lhs ? TREE_TYPE (lhs) : integer_type_node;
kono
parents:
diff changeset
1904 switch (gimple_call_internal_fn (stmt))
kono
parents:
diff changeset
1905 {
kono
parents:
diff changeset
1906 case IFN_GOMP_USE_SIMT:
kono
parents:
diff changeset
1907 rhs = vf == 1 ? integer_zero_node : integer_one_node;
kono
parents:
diff changeset
1908 break;
kono
parents:
diff changeset
1909 case IFN_GOMP_SIMT_ENTER:
kono
parents:
diff changeset
1910 rhs = vf == 1 ? gimple_call_arg (stmt, 0) : NULL_TREE;
kono
parents:
diff changeset
1911 goto simtreg_enter_exit;
kono
parents:
diff changeset
1912 case IFN_GOMP_SIMT_ENTER_ALLOC:
kono
parents:
diff changeset
1913 if (vf != 1)
kono
parents:
diff changeset
1914 ompdevlow_adjust_simt_enter (&gsi, &regimplify);
kono
parents:
diff changeset
1915 rhs = vf == 1 ? null_pointer_node : NULL_TREE;
kono
parents:
diff changeset
1916 goto simtreg_enter_exit;
kono
parents:
diff changeset
1917 case IFN_GOMP_SIMT_EXIT:
kono
parents:
diff changeset
1918 simtreg_enter_exit:
kono
parents:
diff changeset
1919 if (vf != 1)
kono
parents:
diff changeset
1920 continue;
kono
parents:
diff changeset
1921 unlink_stmt_vdef (stmt);
kono
parents:
diff changeset
1922 break;
kono
parents:
diff changeset
1923 case IFN_GOMP_SIMT_LANE:
kono
parents:
diff changeset
1924 case IFN_GOMP_SIMT_LAST_LANE:
kono
parents:
diff changeset
1925 rhs = vf == 1 ? build_zero_cst (type) : NULL_TREE;
kono
parents:
diff changeset
1926 break;
kono
parents:
diff changeset
1927 case IFN_GOMP_SIMT_VF:
kono
parents:
diff changeset
1928 rhs = build_int_cst (type, vf);
kono
parents:
diff changeset
1929 break;
kono
parents:
diff changeset
1930 case IFN_GOMP_SIMT_ORDERED_PRED:
kono
parents:
diff changeset
1931 rhs = vf == 1 ? integer_zero_node : NULL_TREE;
kono
parents:
diff changeset
1932 if (rhs || !lhs)
kono
parents:
diff changeset
1933 unlink_stmt_vdef (stmt);
kono
parents:
diff changeset
1934 break;
kono
parents:
diff changeset
1935 case IFN_GOMP_SIMT_VOTE_ANY:
kono
parents:
diff changeset
1936 case IFN_GOMP_SIMT_XCHG_BFLY:
kono
parents:
diff changeset
1937 case IFN_GOMP_SIMT_XCHG_IDX:
kono
parents:
diff changeset
1938 rhs = vf == 1 ? gimple_call_arg (stmt, 0) : NULL_TREE;
kono
parents:
diff changeset
1939 break;
kono
parents:
diff changeset
1940 case IFN_GOMP_SIMD_LANE:
kono
parents:
diff changeset
1941 case IFN_GOMP_SIMD_LAST_LANE:
kono
parents:
diff changeset
1942 rhs = vf != 1 ? build_zero_cst (type) : NULL_TREE;
kono
parents:
diff changeset
1943 break;
kono
parents:
diff changeset
1944 case IFN_GOMP_SIMD_VF:
kono
parents:
diff changeset
1945 rhs = vf != 1 ? build_one_cst (type) : NULL_TREE;
kono
parents:
diff changeset
1946 break;
kono
parents:
diff changeset
1947 default:
kono
parents:
diff changeset
1948 continue;
kono
parents:
diff changeset
1949 }
kono
parents:
diff changeset
1950 if (lhs && !rhs)
kono
parents:
diff changeset
1951 continue;
kono
parents:
diff changeset
1952 stmt = lhs ? gimple_build_assign (lhs, rhs) : gimple_build_nop ();
kono
parents:
diff changeset
1953 gsi_replace (&gsi, stmt, false);
kono
parents:
diff changeset
1954 }
kono
parents:
diff changeset
1955 if (regimplify)
kono
parents:
diff changeset
1956 FOR_EACH_BB_REVERSE_FN (bb, cfun)
kono
parents:
diff changeset
1957 for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi); gsi_prev (&gsi))
kono
parents:
diff changeset
1958 if (walk_gimple_stmt (&gsi, NULL, find_simtpriv_var_op, NULL))
kono
parents:
diff changeset
1959 {
kono
parents:
diff changeset
1960 if (gimple_clobber_p (gsi_stmt (gsi)))
kono
parents:
diff changeset
1961 gsi_remove (&gsi, true);
kono
parents:
diff changeset
1962 else
kono
parents:
diff changeset
1963 gimple_regimplify_operands (gsi_stmt (gsi), &gsi);
kono
parents:
diff changeset
1964 }
kono
parents:
diff changeset
1965 if (vf != 1)
kono
parents:
diff changeset
1966 cfun->has_force_vectorize_loops = false;
kono
parents:
diff changeset
1967 return 0;
kono
parents:
diff changeset
1968 }
kono
parents:
diff changeset
1969
kono
parents:
diff changeset
1970 namespace {
kono
parents:
diff changeset
1971
kono
parents:
diff changeset
1972 const pass_data pass_data_omp_device_lower =
kono
parents:
diff changeset
1973 {
kono
parents:
diff changeset
1974 GIMPLE_PASS, /* type */
kono
parents:
diff changeset
1975 "ompdevlow", /* name */
kono
parents:
diff changeset
1976 OPTGROUP_OMP, /* optinfo_flags */
kono
parents:
diff changeset
1977 TV_NONE, /* tv_id */
kono
parents:
diff changeset
1978 PROP_cfg, /* properties_required */
kono
parents:
diff changeset
1979 PROP_gimple_lomp_dev, /* properties_provided */
kono
parents:
diff changeset
1980 0, /* properties_destroyed */
kono
parents:
diff changeset
1981 0, /* todo_flags_start */
kono
parents:
diff changeset
1982 TODO_update_ssa, /* todo_flags_finish */
kono
parents:
diff changeset
1983 };
kono
parents:
diff changeset
1984
kono
parents:
diff changeset
1985 class pass_omp_device_lower : public gimple_opt_pass
kono
parents:
diff changeset
1986 {
kono
parents:
diff changeset
1987 public:
kono
parents:
diff changeset
1988 pass_omp_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
1989 : gimple_opt_pass (pass_data_omp_device_lower, ctxt)
kono
parents:
diff changeset
1990 {}
kono
parents:
diff changeset
1991
kono
parents:
diff changeset
1992 /* opt_pass methods: */
kono
parents:
diff changeset
1993 virtual bool gate (function *fun)
kono
parents:
diff changeset
1994 {
kono
parents:
diff changeset
1995 return !(fun->curr_properties & PROP_gimple_lomp_dev);
kono
parents:
diff changeset
1996 }
kono
parents:
diff changeset
1997 virtual unsigned int execute (function *)
kono
parents:
diff changeset
1998 {
kono
parents:
diff changeset
1999 return execute_omp_device_lower ();
kono
parents:
diff changeset
2000 }
kono
parents:
diff changeset
2001
kono
parents:
diff changeset
2002 }; // class pass_expand_omp_ssa
kono
parents:
diff changeset
2003
kono
parents:
diff changeset
2004 } // anon namespace
kono
parents:
diff changeset
2005
kono
parents:
diff changeset
2006 gimple_opt_pass *
kono
parents:
diff changeset
2007 make_pass_omp_device_lower (gcc::context *ctxt)
kono
parents:
diff changeset
2008 {
kono
parents:
diff changeset
2009 return new pass_omp_device_lower (ctxt);
kono
parents:
diff changeset
2010 }
kono
parents:
diff changeset
2011
kono
parents:
diff changeset
2012 /* "omp declare target link" handling pass. */
kono
parents:
diff changeset
2013
kono
parents:
diff changeset
2014 namespace {
kono
parents:
diff changeset
2015
kono
parents:
diff changeset
2016 const pass_data pass_data_omp_target_link =
kono
parents:
diff changeset
2017 {
kono
parents:
diff changeset
2018 GIMPLE_PASS, /* type */
kono
parents:
diff changeset
2019 "omptargetlink", /* name */
kono
parents:
diff changeset
2020 OPTGROUP_OMP, /* optinfo_flags */
kono
parents:
diff changeset
2021 TV_NONE, /* tv_id */
kono
parents:
diff changeset
2022 PROP_ssa, /* properties_required */
kono
parents:
diff changeset
2023 0, /* properties_provided */
kono
parents:
diff changeset
2024 0, /* properties_destroyed */
kono
parents:
diff changeset
2025 0, /* todo_flags_start */
kono
parents:
diff changeset
2026 TODO_update_ssa, /* todo_flags_finish */
kono
parents:
diff changeset
2027 };
kono
parents:
diff changeset
2028
kono
parents:
diff changeset
2029 class pass_omp_target_link : public gimple_opt_pass
kono
parents:
diff changeset
2030 {
kono
parents:
diff changeset
2031 public:
kono
parents:
diff changeset
2032 pass_omp_target_link (gcc::context *ctxt)
kono
parents:
diff changeset
2033 : gimple_opt_pass (pass_data_omp_target_link, ctxt)
kono
parents:
diff changeset
2034 {}
kono
parents:
diff changeset
2035
kono
parents:
diff changeset
2036 /* opt_pass methods: */
kono
parents:
diff changeset
2037 virtual bool gate (function *fun)
kono
parents:
diff changeset
2038 {
kono
parents:
diff changeset
2039 #ifdef ACCEL_COMPILER
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
2040 return offloading_function_p (fun->decl);
111
kono
parents:
diff changeset
2041 #else
kono
parents:
diff changeset
2042 (void) fun;
kono
parents:
diff changeset
2043 return false;
kono
parents:
diff changeset
2044 #endif
kono
parents:
diff changeset
2045 }
kono
parents:
diff changeset
2046
kono
parents:
diff changeset
2047 virtual unsigned execute (function *);
kono
parents:
diff changeset
2048 };
kono
parents:
diff changeset
2049
kono
parents:
diff changeset
2050 /* Callback for walk_gimple_stmt used to scan for link var operands. */
kono
parents:
diff changeset
2051
kono
parents:
diff changeset
2052 static tree
kono
parents:
diff changeset
2053 find_link_var_op (tree *tp, int *walk_subtrees, void *)
kono
parents:
diff changeset
2054 {
kono
parents:
diff changeset
2055 tree t = *tp;
kono
parents:
diff changeset
2056
kono
parents:
diff changeset
2057 if (VAR_P (t)
kono
parents:
diff changeset
2058 && DECL_HAS_VALUE_EXPR_P (t)
kono
parents:
diff changeset
2059 && is_global_var (t)
kono
parents:
diff changeset
2060 && lookup_attribute ("omp declare target link", DECL_ATTRIBUTES (t)))
kono
parents:
diff changeset
2061 {
kono
parents:
diff changeset
2062 *walk_subtrees = 0;
kono
parents:
diff changeset
2063 return t;
kono
parents:
diff changeset
2064 }
kono
parents:
diff changeset
2065
kono
parents:
diff changeset
2066 return NULL_TREE;
kono
parents:
diff changeset
2067 }
kono
parents:
diff changeset
2068
kono
parents:
diff changeset
2069 unsigned
kono
parents:
diff changeset
2070 pass_omp_target_link::execute (function *fun)
kono
parents:
diff changeset
2071 {
kono
parents:
diff changeset
2072 basic_block bb;
kono
parents:
diff changeset
2073 FOR_EACH_BB_FN (bb, fun)
kono
parents:
diff changeset
2074 {
kono
parents:
diff changeset
2075 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
2076 for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
2077 if (walk_gimple_stmt (&gsi, NULL, find_link_var_op, NULL))
kono
parents:
diff changeset
2078 gimple_regimplify_operands (gsi_stmt (gsi), &gsi);
kono
parents:
diff changeset
2079 }
kono
parents:
diff changeset
2080
kono
parents:
diff changeset
2081 return 0;
kono
parents:
diff changeset
2082 }
kono
parents:
diff changeset
2083
kono
parents:
diff changeset
2084 } // anon namespace
kono
parents:
diff changeset
2085
kono
parents:
diff changeset
2086 gimple_opt_pass *
kono
parents:
diff changeset
2087 make_pass_omp_target_link (gcc::context *ctxt)
kono
parents:
diff changeset
2088 {
kono
parents:
diff changeset
2089 return new pass_omp_target_link (ctxt);
kono
parents:
diff changeset
2090 }