annotate gcc/omp-grid.c @ 144:8f4e72ab4e11

fix segmentation fault caused by nothing next cur_op to end
author Takahiro SHIMIZU <anatofuz@cr.ie.u-ryukyu.ac.jp>
date Sun, 23 Dec 2018 21:23:56 +0900
parents 84e7813d76e9
children 1830386684a0
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
111
kono
parents:
diff changeset
1 /* Lowering and expansion of OpenMP directives for HSA GPU agents.
kono
parents:
diff changeset
2
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
3 Copyright (C) 2013-2018 Free Software Foundation, Inc.
111
kono
parents:
diff changeset
4
kono
parents:
diff changeset
5 This file is part of GCC.
kono
parents:
diff changeset
6
kono
parents:
diff changeset
7 GCC is free software; you can redistribute it and/or modify it under
kono
parents:
diff changeset
8 the terms of the GNU General Public License as published by the Free
kono
parents:
diff changeset
9 Software Foundation; either version 3, or (at your option) any later
kono
parents:
diff changeset
10 version.
kono
parents:
diff changeset
11
kono
parents:
diff changeset
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
kono
parents:
diff changeset
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
kono
parents:
diff changeset
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
kono
parents:
diff changeset
15 for more details.
kono
parents:
diff changeset
16
kono
parents:
diff changeset
17 You should have received a copy of the GNU General Public License
kono
parents:
diff changeset
18 along with GCC; see the file COPYING3. If not see
kono
parents:
diff changeset
19 <http://www.gnu.org/licenses/>. */
kono
parents:
diff changeset
20
kono
parents:
diff changeset
21 #include "config.h"
kono
parents:
diff changeset
22 #include "system.h"
kono
parents:
diff changeset
23 #include "coretypes.h"
kono
parents:
diff changeset
24 #include "backend.h"
kono
parents:
diff changeset
25 #include "tree.h"
kono
parents:
diff changeset
26 #include "gimple.h"
kono
parents:
diff changeset
27 #include "tree-pass.h"
kono
parents:
diff changeset
28 #include "ssa.h"
kono
parents:
diff changeset
29 #include "cgraph.h"
kono
parents:
diff changeset
30 #include "pretty-print.h"
kono
parents:
diff changeset
31 #include "fold-const.h"
kono
parents:
diff changeset
32 #include "gimplify.h"
kono
parents:
diff changeset
33 #include "gimple-iterator.h"
kono
parents:
diff changeset
34 #include "gimple-walk.h"
kono
parents:
diff changeset
35 #include "tree-inline.h"
kono
parents:
diff changeset
36 #include "langhooks.h"
kono
parents:
diff changeset
37 #include "omp-general.h"
kono
parents:
diff changeset
38 #include "omp-low.h"
kono
parents:
diff changeset
39 #include "omp-grid.h"
kono
parents:
diff changeset
40 #include "gimple-pretty-print.h"
kono
parents:
diff changeset
41
kono
parents:
diff changeset
42 /* Return the lastprivate predicate for a given gridified loop described by
kono
parents:
diff changeset
43 FD). */
kono
parents:
diff changeset
44
kono
parents:
diff changeset
45 tree
kono
parents:
diff changeset
46 omp_grid_lastprivate_predicate (struct omp_for_data *fd)
kono
parents:
diff changeset
47 {
kono
parents:
diff changeset
48 /* When dealing with a gridified loop, we need to check up to three collapsed
kono
parents:
diff changeset
49 iteration variables but they are not actually captured in this fd.
kono
parents:
diff changeset
50 Fortunately, we can easily rely on HSA builtins to get this
kono
parents:
diff changeset
51 information. */
kono
parents:
diff changeset
52
kono
parents:
diff changeset
53 tree id, size;
kono
parents:
diff changeset
54 if (gimple_omp_for_kind (fd->for_stmt) == GF_OMP_FOR_KIND_GRID_LOOP
kono
parents:
diff changeset
55 && gimple_omp_for_grid_intra_group (fd->for_stmt))
kono
parents:
diff changeset
56 {
kono
parents:
diff changeset
57 id = builtin_decl_explicit (BUILT_IN_HSA_WORKITEMID);
kono
parents:
diff changeset
58 size = builtin_decl_explicit (BUILT_IN_HSA_CURRENTWORKGROUPSIZE);
kono
parents:
diff changeset
59 }
kono
parents:
diff changeset
60 else
kono
parents:
diff changeset
61 {
kono
parents:
diff changeset
62 id = builtin_decl_explicit (BUILT_IN_HSA_WORKITEMABSID);
kono
parents:
diff changeset
63 size = builtin_decl_explicit (BUILT_IN_HSA_GRIDSIZE);
kono
parents:
diff changeset
64 }
kono
parents:
diff changeset
65 tree cond = NULL;
kono
parents:
diff changeset
66 for (int dim = 0; dim < fd->collapse; dim++)
kono
parents:
diff changeset
67 {
kono
parents:
diff changeset
68 tree dim_tree = build_int_cstu (unsigned_type_node, dim);
kono
parents:
diff changeset
69 tree u1 = build_int_cstu (unsigned_type_node, 1);
kono
parents:
diff changeset
70 tree c2
kono
parents:
diff changeset
71 = build2 (EQ_EXPR, boolean_type_node,
kono
parents:
diff changeset
72 build2 (PLUS_EXPR, unsigned_type_node,
kono
parents:
diff changeset
73 build_call_expr (id, 1, dim_tree), u1),
kono
parents:
diff changeset
74 build_call_expr (size, 1, dim_tree));
kono
parents:
diff changeset
75 if (cond)
kono
parents:
diff changeset
76 cond = build2 (TRUTH_AND_EXPR, boolean_type_node, cond, c2);
kono
parents:
diff changeset
77 else
kono
parents:
diff changeset
78 cond = c2;
kono
parents:
diff changeset
79 }
kono
parents:
diff changeset
80 return cond;
kono
parents:
diff changeset
81 }
kono
parents:
diff changeset
82
kono
parents:
diff changeset
83 /* Structure describing the basic properties of the loop we ara analyzing
kono
parents:
diff changeset
84 whether it can be gridified and when it is gridified. */
kono
parents:
diff changeset
85
kono
parents:
diff changeset
86 struct grid_prop
kono
parents:
diff changeset
87 {
kono
parents:
diff changeset
88 /* True when we are doing tiling gridification, i.e. when there is a distinct
kono
parents:
diff changeset
89 distribute loop over groups and a loop construct over work-items. False
kono
parents:
diff changeset
90 when distribute and parallel for loops form a combined construct. */
kono
parents:
diff changeset
91 bool tiling;
kono
parents:
diff changeset
92 /* Location of the target construct for optimization information
kono
parents:
diff changeset
93 messages. */
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
94 dump_user_location_t target_loc;
111
kono
parents:
diff changeset
95 /* The collapse clause of the involved loops. Collapse value of all of them
kono
parents:
diff changeset
96 must be the same for gridification to take place. */
kono
parents:
diff changeset
97 size_t collapse;
kono
parents:
diff changeset
98 /* Group sizes, if requested by the user or NULL if not requested. */
kono
parents:
diff changeset
99 tree group_sizes[3];
kono
parents:
diff changeset
100 };
kono
parents:
diff changeset
101
kono
parents:
diff changeset
102 #define GRID_MISSED_MSG_PREFIX "Will not turn target construct into a " \
kono
parents:
diff changeset
103 "gridified HSA kernel because "
kono
parents:
diff changeset
104
kono
parents:
diff changeset
105 /* Return true if STMT is an assignment of a register-type into a local
kono
parents:
diff changeset
106 VAR_DECL. If GRID is non-NULL, the assignment additionally must not be to
kono
parents:
diff changeset
107 any of the trees specifying group sizes there. */
kono
parents:
diff changeset
108
kono
parents:
diff changeset
109 static bool
kono
parents:
diff changeset
110 grid_safe_assignment_p (gimple *stmt, grid_prop *grid)
kono
parents:
diff changeset
111 {
kono
parents:
diff changeset
112 gassign *assign = dyn_cast <gassign *> (stmt);
kono
parents:
diff changeset
113 if (!assign)
kono
parents:
diff changeset
114 return false;
kono
parents:
diff changeset
115 if (gimple_clobber_p (assign))
kono
parents:
diff changeset
116 return true;
kono
parents:
diff changeset
117 tree lhs = gimple_assign_lhs (assign);
kono
parents:
diff changeset
118 if (!VAR_P (lhs)
kono
parents:
diff changeset
119 || !is_gimple_reg_type (TREE_TYPE (lhs))
kono
parents:
diff changeset
120 || is_global_var (lhs))
kono
parents:
diff changeset
121 return false;
kono
parents:
diff changeset
122 if (grid)
kono
parents:
diff changeset
123 for (unsigned i = 0; i < grid->collapse; i++)
kono
parents:
diff changeset
124 if (lhs == grid->group_sizes[i])
kono
parents:
diff changeset
125 return false;
kono
parents:
diff changeset
126 return true;
kono
parents:
diff changeset
127 }
kono
parents:
diff changeset
128
kono
parents:
diff changeset
129 /* Return true if all statements in SEQ are assignments to local register-type
kono
parents:
diff changeset
130 variables that do not hold group size information. */
kono
parents:
diff changeset
131
kono
parents:
diff changeset
132 static bool
kono
parents:
diff changeset
133 grid_seq_only_contains_local_assignments (gimple_seq seq, grid_prop *grid)
kono
parents:
diff changeset
134 {
kono
parents:
diff changeset
135 if (!seq)
kono
parents:
diff changeset
136 return true;
kono
parents:
diff changeset
137
kono
parents:
diff changeset
138 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
139 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
140 if (!grid_safe_assignment_p (gsi_stmt (gsi), grid))
kono
parents:
diff changeset
141 return false;
kono
parents:
diff changeset
142 return true;
kono
parents:
diff changeset
143 }
kono
parents:
diff changeset
144
kono
parents:
diff changeset
145 /* Scan statements in SEQ and call itself recursively on any bind. GRID
kono
parents:
diff changeset
146 describes hitherto discovered properties of the loop that is evaluated for
kono
parents:
diff changeset
147 possible gridification. If during whole search only assignments to
kono
parents:
diff changeset
148 register-type local variables (that do not overwrite group size information)
kono
parents:
diff changeset
149 and one single OMP statement is encountered, return true, otherwise return
kono
parents:
diff changeset
150 false. RET is where we store any OMP statement encountered. */
kono
parents:
diff changeset
151
kono
parents:
diff changeset
152 static bool
kono
parents:
diff changeset
153 grid_find_single_omp_among_assignments_1 (gimple_seq seq, grid_prop *grid,
kono
parents:
diff changeset
154 const char *name, gimple **ret)
kono
parents:
diff changeset
155 {
kono
parents:
diff changeset
156 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
157 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
158 {
kono
parents:
diff changeset
159 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
160
kono
parents:
diff changeset
161 if (grid_safe_assignment_p (stmt, grid))
kono
parents:
diff changeset
162 continue;
kono
parents:
diff changeset
163 if (gbind *bind = dyn_cast <gbind *> (stmt))
kono
parents:
diff changeset
164 {
kono
parents:
diff changeset
165 gimple_seq bind_body = gimple_bind_body (bind);
kono
parents:
diff changeset
166 if (!grid_find_single_omp_among_assignments_1 (bind_body, grid, name,
kono
parents:
diff changeset
167 ret))
kono
parents:
diff changeset
168 return false;
kono
parents:
diff changeset
169 }
kono
parents:
diff changeset
170 else if (is_gimple_omp (stmt))
kono
parents:
diff changeset
171 {
kono
parents:
diff changeset
172 if (*ret)
kono
parents:
diff changeset
173 {
kono
parents:
diff changeset
174 if (dump_enabled_p ())
kono
parents:
diff changeset
175 {
kono
parents:
diff changeset
176 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
177 GRID_MISSED_MSG_PREFIX "%s construct "
kono
parents:
diff changeset
178 "contains multiple OpenMP constructs\n",
kono
parents:
diff changeset
179 name);
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
180 dump_printf_loc (MSG_NOTE, *ret,
111
kono
parents:
diff changeset
181 "The first OpenMP construct within "
kono
parents:
diff changeset
182 "a parallel\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
183 dump_printf_loc (MSG_NOTE, stmt,
111
kono
parents:
diff changeset
184 "The second OpenMP construct within "
kono
parents:
diff changeset
185 "a parallel\n");
kono
parents:
diff changeset
186 }
kono
parents:
diff changeset
187 return false;
kono
parents:
diff changeset
188 }
kono
parents:
diff changeset
189 *ret = stmt;
kono
parents:
diff changeset
190 }
kono
parents:
diff changeset
191 else
kono
parents:
diff changeset
192 {
kono
parents:
diff changeset
193 if (dump_enabled_p ())
kono
parents:
diff changeset
194 {
kono
parents:
diff changeset
195 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
196 GRID_MISSED_MSG_PREFIX "%s construct contains "
kono
parents:
diff changeset
197 "a complex statement\n", name);
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
198 dump_printf_loc (MSG_NOTE, stmt,
111
kono
parents:
diff changeset
199 "This statement cannot be analyzed for "
kono
parents:
diff changeset
200 "gridification\n");
kono
parents:
diff changeset
201 }
kono
parents:
diff changeset
202 return false;
kono
parents:
diff changeset
203 }
kono
parents:
diff changeset
204 }
kono
parents:
diff changeset
205 return true;
kono
parents:
diff changeset
206 }
kono
parents:
diff changeset
207
kono
parents:
diff changeset
208 /* Scan statements in SEQ and make sure that it and any binds in it contain
kono
parents:
diff changeset
209 only assignments to local register-type variables (that do not overwrite
kono
parents:
diff changeset
210 group size information) and one OMP construct. If so, return that
kono
parents:
diff changeset
211 construct, otherwise return NULL. GRID describes hitherto discovered
kono
parents:
diff changeset
212 properties of the loop that is evaluated for possible gridification. If
kono
parents:
diff changeset
213 dumping is enabled and function fails, use NAME to dump a note with the
kono
parents:
diff changeset
214 reason for failure. */
kono
parents:
diff changeset
215
kono
parents:
diff changeset
216 static gimple *
kono
parents:
diff changeset
217 grid_find_single_omp_among_assignments (gimple_seq seq, grid_prop *grid,
kono
parents:
diff changeset
218 const char *name)
kono
parents:
diff changeset
219 {
kono
parents:
diff changeset
220 if (!seq)
kono
parents:
diff changeset
221 {
kono
parents:
diff changeset
222 if (dump_enabled_p ())
kono
parents:
diff changeset
223 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
224 GRID_MISSED_MSG_PREFIX "%s construct has empty body\n",
kono
parents:
diff changeset
225 name);
kono
parents:
diff changeset
226 return NULL;
kono
parents:
diff changeset
227 }
kono
parents:
diff changeset
228
kono
parents:
diff changeset
229 gimple *ret = NULL;
kono
parents:
diff changeset
230 if (grid_find_single_omp_among_assignments_1 (seq, grid, name, &ret))
kono
parents:
diff changeset
231 {
kono
parents:
diff changeset
232 if (!ret && dump_enabled_p ())
kono
parents:
diff changeset
233 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
234 GRID_MISSED_MSG_PREFIX "%s construct does not contain"
kono
parents:
diff changeset
235 " any other OpenMP construct\n", name);
kono
parents:
diff changeset
236 return ret;
kono
parents:
diff changeset
237 }
kono
parents:
diff changeset
238 else
kono
parents:
diff changeset
239 return NULL;
kono
parents:
diff changeset
240 }
kono
parents:
diff changeset
241
kono
parents:
diff changeset
242 /* Walker function looking for statements there is no point gridifying (and for
kono
parents:
diff changeset
243 noreturn function calls which we cannot do). Return non-NULL if such a
kono
parents:
diff changeset
244 function is found. */
kono
parents:
diff changeset
245
kono
parents:
diff changeset
246 static tree
kono
parents:
diff changeset
247 grid_find_ungridifiable_statement (gimple_stmt_iterator *gsi,
kono
parents:
diff changeset
248 bool *handled_ops_p,
kono
parents:
diff changeset
249 struct walk_stmt_info *wi)
kono
parents:
diff changeset
250 {
kono
parents:
diff changeset
251 *handled_ops_p = false;
kono
parents:
diff changeset
252 gimple *stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
253 switch (gimple_code (stmt))
kono
parents:
diff changeset
254 {
kono
parents:
diff changeset
255 case GIMPLE_CALL:
kono
parents:
diff changeset
256 if (gimple_call_noreturn_p (as_a <gcall *> (stmt)))
kono
parents:
diff changeset
257 {
kono
parents:
diff changeset
258 *handled_ops_p = true;
kono
parents:
diff changeset
259 wi->info = stmt;
kono
parents:
diff changeset
260 return error_mark_node;
kono
parents:
diff changeset
261 }
kono
parents:
diff changeset
262 break;
kono
parents:
diff changeset
263
kono
parents:
diff changeset
264 /* We may reduce the following list if we find a way to implement the
kono
parents:
diff changeset
265 clauses, but now there is no point trying further. */
kono
parents:
diff changeset
266 case GIMPLE_OMP_CRITICAL:
kono
parents:
diff changeset
267 case GIMPLE_OMP_TASKGROUP:
kono
parents:
diff changeset
268 case GIMPLE_OMP_TASK:
kono
parents:
diff changeset
269 case GIMPLE_OMP_SECTION:
kono
parents:
diff changeset
270 case GIMPLE_OMP_SECTIONS:
kono
parents:
diff changeset
271 case GIMPLE_OMP_SECTIONS_SWITCH:
kono
parents:
diff changeset
272 case GIMPLE_OMP_TARGET:
kono
parents:
diff changeset
273 case GIMPLE_OMP_ORDERED:
kono
parents:
diff changeset
274 *handled_ops_p = true;
kono
parents:
diff changeset
275 wi->info = stmt;
kono
parents:
diff changeset
276 return error_mark_node;
kono
parents:
diff changeset
277 default:
kono
parents:
diff changeset
278 break;
kono
parents:
diff changeset
279 }
kono
parents:
diff changeset
280 return NULL;
kono
parents:
diff changeset
281 }
kono
parents:
diff changeset
282
kono
parents:
diff changeset
283 /* Examine clauses of omp parallel statement PAR and if any prevents
kono
parents:
diff changeset
284 gridification, issue a missed-optimization diagnostics and return false,
kono
parents:
diff changeset
285 otherwise return true. GRID describes hitherto discovered properties of the
kono
parents:
diff changeset
286 loop that is evaluated for possible gridification. */
kono
parents:
diff changeset
287
kono
parents:
diff changeset
288 static bool
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
289 grid_parallel_clauses_gridifiable (gomp_parallel *par, dump_user_location_t tloc)
111
kono
parents:
diff changeset
290 {
kono
parents:
diff changeset
291 tree clauses = gimple_omp_parallel_clauses (par);
kono
parents:
diff changeset
292 while (clauses)
kono
parents:
diff changeset
293 {
kono
parents:
diff changeset
294 switch (OMP_CLAUSE_CODE (clauses))
kono
parents:
diff changeset
295 {
kono
parents:
diff changeset
296 case OMP_CLAUSE_NUM_THREADS:
kono
parents:
diff changeset
297 if (dump_enabled_p ())
kono
parents:
diff changeset
298 {
kono
parents:
diff changeset
299 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
300 GRID_MISSED_MSG_PREFIX "because there is "
kono
parents:
diff changeset
301 "a num_threads clause of the parallel "
kono
parents:
diff changeset
302 "construct\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
303 dump_printf_loc (MSG_NOTE, par,
111
kono
parents:
diff changeset
304 "Parallel construct has a num_threads clause\n");
kono
parents:
diff changeset
305 }
kono
parents:
diff changeset
306 return false;
kono
parents:
diff changeset
307
kono
parents:
diff changeset
308 case OMP_CLAUSE_REDUCTION:
kono
parents:
diff changeset
309 if (dump_enabled_p ())
kono
parents:
diff changeset
310 {
kono
parents:
diff changeset
311 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
312 GRID_MISSED_MSG_PREFIX "a reduction clause "
kono
parents:
diff changeset
313 "is present\n ");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
314 dump_printf_loc (MSG_NOTE, par,
111
kono
parents:
diff changeset
315 "Parallel construct has a reduction clause\n");
kono
parents:
diff changeset
316 }
kono
parents:
diff changeset
317 return false;
kono
parents:
diff changeset
318
kono
parents:
diff changeset
319 default:
kono
parents:
diff changeset
320 break;
kono
parents:
diff changeset
321 }
kono
parents:
diff changeset
322 clauses = OMP_CLAUSE_CHAIN (clauses);
kono
parents:
diff changeset
323 }
kono
parents:
diff changeset
324 return true;
kono
parents:
diff changeset
325 }
kono
parents:
diff changeset
326
kono
parents:
diff changeset
327 /* Examine clauses and the body of omp loop statement GFOR and if something
kono
parents:
diff changeset
328 prevents gridification, issue a missed-optimization diagnostics and return
kono
parents:
diff changeset
329 false, otherwise return true. GRID describes hitherto discovered properties
kono
parents:
diff changeset
330 of the loop that is evaluated for possible gridification. */
kono
parents:
diff changeset
331
kono
parents:
diff changeset
332 static bool
kono
parents:
diff changeset
333 grid_inner_loop_gridifiable_p (gomp_for *gfor, grid_prop *grid)
kono
parents:
diff changeset
334 {
kono
parents:
diff changeset
335 if (!grid_seq_only_contains_local_assignments (gimple_omp_for_pre_body (gfor),
kono
parents:
diff changeset
336 grid))
kono
parents:
diff changeset
337 {
kono
parents:
diff changeset
338 if (dump_enabled_p ())
kono
parents:
diff changeset
339 {
kono
parents:
diff changeset
340 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
341 GRID_MISSED_MSG_PREFIX "the inner loop "
kono
parents:
diff changeset
342 "loop bounds computation contains a complex "
kono
parents:
diff changeset
343 "statement\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
344 dump_printf_loc (MSG_NOTE, gfor,
111
kono
parents:
diff changeset
345 "Loop construct cannot be analyzed for "
kono
parents:
diff changeset
346 "gridification\n");
kono
parents:
diff changeset
347 }
kono
parents:
diff changeset
348 return false;
kono
parents:
diff changeset
349 }
kono
parents:
diff changeset
350
kono
parents:
diff changeset
351 tree clauses = gimple_omp_for_clauses (gfor);
kono
parents:
diff changeset
352 while (clauses)
kono
parents:
diff changeset
353 {
kono
parents:
diff changeset
354 switch (OMP_CLAUSE_CODE (clauses))
kono
parents:
diff changeset
355 {
kono
parents:
diff changeset
356 case OMP_CLAUSE_SCHEDULE:
kono
parents:
diff changeset
357 if (OMP_CLAUSE_SCHEDULE_KIND (clauses) != OMP_CLAUSE_SCHEDULE_AUTO)
kono
parents:
diff changeset
358 {
kono
parents:
diff changeset
359 if (dump_enabled_p ())
kono
parents:
diff changeset
360 {
kono
parents:
diff changeset
361 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
362 GRID_MISSED_MSG_PREFIX "the inner loop "
kono
parents:
diff changeset
363 "has a non-automatic schedule clause\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
364 dump_printf_loc (MSG_NOTE, gfor,
111
kono
parents:
diff changeset
365 "Loop construct has a non automatic "
kono
parents:
diff changeset
366 "schedule clause\n");
kono
parents:
diff changeset
367 }
kono
parents:
diff changeset
368 return false;
kono
parents:
diff changeset
369 }
kono
parents:
diff changeset
370 break;
kono
parents:
diff changeset
371
kono
parents:
diff changeset
372 case OMP_CLAUSE_REDUCTION:
kono
parents:
diff changeset
373 if (dump_enabled_p ())
kono
parents:
diff changeset
374 {
kono
parents:
diff changeset
375 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
376 GRID_MISSED_MSG_PREFIX "a reduction "
kono
parents:
diff changeset
377 "clause is present\n ");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
378 dump_printf_loc (MSG_NOTE, gfor,
111
kono
parents:
diff changeset
379 "Loop construct has a reduction schedule "
kono
parents:
diff changeset
380 "clause\n");
kono
parents:
diff changeset
381 }
kono
parents:
diff changeset
382 return false;
kono
parents:
diff changeset
383
kono
parents:
diff changeset
384 default:
kono
parents:
diff changeset
385 break;
kono
parents:
diff changeset
386 }
kono
parents:
diff changeset
387 clauses = OMP_CLAUSE_CHAIN (clauses);
kono
parents:
diff changeset
388 }
kono
parents:
diff changeset
389 struct walk_stmt_info wi;
kono
parents:
diff changeset
390 memset (&wi, 0, sizeof (wi));
kono
parents:
diff changeset
391 if (walk_gimple_seq (gimple_omp_body (gfor),
kono
parents:
diff changeset
392 grid_find_ungridifiable_statement,
kono
parents:
diff changeset
393 NULL, &wi))
kono
parents:
diff changeset
394 {
kono
parents:
diff changeset
395 gimple *bad = (gimple *) wi.info;
kono
parents:
diff changeset
396 if (dump_enabled_p ())
kono
parents:
diff changeset
397 {
kono
parents:
diff changeset
398 if (is_gimple_call (bad))
kono
parents:
diff changeset
399 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
400 GRID_MISSED_MSG_PREFIX "the inner loop contains "
kono
parents:
diff changeset
401 "call to a noreturn function\n");
kono
parents:
diff changeset
402 else
kono
parents:
diff changeset
403 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
404 GRID_MISSED_MSG_PREFIX "the inner loop contains "
kono
parents:
diff changeset
405 "statement %s which cannot be transformed\n",
kono
parents:
diff changeset
406 gimple_code_name[(int) gimple_code (bad)]);
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
407 dump_printf_loc (MSG_NOTE, bad,
111
kono
parents:
diff changeset
408 "This statement cannot be analyzed for "
kono
parents:
diff changeset
409 "gridification\n");
kono
parents:
diff changeset
410 }
kono
parents:
diff changeset
411 return false;
kono
parents:
diff changeset
412 }
kono
parents:
diff changeset
413 return true;
kono
parents:
diff changeset
414 }
kono
parents:
diff changeset
415
kono
parents:
diff changeset
416 /* Given distribute omp construct represented by DIST, which in the original
kono
parents:
diff changeset
417 source forms a compound construct with a looping construct, return true if it
kono
parents:
diff changeset
418 can be turned into a gridified HSA kernel. Otherwise return false. GRID
kono
parents:
diff changeset
419 describes hitherto discovered properties of the loop that is evaluated for
kono
parents:
diff changeset
420 possible gridification. */
kono
parents:
diff changeset
421
kono
parents:
diff changeset
422 static bool
kono
parents:
diff changeset
423 grid_dist_follows_simple_pattern (gomp_for *dist, grid_prop *grid)
kono
parents:
diff changeset
424 {
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
425 dump_user_location_t tloc = grid->target_loc;
111
kono
parents:
diff changeset
426 gimple *stmt = grid_find_single_omp_among_assignments (gimple_omp_body (dist),
kono
parents:
diff changeset
427 grid, "distribute");
kono
parents:
diff changeset
428 gomp_parallel *par;
kono
parents:
diff changeset
429 if (!stmt
kono
parents:
diff changeset
430 || !(par = dyn_cast <gomp_parallel *> (stmt))
kono
parents:
diff changeset
431 || !grid_parallel_clauses_gridifiable (par, tloc))
kono
parents:
diff changeset
432 return false;
kono
parents:
diff changeset
433
kono
parents:
diff changeset
434 stmt = grid_find_single_omp_among_assignments (gimple_omp_body (par), grid,
kono
parents:
diff changeset
435 "parallel");
kono
parents:
diff changeset
436 gomp_for *gfor;
kono
parents:
diff changeset
437 if (!stmt || !(gfor = dyn_cast <gomp_for *> (stmt)))
kono
parents:
diff changeset
438 return false;
kono
parents:
diff changeset
439
kono
parents:
diff changeset
440 if (gimple_omp_for_kind (gfor) != GF_OMP_FOR_KIND_FOR)
kono
parents:
diff changeset
441 {
kono
parents:
diff changeset
442 if (dump_enabled_p ())
kono
parents:
diff changeset
443 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
444 GRID_MISSED_MSG_PREFIX "the inner loop is not "
kono
parents:
diff changeset
445 "a simple for loop\n");
kono
parents:
diff changeset
446 return false;
kono
parents:
diff changeset
447 }
kono
parents:
diff changeset
448 gcc_assert (gimple_omp_for_collapse (gfor) == grid->collapse);
kono
parents:
diff changeset
449
kono
parents:
diff changeset
450 if (!grid_inner_loop_gridifiable_p (gfor, grid))
kono
parents:
diff changeset
451 return false;
kono
parents:
diff changeset
452
kono
parents:
diff changeset
453 return true;
kono
parents:
diff changeset
454 }
kono
parents:
diff changeset
455
kono
parents:
diff changeset
456 /* Given an omp loop statement GFOR, return true if it can participate in
kono
parents:
diff changeset
457 tiling gridification, i.e. in one where the distribute and parallel for
kono
parents:
diff changeset
458 loops do not form a compound statement. GRID describes hitherto discovered
kono
parents:
diff changeset
459 properties of the loop that is evaluated for possible gridification. */
kono
parents:
diff changeset
460
kono
parents:
diff changeset
461 static bool
kono
parents:
diff changeset
462 grid_gfor_follows_tiling_pattern (gomp_for *gfor, grid_prop *grid)
kono
parents:
diff changeset
463 {
kono
parents:
diff changeset
464 if (gimple_omp_for_kind (gfor) != GF_OMP_FOR_KIND_FOR)
kono
parents:
diff changeset
465 {
kono
parents:
diff changeset
466 if (dump_enabled_p ())
kono
parents:
diff changeset
467 {
kono
parents:
diff changeset
468 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
469 GRID_MISSED_MSG_PREFIX "an inner loop is not "
kono
parents:
diff changeset
470 "a simple for loop\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
471 dump_printf_loc (MSG_NOTE, gfor,
111
kono
parents:
diff changeset
472 "This statement is not a simple for loop\n");
kono
parents:
diff changeset
473 }
kono
parents:
diff changeset
474 return false;
kono
parents:
diff changeset
475 }
kono
parents:
diff changeset
476
kono
parents:
diff changeset
477 if (!grid_inner_loop_gridifiable_p (gfor, grid))
kono
parents:
diff changeset
478 return false;
kono
parents:
diff changeset
479
kono
parents:
diff changeset
480 if (gimple_omp_for_collapse (gfor) != grid->collapse)
kono
parents:
diff changeset
481 {
kono
parents:
diff changeset
482 if (dump_enabled_p ())
kono
parents:
diff changeset
483 {
kono
parents:
diff changeset
484 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
485 GRID_MISSED_MSG_PREFIX "an inner loop does not "
kono
parents:
diff changeset
486 "have use the same collapse clause\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
487 dump_printf_loc (MSG_NOTE, gfor,
111
kono
parents:
diff changeset
488 "Loop construct uses a different collapse clause\n");
kono
parents:
diff changeset
489 }
kono
parents:
diff changeset
490 return false;
kono
parents:
diff changeset
491 }
kono
parents:
diff changeset
492
kono
parents:
diff changeset
493 struct omp_for_data fd;
kono
parents:
diff changeset
494 struct omp_for_data_loop *loops
kono
parents:
diff changeset
495 = (struct omp_for_data_loop *)alloca (grid->collapse
kono
parents:
diff changeset
496 * sizeof (struct omp_for_data_loop));
kono
parents:
diff changeset
497 omp_extract_for_data (gfor, &fd, loops);
kono
parents:
diff changeset
498 for (unsigned i = 0; i < grid->collapse; i++)
kono
parents:
diff changeset
499 {
kono
parents:
diff changeset
500 tree itype, type = TREE_TYPE (fd.loops[i].v);
kono
parents:
diff changeset
501 if (POINTER_TYPE_P (type))
kono
parents:
diff changeset
502 itype = signed_type_for (type);
kono
parents:
diff changeset
503 else
kono
parents:
diff changeset
504 itype = type;
kono
parents:
diff changeset
505
kono
parents:
diff changeset
506 tree n1 = fold_convert (itype, fd.loops[i].n1);
kono
parents:
diff changeset
507 tree n2 = fold_convert (itype, fd.loops[i].n2);
kono
parents:
diff changeset
508 tree t = build_int_cst (itype,
kono
parents:
diff changeset
509 (fd.loops[i].cond_code == LT_EXPR ? -1 : 1));
kono
parents:
diff changeset
510 t = fold_build2 (PLUS_EXPR, itype, fd.loops[i].step, t);
kono
parents:
diff changeset
511 t = fold_build2 (PLUS_EXPR, itype, t, n2);
kono
parents:
diff changeset
512 t = fold_build2 (MINUS_EXPR, itype, t, n1);
kono
parents:
diff changeset
513 if (TYPE_UNSIGNED (itype) && fd.loops[i].cond_code == GT_EXPR)
kono
parents:
diff changeset
514 t = fold_build2 (TRUNC_DIV_EXPR, itype,
kono
parents:
diff changeset
515 fold_build1 (NEGATE_EXPR, itype, t),
kono
parents:
diff changeset
516 fold_build1 (NEGATE_EXPR, itype, fd.loops[i].step));
kono
parents:
diff changeset
517 else
kono
parents:
diff changeset
518 t = fold_build2 (TRUNC_DIV_EXPR, itype, t, fd.loops[i].step);
kono
parents:
diff changeset
519
kono
parents:
diff changeset
520 if (!operand_equal_p (grid->group_sizes[i], t, 0))
kono
parents:
diff changeset
521 {
kono
parents:
diff changeset
522 if (dump_enabled_p ())
kono
parents:
diff changeset
523 {
kono
parents:
diff changeset
524 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
525 GRID_MISSED_MSG_PREFIX "the distribute and "
kono
parents:
diff changeset
526 "an internal loop do not agree on tile size\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
527 dump_printf_loc (MSG_NOTE, gfor,
111
kono
parents:
diff changeset
528 "Loop construct does not seem to loop over "
kono
parents:
diff changeset
529 "a tile size\n");
kono
parents:
diff changeset
530 }
kono
parents:
diff changeset
531 return false;
kono
parents:
diff changeset
532 }
kono
parents:
diff changeset
533 }
kono
parents:
diff changeset
534 return true;
kono
parents:
diff changeset
535 }
kono
parents:
diff changeset
536
kono
parents:
diff changeset
537 /* Facing a call to FNDECL in the body of a distribute construct, return true
kono
parents:
diff changeset
538 if we can handle it or false if it precludes gridification. */
kono
parents:
diff changeset
539
kono
parents:
diff changeset
540 static bool
kono
parents:
diff changeset
541 grid_call_permissible_in_distribute_p (tree fndecl)
kono
parents:
diff changeset
542 {
kono
parents:
diff changeset
543 if (DECL_PURE_P (fndecl) || TREE_READONLY (fndecl))
kono
parents:
diff changeset
544 return true;
kono
parents:
diff changeset
545
kono
parents:
diff changeset
546 const char *name = IDENTIFIER_POINTER (DECL_NAME (fndecl));
kono
parents:
diff changeset
547 if (strstr (name, "omp_") != name)
kono
parents:
diff changeset
548 return false;
kono
parents:
diff changeset
549
kono
parents:
diff changeset
550 if ((strcmp (name, "omp_get_thread_num") == 0)
kono
parents:
diff changeset
551 || (strcmp (name, "omp_get_num_threads") == 0)
kono
parents:
diff changeset
552 || (strcmp (name, "omp_get_num_teams") == 0)
kono
parents:
diff changeset
553 || (strcmp (name, "omp_get_team_num") == 0)
kono
parents:
diff changeset
554 || (strcmp (name, "omp_get_level") == 0)
kono
parents:
diff changeset
555 || (strcmp (name, "omp_get_active_level") == 0)
kono
parents:
diff changeset
556 || (strcmp (name, "omp_in_parallel") == 0))
kono
parents:
diff changeset
557 return true;
kono
parents:
diff changeset
558
kono
parents:
diff changeset
559 return false;
kono
parents:
diff changeset
560 }
kono
parents:
diff changeset
561
kono
parents:
diff changeset
562 /* Facing a call satisfying grid_call_permissible_in_distribute_p in the body
kono
parents:
diff changeset
563 of a distribute construct that is pointed at by GSI, modify it as necessary
kono
parents:
diff changeset
564 for gridification. If the statement itself got removed, return true. */
kono
parents:
diff changeset
565
kono
parents:
diff changeset
566 static bool
kono
parents:
diff changeset
567 grid_handle_call_in_distribute (gimple_stmt_iterator *gsi)
kono
parents:
diff changeset
568 {
kono
parents:
diff changeset
569 gimple *stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
570 tree fndecl = gimple_call_fndecl (stmt);
kono
parents:
diff changeset
571 gcc_checking_assert (stmt);
kono
parents:
diff changeset
572 if (DECL_PURE_P (fndecl) || TREE_READONLY (fndecl))
kono
parents:
diff changeset
573 return false;
kono
parents:
diff changeset
574
kono
parents:
diff changeset
575 const char *name = IDENTIFIER_POINTER (DECL_NAME (fndecl));
kono
parents:
diff changeset
576 if ((strcmp (name, "omp_get_thread_num") == 0)
kono
parents:
diff changeset
577 || (strcmp (name, "omp_get_level") == 0)
kono
parents:
diff changeset
578 || (strcmp (name, "omp_get_active_level") == 0)
kono
parents:
diff changeset
579 || (strcmp (name, "omp_in_parallel") == 0))
kono
parents:
diff changeset
580 {
kono
parents:
diff changeset
581 tree lhs = gimple_call_lhs (stmt);
kono
parents:
diff changeset
582 if (lhs)
kono
parents:
diff changeset
583 {
kono
parents:
diff changeset
584 gassign *assign
kono
parents:
diff changeset
585 = gimple_build_assign (lhs, build_zero_cst (TREE_TYPE (lhs)));
kono
parents:
diff changeset
586 gsi_insert_before (gsi, assign, GSI_SAME_STMT);
kono
parents:
diff changeset
587 }
kono
parents:
diff changeset
588 gsi_remove (gsi, true);
kono
parents:
diff changeset
589 return true;
kono
parents:
diff changeset
590 }
kono
parents:
diff changeset
591
kono
parents:
diff changeset
592 /* The rest of the omp functions can stay as they are, HSA back-end will
kono
parents:
diff changeset
593 handle them correctly. */
kono
parents:
diff changeset
594 gcc_checking_assert ((strcmp (name, "omp_get_num_threads") == 0)
kono
parents:
diff changeset
595 || (strcmp (name, "omp_get_num_teams") == 0)
kono
parents:
diff changeset
596 || (strcmp (name, "omp_get_team_num") == 0));
kono
parents:
diff changeset
597 return false;
kono
parents:
diff changeset
598 }
kono
parents:
diff changeset
599
kono
parents:
diff changeset
600 /* Given a sequence of statements within a distribute omp construct or a
kono
parents:
diff changeset
601 parallel construct, which in the original source does not form a compound
kono
parents:
diff changeset
602 construct with a looping construct, return true if it does not prevent us
kono
parents:
diff changeset
603 from turning it into a gridified HSA kernel. Otherwise return false. GRID
kono
parents:
diff changeset
604 describes hitherto discovered properties of the loop that is evaluated for
kono
parents:
diff changeset
605 possible gridification. IN_PARALLEL must be true if seq is within a
kono
parents:
diff changeset
606 parallel construct and flase if it is only within a distribute
kono
parents:
diff changeset
607 construct. */
kono
parents:
diff changeset
608
kono
parents:
diff changeset
609 static bool
kono
parents:
diff changeset
610 grid_dist_follows_tiling_pattern (gimple_seq seq, grid_prop *grid,
kono
parents:
diff changeset
611 bool in_parallel)
kono
parents:
diff changeset
612 {
kono
parents:
diff changeset
613 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
614 for (gsi = gsi_start (seq); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
615 {
kono
parents:
diff changeset
616 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
617
kono
parents:
diff changeset
618 if (grid_safe_assignment_p (stmt, grid)
kono
parents:
diff changeset
619 || gimple_code (stmt) == GIMPLE_GOTO
kono
parents:
diff changeset
620 || gimple_code (stmt) == GIMPLE_LABEL
kono
parents:
diff changeset
621 || gimple_code (stmt) == GIMPLE_COND)
kono
parents:
diff changeset
622 continue;
kono
parents:
diff changeset
623 else if (gbind *bind = dyn_cast <gbind *> (stmt))
kono
parents:
diff changeset
624 {
kono
parents:
diff changeset
625 if (!grid_dist_follows_tiling_pattern (gimple_bind_body (bind),
kono
parents:
diff changeset
626 grid, in_parallel))
kono
parents:
diff changeset
627 return false;
kono
parents:
diff changeset
628 continue;
kono
parents:
diff changeset
629 }
kono
parents:
diff changeset
630 else if (gtry *try_stmt = dyn_cast <gtry *> (stmt))
kono
parents:
diff changeset
631 {
kono
parents:
diff changeset
632 if (gimple_try_kind (try_stmt) == GIMPLE_TRY_CATCH)
kono
parents:
diff changeset
633 {
kono
parents:
diff changeset
634 if (dump_enabled_p ())
kono
parents:
diff changeset
635 {
kono
parents:
diff changeset
636 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
637 GRID_MISSED_MSG_PREFIX "the distribute "
kono
parents:
diff changeset
638 "construct contains a try..catch region\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
639 dump_printf_loc (MSG_NOTE, try_stmt,
111
kono
parents:
diff changeset
640 "This statement cannot be analyzed for "
kono
parents:
diff changeset
641 "tiled gridification\n");
kono
parents:
diff changeset
642 }
kono
parents:
diff changeset
643 return false;
kono
parents:
diff changeset
644 }
kono
parents:
diff changeset
645 if (!grid_dist_follows_tiling_pattern (gimple_try_eval (try_stmt),
kono
parents:
diff changeset
646 grid, in_parallel))
kono
parents:
diff changeset
647 return false;
kono
parents:
diff changeset
648 if (!grid_dist_follows_tiling_pattern (gimple_try_cleanup (try_stmt),
kono
parents:
diff changeset
649 grid, in_parallel))
kono
parents:
diff changeset
650 return false;
kono
parents:
diff changeset
651 continue;
kono
parents:
diff changeset
652 }
kono
parents:
diff changeset
653 else if (is_gimple_call (stmt))
kono
parents:
diff changeset
654 {
kono
parents:
diff changeset
655 tree fndecl = gimple_call_fndecl (stmt);
kono
parents:
diff changeset
656 if (fndecl && grid_call_permissible_in_distribute_p (fndecl))
kono
parents:
diff changeset
657 continue;
kono
parents:
diff changeset
658
kono
parents:
diff changeset
659 if (dump_enabled_p ())
kono
parents:
diff changeset
660 {
kono
parents:
diff changeset
661 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
662 GRID_MISSED_MSG_PREFIX "the distribute "
kono
parents:
diff changeset
663 "construct contains a call\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
664 dump_printf_loc (MSG_NOTE, stmt,
111
kono
parents:
diff changeset
665 "This statement cannot be analyzed for "
kono
parents:
diff changeset
666 "tiled gridification\n");
kono
parents:
diff changeset
667 }
kono
parents:
diff changeset
668 return false;
kono
parents:
diff changeset
669 }
kono
parents:
diff changeset
670 else if (gomp_parallel *par = dyn_cast <gomp_parallel *> (stmt))
kono
parents:
diff changeset
671 {
kono
parents:
diff changeset
672 if (in_parallel)
kono
parents:
diff changeset
673 {
kono
parents:
diff changeset
674 if (dump_enabled_p ())
kono
parents:
diff changeset
675 {
kono
parents:
diff changeset
676 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
677 GRID_MISSED_MSG_PREFIX "a parallel "
kono
parents:
diff changeset
678 "construct contains another parallel "
kono
parents:
diff changeset
679 "construct\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
680 dump_printf_loc (MSG_NOTE, stmt,
111
kono
parents:
diff changeset
681 "This parallel construct is nested in "
kono
parents:
diff changeset
682 "another one\n");
kono
parents:
diff changeset
683 }
kono
parents:
diff changeset
684 return false;
kono
parents:
diff changeset
685 }
kono
parents:
diff changeset
686 if (!grid_parallel_clauses_gridifiable (par, grid->target_loc)
kono
parents:
diff changeset
687 || !grid_dist_follows_tiling_pattern (gimple_omp_body (par),
kono
parents:
diff changeset
688 grid, true))
kono
parents:
diff changeset
689 return false;
kono
parents:
diff changeset
690 }
kono
parents:
diff changeset
691 else if (gomp_for *gfor = dyn_cast <gomp_for *> (stmt))
kono
parents:
diff changeset
692 {
kono
parents:
diff changeset
693 if (!in_parallel)
kono
parents:
diff changeset
694 {
kono
parents:
diff changeset
695 if (dump_enabled_p ())
kono
parents:
diff changeset
696 {
kono
parents:
diff changeset
697 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
698 GRID_MISSED_MSG_PREFIX "a loop "
kono
parents:
diff changeset
699 "construct is not nested within a parallel "
kono
parents:
diff changeset
700 "construct\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
701 dump_printf_loc (MSG_NOTE, stmt,
111
kono
parents:
diff changeset
702 "This loop construct is not nested in "
kono
parents:
diff changeset
703 "a parallel construct\n");
kono
parents:
diff changeset
704 }
kono
parents:
diff changeset
705 return false;
kono
parents:
diff changeset
706 }
kono
parents:
diff changeset
707 if (!grid_gfor_follows_tiling_pattern (gfor, grid))
kono
parents:
diff changeset
708 return false;
kono
parents:
diff changeset
709 }
kono
parents:
diff changeset
710 else
kono
parents:
diff changeset
711 {
kono
parents:
diff changeset
712 if (dump_enabled_p ())
kono
parents:
diff changeset
713 {
kono
parents:
diff changeset
714 dump_printf_loc (MSG_MISSED_OPTIMIZATION, grid->target_loc,
kono
parents:
diff changeset
715 GRID_MISSED_MSG_PREFIX "the distribute "
kono
parents:
diff changeset
716 "construct contains a complex statement\n");
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
717 dump_printf_loc (MSG_NOTE, stmt,
111
kono
parents:
diff changeset
718 "This statement cannot be analyzed for "
kono
parents:
diff changeset
719 "tiled gridification\n");
kono
parents:
diff changeset
720 }
kono
parents:
diff changeset
721 return false;
kono
parents:
diff changeset
722 }
kono
parents:
diff changeset
723 }
kono
parents:
diff changeset
724 return true;
kono
parents:
diff changeset
725 }
kono
parents:
diff changeset
726
kono
parents:
diff changeset
727 /* If TARGET follows a pattern that can be turned into a gridified HSA kernel,
kono
parents:
diff changeset
728 return true, otherwise return false. In the case of success, also fill in
kono
parents:
diff changeset
729 GRID with information describing the kernel grid. */
kono
parents:
diff changeset
730
kono
parents:
diff changeset
731 static bool
kono
parents:
diff changeset
732 grid_target_follows_gridifiable_pattern (gomp_target *target, grid_prop *grid)
kono
parents:
diff changeset
733 {
kono
parents:
diff changeset
734 if (gimple_omp_target_kind (target) != GF_OMP_TARGET_KIND_REGION)
kono
parents:
diff changeset
735 return false;
kono
parents:
diff changeset
736
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
737 dump_user_location_t tloc = target;
111
kono
parents:
diff changeset
738 grid->target_loc = tloc;
kono
parents:
diff changeset
739 gimple *stmt
kono
parents:
diff changeset
740 = grid_find_single_omp_among_assignments (gimple_omp_body (target),
kono
parents:
diff changeset
741 grid, "target");
kono
parents:
diff changeset
742 if (!stmt)
kono
parents:
diff changeset
743 return false;
kono
parents:
diff changeset
744 gomp_teams *teams = dyn_cast <gomp_teams *> (stmt);
kono
parents:
diff changeset
745 tree group_size = NULL;
kono
parents:
diff changeset
746 if (!teams)
kono
parents:
diff changeset
747 {
kono
parents:
diff changeset
748 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
749 GRID_MISSED_MSG_PREFIX "it does not have a sole teams "
kono
parents:
diff changeset
750 "construct in it.\n");
kono
parents:
diff changeset
751 return false;
kono
parents:
diff changeset
752 }
kono
parents:
diff changeset
753
kono
parents:
diff changeset
754 tree clauses = gimple_omp_teams_clauses (teams);
kono
parents:
diff changeset
755 while (clauses)
kono
parents:
diff changeset
756 {
kono
parents:
diff changeset
757 switch (OMP_CLAUSE_CODE (clauses))
kono
parents:
diff changeset
758 {
kono
parents:
diff changeset
759 case OMP_CLAUSE_NUM_TEAMS:
kono
parents:
diff changeset
760 if (dump_enabled_p ())
kono
parents:
diff changeset
761 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
762 GRID_MISSED_MSG_PREFIX "the teams construct "
kono
parents:
diff changeset
763 "contains a num_teams clause\n ");
kono
parents:
diff changeset
764 return false;
kono
parents:
diff changeset
765
kono
parents:
diff changeset
766 case OMP_CLAUSE_REDUCTION:
kono
parents:
diff changeset
767 if (dump_enabled_p ())
kono
parents:
diff changeset
768 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
769 GRID_MISSED_MSG_PREFIX "a reduction "
kono
parents:
diff changeset
770 "clause is present\n ");
kono
parents:
diff changeset
771 return false;
kono
parents:
diff changeset
772
kono
parents:
diff changeset
773 case OMP_CLAUSE_THREAD_LIMIT:
kono
parents:
diff changeset
774 if (!integer_zerop (OMP_CLAUSE_OPERAND (clauses, 0)))
kono
parents:
diff changeset
775 group_size = OMP_CLAUSE_OPERAND (clauses, 0);
kono
parents:
diff changeset
776 break;
kono
parents:
diff changeset
777
kono
parents:
diff changeset
778 default:
kono
parents:
diff changeset
779 break;
kono
parents:
diff changeset
780 }
kono
parents:
diff changeset
781 clauses = OMP_CLAUSE_CHAIN (clauses);
kono
parents:
diff changeset
782 }
kono
parents:
diff changeset
783
kono
parents:
diff changeset
784 stmt = grid_find_single_omp_among_assignments (gimple_omp_body (teams), grid,
kono
parents:
diff changeset
785 "teams");
kono
parents:
diff changeset
786 if (!stmt)
kono
parents:
diff changeset
787 return false;
kono
parents:
diff changeset
788 gomp_for *dist = dyn_cast <gomp_for *> (stmt);
kono
parents:
diff changeset
789 if (!dist)
kono
parents:
diff changeset
790 {
kono
parents:
diff changeset
791 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
792 GRID_MISSED_MSG_PREFIX "the teams construct does not "
kono
parents:
diff changeset
793 "have a single distribute construct in it.\n");
kono
parents:
diff changeset
794 return false;
kono
parents:
diff changeset
795 }
kono
parents:
diff changeset
796
kono
parents:
diff changeset
797 gcc_assert (gimple_omp_for_kind (dist) == GF_OMP_FOR_KIND_DISTRIBUTE);
kono
parents:
diff changeset
798
kono
parents:
diff changeset
799 grid->collapse = gimple_omp_for_collapse (dist);
kono
parents:
diff changeset
800 if (grid->collapse > 3)
kono
parents:
diff changeset
801 {
kono
parents:
diff changeset
802 if (dump_enabled_p ())
kono
parents:
diff changeset
803 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
804 GRID_MISSED_MSG_PREFIX "the distribute construct "
kono
parents:
diff changeset
805 "contains collapse clause with parameter greater "
kono
parents:
diff changeset
806 "than 3\n");
kono
parents:
diff changeset
807 return false;
kono
parents:
diff changeset
808 }
kono
parents:
diff changeset
809
kono
parents:
diff changeset
810 struct omp_for_data fd;
kono
parents:
diff changeset
811 struct omp_for_data_loop *dist_loops
kono
parents:
diff changeset
812 = (struct omp_for_data_loop *)alloca (grid->collapse
kono
parents:
diff changeset
813 * sizeof (struct omp_for_data_loop));
kono
parents:
diff changeset
814 omp_extract_for_data (dist, &fd, dist_loops);
kono
parents:
diff changeset
815 if (fd.chunk_size)
kono
parents:
diff changeset
816 {
kono
parents:
diff changeset
817 if (group_size && !operand_equal_p (group_size, fd.chunk_size, 0))
kono
parents:
diff changeset
818 {
kono
parents:
diff changeset
819 if (dump_enabled_p ())
kono
parents:
diff changeset
820 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
821 GRID_MISSED_MSG_PREFIX "the teams "
kono
parents:
diff changeset
822 "thread limit is different from distribute "
kono
parents:
diff changeset
823 "schedule chunk\n");
kono
parents:
diff changeset
824 return false;
kono
parents:
diff changeset
825 }
kono
parents:
diff changeset
826 group_size = fd.chunk_size;
kono
parents:
diff changeset
827 }
kono
parents:
diff changeset
828 if (group_size && grid->collapse > 1)
kono
parents:
diff changeset
829 {
kono
parents:
diff changeset
830 if (dump_enabled_p ())
kono
parents:
diff changeset
831 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
832 GRID_MISSED_MSG_PREFIX "group size cannot be "
kono
parents:
diff changeset
833 "set using thread_limit or schedule clauses "
kono
parents:
diff changeset
834 "when also using a collapse clause greater than 1\n");
kono
parents:
diff changeset
835 return false;
kono
parents:
diff changeset
836 }
kono
parents:
diff changeset
837
kono
parents:
diff changeset
838 if (gimple_omp_for_combined_p (dist))
kono
parents:
diff changeset
839 {
kono
parents:
diff changeset
840 grid->tiling = false;
kono
parents:
diff changeset
841 grid->group_sizes[0] = group_size;
kono
parents:
diff changeset
842 for (unsigned i = 1; i < grid->collapse; i++)
kono
parents:
diff changeset
843 grid->group_sizes[i] = NULL;
kono
parents:
diff changeset
844 return grid_dist_follows_simple_pattern (dist, grid);
kono
parents:
diff changeset
845 }
kono
parents:
diff changeset
846 else
kono
parents:
diff changeset
847 {
kono
parents:
diff changeset
848 grid->tiling = true;
kono
parents:
diff changeset
849 if (group_size)
kono
parents:
diff changeset
850 {
kono
parents:
diff changeset
851 if (dump_enabled_p ())
kono
parents:
diff changeset
852 dump_printf_loc (MSG_MISSED_OPTIMIZATION, tloc,
kono
parents:
diff changeset
853 GRID_MISSED_MSG_PREFIX "group size cannot be set "
kono
parents:
diff changeset
854 "using thread_limit or schedule clauses when "
kono
parents:
diff changeset
855 "distribute and loop constructs do not form "
kono
parents:
diff changeset
856 "one combined construct\n");
kono
parents:
diff changeset
857 return false;
kono
parents:
diff changeset
858 }
kono
parents:
diff changeset
859 for (unsigned i = 0; i < grid->collapse; i++)
kono
parents:
diff changeset
860 {
kono
parents:
diff changeset
861 if (fd.loops[i].cond_code == GT_EXPR)
kono
parents:
diff changeset
862 grid->group_sizes[i] = fold_build1 (NEGATE_EXPR,
kono
parents:
diff changeset
863 TREE_TYPE (fd.loops[i].step),
kono
parents:
diff changeset
864 fd.loops[i].step);
kono
parents:
diff changeset
865 else
kono
parents:
diff changeset
866 grid->group_sizes[i] = fd.loops[i].step;
kono
parents:
diff changeset
867 }
kono
parents:
diff changeset
868 return grid_dist_follows_tiling_pattern (gimple_omp_body (dist), grid,
kono
parents:
diff changeset
869 false);
kono
parents:
diff changeset
870 }
kono
parents:
diff changeset
871 }
kono
parents:
diff changeset
872
kono
parents:
diff changeset
873 /* Operand walker, used to remap pre-body declarations according to a hash map
kono
parents:
diff changeset
874 provided in DATA. */
kono
parents:
diff changeset
875
kono
parents:
diff changeset
876 static tree
kono
parents:
diff changeset
877 grid_remap_prebody_decls (tree *tp, int *walk_subtrees, void *data)
kono
parents:
diff changeset
878 {
kono
parents:
diff changeset
879 tree t = *tp;
kono
parents:
diff changeset
880
kono
parents:
diff changeset
881 if (DECL_P (t) || TYPE_P (t))
kono
parents:
diff changeset
882 *walk_subtrees = 0;
kono
parents:
diff changeset
883 else
kono
parents:
diff changeset
884 *walk_subtrees = 1;
kono
parents:
diff changeset
885
kono
parents:
diff changeset
886 if (VAR_P (t))
kono
parents:
diff changeset
887 {
kono
parents:
diff changeset
888 struct walk_stmt_info *wi = (struct walk_stmt_info *) data;
kono
parents:
diff changeset
889 hash_map<tree, tree> *declmap = (hash_map<tree, tree> *) wi->info;
kono
parents:
diff changeset
890 tree *repl = declmap->get (t);
kono
parents:
diff changeset
891 if (repl)
kono
parents:
diff changeset
892 *tp = *repl;
kono
parents:
diff changeset
893 }
kono
parents:
diff changeset
894 return NULL_TREE;
kono
parents:
diff changeset
895 }
kono
parents:
diff changeset
896
kono
parents:
diff changeset
897 /* Identifiers of segments into which a particular variable should be places
kono
parents:
diff changeset
898 when gridifying. */
kono
parents:
diff changeset
899
kono
parents:
diff changeset
900 enum grid_var_segment {GRID_SEGMENT_PRIVATE, GRID_SEGMENT_GROUP,
kono
parents:
diff changeset
901 GRID_SEGMENT_GLOBAL};
kono
parents:
diff changeset
902
kono
parents:
diff changeset
903 /* Mark VAR so that it is eventually placed into SEGMENT. Place an artificial
kono
parents:
diff changeset
904 builtin call into SEQ that will make sure the variable is always considered
kono
parents:
diff changeset
905 address taken. */
kono
parents:
diff changeset
906
kono
parents:
diff changeset
907 static void
kono
parents:
diff changeset
908 grid_mark_variable_segment (tree var, enum grid_var_segment segment)
kono
parents:
diff changeset
909 {
kono
parents:
diff changeset
910 /* Making a non-addressable variables would require that we re-gimplify all
kono
parents:
diff changeset
911 their uses. Fortunately, we do not have to do this because if they are
kono
parents:
diff changeset
912 not addressable, it means they are not used in atomic or parallel
kono
parents:
diff changeset
913 statements and so relaxed GPU consistency rules mean we can just keep them
kono
parents:
diff changeset
914 private. */
kono
parents:
diff changeset
915 if (!TREE_ADDRESSABLE (var))
kono
parents:
diff changeset
916 return;
kono
parents:
diff changeset
917
kono
parents:
diff changeset
918 switch (segment)
kono
parents:
diff changeset
919 {
kono
parents:
diff changeset
920 case GRID_SEGMENT_GROUP:
kono
parents:
diff changeset
921 DECL_ATTRIBUTES (var) = tree_cons (get_identifier ("hsa_group_segment"),
kono
parents:
diff changeset
922 NULL, DECL_ATTRIBUTES (var));
kono
parents:
diff changeset
923 break;
kono
parents:
diff changeset
924 case GRID_SEGMENT_GLOBAL:
kono
parents:
diff changeset
925 DECL_ATTRIBUTES (var) = tree_cons (get_identifier ("hsa_global_segment"),
kono
parents:
diff changeset
926 NULL, DECL_ATTRIBUTES (var));
kono
parents:
diff changeset
927 break;
kono
parents:
diff changeset
928 default:
kono
parents:
diff changeset
929 gcc_unreachable ();
kono
parents:
diff changeset
930 }
kono
parents:
diff changeset
931
kono
parents:
diff changeset
932 if (!TREE_STATIC (var))
kono
parents:
diff changeset
933 {
kono
parents:
diff changeset
934 TREE_STATIC (var) = 1;
kono
parents:
diff changeset
935 varpool_node::finalize_decl (var);
kono
parents:
diff changeset
936 }
kono
parents:
diff changeset
937
kono
parents:
diff changeset
938 }
kono
parents:
diff changeset
939
kono
parents:
diff changeset
940 /* Copy leading register-type assignments to local variables in SRC to just
kono
parents:
diff changeset
941 before DST, Creating temporaries, adjusting mapping of operands in WI and
kono
parents:
diff changeset
942 remapping operands as necessary. Add any new temporaries to TGT_BIND.
kono
parents:
diff changeset
943 Return the first statement that does not conform to grid_safe_assignment_p
kono
parents:
diff changeset
944 or NULL. If VAR_SEGMENT is not GRID_SEGMENT_PRIVATE, also mark all
kono
parents:
diff changeset
945 variables in traversed bind statements so that they are put into the
kono
parents:
diff changeset
946 appropriate segment. */
kono
parents:
diff changeset
947
kono
parents:
diff changeset
948 static gimple *
kono
parents:
diff changeset
949 grid_copy_leading_local_assignments (gimple_seq src, gimple_stmt_iterator *dst,
kono
parents:
diff changeset
950 gbind *tgt_bind,
kono
parents:
diff changeset
951 enum grid_var_segment var_segment,
kono
parents:
diff changeset
952 struct walk_stmt_info *wi)
kono
parents:
diff changeset
953 {
kono
parents:
diff changeset
954 hash_map<tree, tree> *declmap = (hash_map<tree, tree> *) wi->info;
kono
parents:
diff changeset
955 gimple_stmt_iterator gsi;
kono
parents:
diff changeset
956 for (gsi = gsi_start (src); !gsi_end_p (gsi); gsi_next (&gsi))
kono
parents:
diff changeset
957 {
kono
parents:
diff changeset
958 gimple *stmt = gsi_stmt (gsi);
kono
parents:
diff changeset
959 if (gbind *bind = dyn_cast <gbind *> (stmt))
kono
parents:
diff changeset
960 {
kono
parents:
diff changeset
961 gimple *r = grid_copy_leading_local_assignments
kono
parents:
diff changeset
962 (gimple_bind_body (bind), dst, tgt_bind, var_segment, wi);
kono
parents:
diff changeset
963
kono
parents:
diff changeset
964 if (var_segment != GRID_SEGMENT_PRIVATE)
kono
parents:
diff changeset
965 for (tree var = gimple_bind_vars (bind);
kono
parents:
diff changeset
966 var;
kono
parents:
diff changeset
967 var = DECL_CHAIN (var))
kono
parents:
diff changeset
968 grid_mark_variable_segment (var, var_segment);
kono
parents:
diff changeset
969 if (r)
kono
parents:
diff changeset
970 return r;
kono
parents:
diff changeset
971 else
kono
parents:
diff changeset
972 continue;
kono
parents:
diff changeset
973 }
kono
parents:
diff changeset
974 if (!grid_safe_assignment_p (stmt, NULL))
kono
parents:
diff changeset
975 return stmt;
kono
parents:
diff changeset
976 tree lhs = gimple_assign_lhs (as_a <gassign *> (stmt));
kono
parents:
diff changeset
977 tree repl = copy_var_decl (lhs, create_tmp_var_name (NULL),
kono
parents:
diff changeset
978 TREE_TYPE (lhs));
kono
parents:
diff changeset
979 DECL_CONTEXT (repl) = current_function_decl;
kono
parents:
diff changeset
980 gimple_bind_append_vars (tgt_bind, repl);
kono
parents:
diff changeset
981
kono
parents:
diff changeset
982 declmap->put (lhs, repl);
kono
parents:
diff changeset
983 gassign *copy = as_a <gassign *> (gimple_copy (stmt));
kono
parents:
diff changeset
984 walk_gimple_op (copy, grid_remap_prebody_decls, wi);
kono
parents:
diff changeset
985 gsi_insert_before (dst, copy, GSI_SAME_STMT);
kono
parents:
diff changeset
986 }
kono
parents:
diff changeset
987 return NULL;
kono
parents:
diff changeset
988 }
kono
parents:
diff changeset
989
kono
parents:
diff changeset
990 /* Statement walker function to make adjustments to statements within the
kono
parents:
diff changeset
991 gridifed kernel copy. */
kono
parents:
diff changeset
992
kono
parents:
diff changeset
993 static tree
kono
parents:
diff changeset
994 grid_process_grid_body (gimple_stmt_iterator *gsi, bool *handled_ops_p,
kono
parents:
diff changeset
995 struct walk_stmt_info *)
kono
parents:
diff changeset
996 {
kono
parents:
diff changeset
997 *handled_ops_p = false;
kono
parents:
diff changeset
998 gimple *stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
999 if (gimple_code (stmt) == GIMPLE_OMP_FOR
kono
parents:
diff changeset
1000 && (gimple_omp_for_kind (stmt) & GF_OMP_FOR_SIMD))
kono
parents:
diff changeset
1001 {
kono
parents:
diff changeset
1002 gomp_for *loop = as_a <gomp_for *> (stmt);
kono
parents:
diff changeset
1003 tree clauses = gimple_omp_for_clauses (loop);
kono
parents:
diff changeset
1004 tree cl = omp_find_clause (clauses, OMP_CLAUSE_SAFELEN);
kono
parents:
diff changeset
1005 if (cl)
kono
parents:
diff changeset
1006 OMP_CLAUSE_SAFELEN_EXPR (cl) = integer_one_node;
kono
parents:
diff changeset
1007 else
kono
parents:
diff changeset
1008 {
kono
parents:
diff changeset
1009 tree c = build_omp_clause (UNKNOWN_LOCATION, OMP_CLAUSE_SAFELEN);
kono
parents:
diff changeset
1010 OMP_CLAUSE_SAFELEN_EXPR (c) = integer_one_node;
kono
parents:
diff changeset
1011 OMP_CLAUSE_CHAIN (c) = clauses;
kono
parents:
diff changeset
1012 gimple_omp_for_set_clauses (loop, c);
kono
parents:
diff changeset
1013 }
kono
parents:
diff changeset
1014 }
kono
parents:
diff changeset
1015 return NULL_TREE;
kono
parents:
diff changeset
1016 }
kono
parents:
diff changeset
1017
kono
parents:
diff changeset
1018 /* Given a PARLOOP that is a normal for looping construct but also a part of a
kono
parents:
diff changeset
1019 combined construct with a simd loop, eliminate the simd loop. */
kono
parents:
diff changeset
1020
kono
parents:
diff changeset
1021 static void
kono
parents:
diff changeset
1022 grid_eliminate_combined_simd_part (gomp_for *parloop)
kono
parents:
diff changeset
1023 {
kono
parents:
diff changeset
1024 struct walk_stmt_info wi;
kono
parents:
diff changeset
1025
kono
parents:
diff changeset
1026 memset (&wi, 0, sizeof (wi));
kono
parents:
diff changeset
1027 wi.val_only = true;
kono
parents:
diff changeset
1028 enum gf_mask msk = GF_OMP_FOR_SIMD;
kono
parents:
diff changeset
1029 wi.info = (void *) &msk;
kono
parents:
diff changeset
1030 walk_gimple_seq (gimple_omp_body (parloop), omp_find_combined_for, NULL, &wi);
kono
parents:
diff changeset
1031 gimple *stmt = (gimple *) wi.info;
kono
parents:
diff changeset
1032 /* We expect that the SIMD id the only statement in the parallel loop. */
kono
parents:
diff changeset
1033 gcc_assert (stmt
kono
parents:
diff changeset
1034 && gimple_code (stmt) == GIMPLE_OMP_FOR
kono
parents:
diff changeset
1035 && (gimple_omp_for_kind (stmt) == GF_OMP_FOR_SIMD)
kono
parents:
diff changeset
1036 && gimple_omp_for_combined_into_p (stmt)
kono
parents:
diff changeset
1037 && !gimple_omp_for_combined_p (stmt));
kono
parents:
diff changeset
1038 gomp_for *simd = as_a <gomp_for *> (stmt);
kono
parents:
diff changeset
1039
kono
parents:
diff changeset
1040 /* Copy over the iteration properties because the body refers to the index in
kono
parents:
diff changeset
1041 the bottmom-most loop. */
kono
parents:
diff changeset
1042 unsigned i, collapse = gimple_omp_for_collapse (parloop);
kono
parents:
diff changeset
1043 gcc_checking_assert (collapse == gimple_omp_for_collapse (simd));
kono
parents:
diff changeset
1044 for (i = 0; i < collapse; i++)
kono
parents:
diff changeset
1045 {
kono
parents:
diff changeset
1046 gimple_omp_for_set_index (parloop, i, gimple_omp_for_index (simd, i));
kono
parents:
diff changeset
1047 gimple_omp_for_set_initial (parloop, i, gimple_omp_for_initial (simd, i));
kono
parents:
diff changeset
1048 gimple_omp_for_set_final (parloop, i, gimple_omp_for_final (simd, i));
kono
parents:
diff changeset
1049 gimple_omp_for_set_incr (parloop, i, gimple_omp_for_incr (simd, i));
kono
parents:
diff changeset
1050 }
kono
parents:
diff changeset
1051
kono
parents:
diff changeset
1052 tree *tgt= gimple_omp_for_clauses_ptr (parloop);
kono
parents:
diff changeset
1053 while (*tgt)
kono
parents:
diff changeset
1054 tgt = &OMP_CLAUSE_CHAIN (*tgt);
kono
parents:
diff changeset
1055
kono
parents:
diff changeset
1056 /* Copy over all clauses, except for linaer clauses, which are turned into
kono
parents:
diff changeset
1057 private clauses, and all other simd-specificl clauses, which are
kono
parents:
diff changeset
1058 ignored. */
kono
parents:
diff changeset
1059 tree *pc = gimple_omp_for_clauses_ptr (simd);
kono
parents:
diff changeset
1060 while (*pc)
kono
parents:
diff changeset
1061 {
kono
parents:
diff changeset
1062 tree c = *pc;
kono
parents:
diff changeset
1063 switch (TREE_CODE (c))
kono
parents:
diff changeset
1064 {
kono
parents:
diff changeset
1065 case OMP_CLAUSE_LINEAR:
kono
parents:
diff changeset
1066 {
kono
parents:
diff changeset
1067 tree priv = build_omp_clause (UNKNOWN_LOCATION, OMP_CLAUSE_PRIVATE);
kono
parents:
diff changeset
1068 OMP_CLAUSE_DECL (priv) = OMP_CLAUSE_DECL (c);
kono
parents:
diff changeset
1069 OMP_CLAUSE_CHAIN (priv) = NULL;
kono
parents:
diff changeset
1070 *tgt = priv;
kono
parents:
diff changeset
1071 tgt = &OMP_CLAUSE_CHAIN (priv);
kono
parents:
diff changeset
1072 pc = &OMP_CLAUSE_CHAIN (c);
kono
parents:
diff changeset
1073 break;
kono
parents:
diff changeset
1074 }
kono
parents:
diff changeset
1075
kono
parents:
diff changeset
1076 case OMP_CLAUSE_SAFELEN:
kono
parents:
diff changeset
1077 case OMP_CLAUSE_SIMDLEN:
kono
parents:
diff changeset
1078 case OMP_CLAUSE_ALIGNED:
kono
parents:
diff changeset
1079 pc = &OMP_CLAUSE_CHAIN (c);
kono
parents:
diff changeset
1080 break;
kono
parents:
diff changeset
1081
kono
parents:
diff changeset
1082 default:
kono
parents:
diff changeset
1083 *pc = OMP_CLAUSE_CHAIN (c);
kono
parents:
diff changeset
1084 OMP_CLAUSE_CHAIN (c) = NULL;
kono
parents:
diff changeset
1085 *tgt = c;
kono
parents:
diff changeset
1086 tgt = &OMP_CLAUSE_CHAIN(c);
kono
parents:
diff changeset
1087 break;
kono
parents:
diff changeset
1088 }
kono
parents:
diff changeset
1089 }
kono
parents:
diff changeset
1090
kono
parents:
diff changeset
1091 /* Finally, throw away the simd and mark the parallel loop as not
kono
parents:
diff changeset
1092 combined. */
kono
parents:
diff changeset
1093 gimple_omp_set_body (parloop, gimple_omp_body (simd));
kono
parents:
diff changeset
1094 gimple_omp_for_set_combined_p (parloop, false);
kono
parents:
diff changeset
1095 }
kono
parents:
diff changeset
1096
kono
parents:
diff changeset
1097 /* Statement walker function marking all parallels as grid_phony and loops as
kono
parents:
diff changeset
1098 grid ones representing threads of a particular thread group. */
kono
parents:
diff changeset
1099
kono
parents:
diff changeset
1100 static tree
kono
parents:
diff changeset
1101 grid_mark_tiling_loops (gimple_stmt_iterator *gsi, bool *handled_ops_p,
kono
parents:
diff changeset
1102 struct walk_stmt_info *wi_in)
kono
parents:
diff changeset
1103 {
kono
parents:
diff changeset
1104 *handled_ops_p = false;
kono
parents:
diff changeset
1105 if (gomp_for *loop = dyn_cast <gomp_for *> (gsi_stmt (*gsi)))
kono
parents:
diff changeset
1106 {
kono
parents:
diff changeset
1107 *handled_ops_p = true;
kono
parents:
diff changeset
1108 gimple_omp_for_set_kind (loop, GF_OMP_FOR_KIND_GRID_LOOP);
kono
parents:
diff changeset
1109 gimple_omp_for_set_grid_intra_group (loop, true);
kono
parents:
diff changeset
1110 if (gimple_omp_for_combined_p (loop))
kono
parents:
diff changeset
1111 grid_eliminate_combined_simd_part (loop);
kono
parents:
diff changeset
1112
kono
parents:
diff changeset
1113 struct walk_stmt_info body_wi;
kono
parents:
diff changeset
1114 memset (&body_wi, 0, sizeof (body_wi));
kono
parents:
diff changeset
1115 walk_gimple_seq_mod (gimple_omp_body_ptr (loop),
kono
parents:
diff changeset
1116 grid_process_grid_body, NULL, &body_wi);
kono
parents:
diff changeset
1117
kono
parents:
diff changeset
1118 gbind *bind = (gbind *) wi_in->info;
kono
parents:
diff changeset
1119 tree c;
kono
parents:
diff changeset
1120 for (c = gimple_omp_for_clauses (loop); c; c = OMP_CLAUSE_CHAIN (c))
kono
parents:
diff changeset
1121 if (OMP_CLAUSE_CODE (c) == OMP_CLAUSE_LASTPRIVATE)
kono
parents:
diff changeset
1122 {
kono
parents:
diff changeset
1123 push_gimplify_context ();
kono
parents:
diff changeset
1124 tree ov = OMP_CLAUSE_DECL (c);
kono
parents:
diff changeset
1125 tree gv = copy_var_decl (ov, create_tmp_var_name (NULL),
kono
parents:
diff changeset
1126 TREE_TYPE (ov));
kono
parents:
diff changeset
1127
kono
parents:
diff changeset
1128 grid_mark_variable_segment (gv, GRID_SEGMENT_GROUP);
kono
parents:
diff changeset
1129 DECL_CONTEXT (gv) = current_function_decl;
kono
parents:
diff changeset
1130 gimple_bind_append_vars (bind, gv);
kono
parents:
diff changeset
1131 tree x = lang_hooks.decls.omp_clause_assign_op (c, gv, ov);
kono
parents:
diff changeset
1132 gimplify_and_add (x, &OMP_CLAUSE_LASTPRIVATE_GIMPLE_SEQ (c));
kono
parents:
diff changeset
1133 x = lang_hooks.decls.omp_clause_copy_ctor (c, ov, gv);
kono
parents:
diff changeset
1134 gimple_seq l = NULL;
kono
parents:
diff changeset
1135 gimplify_and_add (x, &l);
kono
parents:
diff changeset
1136 gsi_insert_seq_after (gsi, l, GSI_SAME_STMT);
kono
parents:
diff changeset
1137 pop_gimplify_context (bind);
kono
parents:
diff changeset
1138 }
kono
parents:
diff changeset
1139 }
kono
parents:
diff changeset
1140 return NULL_TREE;
kono
parents:
diff changeset
1141 }
kono
parents:
diff changeset
1142
kono
parents:
diff changeset
1143 /* Statement walker function marking all parallels as grid_phony and loops as
kono
parents:
diff changeset
1144 grid ones representing threads of a particular thread group. */
kono
parents:
diff changeset
1145
kono
parents:
diff changeset
1146 static tree
kono
parents:
diff changeset
1147 grid_mark_tiling_parallels_and_loops (gimple_stmt_iterator *gsi,
kono
parents:
diff changeset
1148 bool *handled_ops_p,
kono
parents:
diff changeset
1149 struct walk_stmt_info *wi_in)
kono
parents:
diff changeset
1150 {
kono
parents:
diff changeset
1151 *handled_ops_p = false;
kono
parents:
diff changeset
1152 wi_in->removed_stmt = false;
kono
parents:
diff changeset
1153 gimple *stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
1154 if (gbind *bind = dyn_cast <gbind *> (stmt))
kono
parents:
diff changeset
1155 {
kono
parents:
diff changeset
1156 for (tree var = gimple_bind_vars (bind); var; var = DECL_CHAIN (var))
kono
parents:
diff changeset
1157 grid_mark_variable_segment (var, GRID_SEGMENT_GROUP);
kono
parents:
diff changeset
1158 }
kono
parents:
diff changeset
1159 else if (gomp_parallel *parallel = dyn_cast <gomp_parallel *> (stmt))
kono
parents:
diff changeset
1160 {
kono
parents:
diff changeset
1161 *handled_ops_p = true;
kono
parents:
diff changeset
1162 gimple_omp_parallel_set_grid_phony (parallel, true);
kono
parents:
diff changeset
1163
kono
parents:
diff changeset
1164 gbind *new_bind = gimple_build_bind (NULL, NULL, make_node (BLOCK));
kono
parents:
diff changeset
1165 gimple_bind_set_body (new_bind, gimple_omp_body (parallel));
kono
parents:
diff changeset
1166 gimple_seq s = NULL;
kono
parents:
diff changeset
1167 gimple_seq_add_stmt (&s, new_bind);
kono
parents:
diff changeset
1168 gimple_omp_set_body (parallel, s);
kono
parents:
diff changeset
1169
kono
parents:
diff changeset
1170 struct walk_stmt_info wi_par;
kono
parents:
diff changeset
1171 memset (&wi_par, 0, sizeof (wi_par));
kono
parents:
diff changeset
1172 wi_par.info = new_bind;
kono
parents:
diff changeset
1173 walk_gimple_seq_mod (gimple_bind_body_ptr (new_bind),
kono
parents:
diff changeset
1174 grid_mark_tiling_loops, NULL, &wi_par);
kono
parents:
diff changeset
1175 }
kono
parents:
diff changeset
1176 else if (is_a <gcall *> (stmt))
kono
parents:
diff changeset
1177 wi_in->removed_stmt = grid_handle_call_in_distribute (gsi);
kono
parents:
diff changeset
1178 return NULL_TREE;
kono
parents:
diff changeset
1179 }
kono
parents:
diff changeset
1180
kono
parents:
diff changeset
1181 /* Given freshly copied top level kernel SEQ, identify the individual OMP
kono
parents:
diff changeset
1182 components, mark them as part of kernel, copy assignment leading to them
kono
parents:
diff changeset
1183 just before DST, remapping them using WI and adding new temporaries to
kono
parents:
diff changeset
1184 TGT_BIND, and and return the loop that will be used for kernel dispatch. */
kono
parents:
diff changeset
1185
kono
parents:
diff changeset
1186 static gomp_for *
kono
parents:
diff changeset
1187 grid_process_kernel_body_copy (grid_prop *grid, gimple_seq seq,
kono
parents:
diff changeset
1188 gimple_stmt_iterator *dst,
kono
parents:
diff changeset
1189 gbind *tgt_bind, struct walk_stmt_info *wi)
kono
parents:
diff changeset
1190 {
kono
parents:
diff changeset
1191 gimple *stmt = grid_copy_leading_local_assignments (seq, dst, tgt_bind,
kono
parents:
diff changeset
1192 GRID_SEGMENT_GLOBAL, wi);
kono
parents:
diff changeset
1193 gomp_teams *teams = dyn_cast <gomp_teams *> (stmt);
kono
parents:
diff changeset
1194 gcc_assert (teams);
kono
parents:
diff changeset
1195 gimple_omp_teams_set_grid_phony (teams, true);
kono
parents:
diff changeset
1196 stmt = grid_copy_leading_local_assignments (gimple_omp_body (teams), dst,
kono
parents:
diff changeset
1197 tgt_bind, GRID_SEGMENT_GLOBAL,
kono
parents:
diff changeset
1198 wi);
kono
parents:
diff changeset
1199 gcc_checking_assert (stmt);
kono
parents:
diff changeset
1200 gomp_for *dist = dyn_cast <gomp_for *> (stmt);
kono
parents:
diff changeset
1201 gcc_assert (dist);
kono
parents:
diff changeset
1202 gimple_seq prebody = gimple_omp_for_pre_body (dist);
kono
parents:
diff changeset
1203 if (prebody)
kono
parents:
diff changeset
1204 grid_copy_leading_local_assignments (prebody, dst, tgt_bind,
kono
parents:
diff changeset
1205 GRID_SEGMENT_GROUP, wi);
kono
parents:
diff changeset
1206
kono
parents:
diff changeset
1207 if (grid->tiling)
kono
parents:
diff changeset
1208 {
kono
parents:
diff changeset
1209 gimple_omp_for_set_kind (dist, GF_OMP_FOR_KIND_GRID_LOOP);
kono
parents:
diff changeset
1210 gimple_omp_for_set_grid_group_iter (dist, true);
kono
parents:
diff changeset
1211
kono
parents:
diff changeset
1212 struct walk_stmt_info wi_tiled;
kono
parents:
diff changeset
1213 memset (&wi_tiled, 0, sizeof (wi_tiled));
kono
parents:
diff changeset
1214 walk_gimple_seq_mod (gimple_omp_body_ptr (dist),
kono
parents:
diff changeset
1215 grid_mark_tiling_parallels_and_loops, NULL,
kono
parents:
diff changeset
1216 &wi_tiled);
kono
parents:
diff changeset
1217 return dist;
kono
parents:
diff changeset
1218 }
kono
parents:
diff changeset
1219 else
kono
parents:
diff changeset
1220 {
kono
parents:
diff changeset
1221 gimple_omp_for_set_grid_phony (dist, true);
kono
parents:
diff changeset
1222 stmt = grid_copy_leading_local_assignments (gimple_omp_body (dist), dst,
kono
parents:
diff changeset
1223 tgt_bind,
kono
parents:
diff changeset
1224 GRID_SEGMENT_PRIVATE, wi);
kono
parents:
diff changeset
1225 gcc_checking_assert (stmt);
kono
parents:
diff changeset
1226 gomp_parallel *parallel = as_a <gomp_parallel *> (stmt);
kono
parents:
diff changeset
1227 gimple_omp_parallel_set_grid_phony (parallel, true);
kono
parents:
diff changeset
1228 stmt = grid_copy_leading_local_assignments (gimple_omp_body (parallel),
kono
parents:
diff changeset
1229 dst, tgt_bind,
kono
parents:
diff changeset
1230 GRID_SEGMENT_PRIVATE, wi);
kono
parents:
diff changeset
1231 gomp_for *inner_loop = as_a <gomp_for *> (stmt);
kono
parents:
diff changeset
1232 gimple_omp_for_set_kind (inner_loop, GF_OMP_FOR_KIND_GRID_LOOP);
kono
parents:
diff changeset
1233 prebody = gimple_omp_for_pre_body (inner_loop);
kono
parents:
diff changeset
1234 if (prebody)
kono
parents:
diff changeset
1235 grid_copy_leading_local_assignments (prebody, dst, tgt_bind,
kono
parents:
diff changeset
1236 GRID_SEGMENT_PRIVATE, wi);
kono
parents:
diff changeset
1237
kono
parents:
diff changeset
1238 if (gimple_omp_for_combined_p (inner_loop))
kono
parents:
diff changeset
1239 grid_eliminate_combined_simd_part (inner_loop);
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
1240 struct walk_stmt_info body_wi;
111
kono
parents:
diff changeset
1241 memset (&body_wi, 0, sizeof (body_wi));
kono
parents:
diff changeset
1242 walk_gimple_seq_mod (gimple_omp_body_ptr (inner_loop),
kono
parents:
diff changeset
1243 grid_process_grid_body, NULL, &body_wi);
kono
parents:
diff changeset
1244
kono
parents:
diff changeset
1245 return inner_loop;
kono
parents:
diff changeset
1246 }
kono
parents:
diff changeset
1247 }
kono
parents:
diff changeset
1248
kono
parents:
diff changeset
1249 /* If TARGET points to a GOMP_TARGET which follows a gridifiable pattern,
kono
parents:
diff changeset
1250 create a GPU kernel for it. GSI must point to the same statement, TGT_BIND
kono
parents:
diff changeset
1251 is the bind into which temporaries inserted before TARGET should be
kono
parents:
diff changeset
1252 added. */
kono
parents:
diff changeset
1253
kono
parents:
diff changeset
1254 static void
kono
parents:
diff changeset
1255 grid_attempt_target_gridification (gomp_target *target,
kono
parents:
diff changeset
1256 gimple_stmt_iterator *gsi,
kono
parents:
diff changeset
1257 gbind *tgt_bind)
kono
parents:
diff changeset
1258 {
kono
parents:
diff changeset
1259 /* removed group_size */
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
1260 grid_prop grid = {};
111
kono
parents:
diff changeset
1261 if (!target || !grid_target_follows_gridifiable_pattern (target, &grid))
kono
parents:
diff changeset
1262 return;
kono
parents:
diff changeset
1263
kono
parents:
diff changeset
1264 location_t loc = gimple_location (target);
kono
parents:
diff changeset
1265 if (dump_enabled_p ())
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
1266 dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, target,
111
kono
parents:
diff changeset
1267 "Target construct will be turned into a gridified HSA "
kono
parents:
diff changeset
1268 "kernel\n");
kono
parents:
diff changeset
1269
kono
parents:
diff changeset
1270 /* Copy target body to a GPUKERNEL construct: */
kono
parents:
diff changeset
1271 gimple_seq kernel_seq = copy_gimple_seq_and_replace_locals
kono
parents:
diff changeset
1272 (gimple_omp_body (target));
kono
parents:
diff changeset
1273
kono
parents:
diff changeset
1274 hash_map<tree, tree> *declmap = new hash_map<tree, tree>;
kono
parents:
diff changeset
1275 struct walk_stmt_info wi;
kono
parents:
diff changeset
1276 memset (&wi, 0, sizeof (struct walk_stmt_info));
kono
parents:
diff changeset
1277 wi.info = declmap;
kono
parents:
diff changeset
1278
kono
parents:
diff changeset
1279 /* Copy assignments in between OMP statements before target, mark OMP
kono
parents:
diff changeset
1280 statements within copy appropriately. */
kono
parents:
diff changeset
1281 gomp_for *inner_loop = grid_process_kernel_body_copy (&grid, kernel_seq, gsi,
kono
parents:
diff changeset
1282 tgt_bind, &wi);
kono
parents:
diff changeset
1283
kono
parents:
diff changeset
1284 gbind *old_bind
kono
parents:
diff changeset
1285 = as_a <gbind *> (gimple_seq_first (gimple_omp_body (target)));
kono
parents:
diff changeset
1286 gbind *new_bind = as_a <gbind *> (gimple_seq_first (kernel_seq));
kono
parents:
diff changeset
1287 tree new_block = gimple_bind_block (new_bind);
kono
parents:
diff changeset
1288 tree enc_block = BLOCK_SUPERCONTEXT (gimple_bind_block (old_bind));
kono
parents:
diff changeset
1289 BLOCK_CHAIN (new_block) = BLOCK_SUBBLOCKS (enc_block);
kono
parents:
diff changeset
1290 BLOCK_SUBBLOCKS (enc_block) = new_block;
kono
parents:
diff changeset
1291 BLOCK_SUPERCONTEXT (new_block) = enc_block;
kono
parents:
diff changeset
1292 gimple *gpukernel = gimple_build_omp_grid_body (kernel_seq);
kono
parents:
diff changeset
1293 gimple_seq_add_stmt
kono
parents:
diff changeset
1294 (gimple_bind_body_ptr (as_a <gbind *> (gimple_omp_body (target))),
kono
parents:
diff changeset
1295 gpukernel);
kono
parents:
diff changeset
1296
kono
parents:
diff changeset
1297 for (size_t i = 0; i < grid.collapse; i++)
kono
parents:
diff changeset
1298 walk_tree (&grid.group_sizes[i], grid_remap_prebody_decls, &wi, NULL);
kono
parents:
diff changeset
1299 push_gimplify_context ();
kono
parents:
diff changeset
1300 for (size_t i = 0; i < grid.collapse; i++)
kono
parents:
diff changeset
1301 {
kono
parents:
diff changeset
1302 tree itype, type = TREE_TYPE (gimple_omp_for_index (inner_loop, i));
kono
parents:
diff changeset
1303 if (POINTER_TYPE_P (type))
kono
parents:
diff changeset
1304 itype = signed_type_for (type);
kono
parents:
diff changeset
1305 else
kono
parents:
diff changeset
1306 itype = type;
kono
parents:
diff changeset
1307
kono
parents:
diff changeset
1308 enum tree_code cond_code = gimple_omp_for_cond (inner_loop, i);
kono
parents:
diff changeset
1309 tree n1 = unshare_expr (gimple_omp_for_initial (inner_loop, i));
kono
parents:
diff changeset
1310 walk_tree (&n1, grid_remap_prebody_decls, &wi, NULL);
kono
parents:
diff changeset
1311 tree n2 = unshare_expr (gimple_omp_for_final (inner_loop, i));
kono
parents:
diff changeset
1312 walk_tree (&n2, grid_remap_prebody_decls, &wi, NULL);
kono
parents:
diff changeset
1313 omp_adjust_for_condition (loc, &cond_code, &n2);
kono
parents:
diff changeset
1314 n1 = fold_convert (itype, n1);
kono
parents:
diff changeset
1315 n2 = fold_convert (itype, n2);
kono
parents:
diff changeset
1316
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
1317 tree cond = fold_build2 (cond_code, boolean_type_node, n1, n2);
111
kono
parents:
diff changeset
1318 tree step
kono
parents:
diff changeset
1319 = omp_get_for_step_from_incr (loc, gimple_omp_for_incr (inner_loop, i));
kono
parents:
diff changeset
1320
kono
parents:
diff changeset
1321 tree t = build_int_cst (itype, (cond_code == LT_EXPR ? -1 : 1));
kono
parents:
diff changeset
1322 t = fold_build2 (PLUS_EXPR, itype, step, t);
kono
parents:
diff changeset
1323 t = fold_build2 (PLUS_EXPR, itype, t, n2);
kono
parents:
diff changeset
1324 t = fold_build2 (MINUS_EXPR, itype, t, n1);
kono
parents:
diff changeset
1325 if (TYPE_UNSIGNED (itype) && cond_code == GT_EXPR)
kono
parents:
diff changeset
1326 t = fold_build2 (TRUNC_DIV_EXPR, itype,
kono
parents:
diff changeset
1327 fold_build1 (NEGATE_EXPR, itype, t),
kono
parents:
diff changeset
1328 fold_build1 (NEGATE_EXPR, itype, step));
kono
parents:
diff changeset
1329 else
kono
parents:
diff changeset
1330 t = fold_build2 (TRUNC_DIV_EXPR, itype, t, step);
131
84e7813d76e9 gcc-8.2
mir3636
parents: 111
diff changeset
1331 t = fold_build3 (COND_EXPR, itype, cond, t, build_zero_cst (itype));
111
kono
parents:
diff changeset
1332 if (grid.tiling)
kono
parents:
diff changeset
1333 {
kono
parents:
diff changeset
1334 if (cond_code == GT_EXPR)
kono
parents:
diff changeset
1335 step = fold_build1 (NEGATE_EXPR, itype, step);
kono
parents:
diff changeset
1336 t = fold_build2 (MULT_EXPR, itype, t, step);
kono
parents:
diff changeset
1337 }
kono
parents:
diff changeset
1338
kono
parents:
diff changeset
1339 tree gs = fold_convert (uint32_type_node, t);
kono
parents:
diff changeset
1340 gimple_seq tmpseq = NULL;
kono
parents:
diff changeset
1341 gimplify_expr (&gs, &tmpseq, NULL, is_gimple_val, fb_rvalue);
kono
parents:
diff changeset
1342 if (!gimple_seq_empty_p (tmpseq))
kono
parents:
diff changeset
1343 gsi_insert_seq_before (gsi, tmpseq, GSI_SAME_STMT);
kono
parents:
diff changeset
1344
kono
parents:
diff changeset
1345 tree ws;
kono
parents:
diff changeset
1346 if (grid.group_sizes[i])
kono
parents:
diff changeset
1347 {
kono
parents:
diff changeset
1348 ws = fold_convert (uint32_type_node, grid.group_sizes[i]);
kono
parents:
diff changeset
1349 tmpseq = NULL;
kono
parents:
diff changeset
1350 gimplify_expr (&ws, &tmpseq, NULL, is_gimple_val, fb_rvalue);
kono
parents:
diff changeset
1351 if (!gimple_seq_empty_p (tmpseq))
kono
parents:
diff changeset
1352 gsi_insert_seq_before (gsi, tmpseq, GSI_SAME_STMT);
kono
parents:
diff changeset
1353 }
kono
parents:
diff changeset
1354 else
kono
parents:
diff changeset
1355 ws = build_zero_cst (uint32_type_node);
kono
parents:
diff changeset
1356
kono
parents:
diff changeset
1357 tree c = build_omp_clause (UNKNOWN_LOCATION, OMP_CLAUSE__GRIDDIM_);
kono
parents:
diff changeset
1358 OMP_CLAUSE__GRIDDIM__DIMENSION (c) = i;
kono
parents:
diff changeset
1359 OMP_CLAUSE__GRIDDIM__SIZE (c) = gs;
kono
parents:
diff changeset
1360 OMP_CLAUSE__GRIDDIM__GROUP (c) = ws;
kono
parents:
diff changeset
1361 OMP_CLAUSE_CHAIN (c) = gimple_omp_target_clauses (target);
kono
parents:
diff changeset
1362 gimple_omp_target_set_clauses (target, c);
kono
parents:
diff changeset
1363 }
kono
parents:
diff changeset
1364 pop_gimplify_context (tgt_bind);
kono
parents:
diff changeset
1365 delete declmap;
kono
parents:
diff changeset
1366 return;
kono
parents:
diff changeset
1367 }
kono
parents:
diff changeset
1368
kono
parents:
diff changeset
1369 /* Walker function doing all the work for create_target_kernels. */
kono
parents:
diff changeset
1370
kono
parents:
diff changeset
1371 static tree
kono
parents:
diff changeset
1372 grid_gridify_all_targets_stmt (gimple_stmt_iterator *gsi,
kono
parents:
diff changeset
1373 bool *handled_ops_p,
kono
parents:
diff changeset
1374 struct walk_stmt_info *incoming)
kono
parents:
diff changeset
1375 {
kono
parents:
diff changeset
1376 *handled_ops_p = false;
kono
parents:
diff changeset
1377
kono
parents:
diff changeset
1378 gimple *stmt = gsi_stmt (*gsi);
kono
parents:
diff changeset
1379 gomp_target *target = dyn_cast <gomp_target *> (stmt);
kono
parents:
diff changeset
1380 if (target)
kono
parents:
diff changeset
1381 {
kono
parents:
diff changeset
1382 gbind *tgt_bind = (gbind *) incoming->info;
kono
parents:
diff changeset
1383 gcc_checking_assert (tgt_bind);
kono
parents:
diff changeset
1384 grid_attempt_target_gridification (target, gsi, tgt_bind);
kono
parents:
diff changeset
1385 return NULL_TREE;
kono
parents:
diff changeset
1386 }
kono
parents:
diff changeset
1387 gbind *bind = dyn_cast <gbind *> (stmt);
kono
parents:
diff changeset
1388 if (bind)
kono
parents:
diff changeset
1389 {
kono
parents:
diff changeset
1390 *handled_ops_p = true;
kono
parents:
diff changeset
1391 struct walk_stmt_info wi;
kono
parents:
diff changeset
1392 memset (&wi, 0, sizeof (wi));
kono
parents:
diff changeset
1393 wi.info = bind;
kono
parents:
diff changeset
1394 walk_gimple_seq_mod (gimple_bind_body_ptr (bind),
kono
parents:
diff changeset
1395 grid_gridify_all_targets_stmt, NULL, &wi);
kono
parents:
diff changeset
1396 }
kono
parents:
diff changeset
1397 return NULL_TREE;
kono
parents:
diff changeset
1398 }
kono
parents:
diff changeset
1399
kono
parents:
diff changeset
1400 /* Attempt to gridify all target constructs in BODY_P. All such targets will
kono
parents:
diff changeset
1401 have their bodies duplicated, with the new copy being put into a
kono
parents:
diff changeset
1402 gimple_omp_grid_body statement. All kernel-related construct within the
kono
parents:
diff changeset
1403 grid_body will be marked with phony flags or kernel kinds. Moreover, some
kono
parents:
diff changeset
1404 re-structuring is often needed, such as copying pre-bodies before the target
kono
parents:
diff changeset
1405 construct so that kernel grid sizes can be computed. */
kono
parents:
diff changeset
1406
kono
parents:
diff changeset
1407 void
kono
parents:
diff changeset
1408 omp_grid_gridify_all_targets (gimple_seq *body_p)
kono
parents:
diff changeset
1409 {
kono
parents:
diff changeset
1410 struct walk_stmt_info wi;
kono
parents:
diff changeset
1411 memset (&wi, 0, sizeof (wi));
kono
parents:
diff changeset
1412 walk_gimple_seq_mod (body_p, grid_gridify_all_targets_stmt, NULL, &wi);
kono
parents:
diff changeset
1413 }