1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
|
/* brig-function.h -- declaration of brig_function class.
Copyright (C) 2016-2019 Free Software Foundation, Inc.
Contributed by Pekka Jaaskelainen <pekka.jaaskelainen@parmance.com>
for General Processor Tech.
This file is part of GCC.
GCC is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free
Software Foundation; either version 3, or (at your option) any later
version.
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
for more details.
You should have received a copy of the GNU General Public License
along with GCC; see the file COPYING3. If not see
<http://www.gnu.org/licenses/>. */
#ifndef BRIG_FUNCTION_H
#define BRIG_FUNCTION_H
#include "config.h"
#include "system.h"
#include "ansidecl.h"
#include "coretypes.h"
#include "opts.h"
#include "tree.h"
#include "tree-iterator.h"
#include "hsa-brig-format.h"
#include "brig-util.h"
#include <map>
#include <string>
#include <vector>
#include <set>
#include "phsa.h"
class brig_to_generic;
typedef std::map<std::string, tree> label_index;
typedef std::map<const BrigDirectiveVariable *, tree> variable_index;
typedef std::vector<tree> tree_stl_vec;
/* Holds data for the currently built GENERIC function. */
class brig_function
{
public:
typedef std::map<const BrigDirectiveVariable *, size_t> var_offset_table;
private:
struct reg_decl_index_entry
{
tree m_var_decl;
};
public:
brig_function (const BrigDirectiveExecutable *exec, brig_to_generic *parent);
~brig_function ();
tree arg_variable (const BrigDirectiveVariable *var) const;
void add_arg_variable (const BrigDirectiveVariable *brigVar, tree treeDecl);
void append_kernel_arg (const BrigDirectiveVariable *var, size_t size,
size_t alignment);
size_t kernel_arg_offset (const BrigDirectiveVariable *var) const;
void add_id_variables ();
tree label (const std::string &name);
tree add_local_variable (std::string name, tree type);
size_t group_variable_segment_offset (const std::string &name) const;
bool has_group_variable (const std::string &name) const;
size_t group_segment_size () const;
tree get_m_var_declfor_reg (const BrigOperandRegister *reg);
bool convert_to_wg_function ();
void add_wi_loop (int dim, tree_stmt_iterator *header_entry,
tree_stmt_iterator *branch_after);
tree emit_metadata (tree stmt_list);
tree emit_launcher_and_metadata ();
tree append_statement (tree stmt);
void create_alloca_frame ();
void finish ();
void finish_kernel ();
void append_return_stmt ();
bool has_function_scope_var (const BrigBase* var) const;
void analyze_calls ();
tree expand_builtin (BrigOpcode16_t brig_opcode, tree_stl_vec &operands);
tree expand_or_call_builtin (BrigOpcode16_t brig_opcode,
BrigType16_t brig_type, tree arith_type,
tree_stl_vec &operands);
bool can_expand_builtin (BrigOpcode16_t brig_opcode) const;
tree get_builtin_for_hsa_opcode (tree type, BrigOpcode16_t brig_opcode,
BrigType16_t brig_type) const;
void unpack (tree value, tree_stl_vec &elements);
tree pack (tree_stl_vec &elements);
tree add_temp_var (std::string name, tree expr);
static bool needs_workitem_context_data (BrigOpcode16_t brig_opcode);
static HOST_WIDE_INT int_constant_value (tree node);
static tree_code get_tree_code_for_hsa_opcode (BrigOpcode16_t brig_opcode,
BrigType16_t brig_type);
void start_new_bb ();
void add_reg_var_update (tree reg_var, tree val);
bool is_id_val (tree reg_var);
tree id_val (tree reg_var);
const BrigDirectiveExecutable *m_brig_def;
bool m_is_kernel;
bool m_is_finished;
std::string m_name;
tree m_current_bind_expr;
tree m_func_decl;
tree m_entry_label_stmt;
tree m_exit_label;
/* The __context function argument. */
tree m_context_arg;
/* The __group_base_ptr argument in the current function.
Points to the start of the group segment for the work-group. */
tree m_group_base_arg;
/* The __group_local_offset_ptr argument in the current function. It
contains the offset related to the group_base_ptr where the function's
local area for group variables resides. */
tree m_group_local_offset_arg;
/* The __private_base_ptr argument in the current function.
Points to the start of the private segment. */
tree m_private_base_arg;
/* The return value variable for the current function. */
tree m_ret_value;
/* The offsets of the kernel arguments in the __arg blob
pointing to the kernel argument space. */
size_t m_next_kernarg_offset;
/* The largest kernel argument variable alignment. */
size_t m_kernarg_max_align;
var_offset_table m_kernarg_offsets;
/* Argument variables in the currently handled binding expression
(argument segment). */
variable_index m_arg_variables;
/* The brig variable for the function return value. */
const BrigDirectiveVariable *m_ret_value_brig_var;
/* The function local temporary variable for the return value. */
tree m_ret_temp;
/* Labels in the current function are collected here so we can refer
to them from jumps before they have been placed to the function. */
label_index m_label_index;
/* If the kernel contains at least one barrier, this is set to true. */
bool m_has_barriers;
/* True if the function has at least one alloca instruction. */
bool m_has_allocas;
/* If the kernel contains at least one function call that _may_
contain a barrier call, this is set to true. */
bool m_has_function_calls_with_barriers;
/* Set to true after this function has been analyzed for barrier and
dispatch packet instruction usage in the final call graph analysis. */
bool m_calls_analyzed;
/* True in case the function was successfully converted to a WG function. */
bool m_is_wg_function;
/* Work-item ID related variables are cached in the entry of the kernel
function in order to use them directly in address computations, leading
to more efficient optimizations. The references to the local variables
are stored here. */
tree m_local_id_vars[3];
tree m_cur_wg_size_vars[3];
tree m_wg_id_vars[3];
tree m_wg_size_vars[3];
tree m_grid_size_vars[3];
/* Explicitly computed WG base for the absolute IDs which is used
as the initial value when looping that dimension. We update
the abs id with ++ to make it easy for the vectorizer. */
tree m_abs_id_base_vars[3];
tree m_abs_id_vars[3];
/* Set to true in case the kernel contains at least one dispatch packet
(work-item ID-related) builtin call that could not be expanded to
tree nodes. */
bool m_has_unexpanded_dp_builtins;
/* Points to the instruction after which the real kernel code starts.
Usually points to the last WI ID variable initialization statement. */
tree_stmt_iterator m_kernel_entry;
/* True if we are currently generating the contents of an arg block. */
bool m_generating_arg_block;
/* A collection of function scope variables seen so far for resolving
variable references vs. module scope declarations. */
std::set<const BrigBase*> m_function_scope_vars;
/* The functions called by this function. */
std::vector<tree> m_called_functions;
/* Stores the kernel scope group variable offsets if the function is
a kernel. */
group_variable_offset_index m_local_group_variables;
brig_to_generic *m_parent;
/* The metadata of the function that should be stored with the binary and
passed to the HSA runtime: */
phsa_descriptor m_descriptor;
private:
tree get_tree_type_for_hsa_reg (const BrigOperandRegister *reg) const;
/* Bookkeeping for the different HSA registers and their tree declarations
for the currently generated function. */
reg_decl_index_entry *m_regs[BRIG_2_TREE_HSAIL_TOTAL_REG_COUNT];
/* Map for keeping book reads of ID variables, which can be propagated
to uses in address expressions to produce cleaner indexing functions
with unnecessary casts stripped off, etc. */
typedef std::map<tree, tree> id_val_map;
/* Keeps track of ID values alive in registers in the currently
processed BB. */
id_val_map m_id_val_defs;
/* HSAIL-specific builtin functions not yet integrated to gcc. */
typedef std::map<std::pair<BrigOpcode16_t, BrigType16_t>, tree> builtin_map;
static builtin_map s_custom_builtins;
};
#endif
|