aboutsummaryrefslogtreecommitdiffstats
path: root/src/gallium/drivers/r600/r600_compiler.h
blob: d3c13b519beab74a5724b1c32616ae4b6c8904d3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
/*
 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * on the rights to use, copy, modify, merge, publish, distribute, sub
 * license, and/or sell copies of the Software, and to permit persons to whom
 * the Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
 * USE OR OTHER DEALINGS IN THE SOFTWARE.
 */
#ifndef R600_COMPILER_H
#define R600_COMPILER_H

struct c_vector;

/* operand are the basic source/destination of each operation */
struct c_channel {
	struct c_channel	*next;
	struct c_channel	*prev;
	unsigned		vindex;		/**< index in vector X,Y,Z,W (0,1,2,3) */
	unsigned		value;		/**< immediate value 32bits */
	struct c_vector		*vector;	/**< vector to which it belongs */
};

/* in GPU world most of the time operand are grouped into vector
 * of 4 component this structure is mostly and handler to group
 * operand into a same vector
 */
struct c_vector {
	struct c_vector		*next;
	struct c_vector		*prev;
	unsigned		id;		/**< vector uniq id */
	unsigned		name;		/**< semantic name */
	unsigned		file;		/**< operand file C_FILE_* */
	int			sid;		/**< semantic id */
	struct c_channel	*channel[4];	/**< operands */
};

#define c_list_init(e) do { (e)->next = e; (e)->prev = e; } while(0)
#define c_list_add(e, h) do { (e)->next = (h)->next; (e)->prev = h;  (h)->next = e; (e)->next->prev = e; } while(0)
#define c_list_add_tail(e, h) do { (e)->next = h; (e)->prev = (h)->prev;  (h)->prev = e; (e)->prev->next = e; } while(0)
#define c_list_del(e) do { (e)->next->prev = (e)->prev; (e)->prev->next = (e)->next; c_list_init(e); } while(0)
#define c_list_for_each(p, h) for (p = (h)->next; p != (h); p = p->next)
#define c_list_for_each_from(p, s, h) for (p = s; p != (h); p = p->next)
#define c_list_for_each_safe(p, n, h) for (p = (h)->next, n = p->next; p != (h); p = n, n = p->next)
#define c_list_empty(h) ((h)->next == h)


#define C_PROGRAM_TYPE_VS	0
#define C_PROGRAM_TYPE_FS	1
#define C_PROGRAM_TYPE_COUNT	2

#define C_NODE_FLAG_ALU		1
#define C_NODE_FLAG_FETCH	2

#define C_SWIZZLE_X		0
#define C_SWIZZLE_Y		1
#define C_SWIZZLE_Z		2
#define C_SWIZZLE_W		3
#define C_SWIZZLE_0		4
#define C_SWIZZLE_1		5
#define C_SWIZZLE_D		6	/**< discard */

#define C_FILE_NULL		0
#define C_FILE_CONSTANT		1
#define C_FILE_INPUT		2
#define C_FILE_OUTPUT		3
#define C_FILE_TEMPORARY	4
#define C_FILE_SAMPLER		5
#define C_FILE_ADDRESS		6
#define C_FILE_IMMEDIATE	7
#define C_FILE_LOOP		8
#define C_FILE_PREDICATE	9
#define C_FILE_SYSTEM_VALUE	10
#define C_FILE_RESOURCE		11
#define C_FILE_COUNT		12

#define C_SEMANTIC_POSITION	0
#define C_SEMANTIC_COLOR	1
#define C_SEMANTIC_BCOLOR	2  /**< back-face color */
#define C_SEMANTIC_FOG		3
#define C_SEMANTIC_PSIZE	4
#define C_SEMANTIC_GENERIC	5
#define C_SEMANTIC_NORMAL	6
#define C_SEMANTIC_FACE		7
#define C_SEMANTIC_EDGEFLAG	8
#define C_SEMANTIC_PRIMID	9
#define C_SEMANTIC_INSTANCEID	10
#define C_SEMANTIC_VERTEXID	11
#define C_SEMANTIC_COUNT	12 /**< number of semantic values */

#define C_OPCODE_ARL		0
#define C_OPCODE_MOV		1
#define C_OPCODE_LIT		2
#define C_OPCODE_RCP		3
#define C_OPCODE_RSQ		4
#define C_OPCODE_EXP		5
#define C_OPCODE_LOG		6
#define C_OPCODE_MUL		7
#define C_OPCODE_ADD		8
#define C_OPCODE_DP3		9
#define C_OPCODE_DP4		10
#define C_OPCODE_DST		11
#define C_OPCODE_MIN		12
#define C_OPCODE_MAX		13
#define C_OPCODE_SLT		14
#define C_OPCODE_SGE		15
#define C_OPCODE_MAD		16
#define C_OPCODE_SUB		17
#define C_OPCODE_LRP		18
#define C_OPCODE_CND		19
/* gap */
#define C_OPCODE_DP2A		21
/* gap */
#define C_OPCODE_FRC		24
#define C_OPCODE_CLAMP		25
#define C_OPCODE_FLR		26
#define C_OPCODE_ROUND		27
#define C_OPCODE_EX2		28
#define C_OPCODE_LG2		29
#define C_OPCODE_POW		30
#define C_OPCODE_XPD		31
/* gap */
#define C_OPCODE_ABS		33
#define C_OPCODE_RCC		34
#define C_OPCODE_DPH		35
#define C_OPCODE_COS		36
#define C_OPCODE_DDX		37
#define C_OPCODE_DDY		38
#define C_OPCODE_KILP		39		/* predicated kill */
#define C_OPCODE_PK2H		40
#define C_OPCODE_PK2US		41
#define C_OPCODE_PK4B		42
#define C_OPCODE_PK4UB		43
#define C_OPCODE_RFL		44
#define C_OPCODE_SEQ		45
#define C_OPCODE_SFL		46
#define C_OPCODE_SGT		47
#define C_OPCODE_SIN		48
#define C_OPCODE_SLE		49
#define C_OPCODE_SNE		50
#define C_OPCODE_STR		51
#define C_OPCODE_TEX		52
#define C_OPCODE_TXD		53
#define C_OPCODE_TXP		54
#define C_OPCODE_UP2H		55
#define C_OPCODE_UP2US		56
#define C_OPCODE_UP4B		57
#define C_OPCODE_UP4UB		58
#define C_OPCODE_X2D		59
#define C_OPCODE_ARA		60
#define C_OPCODE_ARR		61
#define C_OPCODE_BRA		62
#define C_OPCODE_CAL		63
#define C_OPCODE_RET		64
#define C_OPCODE_SSG		65		/* SGN */
#define C_OPCODE_CMP		66
#define C_OPCODE_SCS		67
#define C_OPCODE_TXB		68
#define C_OPCODE_NRM		69
#define C_OPCODE_DIV		70
#define C_OPCODE_DP2		71
#define C_OPCODE_TXL		72
#define C_OPCODE_BRK		73
#define C_OPCODE_IF		74
#define C_OPCODE_BGNFOR		75
#define C_OPCODE_REP		76
#define C_OPCODE_ELSE		77
#define C_OPCODE_ENDIF		78
#define C_OPCODE_ENDFOR		79
#define C_OPCODE_ENDREP		80
#define C_OPCODE_PUSHA		81
#define C_OPCODE_POPA		82
#define C_OPCODE_CEIL		83
#define C_OPCODE_I2F		84
#define C_OPCODE_NOT		85
#define C_OPCODE_TRUNC		86
#define C_OPCODE_SHL		87
/* gap */
#define C_OPCODE_AND		89
#define C_OPCODE_OR		90
#define C_OPCODE_MOD		91
#define C_OPCODE_XOR		92
#define C_OPCODE_SAD		93
#define C_OPCODE_TXF		94
#define C_OPCODE_TXQ		95
#define C_OPCODE_CONT		96
#define C_OPCODE_EMIT		97
#define C_OPCODE_ENDPRIM	98
#define C_OPCODE_BGNLOOP	99
#define C_OPCODE_BGNSUB		100
#define C_OPCODE_ENDLOOP	101
#define C_OPCODE_ENDSUB		102
/* gap */
#define C_OPCODE_NOP		107
/* gap */
#define C_OPCODE_NRM4		112
#define C_OPCODE_CALLNZ		113
#define C_OPCODE_IFC		114
#define C_OPCODE_BREAKC		115
#define C_OPCODE_KIL		116	/* conditional kill */
#define C_OPCODE_END		117	/* aka HALT */
/* gap */
#define C_OPCODE_F2I		119
#define C_OPCODE_IDIV		120
#define C_OPCODE_IMAX		121
#define C_OPCODE_IMIN		122
#define C_OPCODE_INEG		123
#define C_OPCODE_ISGE		124
#define C_OPCODE_ISHR		125
#define C_OPCODE_ISLT		126
#define C_OPCODE_F2U		127
#define C_OPCODE_U2F		128
#define C_OPCODE_UADD		129
#define C_OPCODE_UDIV		130
#define C_OPCODE_UMAD		131
#define C_OPCODE_UMAX		132
#define C_OPCODE_UMIN		133
#define C_OPCODE_UMOD		134
#define C_OPCODE_UMUL		135
#define C_OPCODE_USEQ		136
#define C_OPCODE_USGE		137
#define C_OPCODE_USHR		138
#define C_OPCODE_USLT		139
#define C_OPCODE_USNE		140
#define C_OPCODE_SWITCH		141
#define C_OPCODE_CASE		142
#define C_OPCODE_DEFAULT	143
#define C_OPCODE_ENDSWITCH	144
#define C_OPCODE_VFETCH		145
#define C_OPCODE_ENTRY		146
#define C_OPCODE_LAST		147

#define C_OPERAND_FLAG_ABS		(1 << 0)
#define C_OPERAND_FLAG_NEG		(1 << 1)

struct c_operand {
	struct c_vector		*vector;
	unsigned		swizzle[4];
	unsigned		flag[4];
};

struct c_instruction {
	struct c_instruction	*next, *prev;
	unsigned		opcode;
	unsigned		ninput;
	struct c_operand	input[3];
	struct c_operand	output;
	unsigned		write_mask;
	void			*backend;
};

struct c_node;

struct c_node_link {
	struct c_node_link	*next;
	struct c_node_link	*prev;
	struct c_node		*node;
};

/**
 * struct c_node
 *
 * @next:		all node are in a double linked list, this point to
 * 			next node
 * @next:		all node are in a double linked list, this point to
 * 			previous node
 * @predecessors:	list of all predecessor nodes in the flow graph
 * @successors:		list of all sucessor nodes in the flow graph
 * @parent:		parent node in the depth first walk tree
 * @childs:		child nodes in the depth first walk tree
 */
struct c_node {
	struct c_node		*next, *prev;
	struct c_node_link	predecessors;
	struct c_node_link	successors;
	struct c_node		*parent;
	struct c_node_link	childs;
	struct c_instruction	insts;
	unsigned		opcode;
	unsigned		visited;
	unsigned		done;
	void			*backend;
};

struct c_file {
	unsigned		nvectors;
	struct c_vector		vectors;
};

struct c_shader {
	unsigned			nvectors;
	struct c_file			files[C_FILE_COUNT];
	struct c_node			nodes;
	struct c_node			entry;
	struct c_node			end;
	unsigned			type;
};

int c_shader_init(struct c_shader *shader, unsigned type);
void c_shader_destroy(struct c_shader *shader);
struct c_vector *c_shader_vector_new(struct c_shader *shader, unsigned file, unsigned name, int sid);
int c_shader_build_dominator_tree(struct c_shader *shader);
void c_shader_dump(struct c_shader *shader);

void c_node_init(struct c_node *node);
int c_node_add_new_instruction(struct c_node *node, struct c_instruction *instruction);
int c_node_add_new_instruction_head(struct c_node *node, struct c_instruction *instruction);

/* control flow graph functions */
int c_node_cfg_link(struct c_node *predecessor, struct c_node *successor);
struct c_node *c_node_cfg_new_after(struct c_node *predecessor);
struct c_node *c_shader_cfg_new_node_after(struct c_shader *shader, struct c_node *predecessor);

struct c_vector *c_vector_new(void);

#endif