Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
PojavLauncherTeam
GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/gallium/drivers/r300/compiler/radeon_code.h
4574 views
1
/*
2
* Copyright 2009 Nicolai Hähnle <[email protected]>
3
*
4
* Permission is hereby granted, free of charge, to any person obtaining a
5
* copy of this software and associated documentation files (the "Software"),
6
* to deal in the Software without restriction, including without limitation
7
* on the rights to use, copy, modify, merge, publish, distribute, sub
8
* license, and/or sell copies of the Software, and to permit persons to whom
9
* the Software is furnished to do so, subject to the following conditions:
10
*
11
* The above copyright notice and this permission notice (including the next
12
* paragraph) shall be included in all copies or substantial portions of the
13
* Software.
14
*
15
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18
* THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21
* USE OR OTHER DEALINGS IN THE SOFTWARE. */
22
23
#ifndef RADEON_CODE_H
24
#define RADEON_CODE_H
25
26
#include <stdint.h>
27
28
#define R300_PFS_MAX_ALU_INST 64
29
#define R300_PFS_MAX_TEX_INST 32
30
#define R300_PFS_MAX_TEX_INDIRECT 4
31
#define R300_PFS_NUM_TEMP_REGS 32
32
#define R300_PFS_NUM_CONST_REGS 32
33
34
#define R400_PFS_MAX_ALU_INST 512
35
#define R400_PFS_MAX_TEX_INST 512
36
37
#define R500_PFS_MAX_INST 512
38
#define R500_PFS_NUM_TEMP_REGS 128
39
#define R500_PFS_NUM_CONST_REGS 256
40
#define R500_PFS_MAX_BRANCH_DEPTH_FULL 32
41
#define R500_PFS_MAX_BRANCH_DEPTH_PARTIAL 4
42
43
/* The r500 maximum depth is not just for loops, but any combination of loops
44
* and subroutine jumps. */
45
#define R500_PVS_MAX_LOOP_DEPTH 8
46
47
#define STATE_R300_WINDOW_DIMENSION (STATE_INTERNAL_DRIVER+0)
48
49
enum {
50
/**
51
* External constants are constants whose meaning is unknown to this
52
* compiler. For example, a Mesa gl_program's constants are turned
53
* into external constants.
54
*/
55
RC_CONSTANT_EXTERNAL = 0,
56
57
RC_CONSTANT_IMMEDIATE,
58
59
/**
60
* Constant referring to state that is known by this compiler,
61
* see RC_STATE_xxx, i.e. *not* arbitrary Mesa (or other) state.
62
*/
63
RC_CONSTANT_STATE
64
};
65
66
enum {
67
RC_STATE_SHADOW_AMBIENT = 0,
68
69
RC_STATE_R300_WINDOW_DIMENSION,
70
RC_STATE_R300_TEXRECT_FACTOR,
71
RC_STATE_R300_TEXSCALE_FACTOR,
72
RC_STATE_R300_VIEWPORT_SCALE,
73
RC_STATE_R300_VIEWPORT_OFFSET
74
};
75
76
struct rc_constant {
77
unsigned Type:2; /**< RC_CONSTANT_xxx */
78
unsigned Size:3;
79
80
union {
81
unsigned External;
82
float Immediate[4];
83
unsigned State[2];
84
} u;
85
};
86
87
struct rc_constant_list {
88
struct rc_constant * Constants;
89
unsigned Count;
90
91
unsigned _Reserved;
92
};
93
94
void rc_constants_init(struct rc_constant_list * c);
95
void rc_constants_copy(struct rc_constant_list * dst, struct rc_constant_list * src);
96
void rc_constants_destroy(struct rc_constant_list * c);
97
unsigned rc_constants_add(struct rc_constant_list * c, struct rc_constant * constant);
98
unsigned rc_constants_add_state(struct rc_constant_list * c, unsigned state1, unsigned state2);
99
unsigned rc_constants_add_immediate_vec4(struct rc_constant_list * c, const float * data);
100
unsigned rc_constants_add_immediate_scalar(struct rc_constant_list * c, float data, unsigned * swizzle);
101
void rc_constants_print(struct rc_constant_list * c);
102
103
/**
104
* Compare functions.
105
*
106
* \note By design, RC_COMPARE_FUNC_xxx + GL_NEVER gives you
107
* the correct GL compare function.
108
*/
109
typedef enum {
110
RC_COMPARE_FUNC_NEVER = 0,
111
RC_COMPARE_FUNC_LESS,
112
RC_COMPARE_FUNC_EQUAL,
113
RC_COMPARE_FUNC_LEQUAL,
114
RC_COMPARE_FUNC_GREATER,
115
RC_COMPARE_FUNC_NOTEQUAL,
116
RC_COMPARE_FUNC_GEQUAL,
117
RC_COMPARE_FUNC_ALWAYS
118
} rc_compare_func;
119
120
/**
121
* Coordinate wrapping modes.
122
*
123
* These are not quite the same as their GL counterparts yet.
124
*/
125
typedef enum {
126
RC_WRAP_NONE = 0,
127
RC_WRAP_REPEAT,
128
RC_WRAP_MIRRORED_REPEAT,
129
RC_WRAP_MIRRORED_CLAMP
130
} rc_wrap_mode;
131
132
/**
133
* Stores state that influences the compilation of a fragment program.
134
*/
135
struct r300_fragment_program_external_state {
136
struct {
137
/**
138
* This field contains swizzle for some lowering passes
139
* (shadow comparison, unorm->snorm conversion)
140
*/
141
unsigned texture_swizzle:12;
142
143
/**
144
* If the sampler is used as a shadow sampler,
145
* this field specifies the compare function.
146
*
147
* Otherwise, this field is \ref RC_COMPARE_FUNC_NEVER (aka 0).
148
* \sa rc_compare_func
149
*/
150
unsigned texture_compare_func : 3;
151
152
/**
153
* No matter what the sampler type is,
154
* this field turns it into a shadow sampler.
155
*/
156
unsigned compare_mode_enabled : 1;
157
158
/**
159
* If the sampler will receive non-normalized coords,
160
* this field is set. The scaling factor is given by
161
* RC_STATE_R300_TEXRECT_FACTOR.
162
*/
163
unsigned non_normalized_coords : 1;
164
165
/**
166
* This field specifies wrapping modes for the sampler.
167
*
168
* If this field is \ref RC_WRAP_NONE (aka 0), no wrapping maths
169
* will be performed on the coordinates.
170
*/
171
unsigned wrap_mode : 3;
172
173
/**
174
* The coords are scaled after applying the wrap mode emulation
175
* and right before texture fetch. The scaling factor is given by
176
* RC_STATE_R300_TEXSCALE_FACTOR. */
177
unsigned clamp_and_scale_before_fetch : 1;
178
} unit[16];
179
180
unsigned alpha_to_one:1;
181
};
182
183
184
185
struct r300_fragment_program_node {
186
int tex_offset; /**< first tex instruction */
187
int tex_end; /**< last tex instruction, relative to tex_offset */
188
int alu_offset; /**< first ALU instruction */
189
int alu_end; /**< last ALU instruction, relative to alu_offset */
190
int flags;
191
};
192
193
/**
194
* Stores an R300 fragment program in its compiled-to-hardware form.
195
*/
196
struct r300_fragment_program_code {
197
struct {
198
unsigned int length; /**< total # of texture instructions used */
199
uint32_t inst[R400_PFS_MAX_TEX_INST];
200
} tex;
201
202
struct {
203
unsigned int length; /**< total # of ALU instructions used */
204
struct {
205
uint32_t rgb_inst;
206
uint32_t rgb_addr;
207
uint32_t alpha_inst;
208
uint32_t alpha_addr;
209
uint32_t r400_ext_addr;
210
} inst[R400_PFS_MAX_ALU_INST];
211
} alu;
212
213
uint32_t config; /* US_CONFIG */
214
uint32_t pixsize; /* US_PIXSIZE */
215
uint32_t code_offset; /* US_CODE_OFFSET */
216
uint32_t r400_code_offset_ext; /* US_CODE_EXT */
217
uint32_t code_addr[4]; /* US_CODE_ADDR */
218
/*US_CODE_BANK.R390_MODE: Enables 512 instructions and 64 temporaries
219
* for r400 cards */
220
unsigned int r390_mode:1;
221
};
222
223
224
struct r500_fragment_program_code {
225
struct {
226
uint32_t inst0;
227
uint32_t inst1;
228
uint32_t inst2;
229
uint32_t inst3;
230
uint32_t inst4;
231
uint32_t inst5;
232
} inst[R500_PFS_MAX_INST];
233
234
int inst_end; /* Number of instructions - 1; also, last instruction to be executed */
235
236
int max_temp_idx;
237
238
uint32_t us_fc_ctrl;
239
240
uint32_t int_constants[32];
241
uint32_t int_constant_count;
242
};
243
244
struct rX00_fragment_program_code {
245
union {
246
struct r300_fragment_program_code r300;
247
struct r500_fragment_program_code r500;
248
} code;
249
250
unsigned writes_depth:1;
251
252
struct rc_constant_list constants;
253
unsigned *constants_remap_table;
254
};
255
256
257
#define R300_VS_MAX_ALU 256
258
#define R300_VS_MAX_ALU_DWORDS (R300_VS_MAX_ALU * 4)
259
#define R500_VS_MAX_ALU 1024
260
#define R500_VS_MAX_ALU_DWORDS (R500_VS_MAX_ALU * 4)
261
#define R300_VS_MAX_TEMPS 32
262
/* This is the max for all chipsets (r300-r500) */
263
#define R300_VS_MAX_FC_OPS 16
264
#define R300_VS_MAX_LOOP_DEPTH 1
265
266
#define VSF_MAX_INPUTS 32
267
#define VSF_MAX_OUTPUTS 32
268
269
struct r300_vertex_program_code {
270
int length;
271
union {
272
uint32_t d[R500_VS_MAX_ALU_DWORDS];
273
float f[R500_VS_MAX_ALU_DWORDS];
274
} body;
275
276
int pos_end;
277
int num_temporaries; /* Number of temp vars used by program */
278
int inputs[VSF_MAX_INPUTS];
279
int outputs[VSF_MAX_OUTPUTS];
280
281
struct rc_constant_list constants;
282
unsigned *constants_remap_table;
283
284
uint32_t InputsRead;
285
uint32_t OutputsWritten;
286
287
unsigned int num_fc_ops;
288
uint32_t fc_ops;
289
union {
290
uint32_t r300[R300_VS_MAX_FC_OPS];
291
struct {
292
uint32_t lw;
293
uint32_t uw;
294
} r500[R300_VS_MAX_FC_OPS];
295
} fc_op_addrs;
296
int32_t fc_loop_index[R300_VS_MAX_FC_OPS];
297
};
298
299
#endif /* RADEON_CODE_H */
300
301
302