Details | Last modification | View Log | RSS feed
Rev | Author | Line No. | Line |
---|---|---|---|
5563 | serge | 1 | /* |
2 | Copyright (C) Intel Corp. 2006. All Rights Reserved. |
||
3 | Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to |
||
4 | develop this 3D driver. |
||
5 | |||
6 | Permission is hereby granted, free of charge, to any person obtaining |
||
7 | a copy of this software and associated documentation files (the |
||
8 | "Software"), to deal in the Software without restriction, including |
||
9 | without limitation the rights to use, copy, modify, merge, publish, |
||
10 | distribute, sublicense, and/or sell copies of the Software, and to |
||
11 | permit persons to whom the Software is furnished to do so, subject to |
||
12 | the following conditions: |
||
13 | |||
14 | The above copyright notice and this permission notice (including the |
||
15 | next paragraph) shall be included in all copies or substantial |
||
16 | portions of the Software. |
||
17 | |||
18 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, |
||
19 | EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
||
20 | MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. |
||
21 | IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE |
||
22 | LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION |
||
23 | OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION |
||
24 | WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
||
25 | |||
26 | **********************************************************************/ |
||
27 | /* |
||
28 | * Authors: |
||
29 | * Keith Whitwell |
||
30 | */ |
||
31 | |||
32 | |||
33 | #include "main/glheader.h" |
||
34 | #include "main/macros.h" |
||
35 | #include "main/enums.h" |
||
36 | |||
37 | #include "intel_batchbuffer.h" |
||
38 | |||
39 | #include "brw_defines.h" |
||
40 | #include "brw_context.h" |
||
41 | #include "brw_eu.h" |
||
42 | #include "brw_util.h" |
||
43 | #include "brw_sf.h" |
||
44 | |||
45 | |||
46 | /** |
||
47 | * Determine the varying corresponding to the given half of the given |
||
48 | * register. half=0 means the first half of a register, half=1 means the |
||
49 | * second half. |
||
50 | */ |
||
51 | static inline int vert_reg_to_varying(struct brw_sf_compile *c, GLuint reg, |
||
52 | int half) |
||
53 | { |
||
54 | int vue_slot = (reg + c->urb_entry_read_offset) * 2 + half; |
||
55 | return c->vue_map.slot_to_varying[vue_slot]; |
||
56 | } |
||
57 | |||
58 | /** |
||
59 | * Determine the register corresponding to the given varying. |
||
60 | */ |
||
61 | static struct brw_reg get_varying(struct brw_sf_compile *c, |
||
62 | struct brw_reg vert, |
||
63 | GLuint varying) |
||
64 | { |
||
65 | int vue_slot = c->vue_map.varying_to_slot[varying]; |
||
66 | assert (vue_slot >= c->urb_entry_read_offset); |
||
67 | GLuint off = vue_slot / 2 - c->urb_entry_read_offset; |
||
68 | GLuint sub = vue_slot % 2; |
||
69 | |||
70 | return brw_vec4_grf(vert.nr + off, sub * 4); |
||
71 | } |
||
72 | |||
73 | static bool |
||
74 | have_attr(struct brw_sf_compile *c, GLuint attr) |
||
75 | { |
||
76 | return (c->key.attrs & BITFIELD64_BIT(attr)) ? 1 : 0; |
||
77 | } |
||
78 | |||
79 | /*********************************************************************** |
||
80 | * Twoside lighting |
||
81 | */ |
||
82 | static void copy_bfc( struct brw_sf_compile *c, |
||
83 | struct brw_reg vert ) |
||
84 | { |
||
85 | struct brw_compile *p = &c->func; |
||
86 | GLuint i; |
||
87 | |||
88 | for (i = 0; i < 2; i++) { |
||
89 | if (have_attr(c, VARYING_SLOT_COL0+i) && |
||
90 | have_attr(c, VARYING_SLOT_BFC0+i)) |
||
91 | brw_MOV(p, |
||
92 | get_varying(c, vert, VARYING_SLOT_COL0+i), |
||
93 | get_varying(c, vert, VARYING_SLOT_BFC0+i)); |
||
94 | } |
||
95 | } |
||
96 | |||
97 | |||
98 | static void do_twoside_color( struct brw_sf_compile *c ) |
||
99 | { |
||
100 | struct brw_compile *p = &c->func; |
||
101 | GLuint backface_conditional = c->key.frontface_ccw ? BRW_CONDITIONAL_G : BRW_CONDITIONAL_L; |
||
102 | |||
103 | /* Already done in clip program: |
||
104 | */ |
||
105 | if (c->key.primitive == SF_UNFILLED_TRIS) |
||
106 | return; |
||
107 | |||
108 | /* XXX: What happens if BFC isn't present? This could only happen |
||
109 | * for user-supplied vertex programs, as t_vp_build.c always does |
||
110 | * the right thing. |
||
111 | */ |
||
112 | if (!(have_attr(c, VARYING_SLOT_COL0) && have_attr(c, VARYING_SLOT_BFC0)) && |
||
113 | !(have_attr(c, VARYING_SLOT_COL1) && have_attr(c, VARYING_SLOT_BFC1))) |
||
114 | return; |
||
115 | |||
116 | /* Need to use BRW_EXECUTE_4 and also do an 4-wide compare in order |
||
117 | * to get all channels active inside the IF. In the clipping code |
||
118 | * we run with NoMask, so it's not an option and we can use |
||
119 | * BRW_EXECUTE_1 for all comparisions. |
||
120 | */ |
||
121 | brw_push_insn_state(p); |
||
122 | brw_CMP(p, vec4(brw_null_reg()), backface_conditional, c->det, brw_imm_f(0)); |
||
123 | brw_IF(p, BRW_EXECUTE_4); |
||
124 | { |
||
125 | switch (c->nr_verts) { |
||
126 | case 3: copy_bfc(c, c->vert[2]); |
||
127 | case 2: copy_bfc(c, c->vert[1]); |
||
128 | case 1: copy_bfc(c, c->vert[0]); |
||
129 | } |
||
130 | } |
||
131 | brw_ENDIF(p); |
||
132 | brw_pop_insn_state(p); |
||
133 | } |
||
134 | |||
135 | |||
136 | |||
137 | /*********************************************************************** |
||
138 | * Flat shading |
||
139 | */ |
||
140 | |||
141 | #define VARYING_SLOT_COLOR_BITS (BITFIELD64_BIT(VARYING_SLOT_COL0) | \ |
||
142 | BITFIELD64_BIT(VARYING_SLOT_COL1)) |
||
143 | |||
144 | static void copy_colors( struct brw_sf_compile *c, |
||
145 | struct brw_reg dst, |
||
146 | struct brw_reg src) |
||
147 | { |
||
148 | struct brw_compile *p = &c->func; |
||
149 | GLuint i; |
||
150 | |||
151 | for (i = VARYING_SLOT_COL0; i <= VARYING_SLOT_COL1; i++) { |
||
152 | if (have_attr(c,i)) |
||
153 | brw_MOV(p, |
||
154 | get_varying(c, dst, i), |
||
155 | get_varying(c, src, i)); |
||
156 | } |
||
157 | } |
||
158 | |||
159 | |||
160 | |||
161 | /* Need to use a computed jump to copy flatshaded attributes as the |
||
162 | * vertices are ordered according to y-coordinate before reaching this |
||
163 | * point, so the PV could be anywhere. |
||
164 | */ |
||
165 | static void do_flatshade_triangle( struct brw_sf_compile *c ) |
||
166 | { |
||
167 | struct brw_compile *p = &c->func; |
||
168 | struct brw_context *brw = p->brw; |
||
169 | struct brw_reg ip = brw_ip_reg(); |
||
170 | GLuint nr = _mesa_bitcount_64(c->key.attrs & VARYING_SLOT_COLOR_BITS); |
||
171 | GLuint jmpi = 1; |
||
172 | |||
173 | if (!nr) |
||
174 | return; |
||
175 | |||
176 | /* Already done in clip program: |
||
177 | */ |
||
178 | if (c->key.primitive == SF_UNFILLED_TRIS) |
||
179 | return; |
||
180 | |||
181 | if (brw->gen == 5) |
||
182 | jmpi = 2; |
||
183 | |||
184 | brw_push_insn_state(p); |
||
185 | |||
186 | brw_MUL(p, c->pv, c->pv, brw_imm_d(jmpi*(nr*2+1))); |
||
187 | brw_JMPI(p, ip, ip, c->pv); |
||
188 | |||
189 | copy_colors(c, c->vert[1], c->vert[0]); |
||
190 | copy_colors(c, c->vert[2], c->vert[0]); |
||
191 | brw_JMPI(p, ip, ip, brw_imm_d(jmpi*(nr*4+1))); |
||
192 | |||
193 | copy_colors(c, c->vert[0], c->vert[1]); |
||
194 | copy_colors(c, c->vert[2], c->vert[1]); |
||
195 | brw_JMPI(p, ip, ip, brw_imm_d(jmpi*nr*2)); |
||
196 | |||
197 | copy_colors(c, c->vert[0], c->vert[2]); |
||
198 | copy_colors(c, c->vert[1], c->vert[2]); |
||
199 | |||
200 | brw_pop_insn_state(p); |
||
201 | } |
||
202 | |||
203 | |||
204 | static void do_flatshade_line( struct brw_sf_compile *c ) |
||
205 | { |
||
206 | struct brw_compile *p = &c->func; |
||
207 | struct brw_context *brw = p->brw; |
||
208 | struct brw_reg ip = brw_ip_reg(); |
||
209 | GLuint nr = _mesa_bitcount_64(c->key.attrs & VARYING_SLOT_COLOR_BITS); |
||
210 | GLuint jmpi = 1; |
||
211 | |||
212 | if (!nr) |
||
213 | return; |
||
214 | |||
215 | /* Already done in clip program: |
||
216 | */ |
||
217 | if (c->key.primitive == SF_UNFILLED_TRIS) |
||
218 | return; |
||
219 | |||
220 | if (brw->gen == 5) |
||
221 | jmpi = 2; |
||
222 | |||
223 | brw_push_insn_state(p); |
||
224 | |||
225 | brw_MUL(p, c->pv, c->pv, brw_imm_d(jmpi*(nr+1))); |
||
226 | brw_JMPI(p, ip, ip, c->pv); |
||
227 | copy_colors(c, c->vert[1], c->vert[0]); |
||
228 | |||
229 | brw_JMPI(p, ip, ip, brw_imm_ud(jmpi*nr)); |
||
230 | copy_colors(c, c->vert[0], c->vert[1]); |
||
231 | |||
232 | brw_pop_insn_state(p); |
||
233 | } |
||
234 | |||
235 | |||
236 | |||
237 | /*********************************************************************** |
||
238 | * Triangle setup. |
||
239 | */ |
||
240 | |||
241 | |||
242 | static void alloc_regs( struct brw_sf_compile *c ) |
||
243 | { |
||
244 | GLuint reg, i; |
||
245 | |||
246 | /* Values computed by fixed function unit: |
||
247 | */ |
||
248 | c->pv = retype(brw_vec1_grf(1, 1), BRW_REGISTER_TYPE_D); |
||
249 | c->det = brw_vec1_grf(1, 2); |
||
250 | c->dx0 = brw_vec1_grf(1, 3); |
||
251 | c->dx2 = brw_vec1_grf(1, 4); |
||
252 | c->dy0 = brw_vec1_grf(1, 5); |
||
253 | c->dy2 = brw_vec1_grf(1, 6); |
||
254 | |||
255 | /* z and 1/w passed in seperately: |
||
256 | */ |
||
257 | c->z[0] = brw_vec1_grf(2, 0); |
||
258 | c->inv_w[0] = brw_vec1_grf(2, 1); |
||
259 | c->z[1] = brw_vec1_grf(2, 2); |
||
260 | c->inv_w[1] = brw_vec1_grf(2, 3); |
||
261 | c->z[2] = brw_vec1_grf(2, 4); |
||
262 | c->inv_w[2] = brw_vec1_grf(2, 5); |
||
263 | |||
264 | /* The vertices: |
||
265 | */ |
||
266 | reg = 3; |
||
267 | for (i = 0; i < c->nr_verts; i++) { |
||
268 | c->vert[i] = brw_vec8_grf(reg, 0); |
||
269 | reg += c->nr_attr_regs; |
||
270 | } |
||
271 | |||
272 | /* Temporaries, allocated after last vertex reg. |
||
273 | */ |
||
274 | c->inv_det = brw_vec1_grf(reg, 0); reg++; |
||
275 | c->a1_sub_a0 = brw_vec8_grf(reg, 0); reg++; |
||
276 | c->a2_sub_a0 = brw_vec8_grf(reg, 0); reg++; |
||
277 | c->tmp = brw_vec8_grf(reg, 0); reg++; |
||
278 | |||
279 | /* Note grf allocation: |
||
280 | */ |
||
281 | c->prog_data.total_grf = reg; |
||
282 | |||
283 | |||
284 | /* Outputs of this program - interpolation coefficients for |
||
285 | * rasterization: |
||
286 | */ |
||
287 | c->m1Cx = brw_vec8_reg(BRW_MESSAGE_REGISTER_FILE, 1, 0); |
||
288 | c->m2Cy = brw_vec8_reg(BRW_MESSAGE_REGISTER_FILE, 2, 0); |
||
289 | c->m3C0 = brw_vec8_reg(BRW_MESSAGE_REGISTER_FILE, 3, 0); |
||
290 | } |
||
291 | |||
292 | |||
293 | static void copy_z_inv_w( struct brw_sf_compile *c ) |
||
294 | { |
||
295 | struct brw_compile *p = &c->func; |
||
296 | GLuint i; |
||
297 | |||
298 | brw_push_insn_state(p); |
||
299 | |||
300 | /* Copy both scalars with a single MOV: |
||
301 | */ |
||
302 | for (i = 0; i < c->nr_verts; i++) |
||
303 | brw_MOV(p, vec2(suboffset(c->vert[i], 2)), vec2(c->z[i])); |
||
304 | |||
305 | brw_pop_insn_state(p); |
||
306 | } |
||
307 | |||
308 | |||
309 | static void invert_det( struct brw_sf_compile *c) |
||
310 | { |
||
311 | /* Looks like we invert all 8 elements just to get 1/det in |
||
312 | * position 2 !?! |
||
313 | */ |
||
314 | brw_math(&c->func, |
||
315 | c->inv_det, |
||
316 | BRW_MATH_FUNCTION_INV, |
||
317 | 0, |
||
318 | c->det, |
||
319 | BRW_MATH_DATA_SCALAR, |
||
320 | BRW_MATH_PRECISION_FULL); |
||
321 | |||
322 | } |
||
323 | |||
324 | |||
325 | static bool |
||
326 | calculate_masks(struct brw_sf_compile *c, |
||
327 | GLuint reg, |
||
328 | GLushort *pc, |
||
329 | GLushort *pc_persp, |
||
330 | GLushort *pc_linear) |
||
331 | { |
||
332 | bool is_last_attr = (reg == c->nr_setup_regs - 1); |
||
333 | GLbitfield64 persp_mask; |
||
334 | GLbitfield64 linear_mask; |
||
335 | |||
336 | if (c->key.do_flat_shading) |
||
337 | persp_mask = c->key.attrs & ~(BITFIELD64_BIT(VARYING_SLOT_POS) | |
||
338 | BITFIELD64_BIT(VARYING_SLOT_COL0) | |
||
339 | BITFIELD64_BIT(VARYING_SLOT_COL1)); |
||
340 | else |
||
341 | persp_mask = c->key.attrs & ~(BITFIELD64_BIT(VARYING_SLOT_POS)); |
||
342 | |||
343 | if (c->key.do_flat_shading) |
||
344 | linear_mask = c->key.attrs & ~(BITFIELD64_BIT(VARYING_SLOT_COL0) | |
||
345 | BITFIELD64_BIT(VARYING_SLOT_COL1)); |
||
346 | else |
||
347 | linear_mask = c->key.attrs; |
||
348 | |||
349 | *pc_persp = 0; |
||
350 | *pc_linear = 0; |
||
351 | *pc = 0xf; |
||
352 | |||
353 | if (persp_mask & BITFIELD64_BIT(vert_reg_to_varying(c, reg, 0))) |
||
354 | *pc_persp = 0xf; |
||
355 | |||
356 | if (linear_mask & BITFIELD64_BIT(vert_reg_to_varying(c, reg, 0))) |
||
357 | *pc_linear = 0xf; |
||
358 | |||
359 | /* Maybe only processs one attribute on the final round: |
||
360 | */ |
||
361 | if (vert_reg_to_varying(c, reg, 1) != BRW_VARYING_SLOT_COUNT) { |
||
362 | *pc |= 0xf0; |
||
363 | |||
364 | if (persp_mask & BITFIELD64_BIT(vert_reg_to_varying(c, reg, 1))) |
||
365 | *pc_persp |= 0xf0; |
||
366 | |||
367 | if (linear_mask & BITFIELD64_BIT(vert_reg_to_varying(c, reg, 1))) |
||
368 | *pc_linear |= 0xf0; |
||
369 | } |
||
370 | |||
371 | return is_last_attr; |
||
372 | } |
||
373 | |||
374 | /* Calculates the predicate control for which channels of a reg |
||
375 | * (containing 2 attrs) to do point sprite coordinate replacement on. |
||
376 | */ |
||
377 | static uint16_t |
||
378 | calculate_point_sprite_mask(struct brw_sf_compile *c, GLuint reg) |
||
379 | { |
||
380 | int varying1, varying2; |
||
381 | uint16_t pc = 0; |
||
382 | |||
383 | varying1 = vert_reg_to_varying(c, reg, 0); |
||
384 | if (varying1 >= VARYING_SLOT_TEX0 && varying1 <= VARYING_SLOT_TEX7) { |
||
385 | if (c->key.point_sprite_coord_replace & (1 << (varying1 - VARYING_SLOT_TEX0))) |
||
386 | pc |= 0x0f; |
||
387 | } |
||
388 | if (varying1 == BRW_VARYING_SLOT_PNTC) |
||
389 | pc |= 0x0f; |
||
390 | |||
391 | varying2 = vert_reg_to_varying(c, reg, 1); |
||
392 | if (varying2 >= VARYING_SLOT_TEX0 && varying2 <= VARYING_SLOT_TEX7) { |
||
393 | if (c->key.point_sprite_coord_replace & (1 << (varying2 - |
||
394 | VARYING_SLOT_TEX0))) |
||
395 | pc |= 0xf0; |
||
396 | } |
||
397 | if (varying2 == BRW_VARYING_SLOT_PNTC) |
||
398 | pc |= 0xf0; |
||
399 | |||
400 | return pc; |
||
401 | } |
||
402 | |||
403 | |||
404 | |||
405 | void brw_emit_tri_setup(struct brw_sf_compile *c, bool allocate) |
||
406 | { |
||
407 | struct brw_compile *p = &c->func; |
||
408 | GLuint i; |
||
409 | |||
410 | c->nr_verts = 3; |
||
411 | |||
412 | if (allocate) |
||
413 | alloc_regs(c); |
||
414 | |||
415 | invert_det(c); |
||
416 | copy_z_inv_w(c); |
||
417 | |||
418 | if (c->key.do_twoside_color) |
||
419 | do_twoside_color(c); |
||
420 | |||
421 | if (c->key.do_flat_shading) |
||
422 | do_flatshade_triangle(c); |
||
423 | |||
424 | |||
425 | for (i = 0; i < c->nr_setup_regs; i++) |
||
426 | { |
||
427 | /* Pair of incoming attributes: |
||
428 | */ |
||
429 | struct brw_reg a0 = offset(c->vert[0], i); |
||
430 | struct brw_reg a1 = offset(c->vert[1], i); |
||
431 | struct brw_reg a2 = offset(c->vert[2], i); |
||
432 | GLushort pc, pc_persp, pc_linear; |
||
433 | bool last = calculate_masks(c, i, &pc, &pc_persp, &pc_linear); |
||
434 | |||
435 | if (pc_persp) |
||
436 | { |
||
437 | brw_set_predicate_control_flag_value(p, pc_persp); |
||
438 | brw_MUL(p, a0, a0, c->inv_w[0]); |
||
439 | brw_MUL(p, a1, a1, c->inv_w[1]); |
||
440 | brw_MUL(p, a2, a2, c->inv_w[2]); |
||
441 | } |
||
442 | |||
443 | |||
444 | /* Calculate coefficients for interpolated values: |
||
445 | */ |
||
446 | if (pc_linear) |
||
447 | { |
||
448 | brw_set_predicate_control_flag_value(p, pc_linear); |
||
449 | |||
450 | brw_ADD(p, c->a1_sub_a0, a1, negate(a0)); |
||
451 | brw_ADD(p, c->a2_sub_a0, a2, negate(a0)); |
||
452 | |||
453 | /* calculate dA/dx |
||
454 | */ |
||
455 | brw_MUL(p, brw_null_reg(), c->a1_sub_a0, c->dy2); |
||
456 | brw_MAC(p, c->tmp, c->a2_sub_a0, negate(c->dy0)); |
||
457 | brw_MUL(p, c->m1Cx, c->tmp, c->inv_det); |
||
458 | |||
459 | /* calculate dA/dy |
||
460 | */ |
||
461 | brw_MUL(p, brw_null_reg(), c->a2_sub_a0, c->dx0); |
||
462 | brw_MAC(p, c->tmp, c->a1_sub_a0, negate(c->dx2)); |
||
463 | brw_MUL(p, c->m2Cy, c->tmp, c->inv_det); |
||
464 | } |
||
465 | |||
466 | { |
||
467 | brw_set_predicate_control_flag_value(p, pc); |
||
468 | /* start point for interpolation |
||
469 | */ |
||
470 | brw_MOV(p, c->m3C0, a0); |
||
471 | |||
472 | /* Copy m0..m3 to URB. m0 is implicitly copied from r0 in |
||
473 | * the send instruction: |
||
474 | */ |
||
475 | brw_urb_WRITE(p, |
||
476 | brw_null_reg(), |
||
477 | 0, |
||
478 | brw_vec8_grf(0, 0), /* r0, will be copied to m0 */ |
||
479 | 0, /* allocate */ |
||
480 | 1, /* used */ |
||
481 | 4, /* msg len */ |
||
482 | 0, /* response len */ |
||
483 | last, /* eot */ |
||
484 | last, /* writes complete */ |
||
485 | i*4, /* offset */ |
||
486 | BRW_URB_SWIZZLE_TRANSPOSE); /* XXX: Swizzle control "SF to windower" */ |
||
487 | } |
||
488 | } |
||
489 | } |
||
490 | |||
491 | |||
492 | |||
493 | void brw_emit_line_setup(struct brw_sf_compile *c, bool allocate) |
||
494 | { |
||
495 | struct brw_compile *p = &c->func; |
||
496 | GLuint i; |
||
497 | |||
498 | |||
499 | c->nr_verts = 2; |
||
500 | |||
501 | if (allocate) |
||
502 | alloc_regs(c); |
||
503 | |||
504 | invert_det(c); |
||
505 | copy_z_inv_w(c); |
||
506 | |||
507 | if (c->key.do_flat_shading) |
||
508 | do_flatshade_line(c); |
||
509 | |||
510 | for (i = 0; i < c->nr_setup_regs; i++) |
||
511 | { |
||
512 | /* Pair of incoming attributes: |
||
513 | */ |
||
514 | struct brw_reg a0 = offset(c->vert[0], i); |
||
515 | struct brw_reg a1 = offset(c->vert[1], i); |
||
516 | GLushort pc, pc_persp, pc_linear; |
||
517 | bool last = calculate_masks(c, i, &pc, &pc_persp, &pc_linear); |
||
518 | |||
519 | if (pc_persp) |
||
520 | { |
||
521 | brw_set_predicate_control_flag_value(p, pc_persp); |
||
522 | brw_MUL(p, a0, a0, c->inv_w[0]); |
||
523 | brw_MUL(p, a1, a1, c->inv_w[1]); |
||
524 | } |
||
525 | |||
526 | /* Calculate coefficients for position, color: |
||
527 | */ |
||
528 | if (pc_linear) { |
||
529 | brw_set_predicate_control_flag_value(p, pc_linear); |
||
530 | |||
531 | brw_ADD(p, c->a1_sub_a0, a1, negate(a0)); |
||
532 | |||
533 | brw_MUL(p, c->tmp, c->a1_sub_a0, c->dx0); |
||
534 | brw_MUL(p, c->m1Cx, c->tmp, c->inv_det); |
||
535 | |||
536 | brw_MUL(p, c->tmp, c->a1_sub_a0, c->dy0); |
||
537 | brw_MUL(p, c->m2Cy, c->tmp, c->inv_det); |
||
538 | } |
||
539 | |||
540 | { |
||
541 | brw_set_predicate_control_flag_value(p, pc); |
||
542 | |||
543 | /* start point for interpolation |
||
544 | */ |
||
545 | brw_MOV(p, c->m3C0, a0); |
||
546 | |||
547 | /* Copy m0..m3 to URB. |
||
548 | */ |
||
549 | brw_urb_WRITE(p, |
||
550 | brw_null_reg(), |
||
551 | 0, |
||
552 | brw_vec8_grf(0, 0), |
||
553 | 0, /* allocate */ |
||
554 | 1, /* used */ |
||
555 | 4, /* msg len */ |
||
556 | 0, /* response len */ |
||
557 | last, /* eot */ |
||
558 | last, /* writes complete */ |
||
559 | i*4, /* urb destination offset */ |
||
560 | BRW_URB_SWIZZLE_TRANSPOSE); |
||
561 | } |
||
562 | } |
||
563 | } |
||
564 | |||
565 | void brw_emit_point_sprite_setup(struct brw_sf_compile *c, bool allocate) |
||
566 | { |
||
567 | struct brw_compile *p = &c->func; |
||
568 | GLuint i; |
||
569 | |||
570 | c->nr_verts = 1; |
||
571 | |||
572 | if (allocate) |
||
573 | alloc_regs(c); |
||
574 | |||
575 | copy_z_inv_w(c); |
||
576 | for (i = 0; i < c->nr_setup_regs; i++) |
||
577 | { |
||
578 | struct brw_reg a0 = offset(c->vert[0], i); |
||
579 | GLushort pc, pc_persp, pc_linear, pc_coord_replace; |
||
580 | bool last = calculate_masks(c, i, &pc, &pc_persp, &pc_linear); |
||
581 | |||
582 | pc_coord_replace = calculate_point_sprite_mask(c, i); |
||
583 | pc_persp &= ~pc_coord_replace; |
||
584 | |||
585 | if (pc_persp) { |
||
586 | brw_set_predicate_control_flag_value(p, pc_persp); |
||
587 | brw_MUL(p, a0, a0, c->inv_w[0]); |
||
588 | } |
||
589 | |||
590 | /* Point sprite coordinate replacement: A texcoord with this |
||
591 | * enabled gets replaced with the value (x, y, 0, 1) where x and |
||
592 | * y vary from 0 to 1 across the horizontal and vertical of the |
||
593 | * point. |
||
594 | */ |
||
595 | if (pc_coord_replace) { |
||
596 | brw_set_predicate_control_flag_value(p, pc_coord_replace); |
||
597 | /* Caculate 1.0/PointWidth */ |
||
598 | brw_math(&c->func, |
||
599 | c->tmp, |
||
600 | BRW_MATH_FUNCTION_INV, |
||
601 | 0, |
||
602 | c->dx0, |
||
603 | BRW_MATH_DATA_SCALAR, |
||
604 | BRW_MATH_PRECISION_FULL); |
||
605 | |||
606 | brw_set_access_mode(p, BRW_ALIGN_16); |
||
607 | |||
608 | /* dA/dx, dA/dy */ |
||
609 | brw_MOV(p, c->m1Cx, brw_imm_f(0.0)); |
||
610 | brw_MOV(p, c->m2Cy, brw_imm_f(0.0)); |
||
611 | brw_MOV(p, brw_writemask(c->m1Cx, WRITEMASK_X), c->tmp); |
||
612 | if (c->key.sprite_origin_lower_left) { |
||
613 | brw_MOV(p, brw_writemask(c->m2Cy, WRITEMASK_Y), negate(c->tmp)); |
||
614 | } else { |
||
615 | brw_MOV(p, brw_writemask(c->m2Cy, WRITEMASK_Y), c->tmp); |
||
616 | } |
||
617 | |||
618 | /* attribute constant offset */ |
||
619 | brw_MOV(p, c->m3C0, brw_imm_f(0.0)); |
||
620 | if (c->key.sprite_origin_lower_left) { |
||
621 | brw_MOV(p, brw_writemask(c->m3C0, WRITEMASK_YW), brw_imm_f(1.0)); |
||
622 | } else { |
||
623 | brw_MOV(p, brw_writemask(c->m3C0, WRITEMASK_W), brw_imm_f(1.0)); |
||
624 | } |
||
625 | |||
626 | brw_set_access_mode(p, BRW_ALIGN_1); |
||
627 | } |
||
628 | |||
629 | if (pc & ~pc_coord_replace) { |
||
630 | brw_set_predicate_control_flag_value(p, pc & ~pc_coord_replace); |
||
631 | brw_MOV(p, c->m1Cx, brw_imm_ud(0)); |
||
632 | brw_MOV(p, c->m2Cy, brw_imm_ud(0)); |
||
633 | brw_MOV(p, c->m3C0, a0); /* constant value */ |
||
634 | } |
||
635 | |||
636 | |||
637 | brw_set_predicate_control_flag_value(p, pc); |
||
638 | /* Copy m0..m3 to URB. */ |
||
639 | brw_urb_WRITE(p, |
||
640 | brw_null_reg(), |
||
641 | 0, |
||
642 | brw_vec8_grf(0, 0), |
||
643 | 0, /* allocate */ |
||
644 | 1, /* used */ |
||
645 | 4, /* msg len */ |
||
646 | 0, /* response len */ |
||
647 | last, /* eot */ |
||
648 | last, /* writes complete */ |
||
649 | i*4, /* urb destination offset */ |
||
650 | BRW_URB_SWIZZLE_TRANSPOSE); |
||
651 | } |
||
652 | } |
||
653 | |||
654 | /* Points setup - several simplifications as all attributes are |
||
655 | * constant across the face of the point (point sprites excluded!) |
||
656 | */ |
||
657 | void brw_emit_point_setup(struct brw_sf_compile *c, bool allocate) |
||
658 | { |
||
659 | struct brw_compile *p = &c->func; |
||
660 | GLuint i; |
||
661 | |||
662 | c->nr_verts = 1; |
||
663 | |||
664 | if (allocate) |
||
665 | alloc_regs(c); |
||
666 | |||
667 | copy_z_inv_w(c); |
||
668 | |||
669 | brw_MOV(p, c->m1Cx, brw_imm_ud(0)); /* zero - move out of loop */ |
||
670 | brw_MOV(p, c->m2Cy, brw_imm_ud(0)); /* zero - move out of loop */ |
||
671 | |||
672 | for (i = 0; i < c->nr_setup_regs; i++) |
||
673 | { |
||
674 | struct brw_reg a0 = offset(c->vert[0], i); |
||
675 | GLushort pc, pc_persp, pc_linear; |
||
676 | bool last = calculate_masks(c, i, &pc, &pc_persp, &pc_linear); |
||
677 | |||
678 | if (pc_persp) |
||
679 | { |
||
680 | /* This seems odd as the values are all constant, but the |
||
681 | * fragment shader will be expecting it: |
||
682 | */ |
||
683 | brw_set_predicate_control_flag_value(p, pc_persp); |
||
684 | brw_MUL(p, a0, a0, c->inv_w[0]); |
||
685 | } |
||
686 | |||
687 | |||
688 | /* The delta values are always zero, just send the starting |
||
689 | * coordinate. Again, this is to fit in with the interpolation |
||
690 | * code in the fragment shader. |
||
691 | */ |
||
692 | { |
||
693 | brw_set_predicate_control_flag_value(p, pc); |
||
694 | |||
695 | brw_MOV(p, c->m3C0, a0); /* constant value */ |
||
696 | |||
697 | /* Copy m0..m3 to URB. |
||
698 | */ |
||
699 | brw_urb_WRITE(p, |
||
700 | brw_null_reg(), |
||
701 | 0, |
||
702 | brw_vec8_grf(0, 0), |
||
703 | 0, /* allocate */ |
||
704 | 1, /* used */ |
||
705 | 4, /* msg len */ |
||
706 | 0, /* response len */ |
||
707 | last, /* eot */ |
||
708 | last, /* writes complete */ |
||
709 | i*4, /* urb destination offset */ |
||
710 | BRW_URB_SWIZZLE_TRANSPOSE); |
||
711 | } |
||
712 | } |
||
713 | } |
||
714 | |||
715 | void brw_emit_anyprim_setup( struct brw_sf_compile *c ) |
||
716 | { |
||
717 | struct brw_compile *p = &c->func; |
||
718 | struct brw_reg ip = brw_ip_reg(); |
||
719 | struct brw_reg payload_prim = brw_uw1_reg(BRW_GENERAL_REGISTER_FILE, 1, 0); |
||
720 | struct brw_reg payload_attr = get_element_ud(brw_vec1_reg(BRW_GENERAL_REGISTER_FILE, 1, 0), 0); |
||
721 | struct brw_reg primmask; |
||
722 | int jmp; |
||
723 | struct brw_reg v1_null_ud = vec1(retype(brw_null_reg(), BRW_REGISTER_TYPE_UD)); |
||
724 | |||
725 | GLuint saveflag; |
||
726 | |||
727 | c->nr_verts = 3; |
||
728 | alloc_regs(c); |
||
729 | |||
730 | primmask = retype(get_element(c->tmp, 0), BRW_REGISTER_TYPE_UD); |
||
731 | |||
732 | brw_MOV(p, primmask, brw_imm_ud(1)); |
||
733 | brw_SHL(p, primmask, primmask, payload_prim); |
||
734 | |||
735 | brw_set_conditionalmod(p, BRW_CONDITIONAL_Z); |
||
736 | brw_AND(p, v1_null_ud, primmask, brw_imm_ud((1<<_3DPRIM_TRILIST) | |
||
737 | (1<<_3DPRIM_TRISTRIP) | |
||
738 | (1<<_3DPRIM_TRIFAN) | |
||
739 | (1<<_3DPRIM_TRISTRIP_REVERSE) | |
||
740 | (1<<_3DPRIM_POLYGON) | |
||
741 | (1<<_3DPRIM_RECTLIST) | |
||
742 | (1<<_3DPRIM_TRIFAN_NOSTIPPLE))); |
||
743 | jmp = brw_JMPI(p, ip, ip, brw_imm_d(0)) - p->store; |
||
744 | { |
||
745 | saveflag = p->flag_value; |
||
746 | brw_push_insn_state(p); |
||
747 | brw_emit_tri_setup( c, false ); |
||
748 | brw_pop_insn_state(p); |
||
749 | p->flag_value = saveflag; |
||
750 | /* note - thread killed in subroutine, so must |
||
751 | * restore the flag which is changed when building |
||
752 | * the subroutine. fix #13240 |
||
753 | */ |
||
754 | } |
||
755 | brw_land_fwd_jump(p, jmp); |
||
756 | |||
757 | brw_set_conditionalmod(p, BRW_CONDITIONAL_Z); |
||
758 | brw_AND(p, v1_null_ud, primmask, brw_imm_ud((1<<_3DPRIM_LINELIST) | |
||
759 | (1<<_3DPRIM_LINESTRIP) | |
||
760 | (1<<_3DPRIM_LINELOOP) | |
||
761 | (1<<_3DPRIM_LINESTRIP_CONT) | |
||
762 | (1<<_3DPRIM_LINESTRIP_BF) | |
||
763 | (1<<_3DPRIM_LINESTRIP_CONT_BF))); |
||
764 | jmp = brw_JMPI(p, ip, ip, brw_imm_d(0)) - p->store; |
||
765 | { |
||
766 | saveflag = p->flag_value; |
||
767 | brw_push_insn_state(p); |
||
768 | brw_emit_line_setup( c, false ); |
||
769 | brw_pop_insn_state(p); |
||
770 | p->flag_value = saveflag; |
||
771 | /* note - thread killed in subroutine */ |
||
772 | } |
||
773 | brw_land_fwd_jump(p, jmp); |
||
774 | |||
775 | brw_set_conditionalmod(p, BRW_CONDITIONAL_Z); |
||
776 | brw_AND(p, v1_null_ud, payload_attr, brw_imm_ud(1< |
||
777 | jmp = brw_JMPI(p, ip, ip, brw_imm_d(0)) - p->store; |
||
778 | { |
||
779 | saveflag = p->flag_value; |
||
780 | brw_push_insn_state(p); |
||
781 | brw_emit_point_sprite_setup( c, false ); |
||
782 | brw_pop_insn_state(p); |
||
783 | p->flag_value = saveflag; |
||
784 | } |
||
785 | brw_land_fwd_jump(p, jmp); |
||
786 | |||
787 | brw_emit_point_setup( c, false ); |
||
788 | } |
||
789 | |||
790 | |||
791 | |||
792 |