2 * Mesa 3-D graphics library
4 * Copyright (C) 2013 LunarG, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
25 * Chia-I Wu <olv@lunarg.com>
28 #include "util/u_dual_blend.h"
29 #include "intel_reg.h"
31 #include "ilo_common.h"
32 #include "ilo_context.h"
34 #include "ilo_gpe_gen7.h"
35 #include "ilo_shader.h"
36 #include "ilo_state.h"
37 #include "ilo_3d_pipeline.h"
38 #include "ilo_3d_pipeline_gen6.h"
39 #include "ilo_3d_pipeline_gen7.h"
42 gen7_wa_pipe_control_cs_stall(struct ilo_3d_pipeline *p,
43 bool change_multisample_state,
44 bool change_depth_state)
46 struct intel_bo *bo = NULL;
47 uint32_t dw1 = PIPE_CONTROL_CS_STALL;
49 assert(p->dev->gen == ILO_GEN(7));
52 if (p->state.has_gen6_wa_pipe_control)
54 p->state.has_gen6_wa_pipe_control = true;
57 * From the Ivy Bridge PRM, volume 2 part 1, page 258:
59 * "Due to an HW issue driver needs to send a pipe control with stall
60 * when ever there is state change in depth bias related state"
62 * From the Ivy Bridge PRM, volume 2 part 1, page 292:
64 * "A PIPE_CONTOL command with the CS Stall bit set must be programmed
65 * in the ring after this instruction
66 * (3DSTATE_PUSH_CONSTANT_ALLOC_PS)."
68 * From the Ivy Bridge PRM, volume 2 part 1, page 304:
70 * "Driver must ierarchi that all the caches in the depth pipe are
71 * flushed before this command (3DSTATE_MULTISAMPLE) is parsed. This
72 * requires driver to send a PIPE_CONTROL with a CS stall along with a
73 * Depth Flush prior to this command.
75 * From the Ivy Bridge PRM, volume 2 part 1, page 315:
77 * "Driver must send a least one PIPE_CONTROL command with CS Stall and
78 * a post sync operation prior to the group of depth
79 * commands(3DSTATE_DEPTH_BUFFER, 3DSTATE_CLEAR_PARAMS,
80 * 3DSTATE_STENCIL_BUFFER, and 3DSTATE_HIER_DEPTH_BUFFER)."
83 if (change_multisample_state)
84 dw1 |= PIPE_CONTROL_DEPTH_CACHE_FLUSH;
86 if (change_depth_state) {
87 dw1 |= PIPE_CONTROL_WRITE_IMMEDIATE;
88 bo = p->workaround_bo;
91 p->gen6_PIPE_CONTROL(p->dev, dw1, bo, 0, false, p->cp);
95 gen7_wa_pipe_control_vs_depth_stall(struct ilo_3d_pipeline *p)
97 assert(p->dev->gen == ILO_GEN(7));
100 * From the Ivy Bridge PRM, volume 2 part 1, page 106:
102 * "A PIPE_CONTROL with Post-Sync Operation set to 1h and a depth stall
103 * needs to be sent just prior to any 3DSTATE_VS, 3DSTATE_URB_VS,
104 * 3DSTATE_CONSTANT_VS, 3DSTATE_BINDING_TABLE_POINTER_VS,
105 * 3DSTATE_SAMPLER_STATE_POINTER_VS command. Only one PIPE_CONTROL
106 * needs to be sent before any combination of VS associated 3DSTATE."
108 p->gen6_PIPE_CONTROL(p->dev,
109 PIPE_CONTROL_DEPTH_STALL |
110 PIPE_CONTROL_WRITE_IMMEDIATE,
111 p->workaround_bo, 0, false, p->cp);
115 gen7_wa_pipe_control_wm_depth_stall(struct ilo_3d_pipeline *p,
116 bool change_depth_buffer)
118 assert(p->dev->gen == ILO_GEN(7));
121 * From the Ivy Bridge PRM, volume 2 part 1, page 276:
123 * "The driver must make sure a PIPE_CONTROL with the Depth Stall
124 * Enable bit set after all the following states are programmed:
127 * * 3DSTATE_VIEWPORT_STATE_POINTERS_CC
128 * * 3DSTATE_CONSTANT_PS
129 * * 3DSTATE_BINDING_TABLE_POINTERS_PS
130 * * 3DSTATE_SAMPLER_STATE_POINTERS_PS
131 * * 3DSTATE_CC_STATE_POINTERS
132 * * 3DSTATE_BLEND_STATE_POINTERS
133 * * 3DSTATE_DEPTH_STENCIL_STATE_POINTERS"
135 * From the Ivy Bridge PRM, volume 2 part 1, page 315:
137 * "Restriction: Prior to changing Depth/Stencil Buffer state (i.e.,
138 * any combination of 3DSTATE_DEPTH_BUFFER, 3DSTATE_CLEAR_PARAMS,
139 * 3DSTATE_STENCIL_BUFFER, 3DSTATE_HIER_DEPTH_BUFFER) SW must first
140 * issue a pipelined depth stall (PIPE_CONTROL with Depth Stall bit
141 * set), followed by a pipelined depth cache flush (PIPE_CONTROL with
142 * Depth Flush Bit set, followed by another pipelined depth stall
143 * (PIPE_CONTROL with Depth Stall Bit set), unless SW can otherwise
144 * guarantee that the pipeline from WM onwards is already flushed
145 * (e.g., via a preceding MI_FLUSH)."
147 p->gen6_PIPE_CONTROL(p->dev,
148 PIPE_CONTROL_DEPTH_STALL,
149 NULL, 0, false, p->cp);
151 if (!change_depth_buffer)
154 p->gen6_PIPE_CONTROL(p->dev,
155 PIPE_CONTROL_DEPTH_CACHE_FLUSH,
156 NULL, 0, false, p->cp);
158 p->gen6_PIPE_CONTROL(p->dev,
159 PIPE_CONTROL_DEPTH_STALL,
160 NULL, 0, false, p->cp);
164 gen7_wa_pipe_control_wm_max_threads_stall(struct ilo_3d_pipeline *p)
166 assert(p->dev->gen == ILO_GEN(7));
169 * From the Ivy Bridge PRM, volume 2 part 1, page 286:
171 * "If this field (Maximum Number of Threads in 3DSTATE_WM) is changed
172 * between 3DPRIMITIVE commands, a PIPE_CONTROL command with Stall at
173 * Pixel Scoreboard set is required to be issued."
175 p->gen6_PIPE_CONTROL(p->dev,
176 PIPE_CONTROL_STALL_AT_SCOREBOARD,
177 NULL, 0, false, p->cp);
181 #define DIRTY(state) (session->pipe_dirty & ILO_DIRTY_ ## state)
184 gen7_pipeline_common_urb(struct ilo_3d_pipeline *p,
185 const struct ilo_context *ilo,
186 struct gen6_pipeline_session *session)
188 /* 3DSTATE_URB_{VS,GS,HS,DS} */
189 if (DIRTY(VERTEX_ELEMENTS) || DIRTY(VS)) {
190 const struct ilo_shader *vs = (ilo->vs) ? ilo->vs->shader : NULL;
191 /* the first 16KB are reserved for VS and PS PCBs */
192 const int offset = 16 * 1024;
193 int vs_entry_size, vs_total_size;
195 vs_entry_size = (vs) ? vs->out.count : 0;
198 * From the Ivy Bridge PRM, volume 2 part 1, page 35:
200 * "Programming Restriction: As the VS URB entry serves as both the
201 * per-vertex input and output of the VS shader, the VS URB
202 * Allocation Size must be sized to the maximum of the vertex input
203 * and output structures."
205 if (vs_entry_size < ilo->ve->count)
206 vs_entry_size = ilo->ve->count;
208 vs_entry_size *= sizeof(float) * 4;
209 vs_total_size = ilo->dev->urb_size - offset;
211 gen7_wa_pipe_control_vs_depth_stall(p);
213 p->gen7_3DSTATE_URB_VS(p->dev,
214 offset, vs_total_size, vs_entry_size, p->cp);
216 p->gen7_3DSTATE_URB_GS(p->dev, offset, 0, 0, p->cp);
217 p->gen7_3DSTATE_URB_HS(p->dev, offset, 0, 0, p->cp);
218 p->gen7_3DSTATE_URB_DS(p->dev, offset, 0, 0, p->cp);
223 gen7_pipeline_common_pcb_alloc(struct ilo_3d_pipeline *p,
224 const struct ilo_context *ilo,
225 struct gen6_pipeline_session *session)
227 /* 3DSTATE_PUSH_CONSTANT_ALLOC_{VS,PS} */
228 if (session->hw_ctx_changed) {
230 * push constant buffers are only allowed to take up at most the first
233 p->gen7_3DSTATE_PUSH_CONSTANT_ALLOC_VS(p->dev,
236 p->gen7_3DSTATE_PUSH_CONSTANT_ALLOC_PS(p->dev,
239 gen7_wa_pipe_control_cs_stall(p, true, true);
244 gen7_pipeline_common_pointers_1(struct ilo_3d_pipeline *p,
245 const struct ilo_context *ilo,
246 struct gen6_pipeline_session *session)
248 /* 3DSTATE_VIEWPORT_STATE_POINTERS_{CC,SF_CLIP} */
249 if (session->viewport_state_changed) {
250 p->gen7_3DSTATE_VIEWPORT_STATE_POINTERS_CC(p->dev,
251 p->state.CC_VIEWPORT, p->cp);
253 p->gen7_3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP(p->dev,
254 p->state.SF_CLIP_VIEWPORT, p->cp);
259 gen7_pipeline_common_pointers_2(struct ilo_3d_pipeline *p,
260 const struct ilo_context *ilo,
261 struct gen6_pipeline_session *session)
263 /* 3DSTATE_BLEND_STATE_POINTERS */
264 if (session->cc_state_blend_changed) {
265 p->gen7_3DSTATE_BLEND_STATE_POINTERS(p->dev,
266 p->state.BLEND_STATE, p->cp);
269 /* 3DSTATE_CC_STATE_POINTERS */
270 if (session->cc_state_cc_changed) {
271 p->gen7_3DSTATE_CC_STATE_POINTERS(p->dev,
272 p->state.COLOR_CALC_STATE, p->cp);
275 /* 3DSTATE_DEPTH_STENCIL_STATE_POINTERS */
276 if (session->cc_state_dsa_changed) {
277 p->gen7_3DSTATE_DEPTH_STENCIL_STATE_POINTERS(p->dev,
278 p->state.DEPTH_STENCIL_STATE, p->cp);
283 gen7_pipeline_vs(struct ilo_3d_pipeline *p,
284 const struct ilo_context *ilo,
285 struct gen6_pipeline_session *session)
287 const bool emit_3dstate_binding_table = session->binding_table_vs_changed;
288 const bool emit_3dstate_sampler_state = session->sampler_state_vs_changed;
289 /* see gen6_pipeline_vs() */
290 const bool emit_3dstate_constant_vs = session->pcb_state_vs_changed;
291 const bool emit_3dstate_vs = (DIRTY(VS) || DIRTY(VERTEX_SAMPLERS));
293 /* emit depth stall before any of the VS commands */
294 if (emit_3dstate_binding_table || emit_3dstate_sampler_state ||
295 emit_3dstate_constant_vs || emit_3dstate_vs)
296 gen7_wa_pipe_control_vs_depth_stall(p);
298 /* 3DSTATE_BINDING_TABLE_POINTERS_VS */
299 if (emit_3dstate_binding_table) {
300 p->gen7_3DSTATE_BINDING_TABLE_POINTERS_VS(p->dev,
301 p->state.vs.BINDING_TABLE_STATE, p->cp);
304 /* 3DSTATE_SAMPLER_STATE_POINTERS_VS */
305 if (emit_3dstate_sampler_state) {
306 p->gen7_3DSTATE_SAMPLER_STATE_POINTERS_VS(p->dev,
307 p->state.vs.SAMPLER_STATE, p->cp);
310 gen6_pipeline_vs(p, ilo, session);
314 gen7_pipeline_hs(struct ilo_3d_pipeline *p,
315 const struct ilo_context *ilo,
316 struct gen6_pipeline_session *session)
318 /* 3DSTATE_CONSTANT_HS and 3DSTATE_HS */
319 if (session->hw_ctx_changed) {
320 p->gen7_3DSTATE_CONSTANT_HS(p->dev, 0, 0, 0, p->cp);
321 p->gen7_3DSTATE_HS(p->dev, NULL, 0, 0, p->cp);
324 /* 3DSTATE_BINDING_TABLE_POINTERS_HS */
325 if (session->hw_ctx_changed)
326 p->gen7_3DSTATE_BINDING_TABLE_POINTERS_HS(p->dev, 0, p->cp);
330 gen7_pipeline_te(struct ilo_3d_pipeline *p,
331 const struct ilo_context *ilo,
332 struct gen6_pipeline_session *session)
335 if (session->hw_ctx_changed)
336 p->gen7_3DSTATE_TE(p->dev, p->cp);
340 gen7_pipeline_ds(struct ilo_3d_pipeline *p,
341 const struct ilo_context *ilo,
342 struct gen6_pipeline_session *session)
344 /* 3DSTATE_CONSTANT_DS and 3DSTATE_DS */
345 if (session->hw_ctx_changed) {
346 p->gen7_3DSTATE_CONSTANT_DS(p->dev, 0, 0, 0, p->cp);
347 p->gen7_3DSTATE_DS(p->dev, NULL, 0, 0, p->cp);
350 /* 3DSTATE_BINDING_TABLE_POINTERS_DS */
351 if (session->hw_ctx_changed)
352 p->gen7_3DSTATE_BINDING_TABLE_POINTERS_DS(p->dev, 0, p->cp);
357 gen7_pipeline_gs(struct ilo_3d_pipeline *p,
358 const struct ilo_context *ilo,
359 struct gen6_pipeline_session *session)
361 /* 3DSTATE_CONSTANT_GS and 3DSTATE_GS */
362 if (session->hw_ctx_changed) {
363 p->gen6_3DSTATE_CONSTANT_GS(p->dev, 0, 0, 0, p->cp);
364 p->gen7_3DSTATE_GS(p->dev, NULL, 0, p->cp);
367 /* 3DSTATE_BINDING_TABLE_POINTERS_GS */
368 if (session->binding_table_gs_changed) {
369 p->gen7_3DSTATE_BINDING_TABLE_POINTERS_GS(p->dev,
370 p->state.gs.BINDING_TABLE_STATE, p->cp);
375 gen7_pipeline_sol(struct ilo_3d_pipeline *p,
376 const struct ilo_context *ilo,
377 struct gen6_pipeline_session *session)
379 const struct pipe_stream_output_info *so_info;
380 const struct ilo_shader *sh;
381 bool dirty_sh = false;
384 so_info = &ilo->gs->info.stream_output;
385 sh = ilo->gs->shader;
386 dirty_sh = DIRTY(GS);
389 so_info = &ilo->vs->info.stream_output;
390 sh = ilo->vs->shader;
391 dirty_sh = DIRTY(VS);
394 gen6_pipeline_update_max_svbi(p, ilo, session);
396 /* 3DSTATE_SO_BUFFER */
397 if ((DIRTY(STREAM_OUTPUT_TARGETS) || dirty_sh) && ilo->so.enabled) {
400 for (i = 0; i < ilo->so.count; i++) {
401 const int stride = so_info->stride[i] * 4; /* in bytes */
404 /* reset HW write offsets and offset buffer base */
405 if (!p->cp->render_ctx) {
406 ilo_cp_set_one_off_flags(p->cp, INTEL_EXEC_GEN7_SOL_RESET);
407 base += p->state.so_num_vertices * stride;
410 p->gen7_3DSTATE_SO_BUFFER(p->dev, i, base, stride,
411 ilo->so.states[i], p->cp);
415 p->gen7_3DSTATE_SO_BUFFER(p->dev, i, 0, 0, NULL, p->cp);
418 /* 3DSTATE_SO_DECL_LIST */
419 if (dirty_sh && ilo->so.enabled)
420 p->gen7_3DSTATE_SO_DECL_LIST(p->dev, so_info, sh, p->cp);
422 /* 3DSTATE_STREAMOUT */
423 if (DIRTY(STREAM_OUTPUT_TARGETS) || DIRTY(RASTERIZER) || dirty_sh) {
424 const unsigned buffer_mask = (1 << ilo->so.count) - 1;
426 p->gen7_3DSTATE_STREAMOUT(p->dev, buffer_mask, sh->out.count,
427 ilo->rasterizer->state.rasterizer_discard, p->cp);
432 gen7_pipeline_sf(struct ilo_3d_pipeline *p,
433 const struct ilo_context *ilo,
434 struct gen6_pipeline_session *session)
437 if (DIRTY(RASTERIZER) || DIRTY(VS) || DIRTY(GS) || DIRTY(FS)) {
438 const struct ilo_shader *fs = (ilo->fs)? ilo->fs->shader : NULL;
439 const struct ilo_shader *last_sh =
440 (ilo->gs)? ilo->gs->shader :
441 (ilo->vs)? ilo->vs->shader : NULL;
443 p->gen7_3DSTATE_SBE(p->dev,
444 &ilo->rasterizer->state, fs, last_sh, p->cp);
448 if (DIRTY(RASTERIZER) || DIRTY(FRAMEBUFFER)) {
449 gen7_wa_pipe_control_cs_stall(p, true, true);
451 p->gen7_3DSTATE_SF(p->dev,
452 &ilo->rasterizer->state, ilo->fb.state.zsbuf, p->cp);
457 gen7_pipeline_wm(struct ilo_3d_pipeline *p,
458 const struct ilo_context *ilo,
459 struct gen6_pipeline_session *session)
462 if (DIRTY(FS) || DIRTY(BLEND) || DIRTY(DEPTH_STENCIL_ALPHA) ||
464 const struct ilo_shader *fs = (ilo->fs)? ilo->fs->shader : NULL;
465 const bool cc_may_kill = (ilo->dsa->alpha.enabled ||
466 ilo->blend->alpha_to_coverage);
469 assert(!fs->pcb.clip_state_size);
471 if (p->dev->gen == ILO_GEN(7) && session->hw_ctx_changed)
472 gen7_wa_pipe_control_wm_max_threads_stall(p);
474 p->gen7_3DSTATE_WM(p->dev,
475 fs, &ilo->rasterizer->state, cc_may_kill, p->cp);
478 /* 3DSTATE_BINDING_TABLE_POINTERS_PS */
479 if (session->binding_table_fs_changed) {
480 p->gen7_3DSTATE_BINDING_TABLE_POINTERS_PS(p->dev,
481 p->state.wm.BINDING_TABLE_STATE, p->cp);
484 /* 3DSTATE_SAMPLER_STATE_POINTERS_PS */
485 if (session->sampler_state_fs_changed) {
486 p->gen7_3DSTATE_SAMPLER_STATE_POINTERS_PS(p->dev,
487 p->state.wm.SAMPLER_STATE, p->cp);
490 /* 3DSTATE_CONSTANT_PS */
491 if (session->pcb_state_fs_changed)
492 p->gen6_3DSTATE_CONSTANT_PS(p->dev, NULL, NULL, 0, p->cp);
495 if (DIRTY(FS) || DIRTY(FRAGMENT_SAMPLERS) ||
497 const struct ilo_shader *fs = (ilo->fs)? ilo->fs->shader : NULL;
498 const int num_samplers = ilo->sampler[PIPE_SHADER_FRAGMENT].count;
499 const bool dual_blend = ilo->blend->dual_blend;
502 assert(!fs->pcb.clip_state_size);
504 p->gen7_3DSTATE_PS(p->dev, fs, num_samplers, dual_blend, p->cp);
507 /* 3DSTATE_SCISSOR_STATE_POINTERS */
508 if (session->scissor_state_changed) {
509 p->gen6_3DSTATE_SCISSOR_STATE_POINTERS(p->dev,
510 p->state.SCISSOR_RECT, p->cp);
513 /* XXX what is the best way to know if this workaround is needed? */
515 const bool emit_3dstate_ps = (DIRTY(FS) ||
516 DIRTY(FRAGMENT_SAMPLERS) ||
518 const bool emit_3dstate_depth_buffer =
519 (DIRTY(FRAMEBUFFER) || DIRTY(DEPTH_STENCIL_ALPHA) ||
520 session->state_bo_changed);
522 if (emit_3dstate_ps ||
523 emit_3dstate_depth_buffer ||
524 session->pcb_state_fs_changed ||
525 session->viewport_state_changed ||
526 session->binding_table_fs_changed ||
527 session->sampler_state_fs_changed ||
528 session->cc_state_cc_changed ||
529 session->cc_state_blend_changed ||
530 session->cc_state_dsa_changed)
531 gen7_wa_pipe_control_wm_depth_stall(p, emit_3dstate_depth_buffer);
535 * glCopyPixels() with GL_DEPTH, which flushes the context before copying
536 * the depth buffer to a temporary texture, could not update the depth
537 * buffer _sometimes_. Reissuing 3DSTATE_DEPTH_BUFFER in the new batch
538 * makes the problem gone.
541 /* 3DSTATE_DEPTH_BUFFER and 3DSTATE_CLEAR_PARAMS */
542 if (DIRTY(FRAMEBUFFER) || session->state_bo_changed) {
543 p->gen7_3DSTATE_DEPTH_BUFFER(p->dev, ilo->fb.state.zsbuf, p->cp);
544 p->gen6_3DSTATE_HIER_DEPTH_BUFFER(p->dev, ilo->fb.state.zsbuf, p->cp);
545 p->gen6_3DSTATE_STENCIL_BUFFER(p->dev, ilo->fb.state.zsbuf, p->cp);
548 p->gen6_3DSTATE_CLEAR_PARAMS(p->dev, 0, p->cp);
553 gen7_pipeline_wm_multisample(struct ilo_3d_pipeline *p,
554 const struct ilo_context *ilo,
555 struct gen6_pipeline_session *session)
557 /* 3DSTATE_MULTISAMPLE and 3DSTATE_SAMPLE_MASK */
558 if (DIRTY(SAMPLE_MASK) || DIRTY(FRAMEBUFFER)) {
559 const uint32_t *packed_sample_pos;
561 gen7_wa_pipe_control_cs_stall(p, true, true);
564 (ilo->fb.num_samples > 4) ? p->packed_sample_position_8x :
565 (ilo->fb.num_samples > 1) ? &p->packed_sample_position_4x :
566 &p->packed_sample_position_1x;
568 p->gen6_3DSTATE_MULTISAMPLE(p->dev,
569 ilo->fb.num_samples, packed_sample_pos,
570 ilo->rasterizer->state.half_pixel_center, p->cp);
572 p->gen7_3DSTATE_SAMPLE_MASK(p->dev,
573 (ilo->fb.num_samples > 1) ? ilo->sample_mask : 0x1,
574 ilo->fb.num_samples, p->cp);
579 gen7_pipeline_commands(struct ilo_3d_pipeline *p,
580 const struct ilo_context *ilo,
581 struct gen6_pipeline_session *session)
584 * We try to keep the order of the commands match, as closely as possible,
585 * that of the classic i965 driver. It allows us to compare the command
588 gen6_pipeline_common_select(p, ilo, session);
589 gen6_pipeline_common_sip(p, ilo, session);
590 gen6_pipeline_vf_statistics(p, ilo, session);
591 gen7_pipeline_common_pcb_alloc(p, ilo, session);
592 gen6_pipeline_common_base_address(p, ilo, session);
593 gen7_pipeline_common_pointers_1(p, ilo, session);
594 gen7_pipeline_common_urb(p, ilo, session);
595 gen7_pipeline_common_pointers_2(p, ilo, session);
596 gen7_pipeline_wm_multisample(p, ilo, session);
597 gen7_pipeline_gs(p, ilo, session);
598 gen7_pipeline_hs(p, ilo, session);
599 gen7_pipeline_te(p, ilo, session);
600 gen7_pipeline_ds(p, ilo, session);
601 gen7_pipeline_vs(p, ilo, session);
602 gen7_pipeline_sol(p, ilo, session);
603 gen6_pipeline_clip(p, ilo, session);
604 gen7_pipeline_sf(p, ilo, session);
605 gen7_pipeline_wm(p, ilo, session);
606 gen6_pipeline_wm_raster(p, ilo, session);
607 gen6_pipeline_sf_rect(p, ilo, session);
608 gen6_pipeline_vf(p, ilo, session);
609 gen6_pipeline_vf_draw(p, ilo, session);
613 ilo_3d_pipeline_emit_draw_gen7(struct ilo_3d_pipeline *p,
614 const struct ilo_context *ilo,
615 const struct pipe_draw_info *info)
617 struct gen6_pipeline_session session;
619 gen6_pipeline_prepare(p, ilo, info, &session);
621 session.emit_draw_states = gen6_pipeline_states;
622 session.emit_draw_commands = gen7_pipeline_commands;
624 gen6_pipeline_draw(p, ilo, &session);
625 gen6_pipeline_end(p, ilo, &session);
629 gen7_pipeline_estimate_commands(const struct ilo_3d_pipeline *p,
630 const struct ilo_gpe_gen7 *gen7,
631 const struct ilo_context *ilo)
634 enum ilo_gpe_gen7_command cmd;
639 for (cmd = 0; cmd < ILO_GPE_GEN7_COMMAND_COUNT; cmd++) {
643 case ILO_GPE_GEN7_PIPE_CONTROL:
644 /* for the workaround */
646 /* another one after 3DSTATE_URB */
648 /* and another one after 3DSTATE_CONSTANT_VS */
651 case ILO_GPE_GEN7_3DSTATE_VERTEX_BUFFERS:
654 case ILO_GPE_GEN7_3DSTATE_VERTEX_ELEMENTS:
657 case ILO_GPE_GEN7_MEDIA_VFE_STATE:
658 case ILO_GPE_GEN7_MEDIA_CURBE_LOAD:
659 case ILO_GPE_GEN7_MEDIA_INTERFACE_DESCRIPTOR_LOAD:
660 case ILO_GPE_GEN7_MEDIA_STATE_FLUSH:
661 case ILO_GPE_GEN7_GPGPU_WALKER:
671 size += gen7->estimate_command_size(p->dev,
680 gen7_pipeline_estimate_states(const struct ilo_3d_pipeline *p,
681 const struct ilo_gpe_gen7 *gen7,
682 const struct ilo_context *ilo)
684 static int static_size;
685 int shader_type, count, size;
689 enum ilo_gpe_gen7_state state;
691 } static_states[] = {
693 { ILO_GPE_GEN7_SF_CLIP_VIEWPORT, 1 },
694 { ILO_GPE_GEN7_CC_VIEWPORT, 1 },
696 { ILO_GPE_GEN7_COLOR_CALC_STATE, 1 },
697 { ILO_GPE_GEN7_BLEND_STATE, ILO_MAX_DRAW_BUFFERS },
698 { ILO_GPE_GEN7_DEPTH_STENCIL_STATE, 1 },
700 { ILO_GPE_GEN7_SCISSOR_RECT, 1 },
701 /* binding table (vs, gs, fs) */
702 { ILO_GPE_GEN7_BINDING_TABLE_STATE, ILO_MAX_VS_SURFACES },
703 { ILO_GPE_GEN7_BINDING_TABLE_STATE, ILO_MAX_GS_SURFACES },
704 { ILO_GPE_GEN7_BINDING_TABLE_STATE, ILO_MAX_WM_SURFACES },
708 for (i = 0; i < Elements(static_states); i++) {
709 static_size += gen7->estimate_state_size(p->dev,
710 static_states[i].state,
711 static_states[i].count);
718 * render targets (fs)
719 * sampler views (vs, fs)
720 * constant buffers (vs, fs)
722 count = ilo->fb.state.nr_cbufs;
723 for (shader_type = 0; shader_type < PIPE_SHADER_TYPES; shader_type++) {
724 count += ilo->view[shader_type].count;
725 count += ilo->cbuf[shader_type].count;
729 size += gen7->estimate_state_size(p->dev,
730 ILO_GPE_GEN7_SURFACE_STATE, count);
733 /* samplers (vs, fs) */
734 for (shader_type = 0; shader_type < PIPE_SHADER_TYPES; shader_type++) {
735 count = ilo->sampler[shader_type].count;
737 size += gen7->estimate_state_size(p->dev,
738 ILO_GPE_GEN7_SAMPLER_BORDER_COLOR_STATE, count);
739 size += gen7->estimate_state_size(p->dev,
740 ILO_GPE_GEN7_SAMPLER_STATE, count);
745 if (ilo->vs && ilo->vs->shader->pcb.clip_state_size) {
746 const int pcb_size = ilo->vs->shader->pcb.clip_state_size;
748 size += gen7->estimate_state_size(p->dev,
749 ILO_GPE_GEN7_PUSH_CONSTANT_BUFFER, pcb_size);
756 ilo_3d_pipeline_estimate_size_gen7(struct ilo_3d_pipeline *p,
757 enum ilo_3d_pipeline_action action,
760 const struct ilo_gpe_gen7 *gen7 = ilo_gpe_gen7_get();
764 case ILO_3D_PIPELINE_DRAW:
766 const struct ilo_context *ilo = arg;
768 size = gen7_pipeline_estimate_commands(p, gen7, ilo) +
769 gen7_pipeline_estimate_states(p, gen7, ilo);
772 case ILO_3D_PIPELINE_FLUSH:
773 case ILO_3D_PIPELINE_WRITE_TIMESTAMP:
774 case ILO_3D_PIPELINE_WRITE_DEPTH_COUNT:
775 size = gen7->estimate_command_size(p->dev,
776 ILO_GPE_GEN7_PIPE_CONTROL, 1);
779 assert(!"unknown 3D pipeline action");
788 ilo_3d_pipeline_init_gen7(struct ilo_3d_pipeline *p)
790 const struct ilo_gpe_gen7 *gen7 = ilo_gpe_gen7_get();
792 p->estimate_size = ilo_3d_pipeline_estimate_size_gen7;
793 p->emit_draw = ilo_3d_pipeline_emit_draw_gen7;
794 p->emit_flush = ilo_3d_pipeline_emit_flush_gen6;
795 p->emit_write_timestamp = ilo_3d_pipeline_emit_write_timestamp_gen6;
796 p->emit_write_depth_count = ilo_3d_pipeline_emit_write_depth_count_gen6;
798 #define GEN6_USE(p, name, from) \
799 p->gen6_ ## name = from->emit_ ## name
800 GEN6_USE(p, STATE_BASE_ADDRESS, gen7);
801 GEN6_USE(p, STATE_SIP, gen7);
802 GEN6_USE(p, PIPELINE_SELECT, gen7);
803 GEN6_USE(p, 3DSTATE_VERTEX_BUFFERS, gen7);
804 GEN6_USE(p, 3DSTATE_VERTEX_ELEMENTS, gen7);
805 GEN6_USE(p, 3DSTATE_INDEX_BUFFER, gen7);
806 GEN6_USE(p, 3DSTATE_VF_STATISTICS, gen7);
807 GEN6_USE(p, 3DSTATE_SCISSOR_STATE_POINTERS, gen7);
808 GEN6_USE(p, 3DSTATE_VS, gen7);
809 GEN6_USE(p, 3DSTATE_CLIP, gen7);
810 GEN6_USE(p, 3DSTATE_CONSTANT_VS, gen7);
811 GEN6_USE(p, 3DSTATE_CONSTANT_GS, gen7);
812 GEN6_USE(p, 3DSTATE_CONSTANT_PS, gen7);
813 GEN6_USE(p, 3DSTATE_DRAWING_RECTANGLE, gen7);
814 GEN6_USE(p, 3DSTATE_POLY_STIPPLE_OFFSET, gen7);
815 GEN6_USE(p, 3DSTATE_POLY_STIPPLE_PATTERN, gen7);
816 GEN6_USE(p, 3DSTATE_LINE_STIPPLE, gen7);
817 GEN6_USE(p, 3DSTATE_AA_LINE_PARAMETERS, gen7);
818 GEN6_USE(p, 3DSTATE_MULTISAMPLE, gen7);
819 GEN6_USE(p, 3DSTATE_STENCIL_BUFFER, gen7);
820 GEN6_USE(p, 3DSTATE_HIER_DEPTH_BUFFER, gen7);
821 GEN6_USE(p, 3DSTATE_CLEAR_PARAMS, gen7);
822 GEN6_USE(p, PIPE_CONTROL, gen7);
823 GEN6_USE(p, 3DPRIMITIVE, gen7);
824 GEN6_USE(p, INTERFACE_DESCRIPTOR_DATA, gen7);
825 GEN6_USE(p, CC_VIEWPORT, gen7);
826 GEN6_USE(p, COLOR_CALC_STATE, gen7);
827 GEN6_USE(p, BLEND_STATE, gen7);
828 GEN6_USE(p, DEPTH_STENCIL_STATE, gen7);
829 GEN6_USE(p, SCISSOR_RECT, gen7);
830 GEN6_USE(p, BINDING_TABLE_STATE, gen7);
831 GEN6_USE(p, SURFACE_STATE, gen7);
832 GEN6_USE(p, SAMPLER_STATE, gen7);
833 GEN6_USE(p, SAMPLER_BORDER_COLOR_STATE, gen7);
834 GEN6_USE(p, push_constant_buffer, gen7);
837 #define GEN7_USE(p, name, from) \
838 p->gen7_ ## name = from->emit_ ## name
839 GEN7_USE(p, 3DSTATE_DEPTH_BUFFER, gen7);
840 GEN7_USE(p, 3DSTATE_CC_STATE_POINTERS, gen7);
841 GEN7_USE(p, 3DSTATE_GS, gen7);
842 GEN7_USE(p, 3DSTATE_SF, gen7);
843 GEN7_USE(p, 3DSTATE_WM, gen7);
844 GEN7_USE(p, 3DSTATE_SAMPLE_MASK, gen7);
845 GEN7_USE(p, 3DSTATE_CONSTANT_HS, gen7);
846 GEN7_USE(p, 3DSTATE_CONSTANT_DS, gen7);
847 GEN7_USE(p, 3DSTATE_HS, gen7);
848 GEN7_USE(p, 3DSTATE_TE, gen7);
849 GEN7_USE(p, 3DSTATE_DS, gen7);
850 GEN7_USE(p, 3DSTATE_STREAMOUT, gen7);
851 GEN7_USE(p, 3DSTATE_SBE, gen7);
852 GEN7_USE(p, 3DSTATE_PS, gen7);
853 GEN7_USE(p, 3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP, gen7);
854 GEN7_USE(p, 3DSTATE_VIEWPORT_STATE_POINTERS_CC, gen7);
855 GEN7_USE(p, 3DSTATE_BLEND_STATE_POINTERS, gen7);
856 GEN7_USE(p, 3DSTATE_DEPTH_STENCIL_STATE_POINTERS, gen7);
857 GEN7_USE(p, 3DSTATE_BINDING_TABLE_POINTERS_VS, gen7);
858 GEN7_USE(p, 3DSTATE_BINDING_TABLE_POINTERS_HS, gen7);
859 GEN7_USE(p, 3DSTATE_BINDING_TABLE_POINTERS_DS, gen7);
860 GEN7_USE(p, 3DSTATE_BINDING_TABLE_POINTERS_GS, gen7);
861 GEN7_USE(p, 3DSTATE_BINDING_TABLE_POINTERS_PS, gen7);
862 GEN7_USE(p, 3DSTATE_SAMPLER_STATE_POINTERS_VS, gen7);
863 GEN7_USE(p, 3DSTATE_SAMPLER_STATE_POINTERS_HS, gen7);
864 GEN7_USE(p, 3DSTATE_SAMPLER_STATE_POINTERS_DS, gen7);
865 GEN7_USE(p, 3DSTATE_SAMPLER_STATE_POINTERS_GS, gen7);
866 GEN7_USE(p, 3DSTATE_SAMPLER_STATE_POINTERS_PS, gen7);
867 GEN7_USE(p, 3DSTATE_URB_VS, gen7);
868 GEN7_USE(p, 3DSTATE_URB_HS, gen7);
869 GEN7_USE(p, 3DSTATE_URB_DS, gen7);
870 GEN7_USE(p, 3DSTATE_URB_GS, gen7);
871 GEN7_USE(p, 3DSTATE_PUSH_CONSTANT_ALLOC_VS, gen7);
872 GEN7_USE(p, 3DSTATE_PUSH_CONSTANT_ALLOC_HS, gen7);
873 GEN7_USE(p, 3DSTATE_PUSH_CONSTANT_ALLOC_DS, gen7);
874 GEN7_USE(p, 3DSTATE_PUSH_CONSTANT_ALLOC_GS, gen7);
875 GEN7_USE(p, 3DSTATE_PUSH_CONSTANT_ALLOC_PS, gen7);
876 GEN7_USE(p, 3DSTATE_SO_DECL_LIST, gen7);
877 GEN7_USE(p, 3DSTATE_SO_BUFFER, gen7);
878 GEN7_USE(p, SF_CLIP_VIEWPORT, gen7);