Lines Matching +full:cs +full:- +full:1

1 // SPDX-License-Identifier: MIT
18 * Emits a PIPE_CONTROL with a non-zero post-sync operation, for
20 * "PIPE_CONTROL" of the Sandy Bridge PRM volume 2 part 1:
22 * [DevSNB-C+{W/A}] Before any depth stall flush (including those
23 * produced by non-pipelined state commands), software needs to first
24 * send a PIPE_CONTROL with no bits set except Post-Sync Operation !=
27 * [Dev-SNB{W/A}]: Before a PIPE_CONTROL with Write Cache Flush Enable
28 * =1, a PIPE_CONTROL with any non-zero post-sync-op is required.
32 * [Dev-SNB{W/A}]: Pipe-control with CS-stall bit set must be sent
33 * BEFORE the pipe-control with a post-sync op and no write-cache
38 * volume 2 part 1:
40 * "1 of the following must also be set:
41 * - Render Target Cache Flush Enable ([12] of DW1)
42 * - Depth Cache Flush Enable ([0] of DW1)
43 * - Stall at Pixel Scoreboard ([1] of DW1)
44 * - Depth Stall ([13] of DW1)
45 * - Post-Sync Operation ([13] of DW1)
46 * - Notify Enable ([8] of DW1)"
50 * Post-sync nonzero is what triggered this second workaround, so we
58 intel_gt_scratch_offset(rq->engine->gt, in gen6_emit_post_sync_nonzero_flush()
60 u32 *cs; in gen6_emit_post_sync_nonzero_flush() local
62 cs = intel_ring_begin(rq, 6); in gen6_emit_post_sync_nonzero_flush()
63 if (IS_ERR(cs)) in gen6_emit_post_sync_nonzero_flush()
64 return PTR_ERR(cs); in gen6_emit_post_sync_nonzero_flush()
66 *cs++ = GFX_OP_PIPE_CONTROL(5); in gen6_emit_post_sync_nonzero_flush()
67 *cs++ = PIPE_CONTROL_CS_STALL | PIPE_CONTROL_STALL_AT_SCOREBOARD; in gen6_emit_post_sync_nonzero_flush()
68 *cs++ = scratch_addr | PIPE_CONTROL_GLOBAL_GTT; in gen6_emit_post_sync_nonzero_flush()
69 *cs++ = 0; /* low dword */ in gen6_emit_post_sync_nonzero_flush()
70 *cs++ = 0; /* high dword */ in gen6_emit_post_sync_nonzero_flush()
71 *cs++ = MI_NOOP; in gen6_emit_post_sync_nonzero_flush()
72 intel_ring_advance(rq, cs); in gen6_emit_post_sync_nonzero_flush()
74 cs = intel_ring_begin(rq, 6); in gen6_emit_post_sync_nonzero_flush()
75 if (IS_ERR(cs)) in gen6_emit_post_sync_nonzero_flush()
76 return PTR_ERR(cs); in gen6_emit_post_sync_nonzero_flush()
78 *cs++ = GFX_OP_PIPE_CONTROL(5); in gen6_emit_post_sync_nonzero_flush()
79 *cs++ = PIPE_CONTROL_QW_WRITE; in gen6_emit_post_sync_nonzero_flush()
80 *cs++ = scratch_addr | PIPE_CONTROL_GLOBAL_GTT; in gen6_emit_post_sync_nonzero_flush()
81 *cs++ = 0; in gen6_emit_post_sync_nonzero_flush()
82 *cs++ = 0; in gen6_emit_post_sync_nonzero_flush()
83 *cs++ = MI_NOOP; in gen6_emit_post_sync_nonzero_flush()
84 intel_ring_advance(rq, cs); in gen6_emit_post_sync_nonzero_flush()
92 intel_gt_scratch_offset(rq->engine->gt, in gen6_emit_flush_rcs()
94 u32 *cs, flags = 0; in gen6_emit_flush_rcs() local
125 * TLB invalidate requires a post-sync write. in gen6_emit_flush_rcs()
130 cs = intel_ring_begin(rq, 4); in gen6_emit_flush_rcs()
131 if (IS_ERR(cs)) in gen6_emit_flush_rcs()
132 return PTR_ERR(cs); in gen6_emit_flush_rcs()
134 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen6_emit_flush_rcs()
135 *cs++ = flags; in gen6_emit_flush_rcs()
136 *cs++ = scratch_addr | PIPE_CONTROL_GLOBAL_GTT; in gen6_emit_flush_rcs()
137 *cs++ = 0; in gen6_emit_flush_rcs()
138 intel_ring_advance(rq, cs); in gen6_emit_flush_rcs()
143 u32 *gen6_emit_breadcrumb_rcs(struct i915_request *rq, u32 *cs) in gen6_emit_breadcrumb_rcs() argument
146 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen6_emit_breadcrumb_rcs()
147 *cs++ = PIPE_CONTROL_CS_STALL | PIPE_CONTROL_STALL_AT_SCOREBOARD; in gen6_emit_breadcrumb_rcs()
148 *cs++ = 0; in gen6_emit_breadcrumb_rcs()
149 *cs++ = 0; in gen6_emit_breadcrumb_rcs()
151 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen6_emit_breadcrumb_rcs()
152 *cs++ = PIPE_CONTROL_QW_WRITE; in gen6_emit_breadcrumb_rcs()
153 *cs++ = intel_gt_scratch_offset(rq->engine->gt, in gen6_emit_breadcrumb_rcs()
156 *cs++ = 0; in gen6_emit_breadcrumb_rcs()
159 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen6_emit_breadcrumb_rcs()
160 *cs++ = (PIPE_CONTROL_RENDER_TARGET_CACHE_FLUSH | in gen6_emit_breadcrumb_rcs()
165 *cs++ = i915_request_active_seqno(rq) | in gen6_emit_breadcrumb_rcs()
167 *cs++ = rq->fence.seqno; in gen6_emit_breadcrumb_rcs()
169 *cs++ = MI_USER_INTERRUPT; in gen6_emit_breadcrumb_rcs()
170 *cs++ = MI_NOOP; in gen6_emit_breadcrumb_rcs()
172 rq->tail = intel_ring_offset(rq, cs); in gen6_emit_breadcrumb_rcs()
173 assert_ring_tail_valid(rq->ring, rq->tail); in gen6_emit_breadcrumb_rcs()
175 return cs; in gen6_emit_breadcrumb_rcs()
180 u32 cmd, *cs; in mi_flush_dw() local
182 cs = intel_ring_begin(rq, 4); in mi_flush_dw()
183 if (IS_ERR(cs)) in mi_flush_dw()
184 return PTR_ERR(cs); in mi_flush_dw()
197 * Bspec vol 1c.3 - blitter engine command streamer: in mi_flush_dw()
200 * Post-Sync Operation field is a value of 1h or 3h." in mi_flush_dw()
204 *cs++ = cmd; in mi_flush_dw()
205 *cs++ = HWS_SCRATCH_ADDR | MI_FLUSH_DW_USE_GTT; in mi_flush_dw()
206 *cs++ = 0; in mi_flush_dw()
207 *cs++ = MI_NOOP; in mi_flush_dw()
209 intel_ring_advance(rq, cs); in mi_flush_dw()
234 u32 *cs; in gen6_emit_bb_start() local
240 cs = intel_ring_begin(rq, 2); in gen6_emit_bb_start()
241 if (IS_ERR(cs)) in gen6_emit_bb_start()
242 return PTR_ERR(cs); in gen6_emit_bb_start()
244 cs = __gen6_emit_bb_start(cs, offset, security); in gen6_emit_bb_start()
245 intel_ring_advance(rq, cs); in gen6_emit_bb_start()
256 u32 *cs; in hsw_emit_bb_start() local
262 cs = intel_ring_begin(rq, 2); in hsw_emit_bb_start()
263 if (IS_ERR(cs)) in hsw_emit_bb_start()
264 return PTR_ERR(cs); in hsw_emit_bb_start()
266 cs = __gen6_emit_bb_start(cs, offset, security); in hsw_emit_bb_start()
267 intel_ring_advance(rq, cs); in hsw_emit_bb_start()
274 u32 *cs; in gen7_stall_cs() local
276 cs = intel_ring_begin(rq, 4); in gen7_stall_cs()
277 if (IS_ERR(cs)) in gen7_stall_cs()
278 return PTR_ERR(cs); in gen7_stall_cs()
280 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen7_stall_cs()
281 *cs++ = PIPE_CONTROL_CS_STALL | PIPE_CONTROL_STALL_AT_SCOREBOARD; in gen7_stall_cs()
282 *cs++ = 0; in gen7_stall_cs()
283 *cs++ = 0; in gen7_stall_cs()
284 intel_ring_advance(rq, cs); in gen7_stall_cs()
292 intel_gt_scratch_offset(rq->engine->gt, in gen7_emit_flush_rcs()
294 u32 *cs, flags = 0; in gen7_emit_flush_rcs() local
301 * read-cache invalidate bits set) must have the CS_STALL bit set. We in gen7_emit_flush_rcs()
307 * CS_STALL suggests at least a post-sync write. in gen7_emit_flush_rcs()
333 * Workaround: we must issue a pipe_control with CS-stall bit in gen7_emit_flush_rcs()
340 cs = intel_ring_begin(rq, 4); in gen7_emit_flush_rcs()
341 if (IS_ERR(cs)) in gen7_emit_flush_rcs()
342 return PTR_ERR(cs); in gen7_emit_flush_rcs()
344 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen7_emit_flush_rcs()
345 *cs++ = flags; in gen7_emit_flush_rcs()
346 *cs++ = scratch_addr; in gen7_emit_flush_rcs()
347 *cs++ = 0; in gen7_emit_flush_rcs()
348 intel_ring_advance(rq, cs); in gen7_emit_flush_rcs()
353 u32 *gen7_emit_breadcrumb_rcs(struct i915_request *rq, u32 *cs) in gen7_emit_breadcrumb_rcs() argument
355 *cs++ = GFX_OP_PIPE_CONTROL(4); in gen7_emit_breadcrumb_rcs()
356 *cs++ = (PIPE_CONTROL_RENDER_TARGET_CACHE_FLUSH | in gen7_emit_breadcrumb_rcs()
363 *cs++ = i915_request_active_seqno(rq); in gen7_emit_breadcrumb_rcs()
364 *cs++ = rq->fence.seqno; in gen7_emit_breadcrumb_rcs()
366 *cs++ = MI_USER_INTERRUPT; in gen7_emit_breadcrumb_rcs()
367 *cs++ = MI_NOOP; in gen7_emit_breadcrumb_rcs()
369 rq->tail = intel_ring_offset(rq, cs); in gen7_emit_breadcrumb_rcs()
370 assert_ring_tail_valid(rq->ring, rq->tail); in gen7_emit_breadcrumb_rcs()
372 return cs; in gen7_emit_breadcrumb_rcs()
375 u32 *gen6_emit_breadcrumb_xcs(struct i915_request *rq, u32 *cs) in gen6_emit_breadcrumb_xcs() argument
377 GEM_BUG_ON(i915_request_active_timeline(rq)->hwsp_ggtt != rq->engine->status_page.vma); in gen6_emit_breadcrumb_xcs()
378 GEM_BUG_ON(offset_in_page(rq->hwsp_seqno) != I915_GEM_HWS_SEQNO_ADDR); in gen6_emit_breadcrumb_xcs()
380 *cs++ = MI_FLUSH_DW | MI_FLUSH_DW_OP_STOREDW | MI_FLUSH_DW_STORE_INDEX; in gen6_emit_breadcrumb_xcs()
381 *cs++ = I915_GEM_HWS_SEQNO_ADDR | MI_FLUSH_DW_USE_GTT; in gen6_emit_breadcrumb_xcs()
382 *cs++ = rq->fence.seqno; in gen6_emit_breadcrumb_xcs()
384 *cs++ = MI_USER_INTERRUPT; in gen6_emit_breadcrumb_xcs()
386 rq->tail = intel_ring_offset(rq, cs); in gen6_emit_breadcrumb_xcs()
387 assert_ring_tail_valid(rq->ring, rq->tail); in gen6_emit_breadcrumb_xcs()
389 return cs; in gen6_emit_breadcrumb_xcs()
393 u32 *gen7_emit_breadcrumb_xcs(struct i915_request *rq, u32 *cs) in gen7_emit_breadcrumb_xcs() argument
397 GEM_BUG_ON(i915_request_active_timeline(rq)->hwsp_ggtt != rq->engine->status_page.vma); in gen7_emit_breadcrumb_xcs()
398 GEM_BUG_ON(offset_in_page(rq->hwsp_seqno) != I915_GEM_HWS_SEQNO_ADDR); in gen7_emit_breadcrumb_xcs()
400 *cs++ = MI_FLUSH_DW | MI_INVALIDATE_TLB | in gen7_emit_breadcrumb_xcs()
402 *cs++ = I915_GEM_HWS_SEQNO_ADDR | MI_FLUSH_DW_USE_GTT; in gen7_emit_breadcrumb_xcs()
403 *cs++ = rq->fence.seqno; in gen7_emit_breadcrumb_xcs()
406 *cs++ = MI_STORE_DWORD_INDEX; in gen7_emit_breadcrumb_xcs()
407 *cs++ = I915_GEM_HWS_SEQNO_ADDR; in gen7_emit_breadcrumb_xcs()
408 *cs++ = rq->fence.seqno; in gen7_emit_breadcrumb_xcs()
411 *cs++ = MI_FLUSH_DW; in gen7_emit_breadcrumb_xcs()
412 *cs++ = 0; in gen7_emit_breadcrumb_xcs()
413 *cs++ = 0; in gen7_emit_breadcrumb_xcs()
415 *cs++ = MI_USER_INTERRUPT; in gen7_emit_breadcrumb_xcs()
416 *cs++ = MI_NOOP; in gen7_emit_breadcrumb_xcs()
418 rq->tail = intel_ring_offset(rq, cs); in gen7_emit_breadcrumb_xcs()
419 assert_ring_tail_valid(rq->ring, rq->tail); in gen7_emit_breadcrumb_xcs()
421 return cs; in gen7_emit_breadcrumb_xcs()
428 ~(engine->irq_enable_mask | engine->irq_keep_mask)); in gen6_irq_enable()
433 gen5_gt_enable_irq(engine->gt, engine->irq_enable_mask); in gen6_irq_enable()
438 ENGINE_WRITE(engine, RING_IMR, ~engine->irq_keep_mask); in gen6_irq_disable()
439 gen5_gt_disable_irq(engine->gt, engine->irq_enable_mask); in gen6_irq_disable()
444 ENGINE_WRITE(engine, RING_IMR, ~engine->irq_enable_mask); in hsw_irq_enable_vecs()
449 gen6_gt_pm_unmask_irq(engine->gt, engine->irq_enable_mask); in hsw_irq_enable_vecs()
455 gen6_gt_pm_mask_irq(engine->gt, engine->irq_enable_mask); in hsw_irq_disable_vecs()