drm/i915/ringbuffer: Use the HEAD auto-reporting mechanism
[deliverable/linux.git] / drivers / gpu / drm / i915 / intel_ringbuffer.c
CommitLineData
62fdfeaf
EA
1/*
2 * Copyright © 2008-2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Eric Anholt <eric@anholt.net>
25 * Zou Nan hai <nanhai.zou@intel.com>
26 * Xiang Hai hao<haihao.xiang@intel.com>
27 *
28 */
29
30#include "drmP.h"
31#include "drm.h"
62fdfeaf 32#include "i915_drv.h"
8187a2b7 33#include "i915_drm.h"
62fdfeaf 34#include "i915_trace.h"
881f47b6 35#include "intel_drv.h"
62fdfeaf 36
6f392d54
CW
37static u32 i915_gem_get_seqno(struct drm_device *dev)
38{
39 drm_i915_private_t *dev_priv = dev->dev_private;
40 u32 seqno;
41
42 seqno = dev_priv->next_seqno;
43
44 /* reserve 0 for non-seqno */
45 if (++dev_priv->next_seqno == 0)
46 dev_priv->next_seqno = 1;
47
48 return seqno;
49}
50
8187a2b7
ZN
51static void
52render_ring_flush(struct drm_device *dev,
ab6f8e32
CW
53 struct intel_ring_buffer *ring,
54 u32 invalidate_domains,
55 u32 flush_domains)
62fdfeaf 56{
6f392d54
CW
57 drm_i915_private_t *dev_priv = dev->dev_private;
58 u32 cmd;
59
62fdfeaf
EA
60#if WATCH_EXEC
61 DRM_INFO("%s: invalidate %08x flush %08x\n", __func__,
62 invalidate_domains, flush_domains);
63#endif
6f392d54
CW
64
65 trace_i915_gem_request_flush(dev, dev_priv->next_seqno,
62fdfeaf
EA
66 invalidate_domains, flush_domains);
67
62fdfeaf
EA
68 if ((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) {
69 /*
70 * read/write caches:
71 *
72 * I915_GEM_DOMAIN_RENDER is always invalidated, but is
73 * only flushed if MI_NO_WRITE_FLUSH is unset. On 965, it is
74 * also flushed at 2d versus 3d pipeline switches.
75 *
76 * read-only caches:
77 *
78 * I915_GEM_DOMAIN_SAMPLER is flushed on pre-965 if
79 * MI_READ_FLUSH is set, and is always flushed on 965.
80 *
81 * I915_GEM_DOMAIN_COMMAND may not exist?
82 *
83 * I915_GEM_DOMAIN_INSTRUCTION, which exists on 965, is
84 * invalidated when MI_EXE_FLUSH is set.
85 *
86 * I915_GEM_DOMAIN_VERTEX, which exists on 965, is
87 * invalidated with every MI_FLUSH.
88 *
89 * TLBs:
90 *
91 * On 965, TLBs associated with I915_GEM_DOMAIN_COMMAND
92 * and I915_GEM_DOMAIN_CPU in are invalidated at PTE write and
93 * I915_GEM_DOMAIN_RENDER and I915_GEM_DOMAIN_SAMPLER
94 * are flushed at any MI_FLUSH.
95 */
96
97 cmd = MI_FLUSH | MI_NO_WRITE_FLUSH;
98 if ((invalidate_domains|flush_domains) &
99 I915_GEM_DOMAIN_RENDER)
100 cmd &= ~MI_NO_WRITE_FLUSH;
a6c45cf0 101 if (INTEL_INFO(dev)->gen < 4) {
62fdfeaf
EA
102 /*
103 * On the 965, the sampler cache always gets flushed
104 * and this bit is reserved.
105 */
106 if (invalidate_domains & I915_GEM_DOMAIN_SAMPLER)
107 cmd |= MI_READ_FLUSH;
108 }
109 if (invalidate_domains & I915_GEM_DOMAIN_INSTRUCTION)
110 cmd |= MI_EXE_FLUSH;
111
112#if WATCH_EXEC
113 DRM_INFO("%s: queue flush %08x to ring\n", __func__, cmd);
114#endif
be26a10b 115 intel_ring_begin(dev, ring, 2);
8187a2b7
ZN
116 intel_ring_emit(dev, ring, cmd);
117 intel_ring_emit(dev, ring, MI_NOOP);
118 intel_ring_advance(dev, ring);
62fdfeaf 119 }
8187a2b7
ZN
120}
121
297b0c5b
CW
122static void ring_write_tail(struct drm_device *dev,
123 struct intel_ring_buffer *ring,
124 u32 value)
d46eefa2
XH
125{
126 drm_i915_private_t *dev_priv = dev->dev_private;
297b0c5b 127 I915_WRITE_TAIL(ring, value);
d46eefa2
XH
128}
129
79f321b7
DV
130u32 intel_ring_get_active_head(struct drm_device *dev,
131 struct intel_ring_buffer *ring)
8187a2b7
ZN
132{
133 drm_i915_private_t *dev_priv = dev->dev_private;
3d281d8c
DV
134 u32 acthd_reg = INTEL_INFO(dev)->gen >= 4 ?
135 RING_ACTHD(ring->mmio_base) : ACTHD;
8187a2b7
ZN
136
137 return I915_READ(acthd_reg);
138}
139
8187a2b7 140static int init_ring_common(struct drm_device *dev,
ab6f8e32 141 struct intel_ring_buffer *ring)
8187a2b7
ZN
142{
143 u32 head;
144 drm_i915_private_t *dev_priv = dev->dev_private;
145 struct drm_i915_gem_object *obj_priv;
146 obj_priv = to_intel_bo(ring->gem_object);
147
148 /* Stop the ring if it's running. */
7f2ab699 149 I915_WRITE_CTL(ring, 0);
570ef608 150 I915_WRITE_HEAD(ring, 0);
297b0c5b 151 ring->write_tail(dev, ring, 0);
8187a2b7
ZN
152
153 /* Initialize the ring. */
6c0e1c55 154 I915_WRITE_START(ring, obj_priv->gtt_offset);
570ef608 155 head = I915_READ_HEAD(ring) & HEAD_ADDR;
8187a2b7
ZN
156
157 /* G45 ring initialization fails to reset head to zero */
158 if (head != 0) {
159 DRM_ERROR("%s head not reset to zero "
160 "ctl %08x head %08x tail %08x start %08x\n",
161 ring->name,
7f2ab699 162 I915_READ_CTL(ring),
570ef608 163 I915_READ_HEAD(ring),
870e86dd 164 I915_READ_TAIL(ring),
6c0e1c55 165 I915_READ_START(ring));
8187a2b7 166
570ef608 167 I915_WRITE_HEAD(ring, 0);
8187a2b7
ZN
168
169 DRM_ERROR("%s head forced to zero "
170 "ctl %08x head %08x tail %08x start %08x\n",
171 ring->name,
7f2ab699 172 I915_READ_CTL(ring),
570ef608 173 I915_READ_HEAD(ring),
870e86dd 174 I915_READ_TAIL(ring),
6c0e1c55 175 I915_READ_START(ring));
8187a2b7
ZN
176 }
177
7f2ab699 178 I915_WRITE_CTL(ring,
8187a2b7 179 ((ring->gem_object->size - PAGE_SIZE) & RING_NR_PAGES)
08deebf9 180 | RING_REPORT_64K | RING_VALID);
8187a2b7 181
570ef608 182 head = I915_READ_HEAD(ring) & HEAD_ADDR;
8187a2b7
ZN
183 /* If the head is still not zero, the ring is dead */
184 if (head != 0) {
185 DRM_ERROR("%s initialization failed "
186 "ctl %08x head %08x tail %08x start %08x\n",
187 ring->name,
7f2ab699 188 I915_READ_CTL(ring),
570ef608 189 I915_READ_HEAD(ring),
870e86dd 190 I915_READ_TAIL(ring),
6c0e1c55 191 I915_READ_START(ring));
8187a2b7
ZN
192 return -EIO;
193 }
194
195 if (!drm_core_check_feature(dev, DRIVER_MODESET))
196 i915_kernel_lost_context(dev);
197 else {
570ef608 198 ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
870e86dd 199 ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
8187a2b7
ZN
200 ring->space = ring->head - (ring->tail + 8);
201 if (ring->space < 0)
202 ring->space += ring->size;
203 }
204 return 0;
205}
206
207static int init_render_ring(struct drm_device *dev,
ab6f8e32 208 struct intel_ring_buffer *ring)
8187a2b7
ZN
209{
210 drm_i915_private_t *dev_priv = dev->dev_private;
211 int ret = init_ring_common(dev, ring);
a69ffdbf
ZW
212 int mode;
213
a6c45cf0 214 if (INTEL_INFO(dev)->gen > 3) {
a69ffdbf
ZW
215 mode = VS_TIMER_DISPATCH << 16 | VS_TIMER_DISPATCH;
216 if (IS_GEN6(dev))
217 mode |= MI_FLUSH_ENABLE << 16 | MI_FLUSH_ENABLE;
218 I915_WRITE(MI_MODE, mode);
8187a2b7
ZN
219 }
220 return ret;
221}
222
62fdfeaf 223#define PIPE_CONTROL_FLUSH(addr) \
8187a2b7 224do { \
62fdfeaf 225 OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE | \
ca76482e 226 PIPE_CONTROL_DEPTH_STALL | 2); \
62fdfeaf
EA
227 OUT_RING(addr | PIPE_CONTROL_GLOBAL_GTT); \
228 OUT_RING(0); \
229 OUT_RING(0); \
8187a2b7 230} while (0)
62fdfeaf
EA
231
232/**
233 * Creates a new sequence number, emitting a write of it to the status page
234 * plus an interrupt, which will trigger i915_user_interrupt_handler.
235 *
236 * Must be called with struct_lock held.
237 *
238 * Returned sequence numbers are nonzero on success.
239 */
8187a2b7
ZN
240static u32
241render_ring_add_request(struct drm_device *dev,
ab6f8e32 242 struct intel_ring_buffer *ring,
ab6f8e32 243 u32 flush_domains)
62fdfeaf
EA
244{
245 drm_i915_private_t *dev_priv = dev->dev_private;
6f392d54
CW
246 u32 seqno;
247
248 seqno = i915_gem_get_seqno(dev);
ca76482e
ZW
249
250 if (IS_GEN6(dev)) {
251 BEGIN_LP_RING(6);
252 OUT_RING(GFX_OP_PIPE_CONTROL | 3);
253 OUT_RING(PIPE_CONTROL_QW_WRITE |
254 PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_IS_FLUSH |
255 PIPE_CONTROL_NOTIFY);
256 OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
257 OUT_RING(seqno);
258 OUT_RING(0);
259 OUT_RING(0);
260 ADVANCE_LP_RING();
261 } else if (HAS_PIPE_CONTROL(dev)) {
62fdfeaf
EA
262 u32 scratch_addr = dev_priv->seqno_gfx_addr + 128;
263
264 /*
265 * Workaround qword write incoherence by flushing the
266 * PIPE_NOTIFY buffers out to memory before requesting
267 * an interrupt.
268 */
269 BEGIN_LP_RING(32);
270 OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
271 PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH);
272 OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
273 OUT_RING(seqno);
274 OUT_RING(0);
275 PIPE_CONTROL_FLUSH(scratch_addr);
276 scratch_addr += 128; /* write to separate cachelines */
277 PIPE_CONTROL_FLUSH(scratch_addr);
278 scratch_addr += 128;
279 PIPE_CONTROL_FLUSH(scratch_addr);
280 scratch_addr += 128;
281 PIPE_CONTROL_FLUSH(scratch_addr);
282 scratch_addr += 128;
283 PIPE_CONTROL_FLUSH(scratch_addr);
284 scratch_addr += 128;
285 PIPE_CONTROL_FLUSH(scratch_addr);
286 OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
287 PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH |
288 PIPE_CONTROL_NOTIFY);
289 OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
290 OUT_RING(seqno);
291 OUT_RING(0);
292 ADVANCE_LP_RING();
293 } else {
294 BEGIN_LP_RING(4);
295 OUT_RING(MI_STORE_DWORD_INDEX);
296 OUT_RING(I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
297 OUT_RING(seqno);
298
299 OUT_RING(MI_USER_INTERRUPT);
300 ADVANCE_LP_RING();
301 }
302 return seqno;
303}
304
8187a2b7 305static u32
f787a5f5
CW
306render_ring_get_seqno(struct drm_device *dev,
307 struct intel_ring_buffer *ring)
8187a2b7
ZN
308{
309 drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
310 if (HAS_PIPE_CONTROL(dev))
311 return ((volatile u32 *)(dev_priv->seqno_page))[0];
312 else
313 return intel_read_status_page(ring, I915_GEM_HWS_INDEX);
314}
315
316static void
317render_ring_get_user_irq(struct drm_device *dev,
ab6f8e32 318 struct intel_ring_buffer *ring)
62fdfeaf
EA
319{
320 drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
321 unsigned long irqflags;
322
323 spin_lock_irqsave(&dev_priv->user_irq_lock, irqflags);
8187a2b7 324 if (dev->irq_enabled && (++ring->user_irq_refcount == 1)) {
62fdfeaf
EA
325 if (HAS_PCH_SPLIT(dev))
326 ironlake_enable_graphics_irq(dev_priv, GT_PIPE_NOTIFY);
327 else
328 i915_enable_irq(dev_priv, I915_USER_INTERRUPT);
329 }
330 spin_unlock_irqrestore(&dev_priv->user_irq_lock, irqflags);
331}
332
8187a2b7
ZN
333static void
334render_ring_put_user_irq(struct drm_device *dev,
ab6f8e32 335 struct intel_ring_buffer *ring)
62fdfeaf
EA
336{
337 drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
338 unsigned long irqflags;
339
340 spin_lock_irqsave(&dev_priv->user_irq_lock, irqflags);
8187a2b7
ZN
341 BUG_ON(dev->irq_enabled && ring->user_irq_refcount <= 0);
342 if (dev->irq_enabled && (--ring->user_irq_refcount == 0)) {
62fdfeaf
EA
343 if (HAS_PCH_SPLIT(dev))
344 ironlake_disable_graphics_irq(dev_priv, GT_PIPE_NOTIFY);
345 else
346 i915_disable_irq(dev_priv, I915_USER_INTERRUPT);
347 }
348 spin_unlock_irqrestore(&dev_priv->user_irq_lock, irqflags);
349}
350
447da187
DV
351void intel_ring_setup_status_page(struct drm_device *dev,
352 struct intel_ring_buffer *ring)
8187a2b7
ZN
353{
354 drm_i915_private_t *dev_priv = dev->dev_private;
355 if (IS_GEN6(dev)) {
3d281d8c
DV
356 I915_WRITE(RING_HWS_PGA_GEN6(ring->mmio_base),
357 ring->status_page.gfx_addr);
358 I915_READ(RING_HWS_PGA_GEN6(ring->mmio_base)); /* posting read */
8187a2b7 359 } else {
3d281d8c
DV
360 I915_WRITE(RING_HWS_PGA(ring->mmio_base),
361 ring->status_page.gfx_addr);
362 I915_READ(RING_HWS_PGA(ring->mmio_base)); /* posting read */
8187a2b7
ZN
363 }
364
365}
366
ab6f8e32 367static void
d1b851fc
ZN
368bsd_ring_flush(struct drm_device *dev,
369 struct intel_ring_buffer *ring,
370 u32 invalidate_domains,
371 u32 flush_domains)
372{
be26a10b 373 intel_ring_begin(dev, ring, 2);
d1b851fc
ZN
374 intel_ring_emit(dev, ring, MI_FLUSH);
375 intel_ring_emit(dev, ring, MI_NOOP);
376 intel_ring_advance(dev, ring);
377}
378
d1b851fc 379static int init_bsd_ring(struct drm_device *dev,
ab6f8e32 380 struct intel_ring_buffer *ring)
d1b851fc
ZN
381{
382 return init_ring_common(dev, ring);
383}
384
385static u32
549f7365
CW
386ring_add_request(struct drm_device *dev,
387 struct intel_ring_buffer *ring,
388 u32 flush_domains)
d1b851fc
ZN
389{
390 u32 seqno;
6f392d54
CW
391
392 seqno = i915_gem_get_seqno(dev);
393
d1b851fc
ZN
394 intel_ring_begin(dev, ring, 4);
395 intel_ring_emit(dev, ring, MI_STORE_DWORD_INDEX);
396 intel_ring_emit(dev, ring,
397 I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
398 intel_ring_emit(dev, ring, seqno);
399 intel_ring_emit(dev, ring, MI_USER_INTERRUPT);
400 intel_ring_advance(dev, ring);
401
402 DRM_DEBUG_DRIVER("%s %d\n", ring->name, seqno);
403
404 return seqno;
405}
406
d1b851fc
ZN
407static void
408bsd_ring_get_user_irq(struct drm_device *dev,
ab6f8e32 409 struct intel_ring_buffer *ring)
d1b851fc
ZN
410{
411 /* do nothing */
412}
413static void
414bsd_ring_put_user_irq(struct drm_device *dev,
ab6f8e32 415 struct intel_ring_buffer *ring)
d1b851fc
ZN
416{
417 /* do nothing */
418}
419
420static u32
549f7365
CW
421ring_status_page_get_seqno(struct drm_device *dev,
422 struct intel_ring_buffer *ring)
d1b851fc
ZN
423{
424 return intel_read_status_page(ring, I915_GEM_HWS_INDEX);
425}
426
427static int
549f7365
CW
428ring_dispatch_gem_execbuffer(struct drm_device *dev,
429 struct intel_ring_buffer *ring,
430 struct drm_i915_gem_execbuffer2 *exec,
431 struct drm_clip_rect *cliprects,
432 uint64_t exec_offset)
d1b851fc
ZN
433{
434 uint32_t exec_start;
435 exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
436 intel_ring_begin(dev, ring, 2);
437 intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START |
438 (2 << 6) | MI_BATCH_NON_SECURE_I965);
439 intel_ring_emit(dev, ring, exec_start);
440 intel_ring_advance(dev, ring);
441 return 0;
442}
443
8187a2b7
ZN
444static int
445render_ring_dispatch_gem_execbuffer(struct drm_device *dev,
ab6f8e32
CW
446 struct intel_ring_buffer *ring,
447 struct drm_i915_gem_execbuffer2 *exec,
448 struct drm_clip_rect *cliprects,
449 uint64_t exec_offset)
62fdfeaf
EA
450{
451 drm_i915_private_t *dev_priv = dev->dev_private;
452 int nbox = exec->num_cliprects;
453 int i = 0, count;
454 uint32_t exec_start, exec_len;
62fdfeaf
EA
455 exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
456 exec_len = (uint32_t) exec->batch_len;
457
6f392d54 458 trace_i915_gem_request_submit(dev, dev_priv->next_seqno + 1);
62fdfeaf
EA
459
460 count = nbox ? nbox : 1;
461
462 for (i = 0; i < count; i++) {
463 if (i < nbox) {
464 int ret = i915_emit_box(dev, cliprects, i,
465 exec->DR1, exec->DR4);
466 if (ret)
467 return ret;
468 }
469
470 if (IS_I830(dev) || IS_845G(dev)) {
8187a2b7
ZN
471 intel_ring_begin(dev, ring, 4);
472 intel_ring_emit(dev, ring, MI_BATCH_BUFFER);
473 intel_ring_emit(dev, ring,
474 exec_start | MI_BATCH_NON_SECURE);
475 intel_ring_emit(dev, ring, exec_start + exec_len - 4);
476 intel_ring_emit(dev, ring, 0);
62fdfeaf 477 } else {
c7179667 478 intel_ring_begin(dev, ring, 2);
a6c45cf0 479 if (INTEL_INFO(dev)->gen >= 4) {
8187a2b7
ZN
480 intel_ring_emit(dev, ring,
481 MI_BATCH_BUFFER_START | (2 << 6)
482 | MI_BATCH_NON_SECURE_I965);
483 intel_ring_emit(dev, ring, exec_start);
62fdfeaf 484 } else {
8187a2b7
ZN
485 intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START
486 | (2 << 6));
487 intel_ring_emit(dev, ring, exec_start |
488 MI_BATCH_NON_SECURE);
62fdfeaf 489 }
62fdfeaf 490 }
8187a2b7 491 intel_ring_advance(dev, ring);
62fdfeaf
EA
492 }
493
f00a3ddf 494 if (IS_G4X(dev) || IS_GEN5(dev)) {
1cafd347
ZN
495 intel_ring_begin(dev, ring, 2);
496 intel_ring_emit(dev, ring, MI_FLUSH |
497 MI_NO_WRITE_FLUSH |
498 MI_INVALIDATE_ISP );
499 intel_ring_emit(dev, ring, MI_NOOP);
500 intel_ring_advance(dev, ring);
501 }
62fdfeaf 502 /* XXX breadcrumb */
1cafd347 503
62fdfeaf
EA
504 return 0;
505}
506
8187a2b7 507static void cleanup_status_page(struct drm_device *dev,
ab6f8e32 508 struct intel_ring_buffer *ring)
62fdfeaf
EA
509{
510 drm_i915_private_t *dev_priv = dev->dev_private;
511 struct drm_gem_object *obj;
512 struct drm_i915_gem_object *obj_priv;
513
8187a2b7
ZN
514 obj = ring->status_page.obj;
515 if (obj == NULL)
62fdfeaf 516 return;
62fdfeaf
EA
517 obj_priv = to_intel_bo(obj);
518
519 kunmap(obj_priv->pages[0]);
520 i915_gem_object_unpin(obj);
521 drm_gem_object_unreference(obj);
8187a2b7 522 ring->status_page.obj = NULL;
62fdfeaf
EA
523
524 memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
62fdfeaf
EA
525}
526
8187a2b7 527static int init_status_page(struct drm_device *dev,
ab6f8e32 528 struct intel_ring_buffer *ring)
62fdfeaf
EA
529{
530 drm_i915_private_t *dev_priv = dev->dev_private;
531 struct drm_gem_object *obj;
532 struct drm_i915_gem_object *obj_priv;
533 int ret;
534
62fdfeaf
EA
535 obj = i915_gem_alloc_object(dev, 4096);
536 if (obj == NULL) {
537 DRM_ERROR("Failed to allocate status page\n");
538 ret = -ENOMEM;
539 goto err;
540 }
541 obj_priv = to_intel_bo(obj);
542 obj_priv->agp_type = AGP_USER_CACHED_MEMORY;
543
544 ret = i915_gem_object_pin(obj, 4096);
545 if (ret != 0) {
62fdfeaf
EA
546 goto err_unref;
547 }
548
8187a2b7
ZN
549 ring->status_page.gfx_addr = obj_priv->gtt_offset;
550 ring->status_page.page_addr = kmap(obj_priv->pages[0]);
551 if (ring->status_page.page_addr == NULL) {
62fdfeaf 552 memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
62fdfeaf
EA
553 goto err_unpin;
554 }
8187a2b7
ZN
555 ring->status_page.obj = obj;
556 memset(ring->status_page.page_addr, 0, PAGE_SIZE);
62fdfeaf 557
447da187 558 intel_ring_setup_status_page(dev, ring);
8187a2b7
ZN
559 DRM_DEBUG_DRIVER("%s hws offset: 0x%08x\n",
560 ring->name, ring->status_page.gfx_addr);
62fdfeaf
EA
561
562 return 0;
563
564err_unpin:
565 i915_gem_object_unpin(obj);
566err_unref:
567 drm_gem_object_unreference(obj);
568err:
8187a2b7 569 return ret;
62fdfeaf
EA
570}
571
8187a2b7 572int intel_init_ring_buffer(struct drm_device *dev,
ab6f8e32 573 struct intel_ring_buffer *ring)
62fdfeaf 574{
870e86dd 575 struct drm_i915_private *dev_priv = dev->dev_private;
8187a2b7
ZN
576 struct drm_i915_gem_object *obj_priv;
577 struct drm_gem_object *obj;
dd785e35
CW
578 int ret;
579
8187a2b7 580 ring->dev = dev;
23bc5982
CW
581 INIT_LIST_HEAD(&ring->active_list);
582 INIT_LIST_HEAD(&ring->request_list);
64193406 583 INIT_LIST_HEAD(&ring->gpu_write_list);
62fdfeaf 584
8187a2b7
ZN
585 if (I915_NEED_GFX_HWS(dev)) {
586 ret = init_status_page(dev, ring);
587 if (ret)
588 return ret;
589 }
62fdfeaf 590
8187a2b7 591 obj = i915_gem_alloc_object(dev, ring->size);
62fdfeaf
EA
592 if (obj == NULL) {
593 DRM_ERROR("Failed to allocate ringbuffer\n");
8187a2b7 594 ret = -ENOMEM;
dd785e35 595 goto err_hws;
62fdfeaf 596 }
62fdfeaf 597
8187a2b7
ZN
598 ring->gem_object = obj;
599
a9db5c8f 600 ret = i915_gem_object_pin(obj, PAGE_SIZE);
dd785e35
CW
601 if (ret)
602 goto err_unref;
62fdfeaf 603
8187a2b7
ZN
604 obj_priv = to_intel_bo(obj);
605 ring->map.size = ring->size;
62fdfeaf 606 ring->map.offset = dev->agp->base + obj_priv->gtt_offset;
62fdfeaf
EA
607 ring->map.type = 0;
608 ring->map.flags = 0;
609 ring->map.mtrr = 0;
610
611 drm_core_ioremap_wc(&ring->map, dev);
612 if (ring->map.handle == NULL) {
613 DRM_ERROR("Failed to map ringbuffer.\n");
8187a2b7 614 ret = -EINVAL;
dd785e35 615 goto err_unpin;
62fdfeaf
EA
616 }
617
8187a2b7
ZN
618 ring->virtual_start = ring->map.handle;
619 ret = ring->init(dev, ring);
dd785e35
CW
620 if (ret)
621 goto err_unmap;
62fdfeaf 622
62fdfeaf
EA
623 if (!drm_core_check_feature(dev, DRIVER_MODESET))
624 i915_kernel_lost_context(dev);
625 else {
570ef608 626 ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
870e86dd 627 ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
62fdfeaf
EA
628 ring->space = ring->head - (ring->tail + 8);
629 if (ring->space < 0)
8187a2b7 630 ring->space += ring->size;
62fdfeaf 631 }
8187a2b7 632 return ret;
dd785e35
CW
633
634err_unmap:
635 drm_core_ioremapfree(&ring->map, dev);
636err_unpin:
637 i915_gem_object_unpin(obj);
638err_unref:
639 drm_gem_object_unreference(obj);
640 ring->gem_object = NULL;
641err_hws:
8187a2b7
ZN
642 cleanup_status_page(dev, ring);
643 return ret;
62fdfeaf
EA
644}
645
8187a2b7 646void intel_cleanup_ring_buffer(struct drm_device *dev,
ab6f8e32 647 struct intel_ring_buffer *ring)
62fdfeaf 648{
8187a2b7 649 if (ring->gem_object == NULL)
62fdfeaf
EA
650 return;
651
8187a2b7 652 drm_core_ioremapfree(&ring->map, dev);
62fdfeaf 653
8187a2b7
ZN
654 i915_gem_object_unpin(ring->gem_object);
655 drm_gem_object_unreference(ring->gem_object);
656 ring->gem_object = NULL;
55889788
CW
657
658 if (ring->cleanup)
659 ring->cleanup(ring);
660
8187a2b7 661 cleanup_status_page(dev, ring);
62fdfeaf
EA
662}
663
ab6f8e32
CW
664static int intel_wrap_ring_buffer(struct drm_device *dev,
665 struct intel_ring_buffer *ring)
62fdfeaf 666{
8187a2b7 667 unsigned int *virt;
62fdfeaf 668 int rem;
8187a2b7 669 rem = ring->size - ring->tail;
62fdfeaf 670
8187a2b7
ZN
671 if (ring->space < rem) {
672 int ret = intel_wait_ring_buffer(dev, ring, rem);
62fdfeaf
EA
673 if (ret)
674 return ret;
675 }
62fdfeaf 676
8187a2b7 677 virt = (unsigned int *)(ring->virtual_start + ring->tail);
1741dd4a
CW
678 rem /= 8;
679 while (rem--) {
62fdfeaf 680 *virt++ = MI_NOOP;
1741dd4a
CW
681 *virt++ = MI_NOOP;
682 }
62fdfeaf 683
8187a2b7 684 ring->tail = 0;
43ed340a 685 ring->space = ring->head - 8;
62fdfeaf
EA
686
687 return 0;
688}
689
8187a2b7 690int intel_wait_ring_buffer(struct drm_device *dev,
ab6f8e32 691 struct intel_ring_buffer *ring, int n)
62fdfeaf 692{
8187a2b7 693 unsigned long end;
570ef608 694 drm_i915_private_t *dev_priv = dev->dev_private;
08deebf9
CW
695 u32 head;
696
697 head = intel_read_status_page(ring, 4);
698 if (head) {
699 ring->head = head & HEAD_ADDR;
700 ring->space = ring->head - (ring->tail + 8);
701 if (ring->space < 0)
702 ring->space += ring->size;
703 if (ring->space >= n)
704 return 0;
705 }
62fdfeaf
EA
706
707 trace_i915_ring_wait_begin (dev);
8187a2b7
ZN
708 end = jiffies + 3 * HZ;
709 do {
570ef608 710 ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
62fdfeaf
EA
711 ring->space = ring->head - (ring->tail + 8);
712 if (ring->space < 0)
8187a2b7 713 ring->space += ring->size;
62fdfeaf
EA
714 if (ring->space >= n) {
715 trace_i915_ring_wait_end (dev);
716 return 0;
717 }
718
719 if (dev->primary->master) {
720 struct drm_i915_master_private *master_priv = dev->primary->master->driver_priv;
721 if (master_priv->sarea_priv)
722 master_priv->sarea_priv->perf_boxes |= I915_BOX_WAIT;
723 }
d1b851fc 724
e60a0b10 725 msleep(1);
8187a2b7
ZN
726 } while (!time_after(jiffies, end));
727 trace_i915_ring_wait_end (dev);
728 return -EBUSY;
729}
62fdfeaf 730
8187a2b7 731void intel_ring_begin(struct drm_device *dev,
ab6f8e32
CW
732 struct intel_ring_buffer *ring,
733 int num_dwords)
8187a2b7 734{
be26a10b 735 int n = 4*num_dwords;
8187a2b7
ZN
736 if (unlikely(ring->tail + n > ring->size))
737 intel_wrap_ring_buffer(dev, ring);
738 if (unlikely(ring->space < n))
739 intel_wait_ring_buffer(dev, ring, n);
d97ed339
CW
740
741 ring->space -= n;
8187a2b7 742}
62fdfeaf 743
8187a2b7 744void intel_ring_advance(struct drm_device *dev,
ab6f8e32 745 struct intel_ring_buffer *ring)
8187a2b7 746{
d97ed339 747 ring->tail &= ring->size - 1;
297b0c5b 748 ring->write_tail(dev, ring, ring->tail);
8187a2b7 749}
62fdfeaf 750
e070868e 751static const struct intel_ring_buffer render_ring = {
8187a2b7 752 .name = "render ring",
9220434a 753 .id = RING_RENDER,
333e9fe9 754 .mmio_base = RENDER_RING_BASE,
8187a2b7 755 .size = 32 * PAGE_SIZE,
8187a2b7 756 .init = init_render_ring,
297b0c5b 757 .write_tail = ring_write_tail,
8187a2b7
ZN
758 .flush = render_ring_flush,
759 .add_request = render_ring_add_request,
f787a5f5 760 .get_seqno = render_ring_get_seqno,
8187a2b7
ZN
761 .user_irq_get = render_ring_get_user_irq,
762 .user_irq_put = render_ring_put_user_irq,
763 .dispatch_gem_execbuffer = render_ring_dispatch_gem_execbuffer,
8187a2b7 764};
d1b851fc
ZN
765
766/* ring buffer for bit-stream decoder */
767
e070868e 768static const struct intel_ring_buffer bsd_ring = {
d1b851fc 769 .name = "bsd ring",
9220434a 770 .id = RING_BSD,
333e9fe9 771 .mmio_base = BSD_RING_BASE,
d1b851fc 772 .size = 32 * PAGE_SIZE,
d1b851fc 773 .init = init_bsd_ring,
297b0c5b 774 .write_tail = ring_write_tail,
d1b851fc 775 .flush = bsd_ring_flush,
549f7365
CW
776 .add_request = ring_add_request,
777 .get_seqno = ring_status_page_get_seqno,
d1b851fc
ZN
778 .user_irq_get = bsd_ring_get_user_irq,
779 .user_irq_put = bsd_ring_put_user_irq,
549f7365 780 .dispatch_gem_execbuffer = ring_dispatch_gem_execbuffer,
d1b851fc 781};
5c1143bb 782
881f47b6 783
297b0c5b
CW
784static void gen6_bsd_ring_write_tail(struct drm_device *dev,
785 struct intel_ring_buffer *ring,
786 u32 value)
881f47b6
XH
787{
788 drm_i915_private_t *dev_priv = dev->dev_private;
789
790 /* Every tail move must follow the sequence below */
791 I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
792 GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
793 GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_DISABLE);
794 I915_WRITE(GEN6_BSD_RNCID, 0x0);
795
796 if (wait_for((I915_READ(GEN6_BSD_SLEEP_PSMI_CONTROL) &
797 GEN6_BSD_SLEEP_PSMI_CONTROL_IDLE_INDICATOR) == 0,
798 50))
799 DRM_ERROR("timed out waiting for IDLE Indicator\n");
800
870e86dd 801 I915_WRITE_TAIL(ring, value);
881f47b6
XH
802 I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
803 GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
804 GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_ENABLE);
805}
806
549f7365
CW
807static void gen6_ring_flush(struct drm_device *dev,
808 struct intel_ring_buffer *ring,
809 u32 invalidate_domains,
810 u32 flush_domains)
881f47b6
XH
811{
812 intel_ring_begin(dev, ring, 4);
813 intel_ring_emit(dev, ring, MI_FLUSH_DW);
814 intel_ring_emit(dev, ring, 0);
815 intel_ring_emit(dev, ring, 0);
816 intel_ring_emit(dev, ring, 0);
817 intel_ring_advance(dev, ring);
818}
819
820static int
549f7365
CW
821gen6_ring_dispatch_gem_execbuffer(struct drm_device *dev,
822 struct intel_ring_buffer *ring,
823 struct drm_i915_gem_execbuffer2 *exec,
824 struct drm_clip_rect *cliprects,
825 uint64_t exec_offset)
881f47b6
XH
826{
827 uint32_t exec_start;
ab6f8e32 828
881f47b6 829 exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
ab6f8e32 830
881f47b6 831 intel_ring_begin(dev, ring, 2);
ab6f8e32
CW
832 intel_ring_emit(dev, ring,
833 MI_BATCH_BUFFER_START | MI_BATCH_NON_SECURE_I965);
834 /* bit0-7 is the length on GEN6+ */
881f47b6
XH
835 intel_ring_emit(dev, ring, exec_start);
836 intel_ring_advance(dev, ring);
ab6f8e32 837
881f47b6
XH
838 return 0;
839}
840
841/* ring buffer for Video Codec for Gen6+ */
e070868e 842static const struct intel_ring_buffer gen6_bsd_ring = {
881f47b6
XH
843 .name = "gen6 bsd ring",
844 .id = RING_BSD,
333e9fe9 845 .mmio_base = GEN6_BSD_RING_BASE,
881f47b6 846 .size = 32 * PAGE_SIZE,
881f47b6 847 .init = init_bsd_ring,
297b0c5b 848 .write_tail = gen6_bsd_ring_write_tail,
549f7365
CW
849 .flush = gen6_ring_flush,
850 .add_request = ring_add_request,
851 .get_seqno = ring_status_page_get_seqno,
881f47b6
XH
852 .user_irq_get = bsd_ring_get_user_irq,
853 .user_irq_put = bsd_ring_put_user_irq,
549f7365
CW
854 .dispatch_gem_execbuffer = gen6_ring_dispatch_gem_execbuffer,
855};
856
857/* Blitter support (SandyBridge+) */
858
859static void
860blt_ring_get_user_irq(struct drm_device *dev,
861 struct intel_ring_buffer *ring)
862{
863 /* do nothing */
864}
865static void
866blt_ring_put_user_irq(struct drm_device *dev,
867 struct intel_ring_buffer *ring)
868{
869 /* do nothing */
870}
871
55889788
CW
872
873/* Workaround for some stepping of SNB,
874 * each time when BLT engine ring tail moved,
875 * the first command in the ring to be parsed
876 * should be MI_BATCH_BUFFER_START
877 */
878#define NEED_BLT_WORKAROUND(dev) \
879 (IS_GEN6(dev) && (dev->pdev->revision < 8))
880
881static inline struct drm_i915_gem_object *
882to_blt_workaround(struct intel_ring_buffer *ring)
883{
884 return ring->private;
885}
886
887static int blt_ring_init(struct drm_device *dev,
888 struct intel_ring_buffer *ring)
889{
890 if (NEED_BLT_WORKAROUND(dev)) {
891 struct drm_i915_gem_object *obj;
892 u32 __iomem *ptr;
893 int ret;
894
895 obj = to_intel_bo(i915_gem_alloc_object(dev, 4096));
896 if (obj == NULL)
897 return -ENOMEM;
898
899 ret = i915_gem_object_pin(&obj->base, 4096);
900 if (ret) {
901 drm_gem_object_unreference(&obj->base);
902 return ret;
903 }
904
905 ptr = kmap(obj->pages[0]);
906 iowrite32(MI_BATCH_BUFFER_END, ptr);
907 iowrite32(MI_NOOP, ptr+1);
908 kunmap(obj->pages[0]);
909
910 ret = i915_gem_object_set_to_gtt_domain(&obj->base, false);
911 if (ret) {
912 i915_gem_object_unpin(&obj->base);
913 drm_gem_object_unreference(&obj->base);
914 return ret;
915 }
916
917 ring->private = obj;
918 }
919
920 return init_ring_common(dev, ring);
921}
922
923static void blt_ring_begin(struct drm_device *dev,
924 struct intel_ring_buffer *ring,
925 int num_dwords)
926{
927 if (ring->private) {
928 intel_ring_begin(dev, ring, num_dwords+2);
929 intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START);
930 intel_ring_emit(dev, ring, to_blt_workaround(ring)->gtt_offset);
931 } else
932 intel_ring_begin(dev, ring, 4);
933}
934
935static void blt_ring_flush(struct drm_device *dev,
936 struct intel_ring_buffer *ring,
937 u32 invalidate_domains,
938 u32 flush_domains)
939{
940 blt_ring_begin(dev, ring, 4);
941 intel_ring_emit(dev, ring, MI_FLUSH_DW);
942 intel_ring_emit(dev, ring, 0);
943 intel_ring_emit(dev, ring, 0);
944 intel_ring_emit(dev, ring, 0);
945 intel_ring_advance(dev, ring);
946}
947
948static u32
949blt_ring_add_request(struct drm_device *dev,
950 struct intel_ring_buffer *ring,
951 u32 flush_domains)
952{
953 u32 seqno = i915_gem_get_seqno(dev);
954
955 blt_ring_begin(dev, ring, 4);
956 intel_ring_emit(dev, ring, MI_STORE_DWORD_INDEX);
957 intel_ring_emit(dev, ring,
958 I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
959 intel_ring_emit(dev, ring, seqno);
960 intel_ring_emit(dev, ring, MI_USER_INTERRUPT);
961 intel_ring_advance(dev, ring);
962
963 DRM_DEBUG_DRIVER("%s %d\n", ring->name, seqno);
964 return seqno;
965}
966
967static void blt_ring_cleanup(struct intel_ring_buffer *ring)
968{
969 if (!ring->private)
970 return;
971
972 i915_gem_object_unpin(ring->private);
973 drm_gem_object_unreference(ring->private);
974 ring->private = NULL;
975}
976
549f7365
CW
977static const struct intel_ring_buffer gen6_blt_ring = {
978 .name = "blt ring",
979 .id = RING_BLT,
980 .mmio_base = BLT_RING_BASE,
981 .size = 32 * PAGE_SIZE,
55889788 982 .init = blt_ring_init,
297b0c5b 983 .write_tail = ring_write_tail,
55889788
CW
984 .flush = blt_ring_flush,
985 .add_request = blt_ring_add_request,
549f7365
CW
986 .get_seqno = ring_status_page_get_seqno,
987 .user_irq_get = blt_ring_get_user_irq,
988 .user_irq_put = blt_ring_put_user_irq,
989 .dispatch_gem_execbuffer = gen6_ring_dispatch_gem_execbuffer,
55889788 990 .cleanup = blt_ring_cleanup,
881f47b6
XH
991};
992
5c1143bb
XH
993int intel_init_render_ring_buffer(struct drm_device *dev)
994{
995 drm_i915_private_t *dev_priv = dev->dev_private;
996
997 dev_priv->render_ring = render_ring;
998
999 if (!I915_NEED_GFX_HWS(dev)) {
1000 dev_priv->render_ring.status_page.page_addr
1001 = dev_priv->status_page_dmah->vaddr;
1002 memset(dev_priv->render_ring.status_page.page_addr,
1003 0, PAGE_SIZE);
1004 }
1005
1006 return intel_init_ring_buffer(dev, &dev_priv->render_ring);
1007}
1008
1009int intel_init_bsd_ring_buffer(struct drm_device *dev)
1010{
1011 drm_i915_private_t *dev_priv = dev->dev_private;
1012
881f47b6
XH
1013 if (IS_GEN6(dev))
1014 dev_priv->bsd_ring = gen6_bsd_ring;
1015 else
1016 dev_priv->bsd_ring = bsd_ring;
5c1143bb
XH
1017
1018 return intel_init_ring_buffer(dev, &dev_priv->bsd_ring);
1019}
549f7365
CW
1020
1021int intel_init_blt_ring_buffer(struct drm_device *dev)
1022{
1023 drm_i915_private_t *dev_priv = dev->dev_private;
1024
1025 dev_priv->blt_ring = gen6_blt_ring;
1026
1027 return intel_init_ring_buffer(dev, &dev_priv->blt_ring);
1028}
This page took 0.189741 seconds and 5 git commands to generate.