1 /* via_dma.c -- DMA support for the VIA Unichrome/Pro
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
6 * Copyright 2004 Digeo, Inc., Palo Alto, CA, U.S.A.
9 * Copyright 2004 The Unichrome project.
10 * All Rights Reserved.
12 * Permission is hereby granted, free of charge, to any person obtaining a
13 * copy of this software and associated documentation files (the "Software"),
14 * to deal in the Software without restriction, including without limitation
15 * the rights to use, copy, modify, merge, publish, distribute, sub license,
16 * and/or sell copies of the Software, and to permit persons to whom the
17 * Software is furnished to do so, subject to the following conditions:
19 * The above copyright notice and this permission notice (including the
20 * next paragraph) shall be included in all copies or substantial portions
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
24 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
25 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
26 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
27 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
28 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
29 * USE OR OTHER DEALINGS IN THE SOFTWARE.
41 #include "via_3d_reg.h"
43 #define SetReg2DAGP(nReg, nData) { \
44 *((uint32_t *)(vb)) = ((nReg) >> 2) | HALCYON_HEADER1; \
45 *((uint32_t *)(vb) + 1) = (nData); \
46 vb = ((uint32_t *)vb) + 2; \
47 dev_priv->dma_low +=8; \
50 #define via_flush_write_combine() DRM_MEMORYBARRIER()
52 #define VIA_OUT_RING_QW(w1,w2) \
55 dev_priv->dma_low += 8;
57 static void via_cmdbuf_start(drm_via_private_t *dev_priv);
58 static void via_cmdbuf_pause(drm_via_private_t *dev_priv);
59 static void via_cmdbuf_reset(drm_via_private_t *dev_priv);
60 static void via_cmdbuf_rewind(drm_via_private_t *dev_priv);
61 static int via_wait_idle(drm_via_private_t *dev_priv);
62 static void via_pad_cache(drm_via_private_t *dev_priv, int qwords);
66 * Free space in command buffer.
69 static uint32_t via_cmdbuf_space(drm_via_private_t *dev_priv)
71 uint32_t agp_base = dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr;
72 uint32_t hw_addr = *(dev_priv->hw_addr_ptr) - agp_base;
74 return ((hw_addr <= dev_priv->dma_low) ?
75 (dev_priv->dma_high + hw_addr - dev_priv->dma_low) :
76 (hw_addr - dev_priv->dma_low));
80 * How much does the command regulator lag behind?
83 static uint32_t via_cmdbuf_lag(drm_via_private_t *dev_priv)
85 uint32_t agp_base = dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr;
86 uint32_t hw_addr = *(dev_priv->hw_addr_ptr) - agp_base;
88 return ((hw_addr <= dev_priv->dma_low) ?
89 (dev_priv->dma_low - hw_addr) :
90 (dev_priv->dma_wrap + dev_priv->dma_low - hw_addr));
94 * Check that the given size fits in the buffer, otherwise wait.
98 via_cmdbuf_wait(drm_via_private_t * dev_priv, unsigned int size)
100 uint32_t agp_base = dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr;
101 uint32_t cur_addr, hw_addr, next_addr;
102 volatile uint32_t *hw_addr_ptr;
104 hw_addr_ptr = dev_priv->hw_addr_ptr;
105 cur_addr = dev_priv->dma_low;
106 next_addr = cur_addr + size + 512 * 1024;
109 hw_addr = *hw_addr_ptr - agp_base;
112 ("via_cmdbuf_wait timed out hw %x cur_addr %x next_addr %x\n",
113 hw_addr, cur_addr, next_addr);
116 } while ((cur_addr < hw_addr) && (next_addr >= hw_addr));
122 * Checks whether buffer head has reach the end. Rewind the ring buffer
125 * Returns virtual pointer to ring buffer.
128 static inline uint32_t *via_check_dma(drm_via_private_t * dev_priv,
131 if ((dev_priv->dma_low + size + 4 * CMDBUF_ALIGNMENT_SIZE) >
132 dev_priv->dma_high) {
133 via_cmdbuf_rewind(dev_priv);
135 if (via_cmdbuf_wait(dev_priv, size) != 0) {
139 return (uint32_t *) (dev_priv->dma_ptr + dev_priv->dma_low);
142 int via_dma_cleanup(struct drm_device * dev)
144 if (dev->dev_private) {
145 drm_via_private_t *dev_priv =
146 (drm_via_private_t *) dev->dev_private;
148 if (dev_priv->ring.virtual_start) {
149 via_cmdbuf_reset(dev_priv);
151 drm_core_ioremapfree(&dev_priv->ring.map, dev);
152 dev_priv->ring.virtual_start = NULL;
160 static int via_initialize(struct drm_device * dev,
161 drm_via_private_t * dev_priv,
162 drm_via_dma_init_t * init)
164 if (!dev_priv || !dev_priv->mmio) {
165 DRM_ERROR("via_dma_init called before via_map_init\n");
169 if (dev_priv->ring.virtual_start != NULL) {
170 DRM_ERROR("called again without calling cleanup\n");
174 if (!dev->agp || !dev->agp->base) {
175 DRM_ERROR("called with no agp memory available\n");
179 if (dev_priv->chipset == VIA_DX9_0) {
180 DRM_ERROR("AGP DMA is not supported on this chip\n");
184 dev_priv->ring.map.offset = dev->agp->base + init->offset;
185 dev_priv->ring.map.size = init->size;
186 dev_priv->ring.map.type = 0;
187 dev_priv->ring.map.flags = 0;
188 dev_priv->ring.map.mtrr = 0;
190 drm_core_ioremap(&dev_priv->ring.map, dev);
192 if (dev_priv->ring.map.handle == NULL) {
193 via_dma_cleanup(dev);
194 DRM_ERROR("can not ioremap virtual address for"
199 dev_priv->ring.virtual_start = dev_priv->ring.map.handle;
201 dev_priv->dma_ptr = dev_priv->ring.virtual_start;
202 dev_priv->dma_low = 0;
203 dev_priv->dma_high = init->size;
204 dev_priv->dma_wrap = init->size;
205 dev_priv->dma_offset = init->offset;
206 dev_priv->last_pause_ptr = NULL;
207 dev_priv->hw_addr_ptr =
208 (volatile uint32_t *)((char *)dev_priv->mmio->handle +
209 init->reg_pause_addr);
211 via_cmdbuf_start(dev_priv);
216 static int via_dma_init(struct drm_device *dev, void *data, struct drm_file *file_priv)
218 drm_via_private_t *dev_priv = (drm_via_private_t *) dev->dev_private;
219 drm_via_dma_init_t *init = data;
222 switch (init->func) {
224 if (!DRM_SUSER(DRM_CURPROC))
227 retcode = via_initialize(dev, dev_priv, init);
229 case VIA_CLEANUP_DMA:
230 if (!DRM_SUSER(DRM_CURPROC))
233 retcode = via_dma_cleanup(dev);
235 case VIA_DMA_INITIALIZED:
236 retcode = (dev_priv->ring.virtual_start != NULL) ?
249 static int via_dispatch_cmdbuffer(struct drm_device * dev, drm_via_cmdbuffer_t * cmd)
251 drm_via_private_t *dev_priv;
255 dev_priv = (drm_via_private_t *) dev->dev_private;
257 if (dev_priv->ring.virtual_start == NULL) {
258 DRM_ERROR("called without initializing AGP ring buffer.\n");
262 if (cmd->size > VIA_PCI_BUF_SIZE) {
266 if (DRM_COPY_FROM_USER(dev_priv->pci_buf, cmd->buf, cmd->size))
270 * Running this function on AGP memory is dead slow. Therefore
271 * we run it on a temporary cacheable system memory buffer and
272 * copy it to AGP memory when ready.
276 via_verify_command_stream((uint32_t *)dev_priv->pci_buf,
277 cmd->size, dev, 1))) {
281 vb = via_check_dma(dev_priv, (cmd->size < 0x100) ? 0x102 : cmd->size);
286 memcpy(vb, dev_priv->pci_buf, cmd->size);
288 dev_priv->dma_low += cmd->size;
291 * Small submissions somehow stalls the CPU. (AGP cache effects?)
292 * pad to greater size.
295 if (cmd->size < 0x100)
296 via_pad_cache(dev_priv, (0x100 - cmd->size) >> 3);
297 via_cmdbuf_pause(dev_priv);
302 int via_driver_dma_quiescent(struct drm_device * dev)
304 drm_via_private_t *dev_priv = dev->dev_private;
306 if (!via_wait_idle(dev_priv)) {
312 static int via_flush_ioctl(struct drm_device *dev, void *data, struct drm_file *file_priv)
315 LOCK_TEST_WITH_RETURN(dev, file_priv);
317 return via_driver_dma_quiescent(dev);
320 static int via_cmdbuffer(struct drm_device *dev, void *data, struct drm_file *file_priv)
322 drm_via_cmdbuffer_t *cmdbuf = data;
325 LOCK_TEST_WITH_RETURN(dev, file_priv);
327 DRM_DEBUG("buf %p size %lu\n", cmdbuf->buf, cmdbuf->size);
329 ret = via_dispatch_cmdbuffer(dev, cmdbuf);
337 static int via_dispatch_pci_cmdbuffer(struct drm_device * dev,
338 drm_via_cmdbuffer_t * cmd)
340 drm_via_private_t *dev_priv = dev->dev_private;
343 if (cmd->size > VIA_PCI_BUF_SIZE) {
346 if (DRM_COPY_FROM_USER(dev_priv->pci_buf, cmd->buf, cmd->size))
350 via_verify_command_stream((uint32_t *) dev_priv->pci_buf,
351 cmd->size, dev, 0))) {
356 via_parse_command_stream(dev, (const uint32_t *)dev_priv->pci_buf,
361 static int via_pci_cmdbuffer(struct drm_device *dev, void *data, struct drm_file *file_priv)
363 drm_via_cmdbuffer_t *cmdbuf = data;
366 LOCK_TEST_WITH_RETURN(dev, file_priv);
368 DRM_DEBUG("buf %p size %lu\n", cmdbuf->buf, cmdbuf->size);
370 ret = via_dispatch_pci_cmdbuffer(dev, cmdbuf);
378 static inline uint32_t *via_align_buffer(drm_via_private_t * dev_priv,
379 uint32_t * vb, int qw_count)
381 for (; qw_count > 0; --qw_count) {
382 VIA_OUT_RING_QW(HC_DUMMY, HC_DUMMY);
388 * This function is used internally by ring buffer mangement code.
390 * Returns virtual pointer to ring buffer.
392 static inline uint32_t *via_get_dma(drm_via_private_t * dev_priv)
394 return (uint32_t *) (dev_priv->dma_ptr + dev_priv->dma_low);
398 * Hooks a segment of data into the tail of the ring-buffer by
399 * modifying the pause address stored in the buffer itself. If
400 * the regulator has already paused, restart it.
402 static int via_hook_segment(drm_via_private_t * dev_priv,
403 uint32_t pause_addr_hi, uint32_t pause_addr_lo,
407 volatile uint32_t *paused_at = dev_priv->last_pause_ptr;
411 via_flush_write_combine();
412 (void) *(volatile uint32_t *)(via_get_dma(dev_priv) -1);
413 *paused_at = pause_addr_lo;
414 via_flush_write_combine();
416 reader = *(dev_priv->hw_addr_ptr);
417 ptr = ((volatile char *)paused_at - dev_priv->dma_ptr) +
418 dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr + 4;
419 dev_priv->last_pause_ptr = via_get_dma(dev_priv) - 1;
421 if ((ptr - reader) <= dev_priv->dma_diff ) {
423 while (!(paused = (VIA_READ(0x41c) & 0x80000000)) && count--);
426 if (paused && !no_pci_fire) {
427 reader = *(dev_priv->hw_addr_ptr);
428 if ((ptr - reader) == dev_priv->dma_diff) {
431 * There is a concern that these writes may stall the PCI bus
432 * if the GPU is not idle. However, idling the GPU first
433 * doesn't make a difference.
436 VIA_WRITE(VIA_REG_TRANSET, (HC_ParaType_PreCR << 16));
437 VIA_WRITE(VIA_REG_TRANSPACE, pause_addr_hi);
438 VIA_WRITE(VIA_REG_TRANSPACE, pause_addr_lo);
439 VIA_READ(VIA_REG_TRANSPACE);
448 static int via_wait_idle(drm_via_private_t *dev_priv)
450 int count = 10000000;
452 while (!(VIA_READ(VIA_REG_STATUS) & VIA_VR_QUEUE_BUSY) && count--);
454 while (count-- && (VIA_READ(VIA_REG_STATUS) &
455 (VIA_CMD_RGTR_BUSY | VIA_2D_ENG_BUSY |
460 static uint32_t *via_align_cmd(drm_via_private_t *dev_priv, uint32_t cmd_type,
461 uint32_t addr, uint32_t *cmd_addr_hi,
462 uint32_t *cmd_addr_lo, int skip_wait)
465 uint32_t cmd_addr, addr_lo, addr_hi;
467 uint32_t qw_pad_count;
470 via_cmdbuf_wait(dev_priv, 2 * CMDBUF_ALIGNMENT_SIZE);
472 vb = via_get_dma(dev_priv);
473 VIA_OUT_RING_QW(HC_HEADER2 | ((VIA_REG_TRANSET >> 2) << 12) |
474 (VIA_REG_TRANSPACE >> 2), HC_ParaType_PreCR << 16);
476 agp_base = dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr;
477 qw_pad_count = (CMDBUF_ALIGNMENT_SIZE >> 3) -
478 ((dev_priv->dma_low & CMDBUF_ALIGNMENT_MASK) >> 3);
480 cmd_addr = (addr) ? addr :
481 agp_base + dev_priv->dma_low - 8 + (qw_pad_count << 3);
482 addr_lo = ((HC_SubA_HAGPBpL << 24) | (cmd_type & HC_HAGPBpID_MASK) |
483 (cmd_addr & HC_HAGPBpL_MASK));
484 addr_hi = ((HC_SubA_HAGPBpH << 24) | (cmd_addr >> 24));
486 vb = via_align_buffer(dev_priv, vb, qw_pad_count - 1);
487 VIA_OUT_RING_QW(*cmd_addr_hi = addr_hi, *cmd_addr_lo = addr_lo);
491 static void via_cmdbuf_start(drm_via_private_t * dev_priv)
493 uint32_t pause_addr_lo, pause_addr_hi;
494 uint32_t start_addr, start_addr_lo;
495 uint32_t end_addr, end_addr_lo;
502 dev_priv->dma_low = 0;
504 agp_base = dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr;
505 start_addr = agp_base;
506 end_addr = agp_base + dev_priv->dma_high;
508 start_addr_lo = ((HC_SubA_HAGPBstL << 24) | (start_addr & 0xFFFFFF));
509 end_addr_lo = ((HC_SubA_HAGPBendL << 24) | (end_addr & 0xFFFFFF));
510 command = ((HC_SubA_HAGPCMNT << 24) | (start_addr >> 24) |
511 ((end_addr & 0xff000000) >> 16));
513 dev_priv->last_pause_ptr =
514 via_align_cmd(dev_priv, HC_HAGPBpID_PAUSE, 0,
515 &pause_addr_hi, & pause_addr_lo, 1) - 1;
517 via_flush_write_combine();
518 (void) *(volatile uint32_t *)dev_priv->last_pause_ptr;
520 VIA_WRITE(VIA_REG_TRANSET, (HC_ParaType_PreCR << 16));
521 VIA_WRITE(VIA_REG_TRANSPACE, command);
522 VIA_WRITE(VIA_REG_TRANSPACE, start_addr_lo);
523 VIA_WRITE(VIA_REG_TRANSPACE, end_addr_lo);
525 VIA_WRITE(VIA_REG_TRANSPACE, pause_addr_hi);
526 VIA_WRITE(VIA_REG_TRANSPACE, pause_addr_lo);
527 DRM_WRITEMEMORYBARRIER();
528 VIA_WRITE(VIA_REG_TRANSPACE, command | HC_HAGPCMNT_MASK);
529 VIA_READ(VIA_REG_TRANSPACE);
531 dev_priv->dma_diff = 0;
534 while (!(VIA_READ(0x41c) & 0x80000000) && count--);
536 reader = *(dev_priv->hw_addr_ptr);
537 ptr = ((volatile char *)dev_priv->last_pause_ptr - dev_priv->dma_ptr) +
538 dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr + 4;
541 * This is the difference between where we tell the
542 * command reader to pause and where it actually pauses.
543 * This differs between hw implementation so we need to
547 dev_priv->dma_diff = ptr - reader;
550 static void via_pad_cache(drm_via_private_t *dev_priv, int qwords)
554 via_cmdbuf_wait(dev_priv, qwords + 2);
555 vb = via_get_dma(dev_priv);
556 VIA_OUT_RING_QW(HC_HEADER2, HC_ParaType_NotTex << 16);
557 via_align_buffer(dev_priv, vb, qwords);
560 static inline void via_dummy_bitblt(drm_via_private_t * dev_priv)
562 uint32_t *vb = via_get_dma(dev_priv);
563 SetReg2DAGP(0x0C, (0 | (0 << 16)));
564 SetReg2DAGP(0x10, 0 | (0 << 16));
565 SetReg2DAGP(0x0, 0x1 | 0x2000 | 0xAA000000);
568 static void via_cmdbuf_jump(drm_via_private_t * dev_priv)
571 uint32_t pause_addr_lo, pause_addr_hi;
572 uint32_t jump_addr_lo, jump_addr_hi;
573 volatile uint32_t *last_pause_ptr;
575 agp_base = dev_priv->dma_offset + (uint32_t) dev_priv->agpAddr;
576 via_align_cmd(dev_priv, HC_HAGPBpID_JUMP, 0, &jump_addr_hi,
579 dev_priv->dma_wrap = dev_priv->dma_low;
583 * Wrap command buffer to the beginning.
586 dev_priv->dma_low = 0;
587 if (via_cmdbuf_wait(dev_priv, CMDBUF_ALIGNMENT_SIZE) != 0) {
588 DRM_ERROR("via_cmdbuf_jump failed\n");
591 via_dummy_bitblt(dev_priv);
592 via_dummy_bitblt(dev_priv);
593 last_pause_ptr = via_align_cmd(dev_priv, HC_HAGPBpID_PAUSE, 0, &pause_addr_hi,
594 &pause_addr_lo, 0) -1;
595 via_align_cmd(dev_priv, HC_HAGPBpID_PAUSE, 0, &pause_addr_hi,
597 *last_pause_ptr = pause_addr_lo;
599 via_hook_segment(dev_priv, jump_addr_hi, jump_addr_lo, 0);
602 static void via_cmdbuf_rewind(drm_via_private_t * dev_priv)
604 via_cmdbuf_jump(dev_priv);
607 static void via_cmdbuf_flush(drm_via_private_t * dev_priv, uint32_t cmd_type)
609 uint32_t pause_addr_lo, pause_addr_hi;
611 via_align_cmd(dev_priv, cmd_type, 0, &pause_addr_hi, &pause_addr_lo, 0);
612 via_hook_segment(dev_priv, pause_addr_hi, pause_addr_lo, 0);
616 static void via_cmdbuf_pause(drm_via_private_t * dev_priv)
618 via_cmdbuf_flush(dev_priv, HC_HAGPBpID_PAUSE);
621 static void via_cmdbuf_reset(drm_via_private_t * dev_priv)
623 via_cmdbuf_flush(dev_priv, HC_HAGPBpID_STOP);
624 via_wait_idle(dev_priv);
628 * User interface to the space and lag functions.
631 static int via_cmdbuf_size(struct drm_device *dev, void *data, struct drm_file *file_priv)
633 drm_via_cmdbuf_size_t *d_siz = data;
635 uint32_t tmp_size, count;
636 drm_via_private_t *dev_priv;
639 LOCK_TEST_WITH_RETURN(dev, file_priv);
641 dev_priv = (drm_via_private_t *) dev->dev_private;
643 if (dev_priv->ring.virtual_start == NULL) {
644 DRM_ERROR("called without initializing AGP ring buffer.\n");
649 tmp_size = d_siz->size;
650 switch (d_siz->func) {
651 case VIA_CMDBUF_SPACE:
652 while (((tmp_size = via_cmdbuf_space(dev_priv)) < d_siz->size)
659 DRM_ERROR("VIA_CMDBUF_SPACE timed out.\n");
664 while (((tmp_size = via_cmdbuf_lag(dev_priv)) > d_siz->size)
671 DRM_ERROR("VIA_CMDBUF_LAG timed out.\n");
678 d_siz->size = tmp_size;
683 #ifndef VIA_HAVE_DMABLIT
685 via_dma_blit_sync( struct drm_device *dev, void *data, struct drm_file *file_priv ) {
686 DRM_ERROR("PCI DMA BitBlt is not implemented for this system.\n");
690 via_dma_blit( struct drm_device *dev, void *data, struct drm_file *file_priv ) {
691 DRM_ERROR("PCI DMA BitBlt is not implemented for this system.\n");
696 struct drm_ioctl_desc via_ioctls[] = {
697 DRM_IOCTL_DEF(DRM_VIA_ALLOCMEM, via_mem_alloc, DRM_AUTH),
698 DRM_IOCTL_DEF(DRM_VIA_FREEMEM, via_mem_free, DRM_AUTH),
699 DRM_IOCTL_DEF(DRM_VIA_AGP_INIT, via_agp_init, DRM_AUTH|DRM_MASTER),
700 DRM_IOCTL_DEF(DRM_VIA_FB_INIT, via_fb_init, DRM_AUTH|DRM_MASTER),
701 DRM_IOCTL_DEF(DRM_VIA_MAP_INIT, via_map_init, DRM_AUTH|DRM_MASTER),
702 DRM_IOCTL_DEF(DRM_VIA_DEC_FUTEX, via_decoder_futex, DRM_AUTH),
703 DRM_IOCTL_DEF(DRM_VIA_DMA_INIT, via_dma_init, DRM_AUTH),
704 DRM_IOCTL_DEF(DRM_VIA_CMDBUFFER, via_cmdbuffer, DRM_AUTH),
705 DRM_IOCTL_DEF(DRM_VIA_FLUSH, via_flush_ioctl, DRM_AUTH),
706 DRM_IOCTL_DEF(DRM_VIA_PCICMD, via_pci_cmdbuffer, DRM_AUTH),
707 DRM_IOCTL_DEF(DRM_VIA_CMDBUF_SIZE, via_cmdbuf_size, DRM_AUTH),
708 DRM_IOCTL_DEF(DRM_VIA_WAIT_IRQ, via_wait_irq, DRM_AUTH),
709 DRM_IOCTL_DEF(DRM_VIA_DMA_BLIT, via_dma_blit, DRM_AUTH),
710 DRM_IOCTL_DEF(DRM_VIA_BLIT_SYNC, via_dma_blit_sync, DRM_AUTH)
713 int via_max_ioctl = DRM_ARRAY_SIZE(via_ioctls);