drivers/gpu/drm/via/via_dma.h | 29 - drivers/gpu/drm/via/via_drv.c | 4 drivers/gpu/drm/via/via_drv.h | 3 drivers/gpu/drm/via/via_h1_dma.c | 690 ++++----------------------------------- drivers/gpu/drm/via/via_ioc32.c | 10 drivers/gpu/drm/via/via_irq.c | 9 drivers/gpu/drm/via/via_ttm.c | 74 +++- drivers/gpu/drm/via/via_video.c | 4 8 files changed, 174 insertions(+), 649 deletions(-)
New commits: commit d3a112941fecf610711d67e9d2d412ce258f546e Author: James Simmons <jsimm...@infradead.org> Date: Wed Feb 27 17:48:02 2013 -0500 Accelerate buffer object domain changes (DMA blitting) diff --git a/drivers/gpu/drm/via/via_dma.h b/drivers/gpu/drm/via/via_dma.h index cdfff36..b002475 100644 --- a/drivers/gpu/drm/via/via_dma.h +++ b/drivers/gpu/drm/via/via_dma.h @@ -57,15 +57,13 @@ struct via_h1_header { }; struct drm_via_sg_info { - struct page **pages; - unsigned long num_pages; - struct via_h1_header **desc_pages; + struct ttm_tt *ttm; + unsigned long **desc_pages; int num_desc_pages; int num_desc; enum dma_data_direction direction; - unsigned char *bounce_buffer; + unsigned long dev_start; dma_addr_t chain_start; - uint32_t free_on_sequence; unsigned int descriptors_per_page; int aborted; enum { @@ -77,27 +75,6 @@ struct drm_via_sg_info { } state; }; -typedef struct _drm_via_blitq { - struct drm_device *dev; - uint32_t cur_blit_handle; - uint32_t done_blit_handle; - unsigned serviced; - unsigned head; - unsigned cur; - unsigned num_free; - unsigned num_outstanding; - unsigned long end; - int aborting; - int is_active; - struct drm_via_sg_info *blits[VIA_NUM_BLIT_SLOTS]; - spinlock_t blit_lock; - wait_queue_head_t blit_queue[VIA_NUM_BLIT_SLOTS]; - wait_queue_head_t busy_queue; - struct work_struct wq; - struct timer_list poll_timer; -} drm_via_blitq_t; - - /* * PCI DMA Registers * Channels 2 & 3 don't seem to be implemented in hardware. diff --git a/drivers/gpu/drm/via/via_drv.c b/drivers/gpu/drm/via/via_drv.c index d5e95e0..e6d1e28 100644 --- a/drivers/gpu/drm/via/via_drv.c +++ b/drivers/gpu/drm/via/via_drv.c @@ -372,6 +372,10 @@ via_driver_load(struct drm_device *dev, unsigned long chipset) if (ret) goto out_err; + ret = via_dmablit_init(dev); + if (ret) + goto out_err; + if (drm_core_check_feature(dev, DRIVER_MODESET)) ret = via_modeset_init(dev); out_err: diff --git a/drivers/gpu/drm/via/via_drv.h b/drivers/gpu/drm/via/via_drv.h index f700ac0..8b21218 100644 --- a/drivers/gpu/drm/via/via_drv.h +++ b/drivers/gpu/drm/via/via_drv.h @@ -138,7 +138,6 @@ struct drm_via_private { struct via_fence_pool dma_fences; int desc_size; - drm_via_blitq_t blit_queues[VIA_NUM_BLIT_ENGINES]; wait_queue_head_t decoder_queue[VIA_NR_XVMC_LOCKS]; struct via_crtc iga[2]; @@ -191,8 +190,6 @@ extern int via_cmdbuf_size(struct drm_device *dev, void *data, struct drm_file * extern int via_pci_cmdbuffer(struct drm_device *dev, void *data, struct drm_file *file_priv); extern int via_decoder_futex(struct drm_device *dev, void *data, struct drm_file *file_priv); extern int via_wait_irq(struct drm_device *dev, void *data, struct drm_file *file_priv); -extern int via_dma_blit_sync(struct drm_device *dev, void *data, struct drm_file *file_priv); -extern int via_dma_blit(struct drm_device *dev, void *data, struct drm_file *file_priv); extern int via_wait_idle(struct drm_via_private *dev_priv); extern int via_detect_vram(struct drm_device *dev); diff --git a/drivers/gpu/drm/via/via_h1_dma.c b/drivers/gpu/drm/via/via_h1_dma.c index 9befd8a..d2e8521 100644 --- a/drivers/gpu/drm/via/via_h1_dma.c +++ b/drivers/gpu/drm/via/via_h1_dma.c @@ -29,10 +29,6 @@ #include "via_drv.h" #include "via_dma.h" -#define VIA_PGDN(x) (((unsigned long)(x)) & PAGE_MASK) -#define VIA_PGOFF(x) (((unsigned long)(x)) & ~PAGE_MASK) -#define VIA_PFN(x) ((unsigned long)(x) >> PAGE_SHIFT) - /* * Fire a blit engine. */ @@ -69,148 +65,92 @@ via_dmablit_engine_off(struct drm_device *dev, int engine) VIA_WRITE(VIA_PCI_DMA_CSR0 + engine * 0x04, VIA_DMA_CSR_TD | VIA_DMA_CSR_DD); } +static void +via_dmablit_done(struct drm_device *dev, int engine) +{ + struct drm_via_private *dev_priv = dev->dev_private; + + /* Clear transfer done flag. */ + VIA_WRITE(VIA_PCI_DMA_CSR0 + engine * 0x04, VIA_DMA_CSR_TD); +} + /* * Unmap a DMA mapping. */ static void -via_unmap_from_device(struct device *dev, struct drm_via_sg_info *vsg) +via_unmap_from_device(struct drm_device *dev, struct drm_via_sg_info *vsg) { + struct drm_via_private *dev_priv = dev->dev_private; int num_desc = vsg->num_desc; unsigned cur_descriptor_page = num_desc / vsg->descriptors_per_page; unsigned descriptor_this_page = num_desc % vsg->descriptors_per_page; - struct via_h1_header *desc_ptr = vsg->desc_pages[cur_descriptor_page] + - descriptor_this_page; dma_addr_t next = vsg->chain_start; + struct via_h1_header *desc_ptr; + desc_ptr = (struct via_h1_header *) vsg->desc_pages[cur_descriptor_page] + + descriptor_this_page; while (num_desc--) { if (descriptor_this_page-- == 0) { cur_descriptor_page--; descriptor_this_page = vsg->descriptors_per_page - 1; - desc_ptr = vsg->desc_pages[cur_descriptor_page] + - descriptor_this_page; + desc_ptr = (struct via_h1_header *) vsg->desc_pages[cur_descriptor_page] + + descriptor_this_page; } - dma_unmap_single(dev, next, sizeof(*desc_ptr), DMA_TO_DEVICE); - dma_unmap_page(dev, desc_ptr->mem_addr, desc_ptr->size, vsg->direction); + dma_unmap_single(dev->dev, next, dev_priv->desc_size, DMA_TO_DEVICE); + dma_unmap_page(dev->dev, desc_ptr->mem_addr, desc_ptr->size, vsg->direction); next = (dma_addr_t) desc_ptr->next; desc_ptr--; } } /* - * Count how many descriptors are needed. - */ -static void -via_count_descriptors(const drm_via_dmablit_t *xfer, struct drm_via_sg_info *vsg) -{ - unsigned char *mem_addr = xfer->mem_addr, *cur_mem; - uint32_t fb_addr = xfer->fb_addr, cur_fb; - int num_desc = 0, cur_line; - unsigned long line_len; - unsigned remaining_len; - - for (cur_line = 0; cur_line < xfer->num_lines; ++cur_line) { - line_len = xfer->line_length; - cur_fb = fb_addr; - cur_mem = mem_addr; - - while (line_len > 0) { - remaining_len = min(PAGE_SIZE-VIA_PGOFF(cur_mem), line_len); - line_len -= remaining_len; - - num_desc++; - cur_mem += remaining_len; - cur_fb += remaining_len; - } - - mem_addr += xfer->mem_stride; - fb_addr += xfer->fb_stride; - } - vsg->num_desc = num_desc; -} - -/* * Map the DMA pages for the device, put together and map also the descriptors. Descriptors * are run in reverse order by the hardware because we are not allowed to update the * 'next' field without syncing calls when the descriptor is already mapped. */ -static void -via_map_for_device(struct device *dev, const drm_via_dmablit_t *xfer, - struct drm_via_sg_info *vsg) -{ - unsigned num_descriptors_this_page = 0, cur_descriptor_page = 0; - unsigned char *mem_addr = xfer->mem_addr, *cur_mem; - unsigned char *first_addr = (unsigned char *)VIA_PGDN(mem_addr); - uint32_t fb_addr = xfer->fb_addr, cur_fb; - unsigned long line_len; - unsigned remaining_len; - int num_desc = 0; - int cur_line; - dma_addr_t next = 0 | VIA_DMA_DPR_EC; - struct via_h1_header *desc_ptr = vsg->desc_pages[cur_descriptor_page]; - - for (cur_line = 0; cur_line < xfer->num_lines; ++cur_line) { - line_len = xfer->line_length; - cur_fb = fb_addr; - cur_mem = mem_addr; - - while (line_len > 0) { - remaining_len = min(PAGE_SIZE-VIA_PGOFF(cur_mem), line_len); - line_len -= remaining_len; - - desc_ptr->mem_addr = dma_map_page(dev, - vsg->pages[VIA_PFN(cur_mem) - VIA_PFN(first_addr)], - VIA_PGOFF(cur_mem), remaining_len, - vsg->direction); - desc_ptr->dev_addr = cur_fb; - desc_ptr->size = remaining_len; - desc_ptr->next = (uint32_t) next; - next = dma_map_single(dev, desc_ptr, sizeof(*desc_ptr), DMA_TO_DEVICE); - desc_ptr++; - if (++num_descriptors_this_page >= vsg->descriptors_per_page) { - num_descriptors_this_page = 0; - desc_ptr = vsg->desc_pages[++cur_descriptor_page]; - } - - cur_mem += remaining_len; - cur_fb += remaining_len; - num_desc++; +static int +via_map_for_device(struct via_fence_engine *eng, struct drm_via_sg_info *vsg, + unsigned long offset) +{ + unsigned int num_descriptors_this_page = 0, cur_descriptor_page = 0; + unsigned long dev_start = eng->pool->fence_sync.bo->offset; + struct device *dev = eng->pool->dev->dev; + dma_addr_t next = VIA_DMA_DPR_EC; + struct via_h1_header *desc_ptr; + struct ttm_tt *ttm = vsg->ttm; + int num_desc = 0, ret = 0; + + desc_ptr = (struct via_h1_header *) vsg->desc_pages[cur_descriptor_page]; + dev_start = vsg->dev_start; + + for (num_desc = 0; num_desc < ttm->num_pages; num_desc++) { + /* Map system pages */ + if (!ttm->pages[num_desc]) { + ret = -ENOMEM; + goto out; } - - mem_addr += xfer->mem_stride; - fb_addr += xfer->fb_stride; + desc_ptr->mem_addr = dma_map_page(dev, ttm->pages[num_desc], 0, + PAGE_SIZE, vsg->direction); + desc_ptr->dev_addr = dev_start; + /* size count in 16 bytes */ + desc_ptr->size = PAGE_SIZE / 16; + desc_ptr->next = (uint32_t) next; + + /* Map decriptors for Chaining mode */ + next = dma_map_single(dev, desc_ptr, sizeof(*desc_ptr), DMA_TO_DEVICE); + desc_ptr++; + if (++num_descriptors_this_page >= vsg->descriptors_per_page) { + num_descriptors_this_page = 0; + desc_ptr = (struct via_h1_header *) vsg->desc_pages[++cur_descriptor_page]; + } + dev_start += PAGE_SIZE; } vsg->chain_start = next; vsg->state = dr_via_device_mapped; - vsg->num_desc = num_desc; -} - -/* - * Allocate DMA capable memory for the blit descriptor chain, and an array that keeps track of the - * pages we allocate. We don't want to use kmalloc for the descriptor chain because it may be - * quite large for some blits, and pages don't need to be contingous. - */ -static int -via_alloc_desc_pages(struct drm_via_sg_info *vsg) -{ - int i; - - vsg->descriptors_per_page = PAGE_SIZE / sizeof(struct via_h1_header); - vsg->num_desc_pages = (vsg->num_desc + vsg->descriptors_per_page - 1) / - vsg->descriptors_per_page; - - if (NULL == (vsg->desc_pages = kcalloc(vsg->num_desc_pages, sizeof(void *), GFP_KERNEL))) - return -ENOMEM; - - vsg->state = dr_via_desc_pages_alloc; - for (i = 0; i < vsg->num_desc_pages; ++i) { - if (NULL == (vsg->desc_pages[i] = (struct via_h1_header *) __get_free_page(GFP_KERNEL))) - return -ENOMEM; - } - DRM_DEBUG("Allocated %d pages for %d descriptors.\n", vsg->num_desc_pages, - vsg->num_desc); - return 0; +out: + return ret; } /* @@ -219,9 +159,10 @@ via_alloc_desc_pages(struct drm_via_sg_info *vsg) * with the actual status of the used resources. */ static void -via_free_sg_info(struct device *dev, struct drm_via_sg_info *vsg) +via_free_sg_info(struct via_fence *fence) { - struct page *page; + struct drm_device *dev = fence->pool->dev; + struct drm_via_sg_info *vsg = fence->priv; int i; switch (vsg->state) { @@ -229,525 +170,58 @@ via_free_sg_info(struct device *dev, struct drm_via_sg_info *vsg) via_unmap_from_device(dev, vsg); case dr_via_desc_pages_alloc: for (i = 0; i < vsg->num_desc_pages; ++i) { - if (vsg->desc_pages[i] != NULL) + if (vsg->desc_pages[i]) free_page((unsigned long)vsg->desc_pages[i]); } kfree(vsg->desc_pages); - case dr_via_pages_locked: - for (i = 0; i < vsg->num_pages; ++i) { - if (NULL != (page = vsg->pages[i])) { - if (!PageReserved(page) && (DMA_FROM_DEVICE == vsg->direction)) - SetPageDirty(page); - page_cache_release(page); - } - } - case dr_via_pages_alloc: - vfree(vsg->pages); default: vsg->state = dr_via_sg_init; } - vfree(vsg->bounce_buffer); - vsg->bounce_buffer = NULL; - vsg->free_on_sequence = 0; } -/* - * Obtain a page pointer array and lock all pages into system memory. A segmentation violation will - * occur here if the calling user does not have access to the submitted address. - */ -static int -via_lock_all_dma_pages(struct drm_device *dev, struct drm_via_sg_info *ttm, drm_via_dmablit_t *xfer) -{ - unsigned long first_pfn = VIA_PFN(xfer->mem_addr); - int write = xfer->to_fb, ret; - unsigned long start; - - ttm->direction = (write) ? DMA_TO_DEVICE : DMA_FROM_DEVICE; - ttm->bounce_buffer = NULL; - ttm->state = dr_via_sg_init; - ttm->num_pages = VIA_PFN(xfer->mem_addr + (xfer->num_lines * xfer->mem_stride - 1)) - - first_pfn + 1; - ttm->pages = vzalloc(sizeof(struct page *) * ttm->num_pages); - if (NULL == ttm->pages) - return -ENOMEM; - - start = (unsigned long)xfer->mem_addr; - - down_read(¤t->mm->mmap_sem); - ret = get_user_pages(current, current->mm, start, ttm->num_pages, - (ttm->direction == DMA_FROM_DEVICE), - 0, ttm->pages, NULL); - - up_read(¤t->mm->mmap_sem); - if (ret != ttm->num_pages) { - if (ret < 0) - return ret; - ttm->state = dr_via_pages_locked; - return -EINVAL; - } - ttm->state = dr_via_pages_locked; - DRM_DEBUG("DMA pages locked\n"); - return 0; -} - -/* - * The dmablit part of the IRQ handler. Trying to do only reasonably fast things here. - * The rest, like unmapping and freeing memory for done blits is done in a separate workqueue - * task. Basically the task of the interrupt handler is to submit a new blit to the engine, while - * the workqueue task takes care of processing associated with the old blit. - */ -void -via_dmablit_handler(struct drm_device *dev, int engine, int from_irq) -{ - struct drm_via_private *dev_priv = dev->dev_private; - drm_via_blitq_t *blitq = dev_priv->blit_queues + engine; - int done_transfer, cur; - unsigned long irqsave = 0; - uint32_t status = 0; - - DRM_DEBUG("DMA blit handler called. engine = %d, from_irq = %d, blitq = 0x%lx\n", - engine, from_irq, (unsigned long) blitq); - - if (from_irq) - spin_lock(&blitq->blit_lock); - else - spin_lock_irqsave(&blitq->blit_lock, irqsave); - - done_transfer = blitq->is_active && - ((status = VIA_READ(VIA_PCI_DMA_CSR0 + engine * 0x04)) & VIA_DMA_CSR_TD); - done_transfer = done_transfer || (blitq->aborting && !(status & VIA_DMA_CSR_DE)); - - cur = blitq->cur; - if (done_transfer) { - - blitq->blits[cur]->aborted = blitq->aborting; - blitq->done_blit_handle++; - DRM_WAKEUP(blitq->blit_queue + cur); - - cur++; - if (cur >= VIA_NUM_BLIT_SLOTS) - cur = 0; - blitq->cur = cur; - - /* - * Clear transfer done flag. - */ - - VIA_WRITE(VIA_PCI_DMA_CSR0 + engine * 0x04, VIA_DMA_CSR_TD); - - blitq->is_active = 0; - blitq->aborting = 0; - schedule_work(&blitq->wq); - - } else if (blitq->is_active && time_after_eq(jiffies, blitq->end)) { - /* - * Abort transfer after one second. - */ - via_abort_dmablit(dev, engine); - blitq->aborting = 1; - blitq->end = jiffies + DRM_HZ; - } - - if (!blitq->is_active) { - if (blitq->num_outstanding) { - via_h1_fire_dmablit(dev, blitq->blits[cur], engine); - blitq->is_active = 1; - blitq->cur = cur; - blitq->num_outstanding--; - blitq->end = jiffies + DRM_HZ; - if (!timer_pending(&blitq->poll_timer)) - mod_timer(&blitq->poll_timer, jiffies + 1); - } else { - if (timer_pending(&blitq->poll_timer)) - del_timer(&blitq->poll_timer); - via_dmablit_engine_off(dev, engine); - } - } - - if (from_irq) - spin_unlock(&blitq->blit_lock); - else - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); -} - -/* - * Check whether this blit is still active, performing necessary locking. - */ -static int -via_dmablit_active(drm_via_blitq_t *blitq, int engine, uint32_t handle, wait_queue_head_t **queue) +static void +via_h1_dma_fence_signaled(struct via_fence_engine *eng) { - unsigned long irqsave; - uint32_t slot; - int active; - - spin_lock_irqsave(&blitq->blit_lock, irqsave); - - /* - * Allow for handle wraparounds. - */ - active = ((blitq->done_blit_handle - handle) > (1 << 23)) && - ((blitq->cur_blit_handle - handle) <= (1 << 23)); - - if (queue && active) { - slot = handle - blitq->done_blit_handle + blitq->cur - 1; - if (slot >= VIA_NUM_BLIT_SLOTS) - slot -= VIA_NUM_BLIT_SLOTS; - *queue = blitq->blit_queue + slot; - } - - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); - - return active; + via_dmablit_done(eng->pool->dev, eng->index); } /* - * Sync. Wait for at least three seconds for the blit to be performed. + * Build all info and do all mappings required for a blit. */ static int -via_dmablit_sync(struct drm_device *dev, uint32_t handle, int engine) +via_h1_dma_emit(struct via_fence *fence) { - struct drm_via_private *dev_priv = dev->dev_private; - drm_via_blitq_t *blitq = dev_priv->blit_queues + engine; - wait_queue_head_t *queue; + struct via_fence_engine *eng = fence->pool->engines[fence->engine]; + unsigned long offset = VIA_FENCE_SIZE * eng->index; + struct drm_via_sg_info *vsg = fence->priv; int ret = 0; - if (via_dmablit_active(blitq, engine, handle, &queue)) { - DRM_WAIT_ON(ret, *queue, 3 * DRM_HZ, - !via_dmablit_active(blitq, engine, handle, NULL)); + ret = via_map_for_device(eng, vsg, offset); + if (!ret) { + writel(fence->seq.key, eng->read_seq); + via_h1_fire_dmablit(fence->pool->dev, vsg, fence->engine); } - DRM_DEBUG("DMA blit sync handle 0x%x engine %d returned %d\n", - handle, engine, ret); - return ret; } /* - * A timer that regularly polls the blit engine in cases where we don't have interrupts: - * a) Broken hardware (typically those that don't have any video capture facility). - * b) Blit abort. The hardware doesn't send an interrupt when a blit is aborted. - * The timer and hardware IRQ's can and do work in parallel. If the hardware has - * irqs, it will shorten the latency somewhat. - */ -static void -via_dmablit_timer(unsigned long data) -{ - drm_via_blitq_t *blitq = (drm_via_blitq_t *) data; - struct drm_device *dev = blitq->dev; - int engine = (int) - (blitq - ((struct drm_via_private *)dev->dev_private)->blit_queues); - - DRM_DEBUG("Polling timer called for engine %d, jiffies %lu\n", engine, - (unsigned long) jiffies); - - via_dmablit_handler(dev, engine, 0); - - if (!timer_pending(&blitq->poll_timer)) { - mod_timer(&blitq->poll_timer, jiffies + 1); - - /* - * Rerun handler to delete timer if engines are off, and - * to shorten abort latency. This is a little nasty. - */ - via_dmablit_handler(dev, engine, 0); - } -} - -/* - * Workqueue task that frees data and mappings associated with a blit. - * Also wakes up waiting processes. Each of these tasks handles one - * blit engine only and may not be called on each interrupt. - */ -static void -via_dmablit_workqueue(struct work_struct *work) -{ - drm_via_blitq_t *blitq = container_of(work, drm_via_blitq_t, wq); - struct drm_device *dev = blitq->dev; - struct drm_via_sg_info *cur_sg; - unsigned long irqsave; - int cur_released; - - DRM_DEBUG("Workqueue task called for blit engine %ld\n", (unsigned long) - (blitq - ((struct drm_via_private *)dev->dev_private)->blit_queues)); - - spin_lock_irqsave(&blitq->blit_lock, irqsave); - - while (blitq->serviced != blitq->cur) { - - cur_released = blitq->serviced++; - - DRM_DEBUG("Releasing blit slot %d\n", cur_released); - - if (blitq->serviced >= VIA_NUM_BLIT_SLOTS) - blitq->serviced = 0; - - cur_sg = blitq->blits[cur_released]; - blitq->num_free++; - - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); - - DRM_WAKEUP(&blitq->busy_queue); - - via_free_sg_info(dev->dev, cur_sg); - kfree(cur_sg); - - spin_lock_irqsave(&blitq->blit_lock, irqsave); - } - - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); -} - -/* * Init all blit engines. Currently we use two, but some hardware have 4. */ -void -via_init_dmablit(struct drm_device *dev) +int +via_dmablit_init(struct drm_device *dev) { struct drm_via_private *dev_priv = dev->dev_private; - drm_via_blitq_t *blitq; - int i, j; + struct via_fence_pool *pool = &dev_priv->dma_fences; + int ret; pci_set_master(dev->pdev); - for (i = 0; i < VIA_NUM_BLIT_ENGINES; ++i) { - blitq = dev_priv->blit_queues + i; - blitq->dev = dev; - blitq->cur_blit_handle = 0; - blitq->done_blit_handle = 0; - blitq->head = 0; - blitq->cur = 0; - blitq->serviced = 0; - blitq->num_free = VIA_NUM_BLIT_SLOTS - 1; - blitq->num_outstanding = 0; - blitq->is_active = 0; - blitq->aborting = 0; - spin_lock_init(&blitq->blit_lock); - for (j = 0; j < VIA_NUM_BLIT_SLOTS; ++j) - DRM_INIT_WAITQUEUE(blitq->blit_queue + j); - DRM_INIT_WAITQUEUE(&blitq->busy_queue); - INIT_WORK(&blitq->wq, via_dmablit_workqueue); - setup_timer(&blitq->poll_timer, via_dmablit_timer, - (unsigned long)blitq); - } -} - -/* - * Build all info and do all mappings required for a blit. - */ -static int -via_build_sg_info(struct drm_device *dev, struct drm_via_sg_info *vsg, drm_via_dmablit_t *xfer) -{ - int ret = 0; - - if (xfer->num_lines <= 0 || xfer->line_length <= 0) { - DRM_ERROR("Zero size bitblt.\n"); - return -EINVAL; - } - - /* - * Below check is a driver limitation, not a hardware one. We - * don't want to lock unused pages, and don't want to incoporate the - * extra logic of avoiding them. Make sure there are no. - * (Not a big limitation anyway.) - */ - - if ((xfer->mem_stride - xfer->line_length) > 2*PAGE_SIZE) { - DRM_ERROR("Too large system memory stride. Stride: %d, " - "Length: %d\n", xfer->mem_stride, xfer->line_length); - return -EINVAL; - } - - if ((xfer->mem_stride == xfer->line_length) && - (xfer->fb_stride == xfer->line_length)) { - xfer->mem_stride *= xfer->num_lines; - xfer->line_length = xfer->mem_stride; - xfer->fb_stride = xfer->mem_stride; - xfer->num_lines = 1; - } - - /* - * Don't lock an arbitrary large number of pages, since that causes a - * DOS security hole. - */ - - if (xfer->num_lines > 2048 || (xfer->num_lines*xfer->mem_stride > (2048*2048*4))) { - DRM_ERROR("Too large PCI DMA bitblt.\n"); - return -EINVAL; - } - - /* - * we allow a negative fb stride to allow flipping of images in - * transfer. - */ - - if (xfer->mem_stride < xfer->line_length || - abs(xfer->fb_stride) < xfer->line_length) { - DRM_ERROR("Invalid frame-buffer / memory stride.\n"); - return -EINVAL; - } - - /* - * A hardware bug seems to be worked around if system memory addresses start on - * 16 byte boundaries. This seems a bit restrictive however. VIA is contacted - * about this. Meanwhile, impose the following restrictions: - */ - -#ifdef VIA_BUGFREE - if ((((unsigned long)xfer->mem_addr & 3) != ((unsigned long)xfer->fb_addr & 3)) || - ((xfer->num_lines > 1) && ((xfer->mem_stride & 3) != (xfer->fb_stride & 3)))) { - DRM_ERROR("Invalid DRM bitblt alignment.\n"); - return -EINVAL; - } -#else - if ((((unsigned long)xfer->mem_addr & 15) || - ((unsigned long)xfer->fb_addr & 3)) || - ((xfer->num_lines > 1) && - ((xfer->mem_stride & 15) || (xfer->fb_stride & 3)))) { - DRM_ERROR("Invalid DRM bitblt alignment.\n"); - return -EINVAL; - } -#endif - - if (0 != (ret = via_lock_all_dma_pages(dev, vsg, xfer))) { - DRM_ERROR("Could not lock DMA pages.\n"); - via_free_sg_info(dev->dev, vsg); - return ret; - } - - via_count_descriptors(xfer, vsg); - if (0 != (ret = via_alloc_desc_pages(vsg))) { - DRM_ERROR("Could not allocate DMA descriptor pages.\n"); - via_free_sg_info(dev->dev, vsg); - return ret; + ret = via_fence_pool_init(pool, "viadrm_dma", 4, TTM_PL_FLAG_VRAM, dev); + if (!ret) { + pool->fence_signaled = via_h1_dma_fence_signaled; + pool->fence_cleanup = via_free_sg_info; + pool->fence_emit = via_h1_dma_emit; } - - via_map_for_device(dev->dev, xfer, vsg); - return 0; -} - -/* - * Reserve one free slot in the blit queue. Will wait for one second for one - * to become available. Otherwise -EBUSY is returned. - */ -static int -via_dmablit_grab_slot(drm_via_blitq_t *blitq, int engine) -{ - int ret = 0; - unsigned long irqsave; - - DRM_DEBUG("Num free is %d\n", blitq->num_free); - spin_lock_irqsave(&blitq->blit_lock, irqsave); - while (blitq->num_free == 0) { - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); - - DRM_WAIT_ON(ret, blitq->busy_queue, DRM_HZ, blitq->num_free > 0); - if (ret) - return (-EINTR == ret) ? -EAGAIN : ret; - - spin_lock_irqsave(&blitq->blit_lock, irqsave); - } - - blitq->num_free--; - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); - - return 0; -} - -/* - * Hand back a free slot if we changed our mind. - */ -static void -via_dmablit_release_slot(drm_via_blitq_t *blitq) -{ - unsigned long irqsave; - - spin_lock_irqsave(&blitq->blit_lock, irqsave); - blitq->num_free++; - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); - DRM_WAKEUP(&blitq->busy_queue); -} - -/* - * Grab a free slot. Build blit info and queue a blit. - */ -static int -via_dmablit(struct drm_device *dev, drm_via_dmablit_t *xfer) -{ - struct drm_via_private *dev_priv = dev->dev_private; - struct drm_via_sg_info *vsg; - drm_via_blitq_t *blitq; - unsigned long irqsave; - int engine, ret; - - if (dev_priv == NULL) { - DRM_ERROR("Called without initialization.\n"); - return -EINVAL; - } - - engine = (xfer->to_fb) ? 0 : 1; - blitq = dev_priv->blit_queues + engine; - if (0 != (ret = via_dmablit_grab_slot(blitq, engine))) - return ret; - - if (NULL == (vsg = kmalloc(sizeof(*vsg), GFP_KERNEL))) { - via_dmablit_release_slot(blitq); - return -ENOMEM; - } - if (0 != (ret = via_build_sg_info(dev, vsg, xfer))) { - via_dmablit_release_slot(blitq); - kfree(vsg); - return ret; - } - - spin_lock_irqsave(&blitq->blit_lock, irqsave); - blitq->blits[blitq->head++] = vsg; - if (blitq->head >= VIA_NUM_BLIT_SLOTS) - blitq->head = 0; - blitq->num_outstanding++; - xfer->sync.sync_handle = ++blitq->cur_blit_handle; - spin_unlock_irqrestore(&blitq->blit_lock, irqsave); - - xfer->sync.engine = engine; - - via_dmablit_handler(dev, engine, 0); - - return 0; -} - -/* - * Sync on a previously submitted blit. Note that the X server use signals extensively, and - * that there is a very big probability that this IOCTL will be interrupted by a signal. In that - * case it returns with -EAGAIN for the signal to be delivered. - * The caller should then reissue the IOCTL. This is similar to what is being done for drmGetLock(). - */ -int -via_dma_blit_sync(struct drm_device *dev, void *data, struct drm_file *file_priv) -{ - drm_via_blitsync_t *sync = data; - int err; - - if (sync->engine >= VIA_NUM_BLIT_ENGINES) - return -EINVAL; - - err = via_dmablit_sync(dev, sync->sync_handle, sync->engine); - - if (-EINTR == err) - err = -EAGAIN; - - return err; -} - -/* - * Queue a blit and hand back a handle to be used for sync. This IOCTL may be interrupted by a signal - * while waiting for a free slot in the blit queue. In that case it returns with -EAGAIN and should - * be reissued. See the above IOCTL code. - */ -int -via_dma_blit(struct drm_device *dev, void *data, struct drm_file *file_priv) -{ - drm_via_dmablit_t *xfer = data; - int err; - - err = via_dmablit(dev, xfer); - - return err; + dev_priv->desc_size = sizeof(struct via_h1_header); + return ret; } diff --git a/drivers/gpu/drm/via/via_ioc32.c b/drivers/gpu/drm/via/via_ioc32.c index 9b933fb..8dc0fa6 100644 --- a/drivers/gpu/drm/via/via_ioc32.c +++ b/drivers/gpu/drm/via/via_ioc32.c @@ -110,6 +110,16 @@ static int via_map_init(struct drm_device *dev, void *data, struct drm_file *fil return ret; } +static int via_dma_blit_sync(struct drm_device *dev, void *data, struct drm_file *file_priv) +{ + return -EINVAL; +} + +static int via_dma_blit(struct drm_device *dev, void *data, struct drm_file *file_priv) +{ + return -EINVAL; +} + static int via_mem_alloc(struct drm_device *dev, void *data, struct drm_file *filp) { diff --git a/drivers/gpu/drm/via/via_irq.c b/drivers/gpu/drm/via/via_irq.c index 089f89d..b0f8ea1 100644 --- a/drivers/gpu/drm/via/via_irq.c +++ b/drivers/gpu/drm/via/via_irq.c @@ -129,14 +129,19 @@ irqreturn_t via_driver_irq_handler(DRM_IRQ_ARGS) for (i = 0; i < dev_priv->num_irqs; ++i) { if (status & cur_irq->pending_mask) { + struct via_fence_engine *eng = NULL; + atomic_inc(&cur_irq->irq_received); DRM_WAKEUP(&cur_irq->irq_queue); ret = IRQ_HANDLED; if (dev_priv->irq_map[drm_via_irq_dma0_td] == i) - via_dmablit_handler(dev, 0, 1); + eng = dev_priv->dma_fences.engines[0]; else if (dev_priv->irq_map[drm_via_irq_dma1_td] == i) - via_dmablit_handler(dev, 1, 1); + eng = dev_priv->dma_fences.engines[1]; + + if (eng) + queue_work(eng->pool->fence_wq, &eng->fence_work); } cur_irq++; } diff --git a/drivers/gpu/drm/via/via_ttm.c b/drivers/gpu/drm/via/via_ttm.c index 0c19bfc..17a4610 100644 --- a/drivers/gpu/drm/via/via_ttm.c +++ b/drivers/gpu/drm/via/via_ttm.c @@ -212,21 +212,81 @@ via_evict_flags(struct ttm_buffer_object *bo, struct ttm_placement *placement) } } +/* + * Allocate DMA capable memory for the blit descriptor chain, and an array that keeps + * track of the pages we allocate. We don't want to use kmalloc for the descriptor + * chain because it may be quite large for some blits, and pages don't need to be + * contingous. + */ +struct drm_via_sg_info * +via_alloc_desc_pages(struct ttm_tt *ttm, struct drm_device *dev, + unsigned long dev_start, enum dma_data_direction direction) +{ + struct drm_via_sg_info *vsg = kzalloc(sizeof(*vsg), GFP_KERNEL); + struct drm_via_private *dev_priv = dev->dev_private; + int desc_size = dev_priv->desc_size, i; + + vsg->ttm = ttm; + vsg->dev_start = dev_start; + vsg->direction = direction; + vsg->num_desc = ttm->num_pages; // + 1; + vsg->descriptors_per_page = PAGE_SIZE / desc_size; + vsg->num_desc_pages = (vsg->num_desc + vsg->descriptors_per_page - 1) / + vsg->descriptors_per_page; + + vsg->desc_pages = kzalloc(vsg->num_desc_pages * sizeof(void *), GFP_KERNEL); + if (!vsg->desc_pages) + return ERR_PTR(-ENOMEM); + + vsg->state = dr_via_desc_pages_alloc; + + /* Alloc pages for descriptor chain */ + for (i = 0; i < vsg->num_desc_pages; ++i) { + vsg->desc_pages[i] = (unsigned long *) __get_free_page(GFP_KERNEL); + + if (!vsg->desc_pages[i]) + return ERR_PTR(-ENOMEM); + } + return vsg; +} + /* Move between GART and VRAM */ static int via_move_blit(struct ttm_buffer_object *bo, bool evict, bool no_wait_gpu, struct ttm_mem_reg *new_mem, struct ttm_mem_reg *old_mem) { - unsigned long old_start, new_start; - void *fence = NULL; + struct drm_via_private *dev_priv = + container_of(bo->bdev, struct drm_via_private, bdev); + enum dma_data_direction direction = DMA_TO_DEVICE; + unsigned long old_start, new_start, dev_addr = 0; + struct drm_via_sg_info *vsg; + int ret = -ENXIO; + struct via_fence *fence; /* Real CPU physical address */ old_start = (old_mem->start << PAGE_SHIFT) + old_mem->bus.base; new_start = (new_mem->start << PAGE_SHIFT) + new_mem->bus.base; - //ret = via_copy(rdev, old_start, new_start, new_mem->num_pages, fence); + if (old_mem->mem_type == TTM_PL_VRAM) { + direction = DMA_FROM_DEVICE; + dev_addr = old_start; + } else if (new_mem->mem_type == TTM_PL_VRAM) { + /* direction is DMA_TO_DEVICE */ + dev_addr = new_start; + } + + /* device addr must be 16 byte align */ + if (dev_addr & 0x0F) + return ret; + + vsg = via_alloc_desc_pages(bo->ttm, dev_priv->dev, dev_addr, direction); + if (unlikely(IS_ERR(vsg))) + return PTR_ERR(vsg); - return ttm_bo_move_accel_cleanup(bo, fence, evict, no_wait_gpu, new_mem); + fence = via_fence_create_and_emit(&dev_priv->dma_fences, vsg, 0); + if (unlikely(IS_ERR(fence))) + return PTR_ERR(fence); + return ttm_bo_move_accel_cleanup(bo, (void *)fence, evict, no_wait_gpu, new_mem); } static int @@ -331,9 +391,11 @@ via_bo_move(struct ttm_buffer_object *bo, bool evict, bool interruptible, } /* Accelerated copy involving the VRAM. */ - if (new_mem->mem_type == TTM_PL_SYSTEM) { + if (old_mem->mem_type == TTM_PL_VRAM && + new_mem->mem_type == TTM_PL_SYSTEM) { ret = via_move_from_vram(bo, interruptible, no_wait_gpu, new_mem); - } else if (old_mem->mem_type == TTM_PL_SYSTEM) { + } else if (old_mem->mem_type == TTM_PL_SYSTEM && + new_mem->mem_type == TTM_PL_VRAM) { ret = via_move_to_vram(bo, interruptible, no_wait_gpu, new_mem); } else { ret = via_move_blit(bo, evict, no_wait_gpu, new_mem, old_mem); diff --git a/drivers/gpu/drm/via/via_video.c b/drivers/gpu/drm/via/via_video.c index 997f1dd..8071ec9 100644 --- a/drivers/gpu/drm/via/via_video.c +++ b/drivers/gpu/drm/via/via_video.c @@ -30,8 +30,6 @@ void via_init_futex(struct drm_via_private *dev_priv) { unsigned int i; - DRM_DEBUG("\n"); - for (i = 0; i < VIA_NR_XVMC_LOCKS; ++i) { DRM_INIT_WAITQUEUE(&(dev_priv->decoder_queue[i])); XVMCLOCKPTR(dev_priv->sarea_priv, i)->lock = 0; @@ -70,8 +68,6 @@ int via_decoder_futex(struct drm_device *dev, void *data, struct drm_file *file_ drm_via_sarea_t *sAPriv = dev_priv->sarea_priv; int ret = 0; - DRM_DEBUG("\n"); - if (fx->lock >= VIA_NR_XVMC_LOCKS) return -EFAULT; _______________________________________________ Openchrome-devel mailing list Openchrome-devel@lists.freedesktop.org http://lists.freedesktop.org/mailman/listinfo/openchrome-devel