18c2ecf20Sopenharmony_ci/* via_dmablit.c -- PCI DMA BitBlt support for the VIA Unichrome/Pro
28c2ecf20Sopenharmony_ci *
38c2ecf20Sopenharmony_ci * Copyright (C) 2005 Thomas Hellstrom, All Rights Reserved.
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * Permission is hereby granted, free of charge, to any person obtaining a
68c2ecf20Sopenharmony_ci * copy of this software and associated documentation files (the "Software"),
78c2ecf20Sopenharmony_ci * to deal in the Software without restriction, including without limitation
88c2ecf20Sopenharmony_ci * the rights to use, copy, modify, merge, publish, distribute, sub license,
98c2ecf20Sopenharmony_ci * and/or sell copies of the Software, and to permit persons to whom the
108c2ecf20Sopenharmony_ci * Software is furnished to do so, subject to the following conditions:
118c2ecf20Sopenharmony_ci *
128c2ecf20Sopenharmony_ci * The above copyright notice and this permission notice (including the
138c2ecf20Sopenharmony_ci * next paragraph) shall be included in all copies or substantial portions
148c2ecf20Sopenharmony_ci * of the Software.
158c2ecf20Sopenharmony_ci *
168c2ecf20Sopenharmony_ci * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
178c2ecf20Sopenharmony_ci * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
188c2ecf20Sopenharmony_ci * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
198c2ecf20Sopenharmony_ci * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
208c2ecf20Sopenharmony_ci * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
218c2ecf20Sopenharmony_ci * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
228c2ecf20Sopenharmony_ci * USE OR OTHER DEALINGS IN THE SOFTWARE.
238c2ecf20Sopenharmony_ci *
248c2ecf20Sopenharmony_ci * Authors:
258c2ecf20Sopenharmony_ci *    Thomas Hellstrom.
268c2ecf20Sopenharmony_ci *    Partially based on code obtained from Digeo Inc.
278c2ecf20Sopenharmony_ci */
288c2ecf20Sopenharmony_ci
298c2ecf20Sopenharmony_ci
308c2ecf20Sopenharmony_ci/*
318c2ecf20Sopenharmony_ci * Unmaps the DMA mappings.
328c2ecf20Sopenharmony_ci * FIXME: Is this a NoOp on x86? Also
338c2ecf20Sopenharmony_ci * FIXME: What happens if this one is called and a pending blit has previously done
348c2ecf20Sopenharmony_ci * the same DMA mappings?
358c2ecf20Sopenharmony_ci */
368c2ecf20Sopenharmony_ci
378c2ecf20Sopenharmony_ci#include <linux/pagemap.h>
388c2ecf20Sopenharmony_ci#include <linux/pci.h>
398c2ecf20Sopenharmony_ci#include <linux/slab.h>
408c2ecf20Sopenharmony_ci#include <linux/vmalloc.h>
418c2ecf20Sopenharmony_ci
428c2ecf20Sopenharmony_ci#include <drm/drm_device.h>
438c2ecf20Sopenharmony_ci#include <drm/via_drm.h>
448c2ecf20Sopenharmony_ci
458c2ecf20Sopenharmony_ci#include "via_dmablit.h"
468c2ecf20Sopenharmony_ci#include "via_drv.h"
478c2ecf20Sopenharmony_ci
488c2ecf20Sopenharmony_ci#define VIA_PGDN(x)	     (((unsigned long)(x)) & PAGE_MASK)
498c2ecf20Sopenharmony_ci#define VIA_PGOFF(x)	    (((unsigned long)(x)) & ~PAGE_MASK)
508c2ecf20Sopenharmony_ci#define VIA_PFN(x)	      ((unsigned long)(x) >> PAGE_SHIFT)
518c2ecf20Sopenharmony_ci
528c2ecf20Sopenharmony_citypedef struct _drm_via_descriptor {
538c2ecf20Sopenharmony_ci	uint32_t mem_addr;
548c2ecf20Sopenharmony_ci	uint32_t dev_addr;
558c2ecf20Sopenharmony_ci	uint32_t size;
568c2ecf20Sopenharmony_ci	uint32_t next;
578c2ecf20Sopenharmony_ci} drm_via_descriptor_t;
588c2ecf20Sopenharmony_ci
598c2ecf20Sopenharmony_ci
608c2ecf20Sopenharmony_ci/*
618c2ecf20Sopenharmony_ci * Unmap a DMA mapping.
628c2ecf20Sopenharmony_ci */
638c2ecf20Sopenharmony_ci
648c2ecf20Sopenharmony_ci
658c2ecf20Sopenharmony_ci
668c2ecf20Sopenharmony_cistatic void
678c2ecf20Sopenharmony_civia_unmap_blit_from_device(struct pci_dev *pdev, drm_via_sg_info_t *vsg)
688c2ecf20Sopenharmony_ci{
698c2ecf20Sopenharmony_ci	int num_desc = vsg->num_desc;
708c2ecf20Sopenharmony_ci	unsigned cur_descriptor_page = num_desc / vsg->descriptors_per_page;
718c2ecf20Sopenharmony_ci	unsigned descriptor_this_page = num_desc % vsg->descriptors_per_page;
728c2ecf20Sopenharmony_ci	drm_via_descriptor_t *desc_ptr = vsg->desc_pages[cur_descriptor_page] +
738c2ecf20Sopenharmony_ci		descriptor_this_page;
748c2ecf20Sopenharmony_ci	dma_addr_t next = vsg->chain_start;
758c2ecf20Sopenharmony_ci
768c2ecf20Sopenharmony_ci	while (num_desc--) {
778c2ecf20Sopenharmony_ci		if (descriptor_this_page-- == 0) {
788c2ecf20Sopenharmony_ci			cur_descriptor_page--;
798c2ecf20Sopenharmony_ci			descriptor_this_page = vsg->descriptors_per_page - 1;
808c2ecf20Sopenharmony_ci			desc_ptr = vsg->desc_pages[cur_descriptor_page] +
818c2ecf20Sopenharmony_ci				descriptor_this_page;
828c2ecf20Sopenharmony_ci		}
838c2ecf20Sopenharmony_ci		dma_unmap_single(&pdev->dev, next, sizeof(*desc_ptr), DMA_TO_DEVICE);
848c2ecf20Sopenharmony_ci		dma_unmap_page(&pdev->dev, desc_ptr->mem_addr, desc_ptr->size, vsg->direction);
858c2ecf20Sopenharmony_ci		next = (dma_addr_t) desc_ptr->next;
868c2ecf20Sopenharmony_ci		desc_ptr--;
878c2ecf20Sopenharmony_ci	}
888c2ecf20Sopenharmony_ci}
898c2ecf20Sopenharmony_ci
908c2ecf20Sopenharmony_ci/*
918c2ecf20Sopenharmony_ci * If mode = 0, count how many descriptors are needed.
928c2ecf20Sopenharmony_ci * If mode = 1, Map the DMA pages for the device, put together and map also the descriptors.
938c2ecf20Sopenharmony_ci * Descriptors are run in reverse order by the hardware because we are not allowed to update the
948c2ecf20Sopenharmony_ci * 'next' field without syncing calls when the descriptor is already mapped.
958c2ecf20Sopenharmony_ci */
968c2ecf20Sopenharmony_ci
978c2ecf20Sopenharmony_cistatic void
988c2ecf20Sopenharmony_civia_map_blit_for_device(struct pci_dev *pdev,
998c2ecf20Sopenharmony_ci		   const drm_via_dmablit_t *xfer,
1008c2ecf20Sopenharmony_ci		   drm_via_sg_info_t *vsg,
1018c2ecf20Sopenharmony_ci		   int mode)
1028c2ecf20Sopenharmony_ci{
1038c2ecf20Sopenharmony_ci	unsigned cur_descriptor_page = 0;
1048c2ecf20Sopenharmony_ci	unsigned num_descriptors_this_page = 0;
1058c2ecf20Sopenharmony_ci	unsigned char *mem_addr = xfer->mem_addr;
1068c2ecf20Sopenharmony_ci	unsigned char *cur_mem;
1078c2ecf20Sopenharmony_ci	unsigned char *first_addr = (unsigned char *)VIA_PGDN(mem_addr);
1088c2ecf20Sopenharmony_ci	uint32_t fb_addr = xfer->fb_addr;
1098c2ecf20Sopenharmony_ci	uint32_t cur_fb;
1108c2ecf20Sopenharmony_ci	unsigned long line_len;
1118c2ecf20Sopenharmony_ci	unsigned remaining_len;
1128c2ecf20Sopenharmony_ci	int num_desc = 0;
1138c2ecf20Sopenharmony_ci	int cur_line;
1148c2ecf20Sopenharmony_ci	dma_addr_t next = 0 | VIA_DMA_DPR_EC;
1158c2ecf20Sopenharmony_ci	drm_via_descriptor_t *desc_ptr = NULL;
1168c2ecf20Sopenharmony_ci
1178c2ecf20Sopenharmony_ci	if (mode == 1)
1188c2ecf20Sopenharmony_ci		desc_ptr = vsg->desc_pages[cur_descriptor_page];
1198c2ecf20Sopenharmony_ci
1208c2ecf20Sopenharmony_ci	for (cur_line = 0; cur_line < xfer->num_lines; ++cur_line) {
1218c2ecf20Sopenharmony_ci
1228c2ecf20Sopenharmony_ci		line_len = xfer->line_length;
1238c2ecf20Sopenharmony_ci		cur_fb = fb_addr;
1248c2ecf20Sopenharmony_ci		cur_mem = mem_addr;
1258c2ecf20Sopenharmony_ci
1268c2ecf20Sopenharmony_ci		while (line_len > 0) {
1278c2ecf20Sopenharmony_ci
1288c2ecf20Sopenharmony_ci			remaining_len = min(PAGE_SIZE-VIA_PGOFF(cur_mem), line_len);
1298c2ecf20Sopenharmony_ci			line_len -= remaining_len;
1308c2ecf20Sopenharmony_ci
1318c2ecf20Sopenharmony_ci			if (mode == 1) {
1328c2ecf20Sopenharmony_ci				desc_ptr->mem_addr =
1338c2ecf20Sopenharmony_ci					dma_map_page(&pdev->dev,
1348c2ecf20Sopenharmony_ci						     vsg->pages[VIA_PFN(cur_mem) -
1358c2ecf20Sopenharmony_ci								VIA_PFN(first_addr)],
1368c2ecf20Sopenharmony_ci						     VIA_PGOFF(cur_mem), remaining_len,
1378c2ecf20Sopenharmony_ci						     vsg->direction);
1388c2ecf20Sopenharmony_ci				desc_ptr->dev_addr = cur_fb;
1398c2ecf20Sopenharmony_ci
1408c2ecf20Sopenharmony_ci				desc_ptr->size = remaining_len;
1418c2ecf20Sopenharmony_ci				desc_ptr->next = (uint32_t) next;
1428c2ecf20Sopenharmony_ci				next = dma_map_single(&pdev->dev, desc_ptr, sizeof(*desc_ptr),
1438c2ecf20Sopenharmony_ci						      DMA_TO_DEVICE);
1448c2ecf20Sopenharmony_ci				desc_ptr++;
1458c2ecf20Sopenharmony_ci				if (++num_descriptors_this_page >= vsg->descriptors_per_page) {
1468c2ecf20Sopenharmony_ci					num_descriptors_this_page = 0;
1478c2ecf20Sopenharmony_ci					desc_ptr = vsg->desc_pages[++cur_descriptor_page];
1488c2ecf20Sopenharmony_ci				}
1498c2ecf20Sopenharmony_ci			}
1508c2ecf20Sopenharmony_ci
1518c2ecf20Sopenharmony_ci			num_desc++;
1528c2ecf20Sopenharmony_ci			cur_mem += remaining_len;
1538c2ecf20Sopenharmony_ci			cur_fb += remaining_len;
1548c2ecf20Sopenharmony_ci		}
1558c2ecf20Sopenharmony_ci
1568c2ecf20Sopenharmony_ci		mem_addr += xfer->mem_stride;
1578c2ecf20Sopenharmony_ci		fb_addr += xfer->fb_stride;
1588c2ecf20Sopenharmony_ci	}
1598c2ecf20Sopenharmony_ci
1608c2ecf20Sopenharmony_ci	if (mode == 1) {
1618c2ecf20Sopenharmony_ci		vsg->chain_start = next;
1628c2ecf20Sopenharmony_ci		vsg->state = dr_via_device_mapped;
1638c2ecf20Sopenharmony_ci	}
1648c2ecf20Sopenharmony_ci	vsg->num_desc = num_desc;
1658c2ecf20Sopenharmony_ci}
1668c2ecf20Sopenharmony_ci
1678c2ecf20Sopenharmony_ci/*
1688c2ecf20Sopenharmony_ci * Function that frees up all resources for a blit. It is usable even if the
1698c2ecf20Sopenharmony_ci * blit info has only been partially built as long as the status enum is consistent
1708c2ecf20Sopenharmony_ci * with the actual status of the used resources.
1718c2ecf20Sopenharmony_ci */
1728c2ecf20Sopenharmony_ci
1738c2ecf20Sopenharmony_ci
1748c2ecf20Sopenharmony_cistatic void
1758c2ecf20Sopenharmony_civia_free_sg_info(struct pci_dev *pdev, drm_via_sg_info_t *vsg)
1768c2ecf20Sopenharmony_ci{
1778c2ecf20Sopenharmony_ci	int i;
1788c2ecf20Sopenharmony_ci
1798c2ecf20Sopenharmony_ci	switch (vsg->state) {
1808c2ecf20Sopenharmony_ci	case dr_via_device_mapped:
1818c2ecf20Sopenharmony_ci		via_unmap_blit_from_device(pdev, vsg);
1828c2ecf20Sopenharmony_ci		fallthrough;
1838c2ecf20Sopenharmony_ci	case dr_via_desc_pages_alloc:
1848c2ecf20Sopenharmony_ci		for (i = 0; i < vsg->num_desc_pages; ++i) {
1858c2ecf20Sopenharmony_ci			if (vsg->desc_pages[i] != NULL)
1868c2ecf20Sopenharmony_ci				free_page((unsigned long)vsg->desc_pages[i]);
1878c2ecf20Sopenharmony_ci		}
1888c2ecf20Sopenharmony_ci		kfree(vsg->desc_pages);
1898c2ecf20Sopenharmony_ci		fallthrough;
1908c2ecf20Sopenharmony_ci	case dr_via_pages_locked:
1918c2ecf20Sopenharmony_ci		unpin_user_pages_dirty_lock(vsg->pages, vsg->num_pages,
1928c2ecf20Sopenharmony_ci					   (vsg->direction == DMA_FROM_DEVICE));
1938c2ecf20Sopenharmony_ci		fallthrough;
1948c2ecf20Sopenharmony_ci	case dr_via_pages_alloc:
1958c2ecf20Sopenharmony_ci		vfree(vsg->pages);
1968c2ecf20Sopenharmony_ci		fallthrough;
1978c2ecf20Sopenharmony_ci	default:
1988c2ecf20Sopenharmony_ci		vsg->state = dr_via_sg_init;
1998c2ecf20Sopenharmony_ci	}
2008c2ecf20Sopenharmony_ci	vfree(vsg->bounce_buffer);
2018c2ecf20Sopenharmony_ci	vsg->bounce_buffer = NULL;
2028c2ecf20Sopenharmony_ci	vsg->free_on_sequence = 0;
2038c2ecf20Sopenharmony_ci}
2048c2ecf20Sopenharmony_ci
2058c2ecf20Sopenharmony_ci/*
2068c2ecf20Sopenharmony_ci * Fire a blit engine.
2078c2ecf20Sopenharmony_ci */
2088c2ecf20Sopenharmony_ci
2098c2ecf20Sopenharmony_cistatic void
2108c2ecf20Sopenharmony_civia_fire_dmablit(struct drm_device *dev, drm_via_sg_info_t *vsg, int engine)
2118c2ecf20Sopenharmony_ci{
2128c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
2138c2ecf20Sopenharmony_ci
2148c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_MAR0 + engine*0x10, 0);
2158c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_DAR0 + engine*0x10, 0);
2168c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04, VIA_DMA_CSR_DD | VIA_DMA_CSR_TD |
2178c2ecf20Sopenharmony_ci		  VIA_DMA_CSR_DE);
2188c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_MR0  + engine*0x04, VIA_DMA_MR_CM | VIA_DMA_MR_TDIE);
2198c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_BCR0 + engine*0x10, 0);
2208c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_DPR0 + engine*0x10, vsg->chain_start);
2218c2ecf20Sopenharmony_ci	wmb();
2228c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04, VIA_DMA_CSR_DE | VIA_DMA_CSR_TS);
2238c2ecf20Sopenharmony_ci	via_read(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04);
2248c2ecf20Sopenharmony_ci}
2258c2ecf20Sopenharmony_ci
2268c2ecf20Sopenharmony_ci/*
2278c2ecf20Sopenharmony_ci * Obtain a page pointer array and lock all pages into system memory. A segmentation violation will
2288c2ecf20Sopenharmony_ci * occur here if the calling user does not have access to the submitted address.
2298c2ecf20Sopenharmony_ci */
2308c2ecf20Sopenharmony_ci
2318c2ecf20Sopenharmony_cistatic int
2328c2ecf20Sopenharmony_civia_lock_all_dma_pages(drm_via_sg_info_t *vsg,  drm_via_dmablit_t *xfer)
2338c2ecf20Sopenharmony_ci{
2348c2ecf20Sopenharmony_ci	int ret;
2358c2ecf20Sopenharmony_ci	unsigned long first_pfn = VIA_PFN(xfer->mem_addr);
2368c2ecf20Sopenharmony_ci	vsg->num_pages = VIA_PFN(xfer->mem_addr + (xfer->num_lines * xfer->mem_stride - 1)) -
2378c2ecf20Sopenharmony_ci		first_pfn + 1;
2388c2ecf20Sopenharmony_ci
2398c2ecf20Sopenharmony_ci	vsg->pages = vzalloc(array_size(sizeof(struct page *), vsg->num_pages));
2408c2ecf20Sopenharmony_ci	if (NULL == vsg->pages)
2418c2ecf20Sopenharmony_ci		return -ENOMEM;
2428c2ecf20Sopenharmony_ci	ret = pin_user_pages_fast((unsigned long)xfer->mem_addr,
2438c2ecf20Sopenharmony_ci			vsg->num_pages,
2448c2ecf20Sopenharmony_ci			vsg->direction == DMA_FROM_DEVICE ? FOLL_WRITE : 0,
2458c2ecf20Sopenharmony_ci			vsg->pages);
2468c2ecf20Sopenharmony_ci	if (ret != vsg->num_pages) {
2478c2ecf20Sopenharmony_ci		if (ret < 0)
2488c2ecf20Sopenharmony_ci			return ret;
2498c2ecf20Sopenharmony_ci		vsg->state = dr_via_pages_locked;
2508c2ecf20Sopenharmony_ci		return -EINVAL;
2518c2ecf20Sopenharmony_ci	}
2528c2ecf20Sopenharmony_ci	vsg->state = dr_via_pages_locked;
2538c2ecf20Sopenharmony_ci	DRM_DEBUG("DMA pages locked\n");
2548c2ecf20Sopenharmony_ci	return 0;
2558c2ecf20Sopenharmony_ci}
2568c2ecf20Sopenharmony_ci
2578c2ecf20Sopenharmony_ci/*
2588c2ecf20Sopenharmony_ci * Allocate DMA capable memory for the blit descriptor chain, and an array that keeps track of the
2598c2ecf20Sopenharmony_ci * pages we allocate. We don't want to use kmalloc for the descriptor chain because it may be
2608c2ecf20Sopenharmony_ci * quite large for some blits, and pages don't need to be contiguous.
2618c2ecf20Sopenharmony_ci */
2628c2ecf20Sopenharmony_ci
2638c2ecf20Sopenharmony_cistatic int
2648c2ecf20Sopenharmony_civia_alloc_desc_pages(drm_via_sg_info_t *vsg)
2658c2ecf20Sopenharmony_ci{
2668c2ecf20Sopenharmony_ci	int i;
2678c2ecf20Sopenharmony_ci
2688c2ecf20Sopenharmony_ci	vsg->descriptors_per_page = PAGE_SIZE / sizeof(drm_via_descriptor_t);
2698c2ecf20Sopenharmony_ci	vsg->num_desc_pages = (vsg->num_desc + vsg->descriptors_per_page - 1) /
2708c2ecf20Sopenharmony_ci		vsg->descriptors_per_page;
2718c2ecf20Sopenharmony_ci
2728c2ecf20Sopenharmony_ci	if (NULL ==  (vsg->desc_pages = kcalloc(vsg->num_desc_pages, sizeof(void *), GFP_KERNEL)))
2738c2ecf20Sopenharmony_ci		return -ENOMEM;
2748c2ecf20Sopenharmony_ci
2758c2ecf20Sopenharmony_ci	vsg->state = dr_via_desc_pages_alloc;
2768c2ecf20Sopenharmony_ci	for (i = 0; i < vsg->num_desc_pages; ++i) {
2778c2ecf20Sopenharmony_ci		if (NULL == (vsg->desc_pages[i] =
2788c2ecf20Sopenharmony_ci			     (drm_via_descriptor_t *) __get_free_page(GFP_KERNEL)))
2798c2ecf20Sopenharmony_ci			return -ENOMEM;
2808c2ecf20Sopenharmony_ci	}
2818c2ecf20Sopenharmony_ci	DRM_DEBUG("Allocated %d pages for %d descriptors.\n", vsg->num_desc_pages,
2828c2ecf20Sopenharmony_ci		  vsg->num_desc);
2838c2ecf20Sopenharmony_ci	return 0;
2848c2ecf20Sopenharmony_ci}
2858c2ecf20Sopenharmony_ci
2868c2ecf20Sopenharmony_cistatic void
2878c2ecf20Sopenharmony_civia_abort_dmablit(struct drm_device *dev, int engine)
2888c2ecf20Sopenharmony_ci{
2898c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
2908c2ecf20Sopenharmony_ci
2918c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04, VIA_DMA_CSR_TA);
2928c2ecf20Sopenharmony_ci}
2938c2ecf20Sopenharmony_ci
2948c2ecf20Sopenharmony_cistatic void
2958c2ecf20Sopenharmony_civia_dmablit_engine_off(struct drm_device *dev, int engine)
2968c2ecf20Sopenharmony_ci{
2978c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
2988c2ecf20Sopenharmony_ci
2998c2ecf20Sopenharmony_ci	via_write(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04, VIA_DMA_CSR_TD | VIA_DMA_CSR_DD);
3008c2ecf20Sopenharmony_ci}
3018c2ecf20Sopenharmony_ci
3028c2ecf20Sopenharmony_ci
3038c2ecf20Sopenharmony_ci
3048c2ecf20Sopenharmony_ci/*
3058c2ecf20Sopenharmony_ci * The dmablit part of the IRQ handler. Trying to do only reasonably fast things here.
3068c2ecf20Sopenharmony_ci * The rest, like unmapping and freeing memory for done blits is done in a separate workqueue
3078c2ecf20Sopenharmony_ci * task. Basically the task of the interrupt handler is to submit a new blit to the engine, while
3088c2ecf20Sopenharmony_ci * the workqueue task takes care of processing associated with the old blit.
3098c2ecf20Sopenharmony_ci */
3108c2ecf20Sopenharmony_ci
3118c2ecf20Sopenharmony_civoid
3128c2ecf20Sopenharmony_civia_dmablit_handler(struct drm_device *dev, int engine, int from_irq)
3138c2ecf20Sopenharmony_ci{
3148c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
3158c2ecf20Sopenharmony_ci	drm_via_blitq_t *blitq = dev_priv->blit_queues + engine;
3168c2ecf20Sopenharmony_ci	int cur;
3178c2ecf20Sopenharmony_ci	int done_transfer;
3188c2ecf20Sopenharmony_ci	unsigned long irqsave = 0;
3198c2ecf20Sopenharmony_ci	uint32_t status = 0;
3208c2ecf20Sopenharmony_ci
3218c2ecf20Sopenharmony_ci	DRM_DEBUG("DMA blit handler called. engine = %d, from_irq = %d, blitq = 0x%lx\n",
3228c2ecf20Sopenharmony_ci		  engine, from_irq, (unsigned long) blitq);
3238c2ecf20Sopenharmony_ci
3248c2ecf20Sopenharmony_ci	if (from_irq)
3258c2ecf20Sopenharmony_ci		spin_lock(&blitq->blit_lock);
3268c2ecf20Sopenharmony_ci	else
3278c2ecf20Sopenharmony_ci		spin_lock_irqsave(&blitq->blit_lock, irqsave);
3288c2ecf20Sopenharmony_ci
3298c2ecf20Sopenharmony_ci	done_transfer = blitq->is_active &&
3308c2ecf20Sopenharmony_ci	  ((status = via_read(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04)) & VIA_DMA_CSR_TD);
3318c2ecf20Sopenharmony_ci	done_transfer = done_transfer || (blitq->aborting && !(status & VIA_DMA_CSR_DE));
3328c2ecf20Sopenharmony_ci
3338c2ecf20Sopenharmony_ci	cur = blitq->cur;
3348c2ecf20Sopenharmony_ci	if (done_transfer) {
3358c2ecf20Sopenharmony_ci
3368c2ecf20Sopenharmony_ci		blitq->blits[cur]->aborted = blitq->aborting;
3378c2ecf20Sopenharmony_ci		blitq->done_blit_handle++;
3388c2ecf20Sopenharmony_ci		wake_up(blitq->blit_queue + cur);
3398c2ecf20Sopenharmony_ci
3408c2ecf20Sopenharmony_ci		cur++;
3418c2ecf20Sopenharmony_ci		if (cur >= VIA_NUM_BLIT_SLOTS)
3428c2ecf20Sopenharmony_ci			cur = 0;
3438c2ecf20Sopenharmony_ci		blitq->cur = cur;
3448c2ecf20Sopenharmony_ci
3458c2ecf20Sopenharmony_ci		/*
3468c2ecf20Sopenharmony_ci		 * Clear transfer done flag.
3478c2ecf20Sopenharmony_ci		 */
3488c2ecf20Sopenharmony_ci
3498c2ecf20Sopenharmony_ci		via_write(dev_priv, VIA_PCI_DMA_CSR0 + engine*0x04,  VIA_DMA_CSR_TD);
3508c2ecf20Sopenharmony_ci
3518c2ecf20Sopenharmony_ci		blitq->is_active = 0;
3528c2ecf20Sopenharmony_ci		blitq->aborting = 0;
3538c2ecf20Sopenharmony_ci		schedule_work(&blitq->wq);
3548c2ecf20Sopenharmony_ci
3558c2ecf20Sopenharmony_ci	} else if (blitq->is_active && time_after_eq(jiffies, blitq->end)) {
3568c2ecf20Sopenharmony_ci
3578c2ecf20Sopenharmony_ci		/*
3588c2ecf20Sopenharmony_ci		 * Abort transfer after one second.
3598c2ecf20Sopenharmony_ci		 */
3608c2ecf20Sopenharmony_ci
3618c2ecf20Sopenharmony_ci		via_abort_dmablit(dev, engine);
3628c2ecf20Sopenharmony_ci		blitq->aborting = 1;
3638c2ecf20Sopenharmony_ci		blitq->end = jiffies + HZ;
3648c2ecf20Sopenharmony_ci	}
3658c2ecf20Sopenharmony_ci
3668c2ecf20Sopenharmony_ci	if (!blitq->is_active) {
3678c2ecf20Sopenharmony_ci		if (blitq->num_outstanding) {
3688c2ecf20Sopenharmony_ci			via_fire_dmablit(dev, blitq->blits[cur], engine);
3698c2ecf20Sopenharmony_ci			blitq->is_active = 1;
3708c2ecf20Sopenharmony_ci			blitq->cur = cur;
3718c2ecf20Sopenharmony_ci			blitq->num_outstanding--;
3728c2ecf20Sopenharmony_ci			blitq->end = jiffies + HZ;
3738c2ecf20Sopenharmony_ci			if (!timer_pending(&blitq->poll_timer))
3748c2ecf20Sopenharmony_ci				mod_timer(&blitq->poll_timer, jiffies + 1);
3758c2ecf20Sopenharmony_ci		} else {
3768c2ecf20Sopenharmony_ci			if (timer_pending(&blitq->poll_timer))
3778c2ecf20Sopenharmony_ci				del_timer(&blitq->poll_timer);
3788c2ecf20Sopenharmony_ci			via_dmablit_engine_off(dev, engine);
3798c2ecf20Sopenharmony_ci		}
3808c2ecf20Sopenharmony_ci	}
3818c2ecf20Sopenharmony_ci
3828c2ecf20Sopenharmony_ci	if (from_irq)
3838c2ecf20Sopenharmony_ci		spin_unlock(&blitq->blit_lock);
3848c2ecf20Sopenharmony_ci	else
3858c2ecf20Sopenharmony_ci		spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
3868c2ecf20Sopenharmony_ci}
3878c2ecf20Sopenharmony_ci
3888c2ecf20Sopenharmony_ci
3898c2ecf20Sopenharmony_ci
3908c2ecf20Sopenharmony_ci/*
3918c2ecf20Sopenharmony_ci * Check whether this blit is still active, performing necessary locking.
3928c2ecf20Sopenharmony_ci */
3938c2ecf20Sopenharmony_ci
3948c2ecf20Sopenharmony_cistatic int
3958c2ecf20Sopenharmony_civia_dmablit_active(drm_via_blitq_t *blitq, int engine, uint32_t handle, wait_queue_head_t **queue)
3968c2ecf20Sopenharmony_ci{
3978c2ecf20Sopenharmony_ci	unsigned long irqsave;
3988c2ecf20Sopenharmony_ci	uint32_t slot;
3998c2ecf20Sopenharmony_ci	int active;
4008c2ecf20Sopenharmony_ci
4018c2ecf20Sopenharmony_ci	spin_lock_irqsave(&blitq->blit_lock, irqsave);
4028c2ecf20Sopenharmony_ci
4038c2ecf20Sopenharmony_ci	/*
4048c2ecf20Sopenharmony_ci	 * Allow for handle wraparounds.
4058c2ecf20Sopenharmony_ci	 */
4068c2ecf20Sopenharmony_ci
4078c2ecf20Sopenharmony_ci	active = ((blitq->done_blit_handle - handle) > (1 << 23)) &&
4088c2ecf20Sopenharmony_ci		((blitq->cur_blit_handle - handle) <= (1 << 23));
4098c2ecf20Sopenharmony_ci
4108c2ecf20Sopenharmony_ci	if (queue && active) {
4118c2ecf20Sopenharmony_ci		slot = handle - blitq->done_blit_handle + blitq->cur - 1;
4128c2ecf20Sopenharmony_ci		if (slot >= VIA_NUM_BLIT_SLOTS)
4138c2ecf20Sopenharmony_ci			slot -= VIA_NUM_BLIT_SLOTS;
4148c2ecf20Sopenharmony_ci		*queue = blitq->blit_queue + slot;
4158c2ecf20Sopenharmony_ci	}
4168c2ecf20Sopenharmony_ci
4178c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
4188c2ecf20Sopenharmony_ci
4198c2ecf20Sopenharmony_ci	return active;
4208c2ecf20Sopenharmony_ci}
4218c2ecf20Sopenharmony_ci
4228c2ecf20Sopenharmony_ci/*
4238c2ecf20Sopenharmony_ci * Sync. Wait for at least three seconds for the blit to be performed.
4248c2ecf20Sopenharmony_ci */
4258c2ecf20Sopenharmony_ci
4268c2ecf20Sopenharmony_cistatic int
4278c2ecf20Sopenharmony_civia_dmablit_sync(struct drm_device *dev, uint32_t handle, int engine)
4288c2ecf20Sopenharmony_ci{
4298c2ecf20Sopenharmony_ci
4308c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
4318c2ecf20Sopenharmony_ci	drm_via_blitq_t *blitq = dev_priv->blit_queues + engine;
4328c2ecf20Sopenharmony_ci	wait_queue_head_t *queue;
4338c2ecf20Sopenharmony_ci	int ret = 0;
4348c2ecf20Sopenharmony_ci
4358c2ecf20Sopenharmony_ci	if (via_dmablit_active(blitq, engine, handle, &queue)) {
4368c2ecf20Sopenharmony_ci		VIA_WAIT_ON(ret, *queue, 3 * HZ,
4378c2ecf20Sopenharmony_ci			    !via_dmablit_active(blitq, engine, handle, NULL));
4388c2ecf20Sopenharmony_ci	}
4398c2ecf20Sopenharmony_ci	DRM_DEBUG("DMA blit sync handle 0x%x engine %d returned %d\n",
4408c2ecf20Sopenharmony_ci		  handle, engine, ret);
4418c2ecf20Sopenharmony_ci
4428c2ecf20Sopenharmony_ci	return ret;
4438c2ecf20Sopenharmony_ci}
4448c2ecf20Sopenharmony_ci
4458c2ecf20Sopenharmony_ci
4468c2ecf20Sopenharmony_ci/*
4478c2ecf20Sopenharmony_ci * A timer that regularly polls the blit engine in cases where we don't have interrupts:
4488c2ecf20Sopenharmony_ci * a) Broken hardware (typically those that don't have any video capture facility).
4498c2ecf20Sopenharmony_ci * b) Blit abort. The hardware doesn't send an interrupt when a blit is aborted.
4508c2ecf20Sopenharmony_ci * The timer and hardware IRQ's can and do work in parallel. If the hardware has
4518c2ecf20Sopenharmony_ci * irqs, it will shorten the latency somewhat.
4528c2ecf20Sopenharmony_ci */
4538c2ecf20Sopenharmony_ci
4548c2ecf20Sopenharmony_ci
4558c2ecf20Sopenharmony_ci
4568c2ecf20Sopenharmony_cistatic void
4578c2ecf20Sopenharmony_civia_dmablit_timer(struct timer_list *t)
4588c2ecf20Sopenharmony_ci{
4598c2ecf20Sopenharmony_ci	drm_via_blitq_t *blitq = from_timer(blitq, t, poll_timer);
4608c2ecf20Sopenharmony_ci	struct drm_device *dev = blitq->dev;
4618c2ecf20Sopenharmony_ci	int engine = (int)
4628c2ecf20Sopenharmony_ci		(blitq - ((drm_via_private_t *)dev->dev_private)->blit_queues);
4638c2ecf20Sopenharmony_ci
4648c2ecf20Sopenharmony_ci	DRM_DEBUG("Polling timer called for engine %d, jiffies %lu\n", engine,
4658c2ecf20Sopenharmony_ci		  (unsigned long) jiffies);
4668c2ecf20Sopenharmony_ci
4678c2ecf20Sopenharmony_ci	via_dmablit_handler(dev, engine, 0);
4688c2ecf20Sopenharmony_ci
4698c2ecf20Sopenharmony_ci	if (!timer_pending(&blitq->poll_timer)) {
4708c2ecf20Sopenharmony_ci		mod_timer(&blitq->poll_timer, jiffies + 1);
4718c2ecf20Sopenharmony_ci
4728c2ecf20Sopenharmony_ci	       /*
4738c2ecf20Sopenharmony_ci		* Rerun handler to delete timer if engines are off, and
4748c2ecf20Sopenharmony_ci		* to shorten abort latency. This is a little nasty.
4758c2ecf20Sopenharmony_ci		*/
4768c2ecf20Sopenharmony_ci
4778c2ecf20Sopenharmony_ci	       via_dmablit_handler(dev, engine, 0);
4788c2ecf20Sopenharmony_ci
4798c2ecf20Sopenharmony_ci	}
4808c2ecf20Sopenharmony_ci}
4818c2ecf20Sopenharmony_ci
4828c2ecf20Sopenharmony_ci
4838c2ecf20Sopenharmony_ci
4848c2ecf20Sopenharmony_ci
4858c2ecf20Sopenharmony_ci/*
4868c2ecf20Sopenharmony_ci * Workqueue task that frees data and mappings associated with a blit.
4878c2ecf20Sopenharmony_ci * Also wakes up waiting processes. Each of these tasks handles one
4888c2ecf20Sopenharmony_ci * blit engine only and may not be called on each interrupt.
4898c2ecf20Sopenharmony_ci */
4908c2ecf20Sopenharmony_ci
4918c2ecf20Sopenharmony_ci
4928c2ecf20Sopenharmony_cistatic void
4938c2ecf20Sopenharmony_civia_dmablit_workqueue(struct work_struct *work)
4948c2ecf20Sopenharmony_ci{
4958c2ecf20Sopenharmony_ci	drm_via_blitq_t *blitq = container_of(work, drm_via_blitq_t, wq);
4968c2ecf20Sopenharmony_ci	struct drm_device *dev = blitq->dev;
4978c2ecf20Sopenharmony_ci	unsigned long irqsave;
4988c2ecf20Sopenharmony_ci	drm_via_sg_info_t *cur_sg;
4998c2ecf20Sopenharmony_ci	int cur_released;
5008c2ecf20Sopenharmony_ci
5018c2ecf20Sopenharmony_ci
5028c2ecf20Sopenharmony_ci	DRM_DEBUG("Workqueue task called for blit engine %ld\n", (unsigned long)
5038c2ecf20Sopenharmony_ci		  (blitq - ((drm_via_private_t *)dev->dev_private)->blit_queues));
5048c2ecf20Sopenharmony_ci
5058c2ecf20Sopenharmony_ci	spin_lock_irqsave(&blitq->blit_lock, irqsave);
5068c2ecf20Sopenharmony_ci
5078c2ecf20Sopenharmony_ci	while (blitq->serviced != blitq->cur) {
5088c2ecf20Sopenharmony_ci
5098c2ecf20Sopenharmony_ci		cur_released = blitq->serviced++;
5108c2ecf20Sopenharmony_ci
5118c2ecf20Sopenharmony_ci		DRM_DEBUG("Releasing blit slot %d\n", cur_released);
5128c2ecf20Sopenharmony_ci
5138c2ecf20Sopenharmony_ci		if (blitq->serviced >= VIA_NUM_BLIT_SLOTS)
5148c2ecf20Sopenharmony_ci			blitq->serviced = 0;
5158c2ecf20Sopenharmony_ci
5168c2ecf20Sopenharmony_ci		cur_sg = blitq->blits[cur_released];
5178c2ecf20Sopenharmony_ci		blitq->num_free++;
5188c2ecf20Sopenharmony_ci
5198c2ecf20Sopenharmony_ci		spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
5208c2ecf20Sopenharmony_ci
5218c2ecf20Sopenharmony_ci		wake_up(&blitq->busy_queue);
5228c2ecf20Sopenharmony_ci
5238c2ecf20Sopenharmony_ci		via_free_sg_info(dev->pdev, cur_sg);
5248c2ecf20Sopenharmony_ci		kfree(cur_sg);
5258c2ecf20Sopenharmony_ci
5268c2ecf20Sopenharmony_ci		spin_lock_irqsave(&blitq->blit_lock, irqsave);
5278c2ecf20Sopenharmony_ci	}
5288c2ecf20Sopenharmony_ci
5298c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
5308c2ecf20Sopenharmony_ci}
5318c2ecf20Sopenharmony_ci
5328c2ecf20Sopenharmony_ci
5338c2ecf20Sopenharmony_ci/*
5348c2ecf20Sopenharmony_ci * Init all blit engines. Currently we use two, but some hardware have 4.
5358c2ecf20Sopenharmony_ci */
5368c2ecf20Sopenharmony_ci
5378c2ecf20Sopenharmony_ci
5388c2ecf20Sopenharmony_civoid
5398c2ecf20Sopenharmony_civia_init_dmablit(struct drm_device *dev)
5408c2ecf20Sopenharmony_ci{
5418c2ecf20Sopenharmony_ci	int i, j;
5428c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
5438c2ecf20Sopenharmony_ci	drm_via_blitq_t *blitq;
5448c2ecf20Sopenharmony_ci
5458c2ecf20Sopenharmony_ci	pci_set_master(dev->pdev);
5468c2ecf20Sopenharmony_ci
5478c2ecf20Sopenharmony_ci	for (i = 0; i < VIA_NUM_BLIT_ENGINES; ++i) {
5488c2ecf20Sopenharmony_ci		blitq = dev_priv->blit_queues + i;
5498c2ecf20Sopenharmony_ci		blitq->dev = dev;
5508c2ecf20Sopenharmony_ci		blitq->cur_blit_handle = 0;
5518c2ecf20Sopenharmony_ci		blitq->done_blit_handle = 0;
5528c2ecf20Sopenharmony_ci		blitq->head = 0;
5538c2ecf20Sopenharmony_ci		blitq->cur = 0;
5548c2ecf20Sopenharmony_ci		blitq->serviced = 0;
5558c2ecf20Sopenharmony_ci		blitq->num_free = VIA_NUM_BLIT_SLOTS - 1;
5568c2ecf20Sopenharmony_ci		blitq->num_outstanding = 0;
5578c2ecf20Sopenharmony_ci		blitq->is_active = 0;
5588c2ecf20Sopenharmony_ci		blitq->aborting = 0;
5598c2ecf20Sopenharmony_ci		spin_lock_init(&blitq->blit_lock);
5608c2ecf20Sopenharmony_ci		for (j = 0; j < VIA_NUM_BLIT_SLOTS; ++j)
5618c2ecf20Sopenharmony_ci			init_waitqueue_head(blitq->blit_queue + j);
5628c2ecf20Sopenharmony_ci		init_waitqueue_head(&blitq->busy_queue);
5638c2ecf20Sopenharmony_ci		INIT_WORK(&blitq->wq, via_dmablit_workqueue);
5648c2ecf20Sopenharmony_ci		timer_setup(&blitq->poll_timer, via_dmablit_timer, 0);
5658c2ecf20Sopenharmony_ci	}
5668c2ecf20Sopenharmony_ci}
5678c2ecf20Sopenharmony_ci
5688c2ecf20Sopenharmony_ci/*
5698c2ecf20Sopenharmony_ci * Build all info and do all mappings required for a blit.
5708c2ecf20Sopenharmony_ci */
5718c2ecf20Sopenharmony_ci
5728c2ecf20Sopenharmony_ci
5738c2ecf20Sopenharmony_cistatic int
5748c2ecf20Sopenharmony_civia_build_sg_info(struct drm_device *dev, drm_via_sg_info_t *vsg, drm_via_dmablit_t *xfer)
5758c2ecf20Sopenharmony_ci{
5768c2ecf20Sopenharmony_ci	int draw = xfer->to_fb;
5778c2ecf20Sopenharmony_ci	int ret = 0;
5788c2ecf20Sopenharmony_ci
5798c2ecf20Sopenharmony_ci	vsg->direction = (draw) ? DMA_TO_DEVICE : DMA_FROM_DEVICE;
5808c2ecf20Sopenharmony_ci	vsg->bounce_buffer = NULL;
5818c2ecf20Sopenharmony_ci
5828c2ecf20Sopenharmony_ci	vsg->state = dr_via_sg_init;
5838c2ecf20Sopenharmony_ci
5848c2ecf20Sopenharmony_ci	if (xfer->num_lines <= 0 || xfer->line_length <= 0) {
5858c2ecf20Sopenharmony_ci		DRM_ERROR("Zero size bitblt.\n");
5868c2ecf20Sopenharmony_ci		return -EINVAL;
5878c2ecf20Sopenharmony_ci	}
5888c2ecf20Sopenharmony_ci
5898c2ecf20Sopenharmony_ci	/*
5908c2ecf20Sopenharmony_ci	 * Below check is a driver limitation, not a hardware one. We
5918c2ecf20Sopenharmony_ci	 * don't want to lock unused pages, and don't want to incoporate the
5928c2ecf20Sopenharmony_ci	 * extra logic of avoiding them. Make sure there are no.
5938c2ecf20Sopenharmony_ci	 * (Not a big limitation anyway.)
5948c2ecf20Sopenharmony_ci	 */
5958c2ecf20Sopenharmony_ci
5968c2ecf20Sopenharmony_ci	if ((xfer->mem_stride - xfer->line_length) > 2*PAGE_SIZE) {
5978c2ecf20Sopenharmony_ci		DRM_ERROR("Too large system memory stride. Stride: %d, "
5988c2ecf20Sopenharmony_ci			  "Length: %d\n", xfer->mem_stride, xfer->line_length);
5998c2ecf20Sopenharmony_ci		return -EINVAL;
6008c2ecf20Sopenharmony_ci	}
6018c2ecf20Sopenharmony_ci
6028c2ecf20Sopenharmony_ci	if ((xfer->mem_stride == xfer->line_length) &&
6038c2ecf20Sopenharmony_ci	   (xfer->fb_stride == xfer->line_length)) {
6048c2ecf20Sopenharmony_ci		xfer->mem_stride *= xfer->num_lines;
6058c2ecf20Sopenharmony_ci		xfer->line_length = xfer->mem_stride;
6068c2ecf20Sopenharmony_ci		xfer->fb_stride = xfer->mem_stride;
6078c2ecf20Sopenharmony_ci		xfer->num_lines = 1;
6088c2ecf20Sopenharmony_ci	}
6098c2ecf20Sopenharmony_ci
6108c2ecf20Sopenharmony_ci	/*
6118c2ecf20Sopenharmony_ci	 * Don't lock an arbitrary large number of pages, since that causes a
6128c2ecf20Sopenharmony_ci	 * DOS security hole.
6138c2ecf20Sopenharmony_ci	 */
6148c2ecf20Sopenharmony_ci
6158c2ecf20Sopenharmony_ci	if (xfer->num_lines > 2048 || (xfer->num_lines*xfer->mem_stride > (2048*2048*4))) {
6168c2ecf20Sopenharmony_ci		DRM_ERROR("Too large PCI DMA bitblt.\n");
6178c2ecf20Sopenharmony_ci		return -EINVAL;
6188c2ecf20Sopenharmony_ci	}
6198c2ecf20Sopenharmony_ci
6208c2ecf20Sopenharmony_ci	/*
6218c2ecf20Sopenharmony_ci	 * we allow a negative fb stride to allow flipping of images in
6228c2ecf20Sopenharmony_ci	 * transfer.
6238c2ecf20Sopenharmony_ci	 */
6248c2ecf20Sopenharmony_ci
6258c2ecf20Sopenharmony_ci	if (xfer->mem_stride < xfer->line_length ||
6268c2ecf20Sopenharmony_ci		abs(xfer->fb_stride) < xfer->line_length) {
6278c2ecf20Sopenharmony_ci		DRM_ERROR("Invalid frame-buffer / memory stride.\n");
6288c2ecf20Sopenharmony_ci		return -EINVAL;
6298c2ecf20Sopenharmony_ci	}
6308c2ecf20Sopenharmony_ci
6318c2ecf20Sopenharmony_ci	/*
6328c2ecf20Sopenharmony_ci	 * A hardware bug seems to be worked around if system memory addresses start on
6338c2ecf20Sopenharmony_ci	 * 16 byte boundaries. This seems a bit restrictive however. VIA is contacted
6348c2ecf20Sopenharmony_ci	 * about this. Meanwhile, impose the following restrictions:
6358c2ecf20Sopenharmony_ci	 */
6368c2ecf20Sopenharmony_ci
6378c2ecf20Sopenharmony_ci#ifdef VIA_BUGFREE
6388c2ecf20Sopenharmony_ci	if ((((unsigned long)xfer->mem_addr & 3) != ((unsigned long)xfer->fb_addr & 3)) ||
6398c2ecf20Sopenharmony_ci	    ((xfer->num_lines > 1) && ((xfer->mem_stride & 3) != (xfer->fb_stride & 3)))) {
6408c2ecf20Sopenharmony_ci		DRM_ERROR("Invalid DRM bitblt alignment.\n");
6418c2ecf20Sopenharmony_ci		return -EINVAL;
6428c2ecf20Sopenharmony_ci	}
6438c2ecf20Sopenharmony_ci#else
6448c2ecf20Sopenharmony_ci	if ((((unsigned long)xfer->mem_addr & 15) ||
6458c2ecf20Sopenharmony_ci	      ((unsigned long)xfer->fb_addr & 3)) ||
6468c2ecf20Sopenharmony_ci	   ((xfer->num_lines > 1) &&
6478c2ecf20Sopenharmony_ci	   ((xfer->mem_stride & 15) || (xfer->fb_stride & 3)))) {
6488c2ecf20Sopenharmony_ci		DRM_ERROR("Invalid DRM bitblt alignment.\n");
6498c2ecf20Sopenharmony_ci		return -EINVAL;
6508c2ecf20Sopenharmony_ci	}
6518c2ecf20Sopenharmony_ci#endif
6528c2ecf20Sopenharmony_ci
6538c2ecf20Sopenharmony_ci	if (0 != (ret = via_lock_all_dma_pages(vsg, xfer))) {
6548c2ecf20Sopenharmony_ci		DRM_ERROR("Could not lock DMA pages.\n");
6558c2ecf20Sopenharmony_ci		via_free_sg_info(dev->pdev, vsg);
6568c2ecf20Sopenharmony_ci		return ret;
6578c2ecf20Sopenharmony_ci	}
6588c2ecf20Sopenharmony_ci
6598c2ecf20Sopenharmony_ci	via_map_blit_for_device(dev->pdev, xfer, vsg, 0);
6608c2ecf20Sopenharmony_ci	if (0 != (ret = via_alloc_desc_pages(vsg))) {
6618c2ecf20Sopenharmony_ci		DRM_ERROR("Could not allocate DMA descriptor pages.\n");
6628c2ecf20Sopenharmony_ci		via_free_sg_info(dev->pdev, vsg);
6638c2ecf20Sopenharmony_ci		return ret;
6648c2ecf20Sopenharmony_ci	}
6658c2ecf20Sopenharmony_ci	via_map_blit_for_device(dev->pdev, xfer, vsg, 1);
6668c2ecf20Sopenharmony_ci
6678c2ecf20Sopenharmony_ci	return 0;
6688c2ecf20Sopenharmony_ci}
6698c2ecf20Sopenharmony_ci
6708c2ecf20Sopenharmony_ci
6718c2ecf20Sopenharmony_ci/*
6728c2ecf20Sopenharmony_ci * Reserve one free slot in the blit queue. Will wait for one second for one
6738c2ecf20Sopenharmony_ci * to become available. Otherwise -EBUSY is returned.
6748c2ecf20Sopenharmony_ci */
6758c2ecf20Sopenharmony_ci
6768c2ecf20Sopenharmony_cistatic int
6778c2ecf20Sopenharmony_civia_dmablit_grab_slot(drm_via_blitq_t *blitq, int engine)
6788c2ecf20Sopenharmony_ci{
6798c2ecf20Sopenharmony_ci	int ret = 0;
6808c2ecf20Sopenharmony_ci	unsigned long irqsave;
6818c2ecf20Sopenharmony_ci
6828c2ecf20Sopenharmony_ci	DRM_DEBUG("Num free is %d\n", blitq->num_free);
6838c2ecf20Sopenharmony_ci	spin_lock_irqsave(&blitq->blit_lock, irqsave);
6848c2ecf20Sopenharmony_ci	while (blitq->num_free == 0) {
6858c2ecf20Sopenharmony_ci		spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
6868c2ecf20Sopenharmony_ci
6878c2ecf20Sopenharmony_ci		VIA_WAIT_ON(ret, blitq->busy_queue, HZ, blitq->num_free > 0);
6888c2ecf20Sopenharmony_ci		if (ret)
6898c2ecf20Sopenharmony_ci			return (-EINTR == ret) ? -EAGAIN : ret;
6908c2ecf20Sopenharmony_ci
6918c2ecf20Sopenharmony_ci		spin_lock_irqsave(&blitq->blit_lock, irqsave);
6928c2ecf20Sopenharmony_ci	}
6938c2ecf20Sopenharmony_ci
6948c2ecf20Sopenharmony_ci	blitq->num_free--;
6958c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
6968c2ecf20Sopenharmony_ci
6978c2ecf20Sopenharmony_ci	return 0;
6988c2ecf20Sopenharmony_ci}
6998c2ecf20Sopenharmony_ci
7008c2ecf20Sopenharmony_ci/*
7018c2ecf20Sopenharmony_ci * Hand back a free slot if we changed our mind.
7028c2ecf20Sopenharmony_ci */
7038c2ecf20Sopenharmony_ci
7048c2ecf20Sopenharmony_cistatic void
7058c2ecf20Sopenharmony_civia_dmablit_release_slot(drm_via_blitq_t *blitq)
7068c2ecf20Sopenharmony_ci{
7078c2ecf20Sopenharmony_ci	unsigned long irqsave;
7088c2ecf20Sopenharmony_ci
7098c2ecf20Sopenharmony_ci	spin_lock_irqsave(&blitq->blit_lock, irqsave);
7108c2ecf20Sopenharmony_ci	blitq->num_free++;
7118c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
7128c2ecf20Sopenharmony_ci	wake_up(&blitq->busy_queue);
7138c2ecf20Sopenharmony_ci}
7148c2ecf20Sopenharmony_ci
7158c2ecf20Sopenharmony_ci/*
7168c2ecf20Sopenharmony_ci * Grab a free slot. Build blit info and queue a blit.
7178c2ecf20Sopenharmony_ci */
7188c2ecf20Sopenharmony_ci
7198c2ecf20Sopenharmony_ci
7208c2ecf20Sopenharmony_cistatic int
7218c2ecf20Sopenharmony_civia_dmablit(struct drm_device *dev, drm_via_dmablit_t *xfer)
7228c2ecf20Sopenharmony_ci{
7238c2ecf20Sopenharmony_ci	drm_via_private_t *dev_priv = (drm_via_private_t *)dev->dev_private;
7248c2ecf20Sopenharmony_ci	drm_via_sg_info_t *vsg;
7258c2ecf20Sopenharmony_ci	drm_via_blitq_t *blitq;
7268c2ecf20Sopenharmony_ci	int ret;
7278c2ecf20Sopenharmony_ci	int engine;
7288c2ecf20Sopenharmony_ci	unsigned long irqsave;
7298c2ecf20Sopenharmony_ci
7308c2ecf20Sopenharmony_ci	if (dev_priv == NULL) {
7318c2ecf20Sopenharmony_ci		DRM_ERROR("Called without initialization.\n");
7328c2ecf20Sopenharmony_ci		return -EINVAL;
7338c2ecf20Sopenharmony_ci	}
7348c2ecf20Sopenharmony_ci
7358c2ecf20Sopenharmony_ci	engine = (xfer->to_fb) ? 0 : 1;
7368c2ecf20Sopenharmony_ci	blitq = dev_priv->blit_queues + engine;
7378c2ecf20Sopenharmony_ci	if (0 != (ret = via_dmablit_grab_slot(blitq, engine)))
7388c2ecf20Sopenharmony_ci		return ret;
7398c2ecf20Sopenharmony_ci	if (NULL == (vsg = kmalloc(sizeof(*vsg), GFP_KERNEL))) {
7408c2ecf20Sopenharmony_ci		via_dmablit_release_slot(blitq);
7418c2ecf20Sopenharmony_ci		return -ENOMEM;
7428c2ecf20Sopenharmony_ci	}
7438c2ecf20Sopenharmony_ci	if (0 != (ret = via_build_sg_info(dev, vsg, xfer))) {
7448c2ecf20Sopenharmony_ci		via_dmablit_release_slot(blitq);
7458c2ecf20Sopenharmony_ci		kfree(vsg);
7468c2ecf20Sopenharmony_ci		return ret;
7478c2ecf20Sopenharmony_ci	}
7488c2ecf20Sopenharmony_ci	spin_lock_irqsave(&blitq->blit_lock, irqsave);
7498c2ecf20Sopenharmony_ci
7508c2ecf20Sopenharmony_ci	blitq->blits[blitq->head++] = vsg;
7518c2ecf20Sopenharmony_ci	if (blitq->head >= VIA_NUM_BLIT_SLOTS)
7528c2ecf20Sopenharmony_ci		blitq->head = 0;
7538c2ecf20Sopenharmony_ci	blitq->num_outstanding++;
7548c2ecf20Sopenharmony_ci	xfer->sync.sync_handle = ++blitq->cur_blit_handle;
7558c2ecf20Sopenharmony_ci
7568c2ecf20Sopenharmony_ci	spin_unlock_irqrestore(&blitq->blit_lock, irqsave);
7578c2ecf20Sopenharmony_ci	xfer->sync.engine = engine;
7588c2ecf20Sopenharmony_ci
7598c2ecf20Sopenharmony_ci	via_dmablit_handler(dev, engine, 0);
7608c2ecf20Sopenharmony_ci
7618c2ecf20Sopenharmony_ci	return 0;
7628c2ecf20Sopenharmony_ci}
7638c2ecf20Sopenharmony_ci
7648c2ecf20Sopenharmony_ci/*
7658c2ecf20Sopenharmony_ci * Sync on a previously submitted blit. Note that the X server use signals extensively, and
7668c2ecf20Sopenharmony_ci * that there is a very big probability that this IOCTL will be interrupted by a signal. In that
7678c2ecf20Sopenharmony_ci * case it returns with -EAGAIN for the signal to be delivered.
7688c2ecf20Sopenharmony_ci * The caller should then reissue the IOCTL. This is similar to what is being done for drmGetLock().
7698c2ecf20Sopenharmony_ci */
7708c2ecf20Sopenharmony_ci
7718c2ecf20Sopenharmony_ciint
7728c2ecf20Sopenharmony_civia_dma_blit_sync(struct drm_device *dev, void *data, struct drm_file *file_priv)
7738c2ecf20Sopenharmony_ci{
7748c2ecf20Sopenharmony_ci	drm_via_blitsync_t *sync = data;
7758c2ecf20Sopenharmony_ci	int err;
7768c2ecf20Sopenharmony_ci
7778c2ecf20Sopenharmony_ci	if (sync->engine >= VIA_NUM_BLIT_ENGINES)
7788c2ecf20Sopenharmony_ci		return -EINVAL;
7798c2ecf20Sopenharmony_ci
7808c2ecf20Sopenharmony_ci	err = via_dmablit_sync(dev, sync->sync_handle, sync->engine);
7818c2ecf20Sopenharmony_ci
7828c2ecf20Sopenharmony_ci	if (-EINTR == err)
7838c2ecf20Sopenharmony_ci		err = -EAGAIN;
7848c2ecf20Sopenharmony_ci
7858c2ecf20Sopenharmony_ci	return err;
7868c2ecf20Sopenharmony_ci}
7878c2ecf20Sopenharmony_ci
7888c2ecf20Sopenharmony_ci
7898c2ecf20Sopenharmony_ci/*
7908c2ecf20Sopenharmony_ci * Queue a blit and hand back a handle to be used for sync. This IOCTL may be interrupted by a signal
7918c2ecf20Sopenharmony_ci * while waiting for a free slot in the blit queue. In that case it returns with -EAGAIN and should
7928c2ecf20Sopenharmony_ci * be reissued. See the above IOCTL code.
7938c2ecf20Sopenharmony_ci */
7948c2ecf20Sopenharmony_ci
7958c2ecf20Sopenharmony_ciint
7968c2ecf20Sopenharmony_civia_dma_blit(struct drm_device *dev, void *data, struct drm_file *file_priv)
7978c2ecf20Sopenharmony_ci{
7988c2ecf20Sopenharmony_ci	drm_via_dmablit_t *xfer = data;
7998c2ecf20Sopenharmony_ci	int err;
8008c2ecf20Sopenharmony_ci
8018c2ecf20Sopenharmony_ci	err = via_dmablit(dev, xfer);
8028c2ecf20Sopenharmony_ci
8038c2ecf20Sopenharmony_ci	return err;
8048c2ecf20Sopenharmony_ci}
805