| /* |
| * Copyright (C) 2006 Benjamin Herrenschmidt, IBM Corporation |
| * |
| * Provide default implementations of the DMA mapping callbacks for |
| * directly mapped busses. |
| */ |
| |
| #include <linux/device.h> |
| #include <linux/dma-mapping.h> |
| #include <linux/dma-debug.h> |
| #include <linux/gfp.h> |
| #include <linux/memblock.h> |
| #include <linux/export.h> |
| #include <linux/pci.h> |
| #include <asm/vio.h> |
| #include <asm/bug.h> |
| #include <asm/machdep.h> |
| #include <asm/swiotlb.h> |
| #include <asm/iommu.h> |
| |
| /* |
| * Generic direct DMA implementation |
| * |
| * This implementation supports a per-device offset that can be applied if |
| * the address at which memory is visible to devices is not 0. Platform code |
| * can set archdata.dma_data to an unsigned long holding the offset. By |
| * default the offset is PCI_DRAM_OFFSET. |
| */ |
| |
| static u64 __maybe_unused get_pfn_limit(struct device *dev) |
| { |
| u64 pfn = (dev->coherent_dma_mask >> PAGE_SHIFT) + 1; |
| struct dev_archdata __maybe_unused *sd = &dev->archdata; |
| |
| #ifdef CONFIG_SWIOTLB |
| if (sd->max_direct_dma_addr && dev->dma_ops == &swiotlb_dma_ops) |
| pfn = min_t(u64, pfn, sd->max_direct_dma_addr >> PAGE_SHIFT); |
| #endif |
| |
| return pfn; |
| } |
| |
| static int dma_direct_dma_supported(struct device *dev, u64 mask) |
| { |
| #ifdef CONFIG_PPC64 |
| u64 limit = get_dma_offset(dev) + (memblock_end_of_DRAM() - 1); |
| |
| /* Limit fits in the mask, we are good */ |
| if (mask >= limit) |
| return 1; |
| |
| #ifdef CONFIG_FSL_SOC |
| /* Freescale gets another chance via ZONE_DMA/ZONE_DMA32, however |
| * that will have to be refined if/when they support iommus |
| */ |
| return 1; |
| #endif |
| /* Sorry ... */ |
| return 0; |
| #else |
| return 1; |
| #endif |
| } |
| |
| void *__dma_direct_alloc_coherent(struct device *dev, size_t size, |
| dma_addr_t *dma_handle, gfp_t flag, |
| unsigned long attrs) |
| { |
| void *ret; |
| #ifdef CONFIG_NOT_COHERENT_CACHE |
| ret = __dma_alloc_coherent(dev, size, dma_handle, flag); |
| if (ret == NULL) |
| return NULL; |
| *dma_handle += get_dma_offset(dev); |
| return ret; |
| #else |
| struct page *page; |
| int node = dev_to_node(dev); |
| #ifdef CONFIG_FSL_SOC |
| u64 pfn = get_pfn_limit(dev); |
| int zone; |
| |
| /* |
| * This code should be OK on other platforms, but we have drivers that |
| * don't set coherent_dma_mask. As a workaround we just ifdef it. This |
| * whole routine needs some serious cleanup. |
| */ |
| |
| zone = dma_pfn_limit_to_zone(pfn); |
| if (zone < 0) { |
| dev_err(dev, "%s: No suitable zone for pfn %#llx\n", |
| __func__, pfn); |
| return NULL; |
| } |
| |
| switch (zone) { |
| case ZONE_DMA: |
| flag |= GFP_DMA; |
| break; |
| #ifdef CONFIG_ZONE_DMA32 |
| case ZONE_DMA32: |
| flag |= GFP_DMA32; |
| break; |
| #endif |
| }; |
| #endif /* CONFIG_FSL_SOC */ |
| |
| /* ignore region specifiers */ |
| flag &= ~(__GFP_HIGHMEM); |
| |
| page = alloc_pages_node(node, flag, get_order(size)); |
| if (page == NULL) |
| return NULL; |
| ret = page_address(page); |
| memset(ret, 0, size); |
| *dma_handle = __pa(ret) + get_dma_offset(dev); |
| |
| return ret; |
| #endif |
| } |
| |
| void __dma_direct_free_coherent(struct device *dev, size_t size, |
| void *vaddr, dma_addr_t dma_handle, |
| unsigned long attrs) |
| { |
| #ifdef CONFIG_NOT_COHERENT_CACHE |
| __dma_free_coherent(size, vaddr); |
| #else |
| free_pages((unsigned long)vaddr, get_order(size)); |
| #endif |
| } |
| |
| static void *dma_direct_alloc_coherent(struct device *dev, size_t size, |
| dma_addr_t *dma_handle, gfp_t flag, |
| unsigned long attrs) |
| { |
| struct iommu_table *iommu; |
| |
| /* The coherent mask may be smaller than the real mask, check if |
| * we can really use the direct ops |
| */ |
| if (dma_direct_dma_supported(dev, dev->coherent_dma_mask)) |
| return __dma_direct_alloc_coherent(dev, size, dma_handle, |
| flag, attrs); |
| |
| /* Ok we can't ... do we have an iommu ? If not, fail */ |
| iommu = get_iommu_table_base(dev); |
| if (!iommu) |
| return NULL; |
| |
| /* Try to use the iommu */ |
| return iommu_alloc_coherent(dev, iommu, size, dma_handle, |
| dev->coherent_dma_mask, flag, |
| dev_to_node(dev)); |
| } |
| |
| static void dma_direct_free_coherent(struct device *dev, size_t size, |
| void *vaddr, dma_addr_t dma_handle, |
| unsigned long attrs) |
| { |
| struct iommu_table *iommu; |
| |
| /* See comments in dma_direct_alloc_coherent() */ |
| if (dma_direct_dma_supported(dev, dev->coherent_dma_mask)) |
| return __dma_direct_free_coherent(dev, size, vaddr, dma_handle, |
| attrs); |
| /* Maybe we used an iommu ... */ |
| iommu = get_iommu_table_base(dev); |
| |
| /* If we hit that we should have never allocated in the first |
| * place so how come we are freeing ? |
| */ |
| if (WARN_ON(!iommu)) |
| return; |
| iommu_free_coherent(iommu, size, vaddr, dma_handle); |
| } |
| |
| int dma_direct_mmap_coherent(struct device *dev, struct vm_area_struct *vma, |
| void *cpu_addr, dma_addr_t handle, size_t size, |
| unsigned long attrs) |
| { |
| unsigned long pfn; |
| |
| #ifdef CONFIG_NOT_COHERENT_CACHE |
| vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot); |
| pfn = __dma_get_coherent_pfn((unsigned long)cpu_addr); |
| #else |
| pfn = page_to_pfn(virt_to_page(cpu_addr)); |
| #endif |
| return remap_pfn_range(vma, vma->vm_start, |
| pfn + vma->vm_pgoff, |
| vma->vm_end - vma->vm_start, |
| vma->vm_page_prot); |
| } |
| |
| static int dma_direct_map_sg(struct device *dev, struct scatterlist *sgl, |
| int nents, enum dma_data_direction direction, |
| unsigned long attrs) |
| { |
| struct scatterlist *sg; |
| int i; |
| |
| for_each_sg(sgl, sg, nents, i) { |
| sg->dma_address = sg_phys(sg) + get_dma_offset(dev); |
| sg->dma_length = sg->length; |
| |
| if (attrs & DMA_ATTR_SKIP_CPU_SYNC) |
| continue; |
| |
| __dma_sync_page(sg_page(sg), sg->offset, sg->length, direction); |
| } |
| |
| return nents; |
| } |
| |
| static void dma_direct_unmap_sg(struct device *dev, struct scatterlist *sg, |
| int nents, enum dma_data_direction direction, |
| unsigned long attrs) |
| { |
| } |
| |
| static u64 dma_direct_get_required_mask(struct device *dev) |
| { |
| u64 end, mask; |
| |
| end = memblock_end_of_DRAM() + get_dma_offset(dev); |
| |
| mask = 1ULL << (fls64(end) - 1); |
| mask += mask - 1; |
| |
| return mask; |
| } |
| |
| static inline dma_addr_t dma_direct_map_page(struct device *dev, |
| struct page *page, |
| unsigned long offset, |
| size_t size, |
| enum dma_data_direction dir, |
| unsigned long attrs) |
| { |
| BUG_ON(dir == DMA_NONE); |
| |
| if (!(attrs & DMA_ATTR_SKIP_CPU_SYNC)) |
| __dma_sync_page(page, offset, size, dir); |
| |
| return page_to_phys(page) + offset + get_dma_offset(dev); |
| } |
| |
| static inline void dma_direct_unmap_page(struct device *dev, |
| dma_addr_t dma_address, |
| size_t size, |
| enum dma_data_direction direction, |
| unsigned long attrs) |
| { |
| } |
| |
| #ifdef CONFIG_NOT_COHERENT_CACHE |
| static inline void dma_direct_sync_sg(struct device *dev, |
| struct scatterlist *sgl, int nents, |
| enum dma_data_direction direction) |
| { |
| struct scatterlist *sg; |
| int i; |
| |
| for_each_sg(sgl, sg, nents, i) |
| __dma_sync_page(sg_page(sg), sg->offset, sg->length, direction); |
| } |
| |
| static inline void dma_direct_sync_single(struct device *dev, |
| dma_addr_t dma_handle, size_t size, |
| enum dma_data_direction direction) |
| { |
| __dma_sync(bus_to_virt(dma_handle), size, direction); |
| } |
| #endif |
| |
| const struct dma_map_ops dma_direct_ops = { |
| .alloc = dma_direct_alloc_coherent, |
| .free = dma_direct_free_coherent, |
| .mmap = dma_direct_mmap_coherent, |
| .map_sg = dma_direct_map_sg, |
| .unmap_sg = dma_direct_unmap_sg, |
| .dma_supported = dma_direct_dma_supported, |
| .map_page = dma_direct_map_page, |
| .unmap_page = dma_direct_unmap_page, |
| .get_required_mask = dma_direct_get_required_mask, |
| #ifdef CONFIG_NOT_COHERENT_CACHE |
| .sync_single_for_cpu = dma_direct_sync_single, |
| .sync_single_for_device = dma_direct_sync_single, |
| .sync_sg_for_cpu = dma_direct_sync_sg, |
| .sync_sg_for_device = dma_direct_sync_sg, |
| #endif |
| }; |
| EXPORT_SYMBOL(dma_direct_ops); |
| |
| int dma_set_coherent_mask(struct device *dev, u64 mask) |
| { |
| if (!dma_supported(dev, mask)) { |
| /* |
| * We need to special case the direct DMA ops which can |
| * support a fallback for coherent allocations. There |
| * is no dma_op->set_coherent_mask() so we have to do |
| * things the hard way: |
| */ |
| if (get_dma_ops(dev) != &dma_direct_ops || |
| get_iommu_table_base(dev) == NULL || |
| !dma_iommu_dma_supported(dev, mask)) |
| return -EIO; |
| } |
| dev->coherent_dma_mask = mask; |
| return 0; |
| } |
| EXPORT_SYMBOL(dma_set_coherent_mask); |
| |
| #define PREALLOC_DMA_DEBUG_ENTRIES (1 << 16) |
| |
| int __dma_set_mask(struct device *dev, u64 dma_mask) |
| { |
| const struct dma_map_ops *dma_ops = get_dma_ops(dev); |
| |
| if ((dma_ops != NULL) && (dma_ops->set_dma_mask != NULL)) |
| return dma_ops->set_dma_mask(dev, dma_mask); |
| if (!dev->dma_mask || !dma_supported(dev, dma_mask)) |
| return -EIO; |
| *dev->dma_mask = dma_mask; |
| return 0; |
| } |
| |
| int dma_set_mask(struct device *dev, u64 dma_mask) |
| { |
| if (ppc_md.dma_set_mask) |
| return ppc_md.dma_set_mask(dev, dma_mask); |
| |
| if (dev_is_pci(dev)) { |
| struct pci_dev *pdev = to_pci_dev(dev); |
| struct pci_controller *phb = pci_bus_to_host(pdev->bus); |
| if (phb->controller_ops.dma_set_mask) |
| return phb->controller_ops.dma_set_mask(pdev, dma_mask); |
| } |
| |
| return __dma_set_mask(dev, dma_mask); |
| } |
| EXPORT_SYMBOL(dma_set_mask); |
| |
| u64 __dma_get_required_mask(struct device *dev) |
| { |
| const struct dma_map_ops *dma_ops = get_dma_ops(dev); |
| |
| if (unlikely(dma_ops == NULL)) |
| return 0; |
| |
| if (dma_ops->get_required_mask) |
| return dma_ops->get_required_mask(dev); |
| |
| return DMA_BIT_MASK(8 * sizeof(dma_addr_t)); |
| } |
| |
| u64 dma_get_required_mask(struct device *dev) |
| { |
| if (ppc_md.dma_get_required_mask) |
| return ppc_md.dma_get_required_mask(dev); |
| |
| if (dev_is_pci(dev)) { |
| struct pci_dev *pdev = to_pci_dev(dev); |
| struct pci_controller *phb = pci_bus_to_host(pdev->bus); |
| if (phb->controller_ops.dma_get_required_mask) |
| return phb->controller_ops.dma_get_required_mask(pdev); |
| } |
| |
| return __dma_get_required_mask(dev); |
| } |
| EXPORT_SYMBOL_GPL(dma_get_required_mask); |
| |
| static int __init dma_init(void) |
| { |
| dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES); |
| #ifdef CONFIG_PCI |
| dma_debug_add_bus(&pci_bus_type); |
| #endif |
| #ifdef CONFIG_IBMVIO |
| dma_debug_add_bus(&vio_bus_type); |
| #endif |
| |
| return 0; |
| } |
| fs_initcall(dma_init); |
| |