Lines Matching +full:i +full:- +full:tlb +full:- +full:size
1 // SPDX-License-Identifier: GPL-2.0-only
6 * I/O TLBs (aka DMA address translation hardware).
9 * Copyright (C) 2000, 2003 Hewlett-Packard Co
10 * David Mosberger-Tang <davidm@hpl.hp.com>
12 * 03/05/07 davidm Switch from PCI-DMA to generic device DMA API.
14 * unnecessary i-cache flushing.
21 #define pr_fmt(fmt) "software IO TLB: " fmt
27 #include <linux/dma-direct.h>
28 #include <linux/dma-map-ops.h>
33 #include <linux/iommu-helper.h>
54 #define SLABS_PER_PAGE (1 << (PAGE_SHIFT - IO_TLB_SHIFT))
57 * Minimum IO TLB size to bother booting with. Systems with mainly
82 * struct io_tlb_area - IO TLB memory area descriptor
86 * @used: The number of used IO TLB block.
132 pr_info("SWIOTLB bounce buffer size roundup to %luMB", in swiotlb_adjust_nareas()
140 /* avoid tail segment of size < IO_TLB_SEGSIZE */ in setup_io_tlb_npages()
172 void __init swiotlb_adjust_size(unsigned long size) in swiotlb_adjust_size() argument
177 * adjust/expand SWIOTLB size for their use. in swiotlb_adjust_size()
182 size = ALIGN(size, IO_TLB_SIZE); in swiotlb_adjust_size()
183 default_nslabs = ALIGN(size >> IO_TLB_SHIFT, IO_TLB_SEGSIZE); in swiotlb_adjust_size()
185 size = default_nslabs << IO_TLB_SHIFT; in swiotlb_adjust_size()
186 pr_info("SWIOTLB bounce buffer size adjusted to %luMB", size >> 20); in swiotlb_adjust_size()
193 if (!mem->nslabs) { in swiotlb_print_info()
198 pr_info("mapped [mem %pa-%pa] (%luMB)\n", &mem->start, &mem->end, in swiotlb_print_info()
199 (mem->nslabs << IO_TLB_SHIFT) >> 20); in swiotlb_print_info()
204 return val & (IO_TLB_SEGSIZE - 1); in io_tlb_offset()
214 * when swiotlb_unencrypted_base is set. (e.g. for Hyper-V AMD SEV-SNP
223 phys_addr_t paddr = mem->start + swiotlb_unencrypted_base; in swiotlb_mem_remap()
227 pr_err("Failed to map the unencrypted memory %pa size %lx.\n", in swiotlb_mem_remap()
252 if (!mem->nslabs || mem->late_alloc) in swiotlb_update_mem_attributes()
254 vaddr = phys_to_virt(mem->start); in swiotlb_update_mem_attributes()
255 bytes = PAGE_ALIGN(mem->nslabs << IO_TLB_SHIFT); in swiotlb_update_mem_attributes()
258 mem->vaddr = swiotlb_mem_remap(mem, bytes); in swiotlb_update_mem_attributes()
259 if (!mem->vaddr) in swiotlb_update_mem_attributes()
260 mem->vaddr = vaddr; in swiotlb_update_mem_attributes()
268 unsigned long bytes = nslabs << IO_TLB_SHIFT, i; in swiotlb_init_io_tlb_mem() local
270 mem->nslabs = nslabs; in swiotlb_init_io_tlb_mem()
271 mem->start = start; in swiotlb_init_io_tlb_mem()
272 mem->end = mem->start + bytes; in swiotlb_init_io_tlb_mem()
273 mem->late_alloc = late_alloc; in swiotlb_init_io_tlb_mem()
274 mem->nareas = nareas; in swiotlb_init_io_tlb_mem()
275 mem->area_nslabs = nslabs / mem->nareas; in swiotlb_init_io_tlb_mem()
277 mem->force_bounce = swiotlb_force_bounce || (flags & SWIOTLB_FORCE); in swiotlb_init_io_tlb_mem()
279 for (i = 0; i < mem->nareas; i++) { in swiotlb_init_io_tlb_mem()
280 spin_lock_init(&mem->areas[i].lock); in swiotlb_init_io_tlb_mem()
281 mem->areas[i].index = 0; in swiotlb_init_io_tlb_mem()
282 mem->areas[i].used = 0; in swiotlb_init_io_tlb_mem()
285 for (i = 0; i < mem->nslabs; i++) { in swiotlb_init_io_tlb_mem()
286 mem->slots[i].list = IO_TLB_SEGSIZE - io_tlb_offset(i); in swiotlb_init_io_tlb_mem()
287 mem->slots[i].orig_addr = INVALID_PHYS_ADDR; in swiotlb_init_io_tlb_mem()
288 mem->slots[i].alloc_size = 0; in swiotlb_init_io_tlb_mem()
299 mem->vaddr = vaddr; in swiotlb_init_io_tlb_mem()
305 * structures for the software IO TLB used to implement the DMA API.
308 int (*remap)(void *tlb, unsigned long nslabs)) in swiotlb_init_remap() argument
314 void *tlb; in swiotlb_init_remap() local
337 tlb = memblock_alloc(bytes, PAGE_SIZE); in swiotlb_init_remap()
339 tlb = memblock_alloc_low(bytes, PAGE_SIZE); in swiotlb_init_remap()
340 if (!tlb) { in swiotlb_init_remap()
341 pr_warn("%s: failed to allocate tlb structure\n", __func__); in swiotlb_init_remap()
345 if (remap && remap(tlb, nslabs) < 0) { in swiotlb_init_remap()
346 memblock_free(tlb, PAGE_ALIGN(bytes)); in swiotlb_init_remap()
356 alloc_size = PAGE_ALIGN(array_size(sizeof(*mem->slots), nslabs)); in swiotlb_init_remap()
357 mem->slots = memblock_alloc(alloc_size, PAGE_SIZE); in swiotlb_init_remap()
358 if (!mem->slots) { in swiotlb_init_remap()
364 mem->areas = memblock_alloc(array_size(sizeof(struct io_tlb_area), in swiotlb_init_remap()
366 if (!mem->areas) { in swiotlb_init_remap()
367 pr_warn("%s: Failed to allocate mem->areas.\n", __func__); in swiotlb_init_remap()
371 swiotlb_init_io_tlb_mem(mem, __pa(tlb), nslabs, flags, false, in swiotlb_init_remap()
388 int swiotlb_init_late(size_t size, gfp_t gfp_mask, in swiotlb_init_late() argument
389 int (*remap)(void *tlb, unsigned long nslabs)) in swiotlb_init_late() argument
392 unsigned long nslabs = ALIGN(size >> IO_TLB_SHIFT, IO_TLB_SEGSIZE); in swiotlb_init_late()
410 order--; in swiotlb_init_late()
416 return -ENOMEM; in swiotlb_init_late()
438 area_order = get_order(array_size(sizeof(*mem->areas), in swiotlb_init_late()
440 mem->areas = (struct io_tlb_area *) in swiotlb_init_late()
442 if (!mem->areas) in swiotlb_init_late()
445 mem->slots = (void *)__get_free_pages(GFP_KERNEL | __GFP_ZERO, in swiotlb_init_late()
446 get_order(array_size(sizeof(*mem->slots), nslabs))); in swiotlb_init_late()
447 if (!mem->slots) in swiotlb_init_late()
459 free_pages((unsigned long)mem->areas, area_order); in swiotlb_init_late()
462 return -ENOMEM; in swiotlb_init_late()
475 if (!mem->nslabs) in swiotlb_exit()
479 tbl_vaddr = (unsigned long)phys_to_virt(mem->start); in swiotlb_exit()
480 tbl_size = PAGE_ALIGN(mem->end - mem->start); in swiotlb_exit()
481 slots_size = PAGE_ALIGN(array_size(sizeof(*mem->slots), mem->nslabs)); in swiotlb_exit()
484 if (mem->late_alloc) { in swiotlb_exit()
485 area_order = get_order(array_size(sizeof(*mem->areas), in swiotlb_exit()
486 mem->nareas)); in swiotlb_exit()
487 free_pages((unsigned long)mem->areas, area_order); in swiotlb_exit()
489 free_pages((unsigned long)mem->slots, get_order(slots_size)); in swiotlb_exit()
491 memblock_free_late(__pa(mem->areas), in swiotlb_exit()
492 array_size(sizeof(*mem->areas), mem->nareas)); in swiotlb_exit()
493 memblock_free_late(mem->start, tbl_size); in swiotlb_exit()
494 memblock_free_late(__pa(mem->slots), slots_size); in swiotlb_exit()
505 return addr & dma_get_min_align_mask(dev) & (IO_TLB_SIZE - 1); in swiotlb_align_offset()
511 static void swiotlb_bounce(struct device *dev, phys_addr_t tlb_addr, size_t size, in swiotlb_bounce() argument
514 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in swiotlb_bounce()
515 int index = (tlb_addr - mem->start) >> IO_TLB_SHIFT; in swiotlb_bounce()
516 phys_addr_t orig_addr = mem->slots[index].orig_addr; in swiotlb_bounce()
517 size_t alloc_size = mem->slots[index].alloc_size; in swiotlb_bounce()
519 unsigned char *vaddr = mem->vaddr + tlb_addr - mem->start; in swiotlb_bounce()
525 tlb_offset = tlb_addr & (IO_TLB_SIZE - 1); in swiotlb_bounce()
534 tlb_offset -= orig_addr_offset; in swiotlb_bounce()
537 "Buffer overflow detected. Allocation size: %zu. Mapping size: %zu+%u.\n", in swiotlb_bounce()
538 alloc_size, size, tlb_offset); in swiotlb_bounce()
543 alloc_size -= tlb_offset; in swiotlb_bounce()
545 if (size > alloc_size) { in swiotlb_bounce()
547 "Buffer overflow detected. Allocation size: %zu. Mapping size: %zu.\n", in swiotlb_bounce()
548 alloc_size, size); in swiotlb_bounce()
549 size = alloc_size; in swiotlb_bounce()
558 while (size) { in swiotlb_bounce()
559 sz = min_t(size_t, PAGE_SIZE - offset, size); in swiotlb_bounce()
569 size -= sz; in swiotlb_bounce()
575 memcpy(vaddr, phys_to_virt(orig_addr), size); in swiotlb_bounce()
577 memcpy(phys_to_virt(orig_addr), vaddr, size); in swiotlb_bounce()
592 return 1UL << (BITS_PER_LONG - IO_TLB_SHIFT); in get_max_slots()
598 if (index >= mem->area_nslabs) in wrap_area_index()
604 * Find a suitable number of IO TLB entries size that will fit this request and
605 * allocate a buffer from that IO TLB pool.
611 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in swiotlb_do_find_slots()
612 struct io_tlb_area *area = mem->areas + area_index; in swiotlb_do_find_slots()
615 phys_to_dma_unencrypted(dev, mem->start) & boundary_mask; in swiotlb_do_find_slots()
618 dma_get_min_align_mask(dev) & ~(IO_TLB_SIZE - 1); in swiotlb_do_find_slots()
620 unsigned int index, wrap, count = 0, i; in swiotlb_do_find_slots() local
627 BUG_ON(area_index >= mem->nareas); in swiotlb_do_find_slots()
636 stride = max(stride, stride << (PAGE_SHIFT - IO_TLB_SHIFT)); in swiotlb_do_find_slots()
639 spin_lock_irqsave(&area->lock, flags); in swiotlb_do_find_slots()
640 if (unlikely(nslots > mem->area_nslabs - area->used)) in swiotlb_do_find_slots()
643 slot_base = area_index * mem->area_nslabs; in swiotlb_do_find_slots()
644 index = wrap = wrap_area_index(mem, ALIGN(area->index, stride)); in swiotlb_do_find_slots()
664 if (mem->slots[slot_index].list >= nslots) in swiotlb_do_find_slots()
671 spin_unlock_irqrestore(&area->lock, flags); in swiotlb_do_find_slots()
672 return -1; in swiotlb_do_find_slots()
675 for (i = slot_index; i < slot_index + nslots; i++) { in swiotlb_do_find_slots()
676 mem->slots[i].list = 0; in swiotlb_do_find_slots()
677 mem->slots[i].alloc_size = alloc_size - (offset + in swiotlb_do_find_slots()
678 ((i - slot_index) << IO_TLB_SHIFT)); in swiotlb_do_find_slots()
680 for (i = slot_index - 1; in swiotlb_do_find_slots()
681 io_tlb_offset(i) != IO_TLB_SEGSIZE - 1 && in swiotlb_do_find_slots()
682 mem->slots[i].list; i--) in swiotlb_do_find_slots()
683 mem->slots[i].list = ++count; in swiotlb_do_find_slots()
688 if (index + nslots < mem->area_nslabs) in swiotlb_do_find_slots()
689 area->index = index + nslots; in swiotlb_do_find_slots()
691 area->index = 0; in swiotlb_do_find_slots()
692 area->used += nslots; in swiotlb_do_find_slots()
693 spin_unlock_irqrestore(&area->lock, flags); in swiotlb_do_find_slots()
700 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in swiotlb_find_slots()
701 int start = raw_smp_processor_id() & (mem->nareas - 1); in swiotlb_find_slots()
702 int i = start, index; in swiotlb_find_slots() local
705 index = swiotlb_do_find_slots(dev, i, orig_addr, alloc_size, in swiotlb_find_slots()
709 if (++i >= mem->nareas) in swiotlb_find_slots()
710 i = 0; in swiotlb_find_slots()
711 } while (i != start); in swiotlb_find_slots()
713 return -1; in swiotlb_find_slots()
718 int i; in mem_used() local
721 for (i = 0; i < mem->nareas; i++) in mem_used()
722 used += mem->areas[i].used; in mem_used()
731 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in swiotlb_tbl_map_single()
733 unsigned int i; in swiotlb_tbl_map_single() local
737 if (!mem || !mem->nslabs) { in swiotlb_tbl_map_single()
754 if (index == -1) { in swiotlb_tbl_map_single()
758 alloc_size, mem->nslabs, mem_used(mem)); in swiotlb_tbl_map_single()
767 for (i = 0; i < nr_slots(alloc_size + offset); i++) in swiotlb_tbl_map_single()
768 mem->slots[index + i].orig_addr = slot_addr(orig_addr, i); in swiotlb_tbl_map_single()
769 tlb_addr = slot_addr(mem->start, index) + offset; in swiotlb_tbl_map_single()
772 * to the tlb buffer, if we knew for sure the device will in swiotlb_tbl_map_single()
774 * unconditional bounce may prevent leaking swiotlb content (i.e. in swiotlb_tbl_map_single()
775 * kernel memory) to user-space. in swiotlb_tbl_map_single()
783 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in swiotlb_release_slots()
786 int index = (tlb_addr - offset - mem->start) >> IO_TLB_SHIFT; in swiotlb_release_slots()
787 int nslots = nr_slots(mem->slots[index].alloc_size + offset); in swiotlb_release_slots()
788 int aindex = index / mem->area_nslabs; in swiotlb_release_slots()
789 struct io_tlb_area *area = &mem->areas[aindex]; in swiotlb_release_slots()
790 int count, i; in swiotlb_release_slots() local
798 BUG_ON(aindex >= mem->nareas); in swiotlb_release_slots()
800 spin_lock_irqsave(&area->lock, flags); in swiotlb_release_slots()
802 count = mem->slots[index + nslots].list; in swiotlb_release_slots()
810 for (i = index + nslots - 1; i >= index; i--) { in swiotlb_release_slots()
811 mem->slots[i].list = ++count; in swiotlb_release_slots()
812 mem->slots[i].orig_addr = INVALID_PHYS_ADDR; in swiotlb_release_slots()
813 mem->slots[i].alloc_size = 0; in swiotlb_release_slots()
820 for (i = index - 1; in swiotlb_release_slots()
821 io_tlb_offset(i) != IO_TLB_SEGSIZE - 1 && mem->slots[i].list; in swiotlb_release_slots()
822 i--) in swiotlb_release_slots()
823 mem->slots[i].list = ++count; in swiotlb_release_slots()
824 area->used -= nslots; in swiotlb_release_slots()
825 spin_unlock_irqrestore(&area->lock, flags); in swiotlb_release_slots()
846 size_t size, enum dma_data_direction dir) in swiotlb_sync_single_for_device() argument
849 swiotlb_bounce(dev, tlb_addr, size, DMA_TO_DEVICE); in swiotlb_sync_single_for_device()
855 size_t size, enum dma_data_direction dir) in swiotlb_sync_single_for_cpu() argument
858 swiotlb_bounce(dev, tlb_addr, size, DMA_FROM_DEVICE); in swiotlb_sync_single_for_cpu()
867 dma_addr_t swiotlb_map(struct device *dev, phys_addr_t paddr, size_t size, in swiotlb_map() argument
873 trace_swiotlb_bounced(dev, phys_to_dma(dev, paddr), size); in swiotlb_map()
875 swiotlb_addr = swiotlb_tbl_map_single(dev, paddr, size, size, 0, dir, in swiotlb_map()
882 if (unlikely(!dma_capable(dev, dma_addr, size, true))) { in swiotlb_map()
883 swiotlb_tbl_unmap_single(dev, swiotlb_addr, size, dir, in swiotlb_map()
887 &dma_addr, size, *dev->dma_mask, dev->bus_dma_limit); in swiotlb_map()
892 arch_sync_dma_for_device(swiotlb_addr, size, dir); in swiotlb_map()
903 * min align mask. This affects max mapping size. in swiotlb_max_mapping_size()
909 return ((size_t)IO_TLB_SIZE) * IO_TLB_SEGSIZE - min_align; in swiotlb_max_mapping_size()
914 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in is_swiotlb_active()
916 return mem && mem->nslabs; in is_swiotlb_active()
930 mem->debugfs = debugfs_create_dir(dirname, io_tlb_default_mem.debugfs); in swiotlb_create_debugfs_files()
931 if (!mem->nslabs) in swiotlb_create_debugfs_files()
934 debugfs_create_ulong("io_tlb_nslabs", 0400, mem->debugfs, &mem->nslabs); in swiotlb_create_debugfs_files()
935 debugfs_create_file("io_tlb_used", 0400, mem->debugfs, NULL, in swiotlb_create_debugfs_files()
951 struct page *swiotlb_alloc(struct device *dev, size_t size) in swiotlb_alloc() argument
953 struct io_tlb_mem *mem = dev->dma_io_tlb_mem; in swiotlb_alloc()
960 index = swiotlb_find_slots(dev, 0, size, 0); in swiotlb_alloc()
961 if (index == -1) in swiotlb_alloc()
964 tlb_addr = slot_addr(mem->start, index); in swiotlb_alloc()
969 bool swiotlb_free(struct device *dev, struct page *page, size_t size) in swiotlb_free() argument
984 struct io_tlb_mem *mem = rmem->priv; in rmem_swiotlb_device_init()
985 unsigned long nslabs = rmem->size >> IO_TLB_SHIFT; in rmem_swiotlb_device_init()
987 /* Set Per-device io tlb area to one */ in rmem_swiotlb_device_init()
998 return -ENOMEM; in rmem_swiotlb_device_init()
1000 mem->slots = kcalloc(nslabs, sizeof(*mem->slots), GFP_KERNEL); in rmem_swiotlb_device_init()
1001 if (!mem->slots) { in rmem_swiotlb_device_init()
1003 return -ENOMEM; in rmem_swiotlb_device_init()
1006 mem->areas = kcalloc(nareas, sizeof(*mem->areas), in rmem_swiotlb_device_init()
1008 if (!mem->areas) { in rmem_swiotlb_device_init()
1009 kfree(mem->slots); in rmem_swiotlb_device_init()
1011 return -ENOMEM; in rmem_swiotlb_device_init()
1014 set_memory_decrypted((unsigned long)phys_to_virt(rmem->base), in rmem_swiotlb_device_init()
1015 rmem->size >> PAGE_SHIFT); in rmem_swiotlb_device_init()
1016 swiotlb_init_io_tlb_mem(mem, rmem->base, nslabs, SWIOTLB_FORCE, in rmem_swiotlb_device_init()
1018 mem->for_alloc = true; in rmem_swiotlb_device_init()
1020 rmem->priv = mem; in rmem_swiotlb_device_init()
1022 swiotlb_create_debugfs_files(mem, rmem->name); in rmem_swiotlb_device_init()
1025 dev->dma_io_tlb_mem = mem; in rmem_swiotlb_device_init()
1033 dev->dma_io_tlb_mem = &io_tlb_default_mem; in rmem_swiotlb_device_release()
1043 unsigned long node = rmem->fdt_node; in rmem_swiotlb_setup()
1046 of_get_flat_dt_prop(node, "linux,cma-default", NULL) || in rmem_swiotlb_setup()
1047 of_get_flat_dt_prop(node, "linux,dma-default", NULL) || in rmem_swiotlb_setup()
1048 of_get_flat_dt_prop(node, "no-map", NULL)) in rmem_swiotlb_setup()
1049 return -EINVAL; in rmem_swiotlb_setup()
1051 if (PageHighMem(pfn_to_page(PHYS_PFN(rmem->base)))) { in rmem_swiotlb_setup()
1053 return -EINVAL; in rmem_swiotlb_setup()
1056 rmem->ops = &rmem_swiotlb_ops; in rmem_swiotlb_setup()
1057 pr_info("Reserved memory: created restricted DMA pool at %pa, size %ld MiB\n", in rmem_swiotlb_setup()
1058 &rmem->base, (unsigned long)rmem->size / SZ_1M); in rmem_swiotlb_setup()
1062 RESERVEDMEM_OF_DECLARE(dma, "restricted-dma-pool", rmem_swiotlb_setup);