Commit 6c1b980a authored by Linus Torvalds's avatar Linus Torvalds

Merge tag 'dma-mapping-6.6-2023-08-29' of git://git.infradead.org/users/hch/dma-mapping

Pull dma-maping updates from Christoph Hellwig:

 - allow dynamic sizing of the swiotlb buffer, to cater for secure
   virtualization workloads that require all I/O to be bounce buffered
   (Petr Tesarik)

 - move a declaration to a header (Arnd Bergmann)

 - check for memory region overlap in dma-contiguous (Binglei Wang)

 - remove the somewhat dangerous runtime swiotlb-xen enablement and
   unexport is_swiotlb_active (Christoph Hellwig, Juergen Gross)

 - per-node CMA improvements (Yajun Deng)

* tag 'dma-mapping-6.6-2023-08-29' of git://git.infradead.org/users/hch/dma-mapping:
  swiotlb: optimize get_max_slots()
  swiotlb: move slot allocation explanation comment where it belongs
  swiotlb: search the software IO TLB only if the device makes use of it
  swiotlb: allocate a new memory pool when existing pools are full
  swiotlb: determine potential physical address limit
  swiotlb: if swiotlb is full, fall back to a transient memory pool
  swiotlb: add a flag whether SWIOTLB is allowed to grow
  swiotlb: separate memory pool data from other allocator data
  swiotlb: add documentation and rename swiotlb_do_find_slots()
  swiotlb: make io_tlb_default_mem local to swiotlb.c
  swiotlb: bail out of swiotlb_init_late() if swiotlb is already allocated
  dma-contiguous: check for memory region overlap
  dma-contiguous: support numa CMA for specified node
  dma-contiguous: support per-numa CMA for all architectures
  dma-mapping: move arch_dma_set_mask() declaration to header
  swiotlb: unexport is_swiotlb_active
  x86: always initialize xen-swiotlb when xen-pcifront is enabling
  xen/pci: add flag for PCI passthrough being possible
parents 3d3dfeb3 d069ed28
...@@ -696,7 +696,7 @@ ...@@ -696,7 +696,7 @@
kernel/dma/contiguous.c kernel/dma/contiguous.c
cma_pernuma=nn[MG] cma_pernuma=nn[MG]
[ARM64,KNL,CMA] [KNL,CMA]
Sets the size of kernel per-numa memory area for Sets the size of kernel per-numa memory area for
contiguous memory allocations. A value of 0 disables contiguous memory allocations. A value of 0 disables
per-numa CMA altogether. And If this option is not per-numa CMA altogether. And If this option is not
...@@ -706,6 +706,17 @@ ...@@ -706,6 +706,17 @@
which is located in node nid, if the allocation fails, which is located in node nid, if the allocation fails,
they will fallback to the global default memory area. they will fallback to the global default memory area.
numa_cma=<node>:nn[MG][,<node>:nn[MG]]
[KNL,CMA]
Sets the size of kernel numa memory area for
contiguous memory allocations. It will reserve CMA
area for the specified node.
With numa CMA enabled, DMA users on node nid will
first try to allocate buffer from the numa area
which is located in node nid, if the allocation fails,
they will fallback to the global default memory area.
cmo_free_hint= [PPC] Format: { yes | no } cmo_free_hint= [PPC] Format: { yes | no }
Specify whether pages are marked as being inactive Specify whether pages are marked as being inactive
when they are freed. This is used in CMO environments when they are freed. This is used in CMO environments
......
...@@ -125,12 +125,10 @@ static int __init xen_mm_init(void) ...@@ -125,12 +125,10 @@ static int __init xen_mm_init(void)
return 0; return 0;
/* we can work with the default swiotlb */ /* we can work with the default swiotlb */
if (!io_tlb_default_mem.nslabs) {
rc = swiotlb_init_late(swiotlb_size_or_default(), rc = swiotlb_init_late(swiotlb_size_or_default(),
xen_swiotlb_gfp(), NULL); xen_swiotlb_gfp(), NULL);
if (rc < 0) if (rc < 0)
return rc; return rc;
}
cflush.op = 0; cflush.op = 0;
cflush.a.dev_bus_addr = 0; cflush.a.dev_bus_addr = 0;
......
...@@ -461,8 +461,6 @@ void __init bootmem_init(void) ...@@ -461,8 +461,6 @@ void __init bootmem_init(void)
arm64_hugetlb_cma_reserve(); arm64_hugetlb_cma_reserve();
#endif #endif
dma_pernuma_cma_reserve();
kvm_hyp_reserve(); kvm_hyp_reserve();
/* /*
......
...@@ -664,7 +664,7 @@ static int __init octeon_pci_setup(void) ...@@ -664,7 +664,7 @@ static int __init octeon_pci_setup(void)
/* BAR1 movable regions contiguous to cover the swiotlb */ /* BAR1 movable regions contiguous to cover the swiotlb */
octeon_bar1_pci_phys = octeon_bar1_pci_phys =
io_tlb_default_mem.start & ~((1ull << 22) - 1); default_swiotlb_base() & ~((1ull << 22) - 1);
for (index = 0; index < 32; index++) { for (index = 0; index < 32; index++) {
union cvmx_pci_bar1_indexx bar1_index; union cvmx_pci_bar1_indexx bar1_index;
......
// SPDX-License-Identifier: GPL-2.0 // SPDX-License-Identifier: GPL-2.0
#include <linux/dma-mapping.h> #include <linux/dma-mapping.h>
#include <linux/dma-map-ops.h>
#include <linux/export.h> #include <linux/export.h>
#include <asm/machdep.h> #include <asm/machdep.h>
......
...@@ -2,12 +2,6 @@ ...@@ -2,12 +2,6 @@
#ifndef _ASM_X86_SWIOTLB_XEN_H #ifndef _ASM_X86_SWIOTLB_XEN_H
#define _ASM_X86_SWIOTLB_XEN_H #define _ASM_X86_SWIOTLB_XEN_H
#ifdef CONFIG_SWIOTLB_XEN
extern int pci_xen_swiotlb_init_late(void);
#else
static inline int pci_xen_swiotlb_init_late(void) { return -ENXIO; }
#endif
int xen_swiotlb_fixup(void *buf, unsigned long nslabs); int xen_swiotlb_fixup(void *buf, unsigned long nslabs);
int xen_create_contiguous_region(phys_addr_t pstart, unsigned int order, int xen_create_contiguous_region(phys_addr_t pstart, unsigned int order,
unsigned int address_bits, unsigned int address_bits,
......
...@@ -72,9 +72,15 @@ static inline void __init pci_swiotlb_detect(void) ...@@ -72,9 +72,15 @@ static inline void __init pci_swiotlb_detect(void)
#endif /* CONFIG_SWIOTLB */ #endif /* CONFIG_SWIOTLB */
#ifdef CONFIG_SWIOTLB_XEN #ifdef CONFIG_SWIOTLB_XEN
static bool xen_swiotlb_enabled(void)
{
return xen_initial_domain() || x86_swiotlb_enable ||
(IS_ENABLED(CONFIG_XEN_PCIDEV_FRONTEND) && xen_pv_pci_possible);
}
static void __init pci_xen_swiotlb_init(void) static void __init pci_xen_swiotlb_init(void)
{ {
if (!xen_initial_domain() && !x86_swiotlb_enable) if (!xen_swiotlb_enabled())
return; return;
x86_swiotlb_enable = true; x86_swiotlb_enable = true;
x86_swiotlb_flags |= SWIOTLB_ANY; x86_swiotlb_flags |= SWIOTLB_ANY;
...@@ -83,27 +89,6 @@ static void __init pci_xen_swiotlb_init(void) ...@@ -83,27 +89,6 @@ static void __init pci_xen_swiotlb_init(void)
if (IS_ENABLED(CONFIG_PCI)) if (IS_ENABLED(CONFIG_PCI))
pci_request_acs(); pci_request_acs();
} }
int pci_xen_swiotlb_init_late(void)
{
if (dma_ops == &xen_swiotlb_dma_ops)
return 0;
/* we can work with the default swiotlb */
if (!io_tlb_default_mem.nslabs) {
int rc = swiotlb_init_late(swiotlb_size_or_default(),
GFP_KERNEL, xen_swiotlb_fixup);
if (rc < 0)
return rc;
}
/* XXX: this switches the dma ops under live devices! */
dma_ops = &xen_swiotlb_dma_ops;
if (IS_ENABLED(CONFIG_PCI))
pci_request_acs();
return 0;
}
EXPORT_SYMBOL_GPL(pci_xen_swiotlb_init_late);
#else #else
static inline void __init pci_xen_swiotlb_init(void) static inline void __init pci_xen_swiotlb_init(void)
{ {
......
...@@ -44,6 +44,9 @@ struct xen_memory_region xen_extra_mem[XEN_EXTRA_MEM_MAX_REGIONS] __initdata; ...@@ -44,6 +44,9 @@ struct xen_memory_region xen_extra_mem[XEN_EXTRA_MEM_MAX_REGIONS] __initdata;
/* Number of pages released from the initial allocation. */ /* Number of pages released from the initial allocation. */
unsigned long xen_released_pages; unsigned long xen_released_pages;
/* Memory map would allow PCI passthrough. */
bool xen_pv_pci_possible;
/* E820 map used during setting up memory. */ /* E820 map used during setting up memory. */
static struct e820_table xen_e820_table __initdata; static struct e820_table xen_e820_table __initdata;
...@@ -814,6 +817,9 @@ char * __init xen_memory_setup(void) ...@@ -814,6 +817,9 @@ char * __init xen_memory_setup(void)
chunk_size = size; chunk_size = size;
type = xen_e820_table.entries[i].type; type = xen_e820_table.entries[i].type;
if (type == E820_TYPE_RESERVED)
xen_pv_pci_possible = true;
if (type == E820_TYPE_RAM) { if (type == E820_TYPE_RAM) {
if (addr < mem_end) { if (addr < mem_end) {
chunk_size = min(size, mem_end - addr); chunk_size = min(size, mem_end - addr);
......
...@@ -3108,9 +3108,7 @@ void device_initialize(struct device *dev) ...@@ -3108,9 +3108,7 @@ void device_initialize(struct device *dev)
defined(CONFIG_ARCH_HAS_SYNC_DMA_FOR_CPU_ALL) defined(CONFIG_ARCH_HAS_SYNC_DMA_FOR_CPU_ALL)
dev->dma_coherent = dma_default_coherent; dev->dma_coherent = dma_default_coherent;
#endif #endif
#ifdef CONFIG_SWIOTLB swiotlb_dev_init(dev);
dev->dma_io_tlb_mem = &io_tlb_default_mem;
#endif
} }
EXPORT_SYMBOL_GPL(device_initialize); EXPORT_SYMBOL_GPL(device_initialize);
......
...@@ -22,7 +22,6 @@ ...@@ -22,7 +22,6 @@
#include <linux/bitops.h> #include <linux/bitops.h>
#include <linux/time.h> #include <linux/time.h>
#include <linux/ktime.h> #include <linux/ktime.h>
#include <linux/swiotlb.h>
#include <xen/platform_pci.h> #include <xen/platform_pci.h>
#include <asm/xen/swiotlb-xen.h> #include <asm/xen/swiotlb-xen.h>
...@@ -669,11 +668,6 @@ static int pcifront_connect_and_init_dma(struct pcifront_device *pdev) ...@@ -669,11 +668,6 @@ static int pcifront_connect_and_init_dma(struct pcifront_device *pdev)
spin_unlock(&pcifront_dev_lock); spin_unlock(&pcifront_dev_lock);
if (!err && !is_swiotlb_active(&pdev->xdev->dev)) {
err = pci_xen_swiotlb_init_late();
if (err)
dev_err(&pdev->xdev->dev, "Could not setup SWIOTLB!\n");
}
return err; return err;
} }
......
...@@ -381,7 +381,7 @@ xen_swiotlb_sync_sg_for_device(struct device *dev, struct scatterlist *sgl, ...@@ -381,7 +381,7 @@ xen_swiotlb_sync_sg_for_device(struct device *dev, struct scatterlist *sgl,
static int static int
xen_swiotlb_dma_supported(struct device *hwdev, u64 mask) xen_swiotlb_dma_supported(struct device *hwdev, u64 mask)
{ {
return xen_phys_to_dma(hwdev, io_tlb_default_mem.end - 1) <= mask; return xen_phys_to_dma(hwdev, default_swiotlb_limit()) <= mask;
} }
const struct dma_map_ops xen_swiotlb_dma_ops = { const struct dma_map_ops xen_swiotlb_dma_ops = {
......
...@@ -625,7 +625,10 @@ struct device_physical_location { ...@@ -625,7 +625,10 @@ struct device_physical_location {
* @dma_pools: Dma pools (if dma'ble device). * @dma_pools: Dma pools (if dma'ble device).
* @dma_mem: Internal for coherent mem override. * @dma_mem: Internal for coherent mem override.
* @cma_area: Contiguous memory area for dma allocations * @cma_area: Contiguous memory area for dma allocations
* @dma_io_tlb_mem: Pointer to the swiotlb pool used. Not for driver use. * @dma_io_tlb_mem: Software IO TLB allocator. Not for driver use.
* @dma_io_tlb_pools: List of transient swiotlb memory pools.
* @dma_io_tlb_lock: Protects changes to the list of active pools.
* @dma_uses_io_tlb: %true if device has used the software IO TLB.
* @archdata: For arch-specific additions. * @archdata: For arch-specific additions.
* @of_node: Associated device tree node. * @of_node: Associated device tree node.
* @fwnode: Associated device node supplied by platform firmware. * @fwnode: Associated device node supplied by platform firmware.
...@@ -731,6 +734,11 @@ struct device { ...@@ -731,6 +734,11 @@ struct device {
#endif #endif
#ifdef CONFIG_SWIOTLB #ifdef CONFIG_SWIOTLB
struct io_tlb_mem *dma_io_tlb_mem; struct io_tlb_mem *dma_io_tlb_mem;
#endif
#ifdef CONFIG_SWIOTLB_DYNAMIC
struct list_head dma_io_tlb_pools;
spinlock_t dma_io_tlb_lock;
bool dma_uses_io_tlb;
#endif #endif
/* arch specific additions */ /* arch specific additions */
struct dev_archdata archdata; struct dev_archdata archdata;
......
...@@ -169,12 +169,6 @@ static inline void dma_free_contiguous(struct device *dev, struct page *page, ...@@ -169,12 +169,6 @@ static inline void dma_free_contiguous(struct device *dev, struct page *page,
} }
#endif /* CONFIG_DMA_CMA*/ #endif /* CONFIG_DMA_CMA*/
#ifdef CONFIG_DMA_PERNUMA_CMA
void dma_pernuma_cma_reserve(void);
#else
static inline void dma_pernuma_cma_reserve(void) { }
#endif /* CONFIG_DMA_PERNUMA_CMA */
#ifdef CONFIG_DMA_DECLARE_COHERENT #ifdef CONFIG_DMA_DECLARE_COHERENT
int dma_declare_coherent_memory(struct device *dev, phys_addr_t phys_addr, int dma_declare_coherent_memory(struct device *dev, phys_addr_t phys_addr,
dma_addr_t device_addr, size_t size); dma_addr_t device_addr, size_t size);
...@@ -343,6 +337,12 @@ void *arch_dma_alloc(struct device *dev, size_t size, dma_addr_t *dma_handle, ...@@ -343,6 +337,12 @@ void *arch_dma_alloc(struct device *dev, size_t size, dma_addr_t *dma_handle,
void arch_dma_free(struct device *dev, size_t size, void *cpu_addr, void arch_dma_free(struct device *dev, size_t size, void *cpu_addr,
dma_addr_t dma_addr, unsigned long attrs); dma_addr_t dma_addr, unsigned long attrs);
#ifdef CONFIG_ARCH_HAS_DMA_SET_MASK
void arch_dma_set_mask(struct device *dev, u64 mask);
#else
#define arch_dma_set_mask(dev, mask) do { } while (0)
#endif
#ifdef CONFIG_MMU #ifdef CONFIG_MMU
/* /*
* Page protection so that devices that can't snoop CPU caches can use the * Page protection so that devices that can't snoop CPU caches can use the
......
...@@ -418,6 +418,8 @@ static inline void dma_sync_sgtable_for_device(struct device *dev, ...@@ -418,6 +418,8 @@ static inline void dma_sync_sgtable_for_device(struct device *dev,
#define dma_get_sgtable(d, t, v, h, s) dma_get_sgtable_attrs(d, t, v, h, s, 0) #define dma_get_sgtable(d, t, v, h, s) dma_get_sgtable_attrs(d, t, v, h, s, 0)
#define dma_mmap_coherent(d, v, c, h, s) dma_mmap_attrs(d, v, c, h, s, 0) #define dma_mmap_coherent(d, v, c, h, s) dma_mmap_attrs(d, v, c, h, s, 0)
bool dma_coherent_ok(struct device *dev, phys_addr_t phys, size_t size);
static inline void *dma_alloc_coherent(struct device *dev, size_t size, static inline void *dma_alloc_coherent(struct device *dev, size_t size,
dma_addr_t *dma_handle, gfp_t gfp) dma_addr_t *dma_handle, gfp_t gfp)
{ {
......
...@@ -8,6 +8,7 @@ ...@@ -8,6 +8,7 @@
#include <linux/types.h> #include <linux/types.h>
#include <linux/limits.h> #include <linux/limits.h>
#include <linux/spinlock.h> #include <linux/spinlock.h>
#include <linux/workqueue.h>
struct device; struct device;
struct page; struct page;
...@@ -62,8 +63,7 @@ dma_addr_t swiotlb_map(struct device *dev, phys_addr_t phys, ...@@ -62,8 +63,7 @@ dma_addr_t swiotlb_map(struct device *dev, phys_addr_t phys,
#ifdef CONFIG_SWIOTLB #ifdef CONFIG_SWIOTLB
/** /**
* struct io_tlb_mem - IO TLB Memory Pool Descriptor * struct io_tlb_pool - IO TLB memory pool descriptor
*
* @start: The start address of the swiotlb memory pool. Used to do a quick * @start: The start address of the swiotlb memory pool. Used to do a quick
* range check to see if the memory was in fact allocated by this * range check to see if the memory was in fact allocated by this
* API. * API.
...@@ -73,19 +73,48 @@ dma_addr_t swiotlb_map(struct device *dev, phys_addr_t phys, ...@@ -73,19 +73,48 @@ dma_addr_t swiotlb_map(struct device *dev, phys_addr_t phys,
* @vaddr: The vaddr of the swiotlb memory pool. The swiotlb memory pool * @vaddr: The vaddr of the swiotlb memory pool. The swiotlb memory pool
* may be remapped in the memory encrypted case and store virtual * may be remapped in the memory encrypted case and store virtual
* address for bounce buffer operation. * address for bounce buffer operation.
* @nslabs: The number of IO TLB blocks (in groups of 64) between @start and * @nslabs: The number of IO TLB slots between @start and @end. For the
* @end. For default swiotlb, this is command line adjustable via * default swiotlb, this can be adjusted with a boot parameter,
* setup_io_tlb_npages. * see setup_io_tlb_npages().
* @list: The free list describing the number of free entries available * @late_alloc: %true if allocated using the page allocator.
* from each index. * @nareas: Number of areas in the pool.
* @orig_addr: The original address corresponding to a mapped entry. * @area_nslabs: Number of slots in each area.
* @alloc_size: Size of the allocated buffer. * @areas: Array of memory area descriptors.
* @slots: Array of slot descriptors.
* @node: Member of the IO TLB memory pool list.
* @rcu: RCU head for swiotlb_dyn_free().
* @transient: %true if transient memory pool.
*/
struct io_tlb_pool {
phys_addr_t start;
phys_addr_t end;
void *vaddr;
unsigned long nslabs;
bool late_alloc;
unsigned int nareas;
unsigned int area_nslabs;
struct io_tlb_area *areas;
struct io_tlb_slot *slots;
#ifdef CONFIG_SWIOTLB_DYNAMIC
struct list_head node;
struct rcu_head rcu;
bool transient;
#endif
};
/**
* struct io_tlb_mem - Software IO TLB allocator
* @defpool: Default (initial) IO TLB memory pool descriptor.
* @pool: IO TLB memory pool descriptor (if not dynamic).
* @nslabs: Total number of IO TLB slabs in all pools.
* @debugfs: The dentry to debugfs. * @debugfs: The dentry to debugfs.
* @late_alloc: %true if allocated using the page allocator
* @force_bounce: %true if swiotlb bouncing is forced * @force_bounce: %true if swiotlb bouncing is forced
* @for_alloc: %true if the pool is used for memory allocation * @for_alloc: %true if the pool is used for memory allocation
* @nareas: The area number in the pool. * @can_grow: %true if more pools can be allocated dynamically.
* @area_nslabs: The slot number in the area. * @phys_limit: Maximum allowed physical address.
* @lock: Lock to synchronize changes to the list.
* @pools: List of IO TLB memory pool descriptors (if dynamic).
* @dyn_alloc: Dynamic IO TLB pool allocation work.
* @total_used: The total number of slots in the pool that are currently used * @total_used: The total number of slots in the pool that are currently used
* across all areas. Used only for calculating used_hiwater in * across all areas. Used only for calculating used_hiwater in
* debugfs. * debugfs.
...@@ -93,30 +122,64 @@ dma_addr_t swiotlb_map(struct device *dev, phys_addr_t phys, ...@@ -93,30 +122,64 @@ dma_addr_t swiotlb_map(struct device *dev, phys_addr_t phys,
* in debugfs. * in debugfs.
*/ */
struct io_tlb_mem { struct io_tlb_mem {
phys_addr_t start; struct io_tlb_pool defpool;
phys_addr_t end;
void *vaddr;
unsigned long nslabs; unsigned long nslabs;
struct dentry *debugfs; struct dentry *debugfs;
bool late_alloc;
bool force_bounce; bool force_bounce;
bool for_alloc; bool for_alloc;
unsigned int nareas; #ifdef CONFIG_SWIOTLB_DYNAMIC
unsigned int area_nslabs; bool can_grow;
struct io_tlb_area *areas; u64 phys_limit;
struct io_tlb_slot *slots; spinlock_t lock;
struct list_head pools;
struct work_struct dyn_alloc;
#endif
#ifdef CONFIG_DEBUG_FS #ifdef CONFIG_DEBUG_FS
atomic_long_t total_used; atomic_long_t total_used;
atomic_long_t used_hiwater; atomic_long_t used_hiwater;
#endif #endif
}; };
extern struct io_tlb_mem io_tlb_default_mem;
#ifdef CONFIG_SWIOTLB_DYNAMIC
struct io_tlb_pool *swiotlb_find_pool(struct device *dev, phys_addr_t paddr);
#else
static inline struct io_tlb_pool *swiotlb_find_pool(struct device *dev,
phys_addr_t paddr)
{
return &dev->dma_io_tlb_mem->defpool;
}
#endif
/**
* is_swiotlb_buffer() - check if a physical address belongs to a swiotlb
* @dev: Device which has mapped the buffer.
* @paddr: Physical address within the DMA buffer.
*
* Check if @paddr points into a bounce buffer.
*
* Return:
* * %true if @paddr points into a bounce buffer
* * %false otherwise
*/
static inline bool is_swiotlb_buffer(struct device *dev, phys_addr_t paddr) static inline bool is_swiotlb_buffer(struct device *dev, phys_addr_t paddr)
{ {
struct io_tlb_mem *mem = dev->dma_io_tlb_mem; struct io_tlb_mem *mem = dev->dma_io_tlb_mem;
return mem && paddr >= mem->start && paddr < mem->end; if (!mem)
return false;
if (IS_ENABLED(CONFIG_SWIOTLB_DYNAMIC)) {
/* Pairs with smp_wmb() in swiotlb_find_slots() and
* swiotlb_dyn_alloc(), which modify the RCU lists.
*/
smp_rmb();
return swiotlb_find_pool(dev, paddr);
}
return paddr >= mem->defpool.start && paddr < mem->defpool.end;
} }
static inline bool is_swiotlb_force_bounce(struct device *dev) static inline bool is_swiotlb_force_bounce(struct device *dev)
...@@ -128,13 +191,22 @@ static inline bool is_swiotlb_force_bounce(struct device *dev) ...@@ -128,13 +191,22 @@ static inline bool is_swiotlb_force_bounce(struct device *dev)
void swiotlb_init(bool addressing_limited, unsigned int flags); void swiotlb_init(bool addressing_limited, unsigned int flags);
void __init swiotlb_exit(void); void __init swiotlb_exit(void);
void swiotlb_dev_init(struct device *dev);
size_t swiotlb_max_mapping_size(struct device *dev); size_t swiotlb_max_mapping_size(struct device *dev);
bool is_swiotlb_allocated(void);
bool is_swiotlb_active(struct device *dev); bool is_swiotlb_active(struct device *dev);
void __init swiotlb_adjust_size(unsigned long size); void __init swiotlb_adjust_size(unsigned long size);
phys_addr_t default_swiotlb_base(void);
phys_addr_t default_swiotlb_limit(void);
#else #else
static inline void swiotlb_init(bool addressing_limited, unsigned int flags) static inline void swiotlb_init(bool addressing_limited, unsigned int flags)
{ {
} }
static inline void swiotlb_dev_init(struct device *dev)
{
}
static inline bool is_swiotlb_buffer(struct device *dev, phys_addr_t paddr) static inline bool is_swiotlb_buffer(struct device *dev, phys_addr_t paddr)
{ {
return false; return false;
...@@ -151,6 +223,11 @@ static inline size_t swiotlb_max_mapping_size(struct device *dev) ...@@ -151,6 +223,11 @@ static inline size_t swiotlb_max_mapping_size(struct device *dev)
return SIZE_MAX; return SIZE_MAX;
} }
static inline bool is_swiotlb_allocated(void)
{
return false;
}
static inline bool is_swiotlb_active(struct device *dev) static inline bool is_swiotlb_active(struct device *dev)
{ {
return false; return false;
...@@ -159,6 +236,16 @@ static inline bool is_swiotlb_active(struct device *dev) ...@@ -159,6 +236,16 @@ static inline bool is_swiotlb_active(struct device *dev)
static inline void swiotlb_adjust_size(unsigned long size) static inline void swiotlb_adjust_size(unsigned long size)
{ {
} }
static inline phys_addr_t default_swiotlb_base(void)
{
return 0;
}
static inline phys_addr_t default_swiotlb_limit(void)
{
return 0;
}
#endif /* CONFIG_SWIOTLB */ #endif /* CONFIG_SWIOTLB */
extern void swiotlb_print_info(void); extern void swiotlb_print_info(void);
......
...@@ -29,6 +29,12 @@ extern bool xen_pvh; ...@@ -29,6 +29,12 @@ extern bool xen_pvh;
extern uint32_t xen_start_flags; extern uint32_t xen_start_flags;
#ifdef CONFIG_XEN_PV
extern bool xen_pv_pci_possible;
#else
#define xen_pv_pci_possible 0
#endif
#include <xen/interface/hvm/start_info.h> #include <xen/interface/hvm/start_info.h>
extern struct hvm_start_info pvh_start_info; extern struct hvm_start_info pvh_start_info;
void xen_prepare_pvh(void); void xen_prepare_pvh(void);
......
...@@ -90,6 +90,19 @@ config SWIOTLB ...@@ -90,6 +90,19 @@ config SWIOTLB
bool bool
select NEED_DMA_MAP_STATE select NEED_DMA_MAP_STATE
config SWIOTLB_DYNAMIC
bool "Dynamic allocation of DMA bounce buffers"
default n
depends on SWIOTLB
help
This enables dynamic resizing of the software IO TLB. The kernel
starts with one memory pool at boot and it will allocate additional
pools as needed. To reduce run-time kernel memory requirements, you
may have to specify a smaller size of the initial pool using
"swiotlb=" on the kernel command line.
If unsure, say N.
config DMA_BOUNCE_UNALIGNED_KMALLOC config DMA_BOUNCE_UNALIGNED_KMALLOC
bool bool
depends on SWIOTLB depends on SWIOTLB
...@@ -145,15 +158,16 @@ config DMA_CMA ...@@ -145,15 +158,16 @@ config DMA_CMA
if DMA_CMA if DMA_CMA
config DMA_PERNUMA_CMA config DMA_NUMA_CMA
bool "Enable separate DMA Contiguous Memory Area for each NUMA Node" bool "Enable separate DMA Contiguous Memory Area for NUMA Node"
default NUMA && ARM64 default NUMA
help help
Enable this option to get pernuma CMA areas so that devices like Enable this option to get numa CMA areas so that NUMA devices
ARM64 SMMU can get local memory by DMA coherent APIs. can get local memory by DMA coherent APIs.
You can set the size of pernuma CMA by specifying "cma_pernuma=size" You can set the size of pernuma CMA by specifying "cma_pernuma=size"
on the kernel's command line. or set the node id and its size of CMA by specifying "numa_cma=
<node>:size[,<node>:size]" on the kernel's command line.
comment "Default contiguous memory area size:" comment "Default contiguous memory area size:"
......
...@@ -50,6 +50,7 @@ ...@@ -50,6 +50,7 @@
#include <linux/sizes.h> #include <linux/sizes.h>
#include <linux/dma-map-ops.h> #include <linux/dma-map-ops.h>
#include <linux/cma.h> #include <linux/cma.h>
#include <linux/nospec.h>
#ifdef CONFIG_CMA_SIZE_MBYTES #ifdef CONFIG_CMA_SIZE_MBYTES
#define CMA_SIZE_MBYTES CONFIG_CMA_SIZE_MBYTES #define CMA_SIZE_MBYTES CONFIG_CMA_SIZE_MBYTES
...@@ -96,11 +97,44 @@ static int __init early_cma(char *p) ...@@ -96,11 +97,44 @@ static int __init early_cma(char *p)
} }
early_param("cma", early_cma); early_param("cma", early_cma);
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
static struct cma *dma_contiguous_numa_area[MAX_NUMNODES];
static phys_addr_t numa_cma_size[MAX_NUMNODES] __initdata;
static struct cma *dma_contiguous_pernuma_area[MAX_NUMNODES]; static struct cma *dma_contiguous_pernuma_area[MAX_NUMNODES];
static phys_addr_t pernuma_size_bytes __initdata; static phys_addr_t pernuma_size_bytes __initdata;
static int __init early_numa_cma(char *p)
{
int nid, count = 0;
unsigned long tmp;
char *s = p;
while (*s) {
if (sscanf(s, "%lu%n", &tmp, &count) != 1)
break;
if (s[count] == ':') {
if (tmp >= MAX_NUMNODES)
break;
nid = array_index_nospec(tmp, MAX_NUMNODES);
s += count + 1;
tmp = memparse(s, &s);
numa_cma_size[nid] = tmp;
if (*s == ',')
s++;
else
break;
} else
break;
}
return 0;
}
early_param("numa_cma", early_numa_cma);
static int __init early_cma_pernuma(char *p) static int __init early_cma_pernuma(char *p)
{ {
pernuma_size_bytes = memparse(p, &p); pernuma_size_bytes = memparse(p, &p);
...@@ -127,32 +161,49 @@ static inline __maybe_unused phys_addr_t cma_early_percent_memory(void) ...@@ -127,32 +161,49 @@ static inline __maybe_unused phys_addr_t cma_early_percent_memory(void)
#endif #endif
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
void __init dma_pernuma_cma_reserve(void) static void __init dma_numa_cma_reserve(void)
{ {
int nid; int nid;
if (!pernuma_size_bytes) for_each_node(nid) {
return;
for_each_online_node(nid) {
int ret; int ret;
char name[CMA_MAX_NAME]; char name[CMA_MAX_NAME];
struct cma **cma = &dma_contiguous_pernuma_area[nid]; struct cma **cma;
if (!node_online(nid)) {
if (pernuma_size_bytes || numa_cma_size[nid])
pr_warn("invalid node %d specified\n", nid);
continue;
}
if (pernuma_size_bytes) {
cma = &dma_contiguous_pernuma_area[nid];
snprintf(name, sizeof(name), "pernuma%d", nid); snprintf(name, sizeof(name), "pernuma%d", nid);
ret = cma_declare_contiguous_nid(0, pernuma_size_bytes, 0, 0, ret = cma_declare_contiguous_nid(0, pernuma_size_bytes, 0, 0,
0, false, name, cma, nid); 0, false, name, cma, nid);
if (ret) { if (ret)
pr_warn("%s: reservation failed: err %d, node %d", __func__, pr_warn("%s: reservation failed: err %d, node %d", __func__,
ret, nid); ret, nid);
continue;
} }
pr_debug("%s: reserved %llu MiB on node %d\n", __func__, if (numa_cma_size[nid]) {
(unsigned long long)pernuma_size_bytes / SZ_1M, nid);
cma = &dma_contiguous_numa_area[nid];
snprintf(name, sizeof(name), "numa%d", nid);
ret = cma_declare_contiguous_nid(0, numa_cma_size[nid], 0, 0, 0, false,
name, cma, nid);
if (ret)
pr_warn("%s: reservation failed: err %d, node %d", __func__,
ret, nid);
}
} }
} }
#else
static inline void __init dma_numa_cma_reserve(void)
{
}
#endif #endif
/** /**
...@@ -171,6 +222,8 @@ void __init dma_contiguous_reserve(phys_addr_t limit) ...@@ -171,6 +222,8 @@ void __init dma_contiguous_reserve(phys_addr_t limit)
phys_addr_t selected_limit = limit; phys_addr_t selected_limit = limit;
bool fixed = false; bool fixed = false;
dma_numa_cma_reserve();
pr_debug("%s(limit %08lx)\n", __func__, (unsigned long)limit); pr_debug("%s(limit %08lx)\n", __func__, (unsigned long)limit);
if (size_cmdline != -1) { if (size_cmdline != -1) {
...@@ -303,7 +356,7 @@ static struct page *cma_alloc_aligned(struct cma *cma, size_t size, gfp_t gfp) ...@@ -303,7 +356,7 @@ static struct page *cma_alloc_aligned(struct cma *cma, size_t size, gfp_t gfp)
*/ */
struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp) struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp)
{ {
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
int nid = dev_to_node(dev); int nid = dev_to_node(dev);
#endif #endif
...@@ -315,7 +368,7 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp) ...@@ -315,7 +368,7 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp)
if (size <= PAGE_SIZE) if (size <= PAGE_SIZE)
return NULL; return NULL;
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
if (nid != NUMA_NO_NODE && !(gfp & (GFP_DMA | GFP_DMA32))) { if (nid != NUMA_NO_NODE && !(gfp & (GFP_DMA | GFP_DMA32))) {
struct cma *cma = dma_contiguous_pernuma_area[nid]; struct cma *cma = dma_contiguous_pernuma_area[nid];
struct page *page; struct page *page;
...@@ -325,6 +378,13 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp) ...@@ -325,6 +378,13 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp)
if (page) if (page)
return page; return page;
} }
cma = dma_contiguous_numa_area[nid];
if (cma) {
page = cma_alloc_aligned(cma, size, gfp);
if (page)
return page;
}
} }
#endif #endif
if (!dma_contiguous_default_area) if (!dma_contiguous_default_area)
...@@ -356,10 +416,13 @@ void dma_free_contiguous(struct device *dev, struct page *page, size_t size) ...@@ -356,10 +416,13 @@ void dma_free_contiguous(struct device *dev, struct page *page, size_t size)
/* /*
* otherwise, page is from either per-numa cma or default cma * otherwise, page is from either per-numa cma or default cma
*/ */
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
if (cma_release(dma_contiguous_pernuma_area[page_to_nid(page)], if (cma_release(dma_contiguous_pernuma_area[page_to_nid(page)],
page, count)) page, count))
return; return;
if (cma_release(dma_contiguous_numa_area[page_to_nid(page)],
page, count))
return;
#endif #endif
if (cma_release(dma_contiguous_default_area, page, count)) if (cma_release(dma_contiguous_default_area, page, count))
return; return;
...@@ -410,6 +473,11 @@ static int __init rmem_cma_setup(struct reserved_mem *rmem) ...@@ -410,6 +473,11 @@ static int __init rmem_cma_setup(struct reserved_mem *rmem)
return -EBUSY; return -EBUSY;
} }
if (memblock_is_region_reserved(rmem->base, rmem->size)) {
pr_info("Reserved memory: overlap with other memblock reserved region\n");
return -EBUSY;
}
if (!of_get_flat_dt_prop(node, "reusable", NULL) || if (!of_get_flat_dt_prop(node, "reusable", NULL) ||
of_get_flat_dt_prop(node, "no-map", NULL)) of_get_flat_dt_prop(node, "no-map", NULL))
return -EINVAL; return -EINVAL;
......
...@@ -66,7 +66,7 @@ static gfp_t dma_direct_optimal_gfp_mask(struct device *dev, u64 *phys_limit) ...@@ -66,7 +66,7 @@ static gfp_t dma_direct_optimal_gfp_mask(struct device *dev, u64 *phys_limit)
return 0; return 0;
} }
static bool dma_coherent_ok(struct device *dev, phys_addr_t phys, size_t size) bool dma_coherent_ok(struct device *dev, phys_addr_t phys, size_t size)
{ {
dma_addr_t dma_addr = phys_to_dma_direct(dev, phys); dma_addr_t dma_addr = phys_to_dma_direct(dev, phys);
......
...@@ -760,12 +760,6 @@ bool dma_pci_p2pdma_supported(struct device *dev) ...@@ -760,12 +760,6 @@ bool dma_pci_p2pdma_supported(struct device *dev)
} }
EXPORT_SYMBOL_GPL(dma_pci_p2pdma_supported); EXPORT_SYMBOL_GPL(dma_pci_p2pdma_supported);
#ifdef CONFIG_ARCH_HAS_DMA_SET_MASK
void arch_dma_set_mask(struct device *dev, u64 mask);
#else
#define arch_dma_set_mask(dev, mask) do { } while (0)
#endif
int dma_set_mask(struct device *dev, u64 mask) int dma_set_mask(struct device *dev, u64 mask)
{ {
/* /*
......
This diff is collapsed.
...@@ -267,6 +267,9 @@ int __init cma_declare_contiguous_nid(phys_addr_t base, ...@@ -267,6 +267,9 @@ int __init cma_declare_contiguous_nid(phys_addr_t base,
if (alignment && !is_power_of_2(alignment)) if (alignment && !is_power_of_2(alignment))
return -EINVAL; return -EINVAL;
if (!IS_ENABLED(CONFIG_NUMA))
nid = NUMA_NO_NODE;
/* Sanitise input arguments. */ /* Sanitise input arguments. */
alignment = max_t(phys_addr_t, alignment, CMA_MIN_ALIGNMENT_BYTES); alignment = max_t(phys_addr_t, alignment, CMA_MIN_ALIGNMENT_BYTES);
if (fixed && base & (alignment - 1)) { if (fixed && base & (alignment - 1)) {
...@@ -372,14 +375,15 @@ int __init cma_declare_contiguous_nid(phys_addr_t base, ...@@ -372,14 +375,15 @@ int __init cma_declare_contiguous_nid(phys_addr_t base,
if (ret) if (ret)
goto free_mem; goto free_mem;
pr_info("Reserved %ld MiB at %pa\n", (unsigned long)size / SZ_1M, pr_info("Reserved %ld MiB at %pa on node %d\n", (unsigned long)size / SZ_1M,
&base); &base, nid);
return 0; return 0;
free_mem: free_mem:
memblock_phys_free(base, size); memblock_phys_free(base, size);
err: err:
pr_err("Failed to reserve %ld MiB\n", (unsigned long)size / SZ_1M); pr_err("Failed to reserve %ld MiB on node %d\n", (unsigned long)size / SZ_1M,
nid);
return ret; return ret;
} }
......
...@@ -895,10 +895,9 @@ void __init setup_kmalloc_cache_index_table(void) ...@@ -895,10 +895,9 @@ void __init setup_kmalloc_cache_index_table(void)
static unsigned int __kmalloc_minalign(void) static unsigned int __kmalloc_minalign(void)
{ {
#ifdef CONFIG_DMA_BOUNCE_UNALIGNED_KMALLOC if (IS_ENABLED(CONFIG_DMA_BOUNCE_UNALIGNED_KMALLOC) &&
if (io_tlb_default_mem.nslabs) is_swiotlb_allocated())
return ARCH_KMALLOC_MINALIGN; return ARCH_KMALLOC_MINALIGN;
#endif
return dma_get_cache_alignment(); return dma_get_cache_alignment();
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment