Commit bf29bfaa authored by Yajun Deng's avatar Yajun Deng Committed by Christoph Hellwig

dma-contiguous: support numa CMA for specified node

The kernel parameter 'cma_pernuma=' only supports reserving the same
size of CMA area for each node. We need to reserve different sizes of
CMA area for specified nodes if these devices belong to different nodes.

Adding another kernel parameter 'numa_cma=' to reserve CMA area for
the specified node. If we want to use one of these parameters, we need to
enable DMA_NUMA_CMA.

At the same time, print the node id in cma_declare_contiguous_nid() if
CONFIG_NUMA is enabled.
Signed-off-by: default avatarYajun Deng <yajun.deng@linux.dev>
Signed-off-by: default avatarChristoph Hellwig <hch@lst.de>
parent 22e4a348
...@@ -706,6 +706,17 @@ ...@@ -706,6 +706,17 @@
which is located in node nid, if the allocation fails, which is located in node nid, if the allocation fails,
they will fallback to the global default memory area. they will fallback to the global default memory area.
numa_cma=<node>:nn[MG][,<node>:nn[MG]]
[KNL,CMA]
Sets the size of kernel numa memory area for
contiguous memory allocations. It will reserve CMA
area for the specified node.
With numa CMA enabled, DMA users on node nid will
first try to allocate buffer from the numa area
which is located in node nid, if the allocation fails,
they will fallback to the global default memory area.
cmo_free_hint= [PPC] Format: { yes | no } cmo_free_hint= [PPC] Format: { yes | no }
Specify whether pages are marked as being inactive Specify whether pages are marked as being inactive
when they are freed. This is used in CMO environments when they are freed. This is used in CMO environments
......
...@@ -145,15 +145,16 @@ config DMA_CMA ...@@ -145,15 +145,16 @@ config DMA_CMA
if DMA_CMA if DMA_CMA
config DMA_PERNUMA_CMA config DMA_NUMA_CMA
bool "Enable separate DMA Contiguous Memory Area for each NUMA Node" bool "Enable separate DMA Contiguous Memory Area for NUMA Node"
default NUMA default NUMA
help help
Enable this option to get pernuma CMA areas so that NUMA devices Enable this option to get numa CMA areas so that NUMA devices
can get local memory by DMA coherent APIs. can get local memory by DMA coherent APIs.
You can set the size of pernuma CMA by specifying "cma_pernuma=size" You can set the size of pernuma CMA by specifying "cma_pernuma=size"
on the kernel's command line. or set the node id and its size of CMA by specifying "numa_cma=
<node>:size[,<node>:size]" on the kernel's command line.
comment "Default contiguous memory area size:" comment "Default contiguous memory area size:"
......
...@@ -50,6 +50,7 @@ ...@@ -50,6 +50,7 @@
#include <linux/sizes.h> #include <linux/sizes.h>
#include <linux/dma-map-ops.h> #include <linux/dma-map-ops.h>
#include <linux/cma.h> #include <linux/cma.h>
#include <linux/nospec.h>
#ifdef CONFIG_CMA_SIZE_MBYTES #ifdef CONFIG_CMA_SIZE_MBYTES
#define CMA_SIZE_MBYTES CONFIG_CMA_SIZE_MBYTES #define CMA_SIZE_MBYTES CONFIG_CMA_SIZE_MBYTES
...@@ -96,11 +97,44 @@ static int __init early_cma(char *p) ...@@ -96,11 +97,44 @@ static int __init early_cma(char *p)
} }
early_param("cma", early_cma); early_param("cma", early_cma);
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
static struct cma *dma_contiguous_numa_area[MAX_NUMNODES];
static phys_addr_t numa_cma_size[MAX_NUMNODES] __initdata;
static struct cma *dma_contiguous_pernuma_area[MAX_NUMNODES]; static struct cma *dma_contiguous_pernuma_area[MAX_NUMNODES];
static phys_addr_t pernuma_size_bytes __initdata; static phys_addr_t pernuma_size_bytes __initdata;
static int __init early_numa_cma(char *p)
{
int nid, count = 0;
unsigned long tmp;
char *s = p;
while (*s) {
if (sscanf(s, "%lu%n", &tmp, &count) != 1)
break;
if (s[count] == ':') {
if (tmp >= MAX_NUMNODES)
break;
nid = array_index_nospec(tmp, MAX_NUMNODES);
s += count + 1;
tmp = memparse(s, &s);
numa_cma_size[nid] = tmp;
if (*s == ',')
s++;
else
break;
} else
break;
}
return 0;
}
early_param("numa_cma", early_numa_cma);
static int __init early_cma_pernuma(char *p) static int __init early_cma_pernuma(char *p)
{ {
pernuma_size_bytes = memparse(p, &p); pernuma_size_bytes = memparse(p, &p);
...@@ -127,34 +161,47 @@ static inline __maybe_unused phys_addr_t cma_early_percent_memory(void) ...@@ -127,34 +161,47 @@ static inline __maybe_unused phys_addr_t cma_early_percent_memory(void)
#endif #endif
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
static void __init dma_pernuma_cma_reserve(void) static void __init dma_numa_cma_reserve(void)
{ {
int nid; int nid;
if (!pernuma_size_bytes) for_each_node(nid) {
return;
for_each_online_node(nid) {
int ret; int ret;
char name[CMA_MAX_NAME]; char name[CMA_MAX_NAME];
struct cma **cma = &dma_contiguous_pernuma_area[nid]; struct cma **cma;
if (!node_online(nid)) {
if (pernuma_size_bytes || numa_cma_size[nid])
pr_warn("invalid node %d specified\n", nid);
continue;
}
if (pernuma_size_bytes) {
cma = &dma_contiguous_pernuma_area[nid];
snprintf(name, sizeof(name), "pernuma%d", nid); snprintf(name, sizeof(name), "pernuma%d", nid);
ret = cma_declare_contiguous_nid(0, pernuma_size_bytes, 0, 0, ret = cma_declare_contiguous_nid(0, pernuma_size_bytes, 0, 0,
0, false, name, cma, nid); 0, false, name, cma, nid);
if (ret) { if (ret)
pr_warn("%s: reservation failed: err %d, node %d", __func__, pr_warn("%s: reservation failed: err %d, node %d", __func__,
ret, nid); ret, nid);
continue;
} }
pr_debug("%s: reserved %llu MiB on node %d\n", __func__, if (numa_cma_size[nid]) {
(unsigned long long)pernuma_size_bytes / SZ_1M, nid);
cma = &dma_contiguous_numa_area[nid];
snprintf(name, sizeof(name), "numa%d", nid);
ret = cma_declare_contiguous_nid(0, numa_cma_size[nid], 0, 0, 0, false,
name, cma, nid);
if (ret)
pr_warn("%s: reservation failed: err %d, node %d", __func__,
ret, nid);
}
} }
} }
#else #else
static inline void __init dma_pernuma_cma_reserve(void) static inline void __init dma_numa_cma_reserve(void)
{ {
} }
#endif #endif
...@@ -175,7 +222,7 @@ void __init dma_contiguous_reserve(phys_addr_t limit) ...@@ -175,7 +222,7 @@ void __init dma_contiguous_reserve(phys_addr_t limit)
phys_addr_t selected_limit = limit; phys_addr_t selected_limit = limit;
bool fixed = false; bool fixed = false;
dma_pernuma_cma_reserve(); dma_numa_cma_reserve();
pr_debug("%s(limit %08lx)\n", __func__, (unsigned long)limit); pr_debug("%s(limit %08lx)\n", __func__, (unsigned long)limit);
...@@ -309,7 +356,7 @@ static struct page *cma_alloc_aligned(struct cma *cma, size_t size, gfp_t gfp) ...@@ -309,7 +356,7 @@ static struct page *cma_alloc_aligned(struct cma *cma, size_t size, gfp_t gfp)
*/ */
struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp) struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp)
{ {
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
int nid = dev_to_node(dev); int nid = dev_to_node(dev);
#endif #endif
...@@ -321,7 +368,7 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp) ...@@ -321,7 +368,7 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp)
if (size <= PAGE_SIZE) if (size <= PAGE_SIZE)
return NULL; return NULL;
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
if (nid != NUMA_NO_NODE && !(gfp & (GFP_DMA | GFP_DMA32))) { if (nid != NUMA_NO_NODE && !(gfp & (GFP_DMA | GFP_DMA32))) {
struct cma *cma = dma_contiguous_pernuma_area[nid]; struct cma *cma = dma_contiguous_pernuma_area[nid];
struct page *page; struct page *page;
...@@ -331,6 +378,13 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp) ...@@ -331,6 +378,13 @@ struct page *dma_alloc_contiguous(struct device *dev, size_t size, gfp_t gfp)
if (page) if (page)
return page; return page;
} }
cma = dma_contiguous_numa_area[nid];
if (cma) {
page = cma_alloc_aligned(cma, size, gfp);
if (page)
return page;
}
} }
#endif #endif
if (!dma_contiguous_default_area) if (!dma_contiguous_default_area)
...@@ -362,10 +416,13 @@ void dma_free_contiguous(struct device *dev, struct page *page, size_t size) ...@@ -362,10 +416,13 @@ void dma_free_contiguous(struct device *dev, struct page *page, size_t size)
/* /*
* otherwise, page is from either per-numa cma or default cma * otherwise, page is from either per-numa cma or default cma
*/ */
#ifdef CONFIG_DMA_PERNUMA_CMA #ifdef CONFIG_DMA_NUMA_CMA
if (cma_release(dma_contiguous_pernuma_area[page_to_nid(page)], if (cma_release(dma_contiguous_pernuma_area[page_to_nid(page)],
page, count)) page, count))
return; return;
if (cma_release(dma_contiguous_numa_area[page_to_nid(page)],
page, count))
return;
#endif #endif
if (cma_release(dma_contiguous_default_area, page, count)) if (cma_release(dma_contiguous_default_area, page, count))
return; return;
......
...@@ -267,6 +267,9 @@ int __init cma_declare_contiguous_nid(phys_addr_t base, ...@@ -267,6 +267,9 @@ int __init cma_declare_contiguous_nid(phys_addr_t base,
if (alignment && !is_power_of_2(alignment)) if (alignment && !is_power_of_2(alignment))
return -EINVAL; return -EINVAL;
if (!IS_ENABLED(CONFIG_NUMA))
nid = NUMA_NO_NODE;
/* Sanitise input arguments. */ /* Sanitise input arguments. */
alignment = max_t(phys_addr_t, alignment, CMA_MIN_ALIGNMENT_BYTES); alignment = max_t(phys_addr_t, alignment, CMA_MIN_ALIGNMENT_BYTES);
if (fixed && base & (alignment - 1)) { if (fixed && base & (alignment - 1)) {
...@@ -372,14 +375,15 @@ int __init cma_declare_contiguous_nid(phys_addr_t base, ...@@ -372,14 +375,15 @@ int __init cma_declare_contiguous_nid(phys_addr_t base,
if (ret) if (ret)
goto free_mem; goto free_mem;
pr_info("Reserved %ld MiB at %pa\n", (unsigned long)size / SZ_1M, pr_info("Reserved %ld MiB at %pa on node %d\n", (unsigned long)size / SZ_1M,
&base); &base, nid);
return 0; return 0;
free_mem: free_mem:
memblock_phys_free(base, size); memblock_phys_free(base, size);
err: err:
pr_err("Failed to reserve %ld MiB\n", (unsigned long)size / SZ_1M); pr_err("Failed to reserve %ld MiB on node %d\n", (unsigned long)size / SZ_1M,
nid);
return ret; return ret;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment