Thomas Gleixner | 8607a96 | 2019-05-22 09:51:44 +0200 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0-or-later |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 2 | /* |
| 3 | * Contiguous Memory Allocator |
| 4 | * |
| 5 | * Copyright (c) 2010-2011 by Samsung Electronics. |
| 6 | * Copyright IBM Corporation, 2013 |
| 7 | * Copyright LG Electronics Inc., 2014 |
| 8 | * Written by: |
| 9 | * Marek Szyprowski <m.szyprowski@samsung.com> |
| 10 | * Michal Nazarewicz <mina86@mina86.com> |
| 11 | * Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> |
| 12 | * Joonsoo Kim <iamjoonsoo.kim@lge.com> |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 13 | */ |
| 14 | |
| 15 | #define pr_fmt(fmt) "cma: " fmt |
| 16 | |
| 17 | #ifdef CONFIG_CMA_DEBUG |
| 18 | #ifndef DEBUG |
| 19 | # define DEBUG |
| 20 | #endif |
| 21 | #endif |
Stefan Strogin | 99e8ea6 | 2015-04-15 16:14:50 -0700 | [diff] [blame] | 22 | #define CREATE_TRACE_POINTS |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 23 | |
| 24 | #include <linux/memblock.h> |
| 25 | #include <linux/err.h> |
| 26 | #include <linux/mm.h> |
Sandeep Patil | 716306e | 2019-09-13 14:50:38 -0700 | [diff] [blame] | 27 | #include <linux/module.h> |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 28 | #include <linux/mutex.h> |
| 29 | #include <linux/sizes.h> |
| 30 | #include <linux/slab.h> |
| 31 | #include <linux/log2.h> |
| 32 | #include <linux/cma.h> |
Marek Szyprowski | f7426b9 | 2014-10-09 15:26:47 -0700 | [diff] [blame] | 33 | #include <linux/highmem.h> |
Thierry Reding | 620951e | 2014-12-12 16:58:31 -0800 | [diff] [blame] | 34 | #include <linux/io.h> |
Randy Dunlap | 514c603 | 2018-04-05 16:25:34 -0700 | [diff] [blame] | 35 | #include <linux/kmemleak.h> |
Chris Goldsworthy | 73eda8e | 2020-09-18 09:19:53 -0700 | [diff] [blame] | 36 | #include <linux/sched.h> |
| 37 | #include <linux/jiffies.h> |
Stefan Strogin | 99e8ea6 | 2015-04-15 16:14:50 -0700 | [diff] [blame] | 38 | #include <trace/events/cma.h> |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 39 | |
Sasha Levin | 28b24c1 | 2015-04-14 15:44:57 -0700 | [diff] [blame] | 40 | #include "cma.h" |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 41 | |
Sasha Levin | 28b24c1 | 2015-04-14 15:44:57 -0700 | [diff] [blame] | 42 | struct cma cma_areas[MAX_CMA_AREAS]; |
| 43 | unsigned cma_area_count; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 44 | |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 45 | phys_addr_t cma_get_base(const struct cma *cma) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 46 | { |
| 47 | return PFN_PHYS(cma->base_pfn); |
| 48 | } |
| 49 | |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 50 | unsigned long cma_get_size(const struct cma *cma) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 51 | { |
| 52 | return cma->count << PAGE_SHIFT; |
| 53 | } |
| 54 | |
Laura Abbott | f318dd0 | 2017-04-18 11:27:03 -0700 | [diff] [blame] | 55 | const char *cma_get_name(const struct cma *cma) |
| 56 | { |
Barry Song | 18e98e5 | 2020-08-11 18:31:57 -0700 | [diff] [blame] | 57 | return cma->name; |
Laura Abbott | f318dd0 | 2017-04-18 11:27:03 -0700 | [diff] [blame] | 58 | } |
Sandeep Patil | 716306e | 2019-09-13 14:50:38 -0700 | [diff] [blame] | 59 | EXPORT_SYMBOL_GPL(cma_get_name); |
Laura Abbott | f318dd0 | 2017-04-18 11:27:03 -0700 | [diff] [blame] | 60 | |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 61 | static unsigned long cma_bitmap_aligned_mask(const struct cma *cma, |
Doug Berger | e048cb3 | 2017-07-10 15:49:44 -0700 | [diff] [blame] | 62 | unsigned int align_order) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 63 | { |
Weijie Yang | 68faed6 | 2014-10-13 15:51:03 -0700 | [diff] [blame] | 64 | if (align_order <= cma->order_per_bit) |
| 65 | return 0; |
| 66 | return (1UL << (align_order - cma->order_per_bit)) - 1; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 67 | } |
| 68 | |
Danesh Petigara | 850fc43 | 2015-03-12 16:25:57 -0700 | [diff] [blame] | 69 | /* |
Doug Berger | e048cb3 | 2017-07-10 15:49:44 -0700 | [diff] [blame] | 70 | * Find the offset of the base PFN from the specified align_order. |
| 71 | * The value returned is represented in order_per_bits. |
Danesh Petigara | 850fc43 | 2015-03-12 16:25:57 -0700 | [diff] [blame] | 72 | */ |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 73 | static unsigned long cma_bitmap_aligned_offset(const struct cma *cma, |
Doug Berger | e048cb3 | 2017-07-10 15:49:44 -0700 | [diff] [blame] | 74 | unsigned int align_order) |
Gregory Fong | b5be83e | 2014-12-12 16:54:48 -0800 | [diff] [blame] | 75 | { |
Doug Berger | e048cb3 | 2017-07-10 15:49:44 -0700 | [diff] [blame] | 76 | return (cma->base_pfn & ((1UL << align_order) - 1)) |
| 77 | >> cma->order_per_bit; |
Gregory Fong | b5be83e | 2014-12-12 16:54:48 -0800 | [diff] [blame] | 78 | } |
| 79 | |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 80 | static unsigned long cma_bitmap_pages_to_bits(const struct cma *cma, |
| 81 | unsigned long pages) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 82 | { |
| 83 | return ALIGN(pages, 1UL << cma->order_per_bit) >> cma->order_per_bit; |
| 84 | } |
| 85 | |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 86 | static void cma_clear_bitmap(struct cma *cma, unsigned long pfn, |
| 87 | unsigned int count) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 88 | { |
| 89 | unsigned long bitmap_no, bitmap_count; |
| 90 | |
| 91 | bitmap_no = (pfn - cma->base_pfn) >> cma->order_per_bit; |
| 92 | bitmap_count = cma_bitmap_pages_to_bits(cma, count); |
| 93 | |
| 94 | mutex_lock(&cma->lock); |
| 95 | bitmap_clear(cma->bitmap, bitmap_no, bitmap_count); |
| 96 | mutex_unlock(&cma->lock); |
| 97 | } |
| 98 | |
Mike Kravetz | 3a5139f | 2020-08-11 18:32:03 -0700 | [diff] [blame] | 99 | static void __init cma_activate_area(struct cma *cma) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 100 | { |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 101 | unsigned long base_pfn = cma->base_pfn, pfn = base_pfn; |
| 102 | unsigned i = cma->count >> pageblock_order; |
| 103 | struct zone *zone; |
| 104 | |
Yunfeng Ye | 2184f99 | 2019-11-30 17:57:22 -0800 | [diff] [blame] | 105 | cma->bitmap = bitmap_zalloc(cma_bitmap_maxno(cma), GFP_KERNEL); |
Mike Kravetz | 3a5139f | 2020-08-11 18:32:03 -0700 | [diff] [blame] | 106 | if (!cma->bitmap) |
| 107 | goto out_error; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 108 | |
Joonsoo Kim | d883c6c | 2018-05-23 10:18:21 +0900 | [diff] [blame] | 109 | WARN_ON_ONCE(!pfn_valid(pfn)); |
| 110 | zone = page_zone(pfn_to_page(pfn)); |
| 111 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 112 | do { |
| 113 | unsigned j; |
| 114 | |
| 115 | base_pfn = pfn; |
| 116 | for (j = pageblock_nr_pages; j; --j, pfn++) { |
Joonsoo Kim | d883c6c | 2018-05-23 10:18:21 +0900 | [diff] [blame] | 117 | WARN_ON_ONCE(!pfn_valid(pfn)); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 118 | /* |
Joonsoo Kim | d883c6c | 2018-05-23 10:18:21 +0900 | [diff] [blame] | 119 | * alloc_contig_range requires the pfn range |
| 120 | * specified to be in the same zone. Make this |
| 121 | * simple by forcing the entire CMA resv range |
| 122 | * to be in the same zone. |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 123 | */ |
| 124 | if (page_zone(pfn_to_page(pfn)) != zone) |
Joonsoo Kim | d883c6c | 2018-05-23 10:18:21 +0900 | [diff] [blame] | 125 | goto not_in_zone; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 126 | } |
| 127 | init_cma_reserved_pageblock(pfn_to_page(base_pfn)); |
| 128 | } while (--i); |
| 129 | |
| 130 | mutex_init(&cma->lock); |
Sasha Levin | 26b02a1 | 2015-04-14 15:44:59 -0700 | [diff] [blame] | 131 | |
| 132 | #ifdef CONFIG_CMA_DEBUGFS |
| 133 | INIT_HLIST_HEAD(&cma->mem_head); |
| 134 | spin_lock_init(&cma->mem_head_lock); |
| 135 | #endif |
| 136 | |
Mike Kravetz | 3a5139f | 2020-08-11 18:32:03 -0700 | [diff] [blame] | 137 | return; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 138 | |
Joonsoo Kim | d883c6c | 2018-05-23 10:18:21 +0900 | [diff] [blame] | 139 | not_in_zone: |
Yunfeng Ye | 2184f99 | 2019-11-30 17:57:22 -0800 | [diff] [blame] | 140 | bitmap_free(cma->bitmap); |
Mike Kravetz | 3a5139f | 2020-08-11 18:32:03 -0700 | [diff] [blame] | 141 | out_error: |
Laurent Pinchart | f022d8c | 2014-10-24 13:18:39 +0300 | [diff] [blame] | 142 | cma->count = 0; |
Mike Kravetz | 3a5139f | 2020-08-11 18:32:03 -0700 | [diff] [blame] | 143 | pr_err("CMA area %s could not be activated\n", cma->name); |
| 144 | return; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 145 | } |
| 146 | |
| 147 | static int __init cma_init_reserved_areas(void) |
| 148 | { |
| 149 | int i; |
| 150 | |
Mike Kravetz | 3a5139f | 2020-08-11 18:32:03 -0700 | [diff] [blame] | 151 | for (i = 0; i < cma_area_count; i++) |
| 152 | cma_activate_area(&cma_areas[i]); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 153 | |
| 154 | return 0; |
| 155 | } |
Joonsoo Kim | d883c6c | 2018-05-23 10:18:21 +0900 | [diff] [blame] | 156 | core_initcall(cma_init_reserved_areas); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 157 | |
| 158 | /** |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 159 | * cma_init_reserved_mem() - create custom contiguous area from reserved memory |
| 160 | * @base: Base address of the reserved area |
| 161 | * @size: Size of the reserved area (in bytes), |
| 162 | * @order_per_bit: Order of pages represented by one bit on bitmap. |
Mike Rapoport | e8b098f | 2018-04-05 16:24:57 -0700 | [diff] [blame] | 163 | * @name: The name of the area. If this parameter is NULL, the name of |
| 164 | * the area will be set to "cmaN", where N is a running counter of |
| 165 | * used areas. |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 166 | * @res_cma: Pointer to store the created cma region. |
| 167 | * |
| 168 | * This function creates custom contiguous area from already reserved memory. |
| 169 | */ |
| 170 | int __init cma_init_reserved_mem(phys_addr_t base, phys_addr_t size, |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 171 | unsigned int order_per_bit, |
Laura Abbott | f318dd0 | 2017-04-18 11:27:03 -0700 | [diff] [blame] | 172 | const char *name, |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 173 | struct cma **res_cma) |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 174 | { |
| 175 | struct cma *cma; |
| 176 | phys_addr_t alignment; |
| 177 | |
| 178 | /* Sanity checks */ |
| 179 | if (cma_area_count == ARRAY_SIZE(cma_areas)) { |
| 180 | pr_err("Not enough slots for CMA reserved regions!\n"); |
| 181 | return -ENOSPC; |
| 182 | } |
| 183 | |
| 184 | if (!size || !memblock_is_region_reserved(base, size)) |
| 185 | return -EINVAL; |
| 186 | |
Shailendra Verma | 0f96ae2 | 2015-06-24 16:58:03 -0700 | [diff] [blame] | 187 | /* ensure minimal alignment required by mm core */ |
Stephen Rothwell | badbda5 | 2016-05-27 14:27:41 -0700 | [diff] [blame] | 188 | alignment = PAGE_SIZE << |
| 189 | max_t(unsigned long, MAX_ORDER - 1, pageblock_order); |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 190 | |
| 191 | /* alignment should be aligned with order_per_bit */ |
| 192 | if (!IS_ALIGNED(alignment >> PAGE_SHIFT, 1 << order_per_bit)) |
| 193 | return -EINVAL; |
| 194 | |
| 195 | if (ALIGN(base, alignment) != base || ALIGN(size, alignment) != size) |
| 196 | return -EINVAL; |
| 197 | |
| 198 | /* |
| 199 | * Each reserved area must be initialised later, when more kernel |
| 200 | * subsystems (like slab allocator) are available. |
| 201 | */ |
| 202 | cma = &cma_areas[cma_area_count]; |
Barry Song | 18e98e5 | 2020-08-11 18:31:57 -0700 | [diff] [blame] | 203 | |
| 204 | if (name) |
| 205 | snprintf(cma->name, CMA_MAX_NAME, name); |
| 206 | else |
| 207 | snprintf(cma->name, CMA_MAX_NAME, "cma%d\n", cma_area_count); |
| 208 | |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 209 | cma->base_pfn = PFN_DOWN(base); |
| 210 | cma->count = size >> PAGE_SHIFT; |
| 211 | cma->order_per_bit = order_per_bit; |
| 212 | *res_cma = cma; |
| 213 | cma_area_count++; |
George G. Davis | 94737a8 | 2015-02-11 15:26:27 -0800 | [diff] [blame] | 214 | totalcma_pages += (size / PAGE_SIZE); |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 215 | |
| 216 | return 0; |
| 217 | } |
| 218 | |
| 219 | /** |
Aslan Bakirov | 8676af1 | 2020-04-10 14:32:42 -0700 | [diff] [blame] | 220 | * cma_declare_contiguous_nid() - reserve custom contiguous area |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 221 | * @base: Base address of the reserved area optional, use 0 for any |
Joonsoo Kim | c1f733aa | 2014-08-06 16:05:32 -0700 | [diff] [blame] | 222 | * @size: Size of the reserved area (in bytes), |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 223 | * @limit: End address of the reserved memory (optional, 0 for any). |
| 224 | * @alignment: Alignment for the CMA area, should be power of 2 or zero |
| 225 | * @order_per_bit: Order of pages represented by one bit on bitmap. |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 226 | * @fixed: hint about where to place the reserved area |
Mike Rapoport | e8b098f | 2018-04-05 16:24:57 -0700 | [diff] [blame] | 227 | * @name: The name of the area. See function cma_init_reserved_mem() |
Joonsoo Kim | c1f733aa | 2014-08-06 16:05:32 -0700 | [diff] [blame] | 228 | * @res_cma: Pointer to store the created cma region. |
Aslan Bakirov | 8676af1 | 2020-04-10 14:32:42 -0700 | [diff] [blame] | 229 | * @nid: nid of the free area to find, %NUMA_NO_NODE for any node |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 230 | * |
| 231 | * This function reserves memory from early allocator. It should be |
| 232 | * called by arch specific code once the early allocator (memblock or bootmem) |
| 233 | * has been activated and all other subsystems have already allocated/reserved |
| 234 | * memory. This function allows to create custom reserved areas. |
| 235 | * |
| 236 | * If @fixed is true, reserve contiguous area at exactly @base. If false, |
| 237 | * reserve in range from @base to @limit. |
| 238 | */ |
Aslan Bakirov | 8676af1 | 2020-04-10 14:32:42 -0700 | [diff] [blame] | 239 | int __init cma_declare_contiguous_nid(phys_addr_t base, |
Joonsoo Kim | c1f733aa | 2014-08-06 16:05:32 -0700 | [diff] [blame] | 240 | phys_addr_t size, phys_addr_t limit, |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 241 | phys_addr_t alignment, unsigned int order_per_bit, |
Aslan Bakirov | 8676af1 | 2020-04-10 14:32:42 -0700 | [diff] [blame] | 242 | bool fixed, const char *name, struct cma **res_cma, |
| 243 | int nid) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 244 | { |
Marek Szyprowski | f7426b9 | 2014-10-09 15:26:47 -0700 | [diff] [blame] | 245 | phys_addr_t memblock_end = memblock_end_of_DRAM(); |
Joonsoo Kim | 6b101e2 | 2014-12-10 15:41:12 -0800 | [diff] [blame] | 246 | phys_addr_t highmem_start; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 247 | int ret = 0; |
| 248 | |
Joonsoo Kim | 6b101e2 | 2014-12-10 15:41:12 -0800 | [diff] [blame] | 249 | /* |
Laura Abbott | 2dece44 | 2017-01-10 13:35:41 -0800 | [diff] [blame] | 250 | * We can't use __pa(high_memory) directly, since high_memory |
| 251 | * isn't a valid direct map VA, and DEBUG_VIRTUAL will (validly) |
| 252 | * complain. Find the boundary by adding one to the last valid |
| 253 | * address. |
Joonsoo Kim | 6b101e2 | 2014-12-10 15:41:12 -0800 | [diff] [blame] | 254 | */ |
Laura Abbott | 2dece44 | 2017-01-10 13:35:41 -0800 | [diff] [blame] | 255 | highmem_start = __pa(high_memory - 1) + 1; |
Laurent Pinchart | 56fa4f6 | 2014-10-24 13:18:42 +0300 | [diff] [blame] | 256 | pr_debug("%s(size %pa, base %pa, limit %pa alignment %pa)\n", |
| 257 | __func__, &size, &base, &limit, &alignment); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 258 | |
| 259 | if (cma_area_count == ARRAY_SIZE(cma_areas)) { |
| 260 | pr_err("Not enough slots for CMA reserved regions!\n"); |
| 261 | return -ENOSPC; |
| 262 | } |
| 263 | |
| 264 | if (!size) |
| 265 | return -EINVAL; |
| 266 | |
| 267 | if (alignment && !is_power_of_2(alignment)) |
| 268 | return -EINVAL; |
| 269 | |
| 270 | /* |
| 271 | * Sanitise input arguments. |
| 272 | * Pages both ends in CMA area could be merged into adjacent unmovable |
| 273 | * migratetype page by page allocator's buddy algorithm. In the case, |
| 274 | * you couldn't get a contiguous memory, which is not what we want. |
| 275 | */ |
Stephen Rothwell | badbda5 | 2016-05-27 14:27:41 -0700 | [diff] [blame] | 276 | alignment = max(alignment, (phys_addr_t)PAGE_SIZE << |
| 277 | max_t(unsigned long, MAX_ORDER - 1, pageblock_order)); |
Doug Berger | c633324 | 2019-07-16 16:26:24 -0700 | [diff] [blame] | 278 | if (fixed && base & (alignment - 1)) { |
| 279 | ret = -EINVAL; |
| 280 | pr_err("Region at %pa must be aligned to %pa bytes\n", |
| 281 | &base, &alignment); |
| 282 | goto err; |
| 283 | } |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 284 | base = ALIGN(base, alignment); |
| 285 | size = ALIGN(size, alignment); |
| 286 | limit &= ~(alignment - 1); |
| 287 | |
Laurent Pinchart | 800a85d | 2014-10-24 13:18:40 +0300 | [diff] [blame] | 288 | if (!base) |
| 289 | fixed = false; |
| 290 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 291 | /* size should be aligned with order_per_bit */ |
| 292 | if (!IS_ALIGNED(size >> PAGE_SHIFT, 1 << order_per_bit)) |
| 293 | return -EINVAL; |
| 294 | |
Marek Szyprowski | f7426b9 | 2014-10-09 15:26:47 -0700 | [diff] [blame] | 295 | /* |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 296 | * If allocating at a fixed base the request region must not cross the |
| 297 | * low/high memory boundary. |
Marek Szyprowski | f7426b9 | 2014-10-09 15:26:47 -0700 | [diff] [blame] | 298 | */ |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 299 | if (fixed && base < highmem_start && base + size > highmem_start) { |
Marek Szyprowski | f7426b9 | 2014-10-09 15:26:47 -0700 | [diff] [blame] | 300 | ret = -EINVAL; |
Laurent Pinchart | 56fa4f6 | 2014-10-24 13:18:42 +0300 | [diff] [blame] | 301 | pr_err("Region at %pa defined on low/high memory boundary (%pa)\n", |
| 302 | &base, &highmem_start); |
Marek Szyprowski | f7426b9 | 2014-10-09 15:26:47 -0700 | [diff] [blame] | 303 | goto err; |
| 304 | } |
| 305 | |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 306 | /* |
| 307 | * If the limit is unspecified or above the memblock end, its effective |
| 308 | * value will be the memblock end. Set it explicitly to simplify further |
| 309 | * checks. |
| 310 | */ |
| 311 | if (limit == 0 || limit > memblock_end) |
| 312 | limit = memblock_end; |
| 313 | |
Doug Berger | c633324 | 2019-07-16 16:26:24 -0700 | [diff] [blame] | 314 | if (base + size > limit) { |
| 315 | ret = -EINVAL; |
| 316 | pr_err("Size (%pa) of region at %pa exceeds limit (%pa)\n", |
| 317 | &size, &base, &limit); |
| 318 | goto err; |
| 319 | } |
| 320 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 321 | /* Reserve memory */ |
Laurent Pinchart | 800a85d | 2014-10-24 13:18:40 +0300 | [diff] [blame] | 322 | if (fixed) { |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 323 | if (memblock_is_region_reserved(base, size) || |
| 324 | memblock_reserve(base, size) < 0) { |
| 325 | ret = -EBUSY; |
| 326 | goto err; |
| 327 | } |
| 328 | } else { |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 329 | phys_addr_t addr = 0; |
| 330 | |
| 331 | /* |
| 332 | * All pages in the reserved area must come from the same zone. |
| 333 | * If the requested region crosses the low/high memory boundary, |
| 334 | * try allocating from high memory first and fall back to low |
| 335 | * memory in case of failure. |
| 336 | */ |
| 337 | if (base < highmem_start && limit > highmem_start) { |
Aslan Bakirov | 8676af1 | 2020-04-10 14:32:42 -0700 | [diff] [blame] | 338 | addr = memblock_alloc_range_nid(size, alignment, |
Barry Song | 40366bd | 2020-07-03 15:15:24 -0700 | [diff] [blame] | 339 | highmem_start, limit, nid, true); |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 340 | limit = highmem_start; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 341 | } |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 342 | |
Roman Gushchin | 0e0bfc4 | 2021-02-25 17:16:33 -0800 | [diff] [blame^] | 343 | /* |
| 344 | * If there is enough memory, try a bottom-up allocation first. |
| 345 | * It will place the new cma area close to the start of the node |
| 346 | * and guarantee that the compaction is moving pages out of the |
| 347 | * cma area and not into it. |
| 348 | * Avoid using first 4GB to not interfere with constrained zones |
| 349 | * like DMA/DMA32. |
| 350 | */ |
| 351 | #ifdef CONFIG_PHYS_ADDR_T_64BIT |
| 352 | if (!memblock_bottom_up() && memblock_end >= SZ_4G + size) { |
| 353 | memblock_set_bottom_up(true); |
| 354 | addr = memblock_alloc_range_nid(size, alignment, SZ_4G, |
| 355 | limit, nid, true); |
| 356 | memblock_set_bottom_up(false); |
| 357 | } |
| 358 | #endif |
| 359 | |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 360 | if (!addr) { |
Aslan Bakirov | 8676af1 | 2020-04-10 14:32:42 -0700 | [diff] [blame] | 361 | addr = memblock_alloc_range_nid(size, alignment, base, |
Barry Song | 40366bd | 2020-07-03 15:15:24 -0700 | [diff] [blame] | 362 | limit, nid, true); |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 363 | if (!addr) { |
| 364 | ret = -ENOMEM; |
| 365 | goto err; |
| 366 | } |
| 367 | } |
| 368 | |
Thierry Reding | 620951e | 2014-12-12 16:58:31 -0800 | [diff] [blame] | 369 | /* |
| 370 | * kmemleak scans/reads tracked objects for pointers to other |
| 371 | * objects but this address isn't mapped and accessible |
| 372 | */ |
Catalin Marinas | 9099dae | 2016-10-11 13:55:11 -0700 | [diff] [blame] | 373 | kmemleak_ignore_phys(addr); |
Laurent Pinchart | 16195dd | 2014-10-24 13:18:41 +0300 | [diff] [blame] | 374 | base = addr; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 375 | } |
| 376 | |
Laura Abbott | f318dd0 | 2017-04-18 11:27:03 -0700 | [diff] [blame] | 377 | ret = cma_init_reserved_mem(base, size, order_per_bit, name, res_cma); |
Marek Szyprowski | de9e14e | 2014-10-13 15:51:09 -0700 | [diff] [blame] | 378 | if (ret) |
Peng Fan | 0d3bd18 | 2019-03-05 15:49:50 -0800 | [diff] [blame] | 379 | goto free_mem; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 380 | |
Laurent Pinchart | 56fa4f6 | 2014-10-24 13:18:42 +0300 | [diff] [blame] | 381 | pr_info("Reserved %ld MiB at %pa\n", (unsigned long)size / SZ_1M, |
| 382 | &base); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 383 | return 0; |
| 384 | |
Peng Fan | 0d3bd18 | 2019-03-05 15:49:50 -0800 | [diff] [blame] | 385 | free_mem: |
| 386 | memblock_free(base, size); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 387 | err: |
Joonsoo Kim | 0de9d2e | 2014-08-06 16:05:34 -0700 | [diff] [blame] | 388 | pr_err("Failed to reserve %ld MiB\n", (unsigned long)size / SZ_1M); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 389 | return ret; |
| 390 | } |
| 391 | |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 392 | #ifdef CONFIG_CMA_DEBUG |
| 393 | static void cma_debug_show_areas(struct cma *cma) |
| 394 | { |
Yue Hu | 2b59e01 | 2019-05-13 17:17:41 -0700 | [diff] [blame] | 395 | unsigned long next_zero_bit, next_set_bit, nr_zero; |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 396 | unsigned long start = 0; |
Yue Hu | 2b59e01 | 2019-05-13 17:17:41 -0700 | [diff] [blame] | 397 | unsigned long nr_part, nr_total = 0; |
| 398 | unsigned long nbits = cma_bitmap_maxno(cma); |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 399 | |
| 400 | mutex_lock(&cma->lock); |
| 401 | pr_info("number of available pages: "); |
| 402 | for (;;) { |
Yue Hu | 2b59e01 | 2019-05-13 17:17:41 -0700 | [diff] [blame] | 403 | next_zero_bit = find_next_zero_bit(cma->bitmap, nbits, start); |
| 404 | if (next_zero_bit >= nbits) |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 405 | break; |
Yue Hu | 2b59e01 | 2019-05-13 17:17:41 -0700 | [diff] [blame] | 406 | next_set_bit = find_next_bit(cma->bitmap, nbits, next_zero_bit); |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 407 | nr_zero = next_set_bit - next_zero_bit; |
Yue Hu | 2b59e01 | 2019-05-13 17:17:41 -0700 | [diff] [blame] | 408 | nr_part = nr_zero << cma->order_per_bit; |
| 409 | pr_cont("%s%lu@%lu", nr_total ? "+" : "", nr_part, |
| 410 | next_zero_bit); |
| 411 | nr_total += nr_part; |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 412 | start = next_zero_bit + nr_zero; |
| 413 | } |
Yue Hu | 2b59e01 | 2019-05-13 17:17:41 -0700 | [diff] [blame] | 414 | pr_cont("=> %lu free of %lu total pages\n", nr_total, cma->count); |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 415 | mutex_unlock(&cma->lock); |
| 416 | } |
| 417 | #else |
| 418 | static inline void cma_debug_show_areas(struct cma *cma) { } |
| 419 | #endif |
| 420 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 421 | /** |
| 422 | * cma_alloc() - allocate pages from contiguous area |
| 423 | * @cma: Contiguous memory region for which the allocation is performed. |
| 424 | * @count: Requested number of pages. |
| 425 | * @align: Requested alignment of pages (in PAGE_SIZE order). |
Minchan Kim | 23ba990 | 2021-01-21 12:09:34 -0800 | [diff] [blame] | 426 | * @gfp_mask: GFP mask to use during the cma allocation. |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 427 | * |
| 428 | * This function allocates part of contiguous memory on specific |
| 429 | * contiguous memory area. |
| 430 | */ |
Lucas Stach | e2f466e | 2017-02-24 14:58:41 -0800 | [diff] [blame] | 431 | struct page *cma_alloc(struct cma *cma, size_t count, unsigned int align, |
Minchan Kim | 23ba990 | 2021-01-21 12:09:34 -0800 | [diff] [blame] | 432 | gfp_t gfp_mask) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 433 | { |
Andrew Morton | 3acaea6 | 2015-11-05 18:50:08 -0800 | [diff] [blame] | 434 | unsigned long mask, offset; |
| 435 | unsigned long pfn = -1; |
| 436 | unsigned long start = 0; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 437 | unsigned long bitmap_maxno, bitmap_no, bitmap_count; |
Andrey Konovalov | 2813b9c | 2018-12-28 00:30:57 -0800 | [diff] [blame] | 438 | size_t i; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 439 | struct page *page = NULL; |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 440 | int ret = -ENOMEM; |
Chris Goldsworthy | 73eda8e | 2020-09-18 09:19:53 -0700 | [diff] [blame] | 441 | int num_attempts = 0; |
| 442 | int max_retries = 5; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 443 | |
Jianqun Xu | 835832b | 2020-08-11 18:31:54 -0700 | [diff] [blame] | 444 | if (!cma || !cma->count || !cma->bitmap) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 445 | return NULL; |
| 446 | |
Minchan Kim | 23ba990 | 2021-01-21 12:09:34 -0800 | [diff] [blame] | 447 | pr_debug("%s(cma %p, count %zu, align %d gfp_mask 0x%x)\n", __func__, |
| 448 | (void *)cma, count, align, gfp_mask); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 449 | |
| 450 | if (!count) |
| 451 | return NULL; |
| 452 | |
| 453 | mask = cma_bitmap_aligned_mask(cma, align); |
Gregory Fong | b5be83e | 2014-12-12 16:54:48 -0800 | [diff] [blame] | 454 | offset = cma_bitmap_aligned_offset(cma, align); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 455 | bitmap_maxno = cma_bitmap_maxno(cma); |
| 456 | bitmap_count = cma_bitmap_pages_to_bits(cma, count); |
| 457 | |
Shiraz Hashim | 6b36ba5 | 2016-11-10 10:46:16 -0800 | [diff] [blame] | 458 | if (bitmap_count > bitmap_maxno) |
| 459 | return NULL; |
| 460 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 461 | for (;;) { |
| 462 | mutex_lock(&cma->lock); |
Gregory Fong | b5be83e | 2014-12-12 16:54:48 -0800 | [diff] [blame] | 463 | bitmap_no = bitmap_find_next_zero_area_off(cma->bitmap, |
| 464 | bitmap_maxno, start, bitmap_count, mask, |
| 465 | offset); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 466 | if (bitmap_no >= bitmap_maxno) { |
Chris Goldsworthy | 73eda8e | 2020-09-18 09:19:53 -0700 | [diff] [blame] | 467 | if ((num_attempts < max_retries) && (ret == -EBUSY)) { |
| 468 | mutex_unlock(&cma->lock); |
| 469 | |
| 470 | if (fatal_signal_pending(current)) |
| 471 | break; |
| 472 | |
| 473 | /* |
| 474 | * Page may be momentarily pinned by some other |
| 475 | * process which has been scheduled out, e.g. |
| 476 | * in exit path, during unmap call, or process |
| 477 | * fork and so cannot be freed there. Sleep |
| 478 | * for 100ms and retry the allocation. |
| 479 | */ |
| 480 | start = 0; |
| 481 | ret = -ENOMEM; |
| 482 | schedule_timeout_killable(msecs_to_jiffies(100)); |
| 483 | num_attempts++; |
| 484 | continue; |
| 485 | } else { |
| 486 | mutex_unlock(&cma->lock); |
| 487 | break; |
| 488 | } |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 489 | } |
| 490 | bitmap_set(cma->bitmap, bitmap_no, bitmap_count); |
| 491 | /* |
| 492 | * It's safe to drop the lock here. We've marked this region for |
| 493 | * our exclusive use. If the migration fails we will take the |
| 494 | * lock again and unmark it. |
| 495 | */ |
| 496 | mutex_unlock(&cma->lock); |
| 497 | |
| 498 | pfn = cma->base_pfn + (bitmap_no << cma->order_per_bit); |
Minchan Kim | 23ba990 | 2021-01-21 12:09:34 -0800 | [diff] [blame] | 499 | ret = alloc_contig_range(pfn, pfn + count, MIGRATE_CMA, gfp_mask); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 500 | if (ret == 0) { |
| 501 | page = pfn_to_page(pfn); |
| 502 | break; |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 503 | } |
Joonsoo Kim | b7155e7 | 2014-08-06 16:05:30 -0700 | [diff] [blame] | 504 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 505 | cma_clear_bitmap(cma, pfn, count); |
Joonsoo Kim | b7155e7 | 2014-08-06 16:05:30 -0700 | [diff] [blame] | 506 | if (ret != -EBUSY) |
| 507 | break; |
| 508 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 509 | pr_debug("%s(): memory range at %p is busy, retrying\n", |
| 510 | __func__, pfn_to_page(pfn)); |
| 511 | /* try again with a bit different memory target */ |
| 512 | start = bitmap_no + mask + 1; |
| 513 | } |
| 514 | |
Andrew Morton | 3acaea6 | 2015-11-05 18:50:08 -0800 | [diff] [blame] | 515 | trace_cma_alloc(pfn, page, count, align); |
Stefan Strogin | 99e8ea6 | 2015-04-15 16:14:50 -0700 | [diff] [blame] | 516 | |
Andrey Konovalov | 2813b9c | 2018-12-28 00:30:57 -0800 | [diff] [blame] | 517 | /* |
| 518 | * CMA can allocate multiple page blocks, which results in different |
| 519 | * blocks being marked with different tags. Reset the tags to ignore |
| 520 | * those page blocks. |
| 521 | */ |
| 522 | if (page) { |
| 523 | for (i = 0; i < count; i++) |
| 524 | page_kasan_tag_reset(page + i); |
| 525 | } |
| 526 | |
Minchan Kim | 23ba990 | 2021-01-21 12:09:34 -0800 | [diff] [blame] | 527 | if (ret && !(gfp_mask & __GFP_NOWARN)) { |
Pintu Agarwal | 5984af108 | 2017-11-15 17:34:26 -0800 | [diff] [blame] | 528 | pr_err("%s: alloc failed, req-size: %zu pages, ret: %d\n", |
Jaewon Kim | dbe43d4 | 2017-02-24 14:58:50 -0800 | [diff] [blame] | 529 | __func__, count, ret); |
| 530 | cma_debug_show_areas(cma); |
| 531 | } |
| 532 | |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 533 | pr_debug("%s(): returned %p\n", __func__, page); |
| 534 | return page; |
| 535 | } |
Sandeep Patil | 716306e | 2019-09-13 14:50:38 -0700 | [diff] [blame] | 536 | EXPORT_SYMBOL_GPL(cma_alloc); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 537 | |
| 538 | /** |
| 539 | * cma_release() - release allocated pages |
| 540 | * @cma: Contiguous memory region for which the allocation is performed. |
| 541 | * @pages: Allocated pages. |
| 542 | * @count: Number of allocated pages. |
| 543 | * |
Ryohei Suzuki | 929f92f | 2019-07-16 16:26:00 -0700 | [diff] [blame] | 544 | * This function releases memory allocated by cma_alloc(). |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 545 | * It returns false when provided pages do not belong to contiguous area and |
| 546 | * true otherwise. |
| 547 | */ |
Sasha Levin | ac17382 | 2015-04-14 15:47:04 -0700 | [diff] [blame] | 548 | bool cma_release(struct cma *cma, const struct page *pages, unsigned int count) |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 549 | { |
| 550 | unsigned long pfn; |
| 551 | |
| 552 | if (!cma || !pages) |
| 553 | return false; |
| 554 | |
Charan Teja Reddy | bfb68bd | 2020-12-14 19:13:26 -0800 | [diff] [blame] | 555 | pr_debug("%s(page %p, count %u)\n", __func__, (void *)pages, count); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 556 | |
| 557 | pfn = page_to_pfn(pages); |
| 558 | |
| 559 | if (pfn < cma->base_pfn || pfn >= cma->base_pfn + cma->count) |
| 560 | return false; |
| 561 | |
| 562 | VM_BUG_ON(pfn + count > cma->base_pfn + cma->count); |
| 563 | |
| 564 | free_contig_range(pfn, count); |
| 565 | cma_clear_bitmap(cma, pfn, count); |
Stefan Strogin | 99e8ea6 | 2015-04-15 16:14:50 -0700 | [diff] [blame] | 566 | trace_cma_release(pfn, pages, count); |
Joonsoo Kim | a254129 | 2014-08-06 16:05:25 -0700 | [diff] [blame] | 567 | |
| 568 | return true; |
| 569 | } |
Sandeep Patil | 716306e | 2019-09-13 14:50:38 -0700 | [diff] [blame] | 570 | EXPORT_SYMBOL_GPL(cma_release); |
Laura Abbott | e4231bc | 2017-04-18 11:27:04 -0700 | [diff] [blame] | 571 | |
| 572 | int cma_for_each_area(int (*it)(struct cma *cma, void *data), void *data) |
| 573 | { |
| 574 | int i; |
| 575 | |
| 576 | for (i = 0; i < cma_area_count; i++) { |
| 577 | int ret = it(&cma_areas[i], data); |
| 578 | |
| 579 | if (ret) |
| 580 | return ret; |
| 581 | } |
| 582 | |
| 583 | return 0; |
| 584 | } |
Sandeep Patil | 716306e | 2019-09-13 14:50:38 -0700 | [diff] [blame] | 585 | EXPORT_SYMBOL_GPL(cma_for_each_area); |