blob: 895ec0c4942e68c43ca49f1fb77f5112344ca05a [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001/* SPDX-License-Identifier: GPL-2.0 */
Christoph Lameterb20a3502006-03-22 00:09:12 -08002#ifndef _LINUX_MIGRATE_H
3#define _LINUX_MIGRATE_H
4
Christoph Lameterb20a3502006-03-22 00:09:12 -08005#include <linux/mm.h>
Christoph Lameter906e0be2007-05-06 14:50:20 -07006#include <linux/mempolicy.h>
Andrew Morton6536e312012-01-20 14:33:53 -08007#include <linux/migrate_mode.h>
Michal Hocko8b913232017-07-10 15:48:47 -07008#include <linux/hugetlb.h>
Christoph Lameterb20a3502006-03-22 00:09:12 -08009
David Rientjes68711a72014-06-04 16:08:25 -070010typedef struct page *new_page_t(struct page *page, unsigned long private,
11 int **reason);
12typedef void free_page_t(struct page *page, unsigned long private);
Christoph Lameter95a402c2006-06-23 02:03:53 -070013
Rafael Aquini78bd5202012-12-11 16:02:31 -080014/*
15 * Return values from addresss_space_operations.migratepage():
16 * - negative errno on page migration failure;
17 * - zero on page migration success;
18 */
19#define MIGRATEPAGE_SUCCESS 0
Konstantin Khlebnikovd6d86c02014-10-09 15:29:27 -070020
Mel Gorman7b2a2d42012-10-19 14:07:31 +010021enum migrate_reason {
22 MR_COMPACTION,
23 MR_MEMORY_FAILURE,
24 MR_MEMORY_HOTPLUG,
25 MR_SYSCALL, /* also applies to cpusets */
26 MR_MEMPOLICY_MBIND,
Peter Zijlstra7039e1d2012-10-25 14:16:34 +020027 MR_NUMA_MISPLACED,
Vlastimil Babka7cd12b42016-03-15 14:56:18 -070028 MR_CMA,
29 MR_TYPES
Mel Gorman7b2a2d42012-10-19 14:07:31 +010030};
Rafael Aquini78bd5202012-12-11 16:02:31 -080031
Vlastimil Babka7cd12b42016-03-15 14:56:18 -070032/* In mm/debug.c; also keep sync with include/trace/events/migrate.h */
33extern char *migrate_reason_names[MR_TYPES];
34
Michal Hocko8b913232017-07-10 15:48:47 -070035static inline struct page *new_page_nodemask(struct page *page,
36 int preferred_nid, nodemask_t *nodemask)
37{
Michal Hocko0f556852017-07-12 14:36:58 -070038 gfp_t gfp_mask = GFP_USER | __GFP_MOVABLE | __GFP_RETRY_MAYFAIL;
Naoya Horiguchi8135d892017-09-08 16:11:15 -070039 unsigned int order = 0;
40 struct page *new_page = NULL;
Michal Hocko8b913232017-07-10 15:48:47 -070041
42 if (PageHuge(page))
43 return alloc_huge_page_nodemask(page_hstate(compound_head(page)),
Michal Hocko3e59fcb2017-07-10 15:49:11 -070044 preferred_nid, nodemask);
Michal Hocko8b913232017-07-10 15:48:47 -070045
Naoya Horiguchi8135d892017-09-08 16:11:15 -070046 if (thp_migration_supported() && PageTransHuge(page)) {
47 order = HPAGE_PMD_ORDER;
48 gfp_mask |= GFP_TRANSHUGE;
49 }
50
Michal Hocko8b913232017-07-10 15:48:47 -070051 if (PageHighMem(page) || (zone_idx(page_zone(page)) == ZONE_MOVABLE))
52 gfp_mask |= __GFP_HIGHMEM;
53
Naoya Horiguchi8135d892017-09-08 16:11:15 -070054 new_page = __alloc_pages_nodemask(gfp_mask, order,
55 preferred_nid, nodemask);
56
57 if (new_page && PageTransHuge(page))
58 prep_transhuge_page(new_page);
59
60 return new_page;
Michal Hocko8b913232017-07-10 15:48:47 -070061}
62
Christoph Lameter906e0be2007-05-06 14:50:20 -070063#ifdef CONFIG_MIGRATION
KOSAKI Motohiro64cdd542009-01-06 14:39:16 -080064
Rafael Aquini5733c7d2012-12-11 16:02:47 -080065extern void putback_movable_pages(struct list_head *l);
Pushkar Jambhlekar9927e382017-05-03 14:54:45 -070066extern int migrate_page(struct address_space *mapping,
67 struct page *newpage, struct page *page,
68 enum migrate_mode mode);
David Rientjes68711a72014-06-04 16:08:25 -070069extern int migrate_pages(struct list_head *l, new_page_t new, free_page_t free,
Hugh Dickins9c620e22013-02-22 16:35:14 -080070 unsigned long private, enum migrate_mode mode, int reason);
Yisheng Xie9e5bcd62017-02-24 14:57:29 -080071extern int isolate_movable_page(struct page *page, isolate_mode_t mode);
Minchan Kimbda807d2016-07-26 15:23:05 -070072extern void putback_movable_page(struct page *page);
Christoph Lameter95a402c2006-06-23 02:03:53 -070073
Christoph Lameterb20a3502006-03-22 00:09:12 -080074extern int migrate_prep(void);
Mel Gorman748446b2010-05-24 14:32:27 -070075extern int migrate_prep_local(void);
Jérôme Glisse2916ecc2017-09-08 16:12:06 -070076extern void migrate_page_states(struct page *newpage, struct page *page);
Naoya Horiguchi290408d2010-09-08 10:19:35 +090077extern void migrate_page_copy(struct page *newpage, struct page *page);
78extern int migrate_huge_page_move_mapping(struct address_space *mapping,
79 struct page *newpage, struct page *page);
Gu Zheng36bc08c2013-07-16 17:56:16 +080080extern int migrate_page_move_mapping(struct address_space *mapping,
81 struct page *newpage, struct page *page,
Benjamin LaHaise8e321fe2013-12-21 17:56:08 -050082 struct buffer_head *head, enum migrate_mode mode,
83 int extra_count);
Christoph Lameterb20a3502006-03-22 00:09:12 -080084#else
KOSAKI Motohiro64cdd542009-01-06 14:39:16 -080085
Rafael Aquini5733c7d2012-12-11 16:02:47 -080086static inline void putback_movable_pages(struct list_head *l) {}
David Rientjes68711a72014-06-04 16:08:25 -070087static inline int migrate_pages(struct list_head *l, new_page_t new,
88 free_page_t free, unsigned long private, enum migrate_mode mode,
89 int reason)
Hugh Dickins9c620e22013-02-22 16:35:14 -080090 { return -ENOSYS; }
Yisheng Xiecbae0172017-02-24 14:57:32 -080091static inline int isolate_movable_page(struct page *page, isolate_mode_t mode)
92 { return -EBUSY; }
Christoph Lameter9bf9e892006-03-31 02:29:56 -080093
Christoph Lameterb20a3502006-03-22 00:09:12 -080094static inline int migrate_prep(void) { return -ENOSYS; }
Mel Gorman748446b2010-05-24 14:32:27 -070095static inline int migrate_prep_local(void) { return -ENOSYS; }
Christoph Lameterb20a3502006-03-22 00:09:12 -080096
Jérôme Glisse2916ecc2017-09-08 16:12:06 -070097static inline void migrate_page_states(struct page *newpage, struct page *page)
98{
99}
100
Naoya Horiguchi290408d2010-09-08 10:19:35 +0900101static inline void migrate_page_copy(struct page *newpage,
102 struct page *page) {}
103
Naoya Horiguchi6f39ce02010-09-30 11:54:51 +0900104static inline int migrate_huge_page_move_mapping(struct address_space *mapping,
Naoya Horiguchi290408d2010-09-08 10:19:35 +0900105 struct page *newpage, struct page *page)
106{
107 return -ENOSYS;
108}
109
Christoph Lameterb20a3502006-03-22 00:09:12 -0800110#endif /* CONFIG_MIGRATION */
Peter Zijlstra7039e1d2012-10-25 14:16:34 +0200111
Minchan Kimdd4123f2016-07-26 15:26:50 -0700112#ifdef CONFIG_COMPACTION
113extern int PageMovable(struct page *page);
114extern void __SetPageMovable(struct page *page, struct address_space *mapping);
115extern void __ClearPageMovable(struct page *page);
116#else
117static inline int PageMovable(struct page *page) { return 0; };
118static inline void __SetPageMovable(struct page *page,
119 struct address_space *mapping)
120{
121}
122static inline void __ClearPageMovable(struct page *page)
123{
124}
125#endif
126
Peter Zijlstra7039e1d2012-10-25 14:16:34 +0200127#ifdef CONFIG_NUMA_BALANCING
Mel Gormande466bd2013-12-18 17:08:42 -0800128extern bool pmd_trans_migrating(pmd_t pmd);
Mel Gorman1bc115d2013-10-07 11:29:05 +0100129extern int migrate_misplaced_page(struct page *page,
130 struct vm_area_struct *vma, int node);
Peter Zijlstra7039e1d2012-10-25 14:16:34 +0200131#else
Mel Gormande466bd2013-12-18 17:08:42 -0800132static inline bool pmd_trans_migrating(pmd_t pmd)
133{
134 return false;
135}
Mel Gorman1bc115d2013-10-07 11:29:05 +0100136static inline int migrate_misplaced_page(struct page *page,
137 struct vm_area_struct *vma, int node)
Peter Zijlstra7039e1d2012-10-25 14:16:34 +0200138{
139 return -EAGAIN; /* can't migrate now */
140}
Mel Gorman220018d2012-12-05 09:32:56 +0000141#endif /* CONFIG_NUMA_BALANCING */
Mel Gormanb32967f2012-11-19 12:35:47 +0000142
Mel Gorman220018d2012-12-05 09:32:56 +0000143#if defined(CONFIG_NUMA_BALANCING) && defined(CONFIG_TRANSPARENT_HUGEPAGE)
144extern int migrate_misplaced_transhuge_page(struct mm_struct *mm,
145 struct vm_area_struct *vma,
146 pmd_t *pmd, pmd_t entry,
147 unsigned long address,
148 struct page *page, int node);
149#else
Mel Gormanb32967f2012-11-19 12:35:47 +0000150static inline int migrate_misplaced_transhuge_page(struct mm_struct *mm,
151 struct vm_area_struct *vma,
152 pmd_t *pmd, pmd_t entry,
153 unsigned long address,
154 struct page *page, int node)
155{
156 return -EAGAIN;
157}
Mel Gorman220018d2012-12-05 09:32:56 +0000158#endif /* CONFIG_NUMA_BALANCING && CONFIG_TRANSPARENT_HUGEPAGE*/
Peter Zijlstra7039e1d2012-10-25 14:16:34 +0200159
Jérôme Glisse8763cb42017-09-08 16:12:09 -0700160
161#ifdef CONFIG_MIGRATION
162
Jérôme Glissea5430dd2017-09-08 16:12:17 -0700163/*
164 * Watch out for PAE architecture, which has an unsigned long, and might not
165 * have enough bits to store all physical address and flags. So far we have
166 * enough room for all our flags.
167 */
Jérôme Glisse8763cb42017-09-08 16:12:09 -0700168#define MIGRATE_PFN_VALID (1UL << 0)
169#define MIGRATE_PFN_MIGRATE (1UL << 1)
170#define MIGRATE_PFN_LOCKED (1UL << 2)
171#define MIGRATE_PFN_WRITE (1UL << 3)
Jérôme Glissea5430dd2017-09-08 16:12:17 -0700172#define MIGRATE_PFN_DEVICE (1UL << 4)
173#define MIGRATE_PFN_ERROR (1UL << 5)
174#define MIGRATE_PFN_SHIFT 6
Jérôme Glisse8763cb42017-09-08 16:12:09 -0700175
176static inline struct page *migrate_pfn_to_page(unsigned long mpfn)
177{
178 if (!(mpfn & MIGRATE_PFN_VALID))
179 return NULL;
180 return pfn_to_page(mpfn >> MIGRATE_PFN_SHIFT);
181}
182
183static inline unsigned long migrate_pfn(unsigned long pfn)
184{
185 return (pfn << MIGRATE_PFN_SHIFT) | MIGRATE_PFN_VALID;
186}
187
188/*
189 * struct migrate_vma_ops - migrate operation callback
190 *
191 * @alloc_and_copy: alloc destination memory and copy source memory to it
192 * @finalize_and_map: allow caller to map the successfully migrated pages
193 *
194 *
195 * The alloc_and_copy() callback happens once all source pages have been locked,
196 * unmapped and checked (checked whether pinned or not). All pages that can be
197 * migrated will have an entry in the src array set with the pfn value of the
198 * page and with the MIGRATE_PFN_VALID and MIGRATE_PFN_MIGRATE flag set (other
199 * flags might be set but should be ignored by the callback).
200 *
201 * The alloc_and_copy() callback can then allocate destination memory and copy
202 * source memory to it for all those entries (ie with MIGRATE_PFN_VALID and
203 * MIGRATE_PFN_MIGRATE flag set). Once these are allocated and copied, the
204 * callback must update each corresponding entry in the dst array with the pfn
205 * value of the destination page and with the MIGRATE_PFN_VALID and
206 * MIGRATE_PFN_LOCKED flags set (destination pages must have their struct pages
207 * locked, via lock_page()).
208 *
209 * At this point the alloc_and_copy() callback is done and returns.
210 *
211 * Note that the callback does not have to migrate all the pages that are
212 * marked with MIGRATE_PFN_MIGRATE flag in src array unless this is a migration
213 * from device memory to system memory (ie the MIGRATE_PFN_DEVICE flag is also
214 * set in the src array entry). If the device driver cannot migrate a device
215 * page back to system memory, then it must set the corresponding dst array
216 * entry to MIGRATE_PFN_ERROR. This will trigger a SIGBUS if CPU tries to
217 * access any of the virtual addresses originally backed by this page. Because
218 * a SIGBUS is such a severe result for the userspace process, the device
219 * driver should avoid setting MIGRATE_PFN_ERROR unless it is really in an
220 * unrecoverable state.
221 *
Jérôme Glisse8315ada2017-09-08 16:12:21 -0700222 * For empty entry inside CPU page table (pte_none() or pmd_none() is true) we
223 * do set MIGRATE_PFN_MIGRATE flag inside the corresponding source array thus
224 * allowing device driver to allocate device memory for those unback virtual
225 * address. For this the device driver simply have to allocate device memory
226 * and properly set the destination entry like for regular migration. Note that
227 * this can still fails and thus inside the device driver must check if the
228 * migration was successful for those entry inside the finalize_and_map()
229 * callback just like for regular migration.
230 *
Jérôme Glisse8763cb42017-09-08 16:12:09 -0700231 * THE alloc_and_copy() CALLBACK MUST NOT CHANGE ANY OF THE SRC ARRAY ENTRIES
232 * OR BAD THINGS WILL HAPPEN !
233 *
234 *
235 * The finalize_and_map() callback happens after struct page migration from
236 * source to destination (destination struct pages are the struct pages for the
237 * memory allocated by the alloc_and_copy() callback). Migration can fail, and
238 * thus the finalize_and_map() allows the driver to inspect which pages were
239 * successfully migrated, and which were not. Successfully migrated pages will
240 * have the MIGRATE_PFN_MIGRATE flag set for their src array entry.
241 *
242 * It is safe to update device page table from within the finalize_and_map()
243 * callback because both destination and source page are still locked, and the
244 * mmap_sem is held in read mode (hence no one can unmap the range being
245 * migrated).
246 *
247 * Once callback is done cleaning up things and updating its page table (if it
248 * chose to do so, this is not an obligation) then it returns. At this point,
249 * the HMM core will finish up the final steps, and the migration is complete.
250 *
251 * THE finalize_and_map() CALLBACK MUST NOT CHANGE ANY OF THE SRC OR DST ARRAY
252 * ENTRIES OR BAD THINGS WILL HAPPEN !
253 */
254struct migrate_vma_ops {
255 void (*alloc_and_copy)(struct vm_area_struct *vma,
256 const unsigned long *src,
257 unsigned long *dst,
258 unsigned long start,
259 unsigned long end,
260 void *private);
261 void (*finalize_and_map)(struct vm_area_struct *vma,
262 const unsigned long *src,
263 const unsigned long *dst,
264 unsigned long start,
265 unsigned long end,
266 void *private);
267};
268
Jérôme Glisse6b368cd2017-09-08 16:12:32 -0700269#if defined(CONFIG_MIGRATE_VMA_HELPER)
Jérôme Glisse8763cb42017-09-08 16:12:09 -0700270int migrate_vma(const struct migrate_vma_ops *ops,
271 struct vm_area_struct *vma,
272 unsigned long start,
273 unsigned long end,
274 unsigned long *src,
275 unsigned long *dst,
276 void *private);
Jérôme Glisse6b368cd2017-09-08 16:12:32 -0700277#else
278static inline int migrate_vma(const struct migrate_vma_ops *ops,
279 struct vm_area_struct *vma,
280 unsigned long start,
281 unsigned long end,
282 unsigned long *src,
283 unsigned long *dst,
284 void *private)
285{
286 return -EINVAL;
287}
288#endif /* IS_ENABLED(CONFIG_MIGRATE_VMA_HELPER) */
Jérôme Glisse8763cb42017-09-08 16:12:09 -0700289
290#endif /* CONFIG_MIGRATION */
291
Christoph Lameterb20a3502006-03-22 00:09:12 -0800292#endif /* _LINUX_MIGRATE_H */