blob: ad807d5a314109fb813bf911ad9ee882444d7b5b [file] [log] [blame]
Nadav Amit8b4770e2018-06-19 16:00:29 -07001// SPDX-License-Identifier: GPL-2.0
Dmitry Torokhov453dc652010-04-23 13:18:08 -04002/*
3 * VMware Balloon driver.
4 *
Nadav Amit8b4770e2018-06-19 16:00:29 -07005 * Copyright (C) 2000-2018, VMware, Inc. All Rights Reserved.
Dmitry Torokhov453dc652010-04-23 13:18:08 -04006 *
Dmitry Torokhov453dc652010-04-23 13:18:08 -04007 * This is VMware physical memory management driver for Linux. The driver
8 * acts like a "balloon" that can be inflated to reclaim physical pages by
9 * reserving them in the guest and invalidating them in the monitor,
10 * freeing up the underlying machine pages so they can be allocated to
11 * other guests. The balloon can also be deflated to allow the guest to
12 * use more physical memory. Higher level policies can control the sizes
13 * of balloons in VMs in order to manage physical memory resources.
14 */
15
16//#define DEBUG
17#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
18
19#include <linux/types.h>
20#include <linux/kernel.h>
21#include <linux/mm.h>
Xavier Deguillardf220a802015-08-06 15:17:58 -070022#include <linux/vmalloc.h>
Dmitry Torokhov453dc652010-04-23 13:18:08 -040023#include <linux/sched.h>
24#include <linux/module.h>
25#include <linux/workqueue.h>
26#include <linux/debugfs.h>
27#include <linux/seq_file.h>
Nadav Amitc7b36902018-09-20 10:30:17 -070028#include <linux/rwsem.h>
29#include <linux/slab.h>
Nadav Amit6e4453b2018-09-20 10:30:18 -070030#include <linux/spinlock.h>
Philip P. Moltmann48e3d662015-08-06 15:18:01 -070031#include <linux/vmw_vmci_defs.h>
32#include <linux/vmw_vmci_api.h>
H. Peter Anvina10a5692010-05-09 01:13:42 -070033#include <asm/hypervisor.h>
Dmitry Torokhov453dc652010-04-23 13:18:08 -040034
35MODULE_AUTHOR("VMware, Inc.");
36MODULE_DESCRIPTION("VMware Memory Control (Balloon) Driver");
Dmitry Torokhov453dc652010-04-23 13:18:08 -040037MODULE_ALIAS("dmi:*:svnVMware*:*");
38MODULE_ALIAS("vmware_vmmemctl");
39MODULE_LICENSE("GPL");
40
41/*
Nadav Amit622074a2018-09-20 10:30:11 -070042 * Use __GFP_HIGHMEM to allow pages from HIGHMEM zone. We don't allow wait
43 * (__GFP_RECLAIM) for huge page allocations. Use __GFP_NOWARN, to suppress page
44 * allocation failure warnings. Disallow access to emergency low-memory pools.
Dmitry Torokhov453dc652010-04-23 13:18:08 -040045 */
Nadav Amit622074a2018-09-20 10:30:11 -070046#define VMW_HUGE_PAGE_ALLOC_FLAGS (__GFP_HIGHMEM|__GFP_NOWARN| \
47 __GFP_NOMEMALLOC)
Dmitry Torokhov453dc652010-04-23 13:18:08 -040048
49/*
Nadav Amit622074a2018-09-20 10:30:11 -070050 * Use __GFP_HIGHMEM to allow pages from HIGHMEM zone. We allow lightweight
51 * reclamation (__GFP_NORETRY). Use __GFP_NOWARN, to suppress page allocation
52 * failure warnings. Disallow access to emergency low-memory pools.
Dmitry Torokhov453dc652010-04-23 13:18:08 -040053 */
Nadav Amit622074a2018-09-20 10:30:11 -070054#define VMW_PAGE_ALLOC_FLAGS (__GFP_HIGHMEM|__GFP_NOWARN| \
55 __GFP_NOMEMALLOC|__GFP_NORETRY)
Dmitry Torokhov453dc652010-04-23 13:18:08 -040056
Dmitry Torokhov55adaa42010-06-04 14:14:52 -070057/* Maximum number of refused pages we accumulate during inflation cycle */
58#define VMW_BALLOON_MAX_REFUSED 16
Dmitry Torokhov453dc652010-04-23 13:18:08 -040059
60/*
61 * Hypervisor communication port definitions.
62 */
63#define VMW_BALLOON_HV_PORT 0x5670
64#define VMW_BALLOON_HV_MAGIC 0x456c6d6f
Dmitry Torokhov453dc652010-04-23 13:18:08 -040065#define VMW_BALLOON_GUEST_ID 1 /* Linux */
66
Xavier Deguillardeb791002015-06-12 11:43:23 -070067enum vmwballoon_capabilities {
68 /*
69 * Bit 0 is reserved and not associated to any capability.
70 */
Philip P. Moltmann48e3d662015-08-06 15:18:01 -070071 VMW_BALLOON_BASIC_CMDS = (1 << 1),
72 VMW_BALLOON_BATCHED_CMDS = (1 << 2),
73 VMW_BALLOON_BATCHED_2M_CMDS = (1 << 3),
74 VMW_BALLOON_SIGNALLED_WAKEUP_CMD = (1 << 4),
Xavier Deguillard55398302019-02-06 15:57:02 -080075 VMW_BALLOON_64_BIT_TARGET = (1 << 5)
Xavier Deguillardeb791002015-06-12 11:43:23 -070076};
77
Xavier Deguillard55398302019-02-06 15:57:02 -080078#define VMW_BALLOON_CAPABILITIES_COMMON (VMW_BALLOON_BASIC_CMDS \
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -070079 | VMW_BALLOON_BATCHED_CMDS \
Philip P. Moltmann48e3d662015-08-06 15:18:01 -070080 | VMW_BALLOON_BATCHED_2M_CMDS \
81 | VMW_BALLOON_SIGNALLED_WAKEUP_CMD)
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -070082
Nadav Amit25acbdd2018-09-20 10:30:14 -070083#define VMW_BALLOON_2M_ORDER (PMD_SHIFT - PAGE_SHIFT)
Xavier Deguillardeb791002015-06-12 11:43:23 -070084
Xavier Deguillard55398302019-02-06 15:57:02 -080085/*
86 * 64-bit targets are only supported in 64-bit
87 */
88#ifdef CONFIG_64BIT
89#define VMW_BALLOON_CAPABILITIES (VMW_BALLOON_CAPABILITIES_COMMON \
90 | VMW_BALLOON_64_BIT_TARGET)
91#else
92#define VMW_BALLOON_CAPABILITIES VMW_BALLOON_CAPABILITIES_COMMON
93#endif
94
Nadav Amitc7b36902018-09-20 10:30:17 -070095enum vmballoon_page_size_type {
96 VMW_BALLOON_4K_PAGE,
97 VMW_BALLOON_2M_PAGE,
98 VMW_BALLOON_LAST_SIZE = VMW_BALLOON_2M_PAGE
99};
100
101#define VMW_BALLOON_NUM_PAGE_SIZES (VMW_BALLOON_LAST_SIZE + 1)
102
Nadav Amit6e4453b2018-09-20 10:30:18 -0700103static const char * const vmballoon_page_size_names[] = {
104 [VMW_BALLOON_4K_PAGE] = "4k",
105 [VMW_BALLOON_2M_PAGE] = "2M"
106};
107
108enum vmballoon_op {
109 VMW_BALLOON_INFLATE,
110 VMW_BALLOON_DEFLATE
111};
112
Nadav Amitc7b36902018-09-20 10:30:17 -0700113enum vmballoon_op_stat_type {
114 VMW_BALLOON_OP_STAT,
115 VMW_BALLOON_OP_FAIL_STAT
116};
117
118#define VMW_BALLOON_OP_STAT_TYPES (VMW_BALLOON_OP_FAIL_STAT + 1)
119
120/**
121 * enum vmballoon_cmd_type - backdoor commands.
Xavier Deguillardf220a802015-08-06 15:17:58 -0700122 *
Nadav Amitc7b36902018-09-20 10:30:17 -0700123 * Availability of the commands is as followed:
Xavier Deguillardf220a802015-08-06 15:17:58 -0700124 *
Nadav Amitc7b36902018-09-20 10:30:17 -0700125 * %VMW_BALLOON_CMD_START, %VMW_BALLOON_CMD_GET_TARGET and
126 * %VMW_BALLOON_CMD_GUEST_ID are always available.
127 *
128 * If the host reports %VMW_BALLOON_BASIC_CMDS are supported then
129 * %VMW_BALLOON_CMD_LOCK and %VMW_BALLOON_CMD_UNLOCK commands are available.
130 *
131 * If the host reports %VMW_BALLOON_BATCHED_CMDS are supported then
132 * %VMW_BALLOON_CMD_BATCHED_LOCK and VMW_BALLOON_CMD_BATCHED_UNLOCK commands
133 * are available.
134 *
135 * If the host reports %VMW_BALLOON_BATCHED_2M_CMDS are supported then
136 * %VMW_BALLOON_CMD_BATCHED_2M_LOCK and %VMW_BALLOON_CMD_BATCHED_2M_UNLOCK
137 * are supported.
138 *
139 * If the host reports VMW_BALLOON_SIGNALLED_WAKEUP_CMD is supported then
140 * VMW_BALLOON_CMD_VMCI_DOORBELL_SET command is supported.
141 *
142 * @VMW_BALLOON_CMD_START: Communicating supported version with the hypervisor.
143 * @VMW_BALLOON_CMD_GET_TARGET: Gets the balloon target size.
144 * @VMW_BALLOON_CMD_LOCK: Informs the hypervisor about a ballooned page.
145 * @VMW_BALLOON_CMD_UNLOCK: Informs the hypervisor about a page that is about
146 * to be deflated from the balloon.
147 * @VMW_BALLOON_CMD_GUEST_ID: Informs the hypervisor about the type of OS that
148 * runs in the VM.
149 * @VMW_BALLOON_CMD_BATCHED_LOCK: Inform the hypervisor about a batch of
150 * ballooned pages (up to 512).
151 * @VMW_BALLOON_CMD_BATCHED_UNLOCK: Inform the hypervisor about a batch of
152 * pages that are about to be deflated from the
153 * balloon (up to 512).
154 * @VMW_BALLOON_CMD_BATCHED_2M_LOCK: Similar to @VMW_BALLOON_CMD_BATCHED_LOCK
155 * for 2MB pages.
156 * @VMW_BALLOON_CMD_BATCHED_2M_UNLOCK: Similar to
157 * @VMW_BALLOON_CMD_BATCHED_UNLOCK for 2MB
158 * pages.
159 * @VMW_BALLOON_CMD_VMCI_DOORBELL_SET: A command to set doorbell notification
160 * that would be invoked when the balloon
161 * size changes.
162 * @VMW_BALLOON_CMD_LAST: Value of the last command.
Xavier Deguillardf220a802015-08-06 15:17:58 -0700163 */
Nadav Amitc7b36902018-09-20 10:30:17 -0700164enum vmballoon_cmd_type {
165 VMW_BALLOON_CMD_START,
166 VMW_BALLOON_CMD_GET_TARGET,
167 VMW_BALLOON_CMD_LOCK,
168 VMW_BALLOON_CMD_UNLOCK,
169 VMW_BALLOON_CMD_GUEST_ID,
170 /* No command 5 */
171 VMW_BALLOON_CMD_BATCHED_LOCK = 6,
172 VMW_BALLOON_CMD_BATCHED_UNLOCK,
173 VMW_BALLOON_CMD_BATCHED_2M_LOCK,
174 VMW_BALLOON_CMD_BATCHED_2M_UNLOCK,
175 VMW_BALLOON_CMD_VMCI_DOORBELL_SET,
176 VMW_BALLOON_CMD_LAST = VMW_BALLOON_CMD_VMCI_DOORBELL_SET,
177};
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700178
Nadav Amitc7b36902018-09-20 10:30:17 -0700179#define VMW_BALLOON_CMD_NUM (VMW_BALLOON_CMD_LAST + 1)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400180
Nadav Amitc7b36902018-09-20 10:30:17 -0700181enum vmballoon_error_codes {
182 VMW_BALLOON_SUCCESS,
183 VMW_BALLOON_ERROR_CMD_INVALID,
184 VMW_BALLOON_ERROR_PPN_INVALID,
185 VMW_BALLOON_ERROR_PPN_LOCKED,
186 VMW_BALLOON_ERROR_PPN_UNLOCKED,
187 VMW_BALLOON_ERROR_PPN_PINNED,
188 VMW_BALLOON_ERROR_PPN_NOTNEEDED,
189 VMW_BALLOON_ERROR_RESET,
190 VMW_BALLOON_ERROR_BUSY
191};
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400192
Xavier Deguillardeb791002015-06-12 11:43:23 -0700193#define VMW_BALLOON_SUCCESS_WITH_CAPABILITIES (0x03000000)
194
Nadav Amit10a95d52018-09-20 10:30:07 -0700195#define VMW_BALLOON_CMD_WITH_TARGET_MASK \
196 ((1UL << VMW_BALLOON_CMD_GET_TARGET) | \
197 (1UL << VMW_BALLOON_CMD_LOCK) | \
198 (1UL << VMW_BALLOON_CMD_UNLOCK) | \
199 (1UL << VMW_BALLOON_CMD_BATCHED_LOCK) | \
200 (1UL << VMW_BALLOON_CMD_BATCHED_UNLOCK) | \
201 (1UL << VMW_BALLOON_CMD_BATCHED_2M_LOCK) | \
202 (1UL << VMW_BALLOON_CMD_BATCHED_2M_UNLOCK))
203
Nadav Amit68131182018-09-20 10:30:08 -0700204static const char * const vmballoon_cmd_names[] = {
205 [VMW_BALLOON_CMD_START] = "start",
206 [VMW_BALLOON_CMD_GET_TARGET] = "target",
207 [VMW_BALLOON_CMD_LOCK] = "lock",
208 [VMW_BALLOON_CMD_UNLOCK] = "unlock",
209 [VMW_BALLOON_CMD_GUEST_ID] = "guestType",
210 [VMW_BALLOON_CMD_BATCHED_LOCK] = "batchLock",
211 [VMW_BALLOON_CMD_BATCHED_UNLOCK] = "batchUnlock",
212 [VMW_BALLOON_CMD_BATCHED_2M_LOCK] = "2m-lock",
213 [VMW_BALLOON_CMD_BATCHED_2M_UNLOCK] = "2m-unlock",
214 [VMW_BALLOON_CMD_VMCI_DOORBELL_SET] = "doorbellSet"
215};
216
Nadav Amitc7b36902018-09-20 10:30:17 -0700217enum vmballoon_stat_page {
218 VMW_BALLOON_PAGE_STAT_ALLOC,
219 VMW_BALLOON_PAGE_STAT_ALLOC_FAIL,
220 VMW_BALLOON_PAGE_STAT_REFUSED_ALLOC,
221 VMW_BALLOON_PAGE_STAT_REFUSED_FREE,
222 VMW_BALLOON_PAGE_STAT_FREE,
223 VMW_BALLOON_PAGE_STAT_LAST = VMW_BALLOON_PAGE_STAT_FREE
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400224};
225
Nadav Amitc7b36902018-09-20 10:30:17 -0700226#define VMW_BALLOON_PAGE_STAT_NUM (VMW_BALLOON_PAGE_STAT_LAST + 1)
227
228enum vmballoon_stat_general {
229 VMW_BALLOON_STAT_TIMER,
230 VMW_BALLOON_STAT_DOORBELL,
Nadav Amit8840a6f2018-09-20 10:30:20 -0700231 VMW_BALLOON_STAT_RESET,
232 VMW_BALLOON_STAT_LAST = VMW_BALLOON_STAT_RESET
Nadav Amitc7b36902018-09-20 10:30:17 -0700233};
234
235#define VMW_BALLOON_STAT_NUM (VMW_BALLOON_STAT_LAST + 1)
236
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400237
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700238static DEFINE_STATIC_KEY_TRUE(vmw_balloon_batching);
Nadav Amitc7b36902018-09-20 10:30:17 -0700239static DEFINE_STATIC_KEY_FALSE(balloon_stat_enabled);
Xavier Deguillardf220a802015-08-06 15:17:58 -0700240
Nadav Amit6e4453b2018-09-20 10:30:18 -0700241struct vmballoon_ctl {
242 struct list_head pages;
243 struct list_head refused_pages;
244 unsigned int n_refused_pages;
245 unsigned int n_pages;
246 enum vmballoon_page_size_type page_size;
247 enum vmballoon_op op;
248};
249
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700250struct vmballoon_page_size {
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400251 /* list of reserved physical pages */
252 struct list_head pages;
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700253};
254
Nadav Amit6c948752018-09-20 10:30:10 -0700255/**
256 * struct vmballoon_batch_entry - a batch entry for lock or unlock.
257 *
258 * @status: the status of the operation, which is written by the hypervisor.
259 * @reserved: reserved for future use. Must be set to zero.
260 * @pfn: the physical frame number of the page to be locked or unlocked.
261 */
262struct vmballoon_batch_entry {
263 u64 status : 5;
264 u64 reserved : PAGE_SHIFT - 5;
265 u64 pfn : 52;
266} __packed;
267
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700268struct vmballoon {
269 struct vmballoon_page_size page_sizes[VMW_BALLOON_NUM_PAGE_SIZES];
270
Nadav Amit6e4453b2018-09-20 10:30:18 -0700271 /**
272 * @max_page_size: maximum supported page size for ballooning.
273 *
274 * Protected by @conf_sem
275 */
276 enum vmballoon_page_size_type max_page_size;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400277
Nadav Amit6e4453b2018-09-20 10:30:18 -0700278 /**
279 * @size: balloon actual size in basic page size (frames).
280 *
281 * While we currently do not support size which is bigger than 32-bit,
282 * in preparation for future support, use 64-bits.
283 */
284 atomic64_t size;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400285
Nadav Amit6e4453b2018-09-20 10:30:18 -0700286 /**
287 * @target: balloon target size in basic page size (frames).
288 *
289 * We do not protect the target under the assumption that setting the
290 * value is always done through a single write. If this assumption ever
291 * breaks, we would have to use X_ONCE for accesses, and suffer the less
292 * optimized code. Although we may read stale target value if multiple
293 * accesses happen at once, the performance impact should be minor.
294 */
295 unsigned long target;
296
297 /**
298 * @reset_required: reset flag
299 *
300 * Setting this flag may introduce races, but the code is expected to
301 * handle them gracefully. In the worst case, another operation will
302 * fail as reset did not take place. Clearing the flag is done while
303 * holding @conf_sem for write.
304 */
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400305 bool reset_required;
306
Nadav Amit6e4453b2018-09-20 10:30:18 -0700307 /**
308 * @capabilities: hypervisor balloon capabilities.
309 *
310 * Protected by @conf_sem.
311 */
Xavier Deguillardf220a802015-08-06 15:17:58 -0700312 unsigned long capabilities;
313
Nadav Amit6c948752018-09-20 10:30:10 -0700314 /**
315 * @batch_page: pointer to communication batch page.
316 *
317 * When batching is used, batch_page points to a page, which holds up to
318 * %VMW_BALLOON_BATCH_MAX_PAGES entries for locking or unlocking.
319 */
320 struct vmballoon_batch_entry *batch_page;
321
Nadav Amit6e4453b2018-09-20 10:30:18 -0700322 /**
323 * @batch_max_pages: maximum pages that can be locked/unlocked.
324 *
325 * Indicates the number of pages that the hypervisor can lock or unlock
326 * at once, according to whether batching is enabled. If batching is
327 * disabled, only a single page can be locked/unlock on each operation.
328 *
329 * Protected by @conf_sem.
330 */
Xavier Deguillardf220a802015-08-06 15:17:58 -0700331 unsigned int batch_max_pages;
Nadav Amit6e4453b2018-09-20 10:30:18 -0700332
333 /**
334 * @page: page to be locked/unlocked by the hypervisor
335 *
336 * @page is only used when batching is disabled and a single page is
337 * reclaimed on each iteration.
338 *
339 * Protected by @comm_lock.
340 */
Xavier Deguillardf220a802015-08-06 15:17:58 -0700341 struct page *page;
342
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400343 /* statistics */
Nadav Amitc7b36902018-09-20 10:30:17 -0700344 struct vmballoon_stats *stats;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400345
Nadav Amitc7b36902018-09-20 10:30:17 -0700346#ifdef CONFIG_DEBUG_FS
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400347 /* debugfs file exporting statistics */
348 struct dentry *dbg_entry;
349#endif
350
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400351 struct delayed_work dwork;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -0700352
Nadav Amit6e4453b2018-09-20 10:30:18 -0700353 /**
354 * @vmci_doorbell.
355 *
356 * Protected by @conf_sem.
357 */
Philip P. Moltmann48e3d662015-08-06 15:18:01 -0700358 struct vmci_handle vmci_doorbell;
Nadav Amitc7b36902018-09-20 10:30:17 -0700359
360 /**
361 * @conf_sem: semaphore to protect the configuration and the statistics.
362 */
363 struct rw_semaphore conf_sem;
Nadav Amit6e4453b2018-09-20 10:30:18 -0700364
365 /**
366 * @comm_lock: lock to protect the communication with the host.
367 *
368 * Lock ordering: @conf_sem -> @comm_lock .
369 */
370 spinlock_t comm_lock;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400371};
372
373static struct vmballoon balloon;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400374
Nadav Amitc7b36902018-09-20 10:30:17 -0700375struct vmballoon_stats {
376 /* timer / doorbell operations */
377 atomic64_t general_stat[VMW_BALLOON_STAT_NUM];
378
379 /* allocation statistics for huge and small pages */
380 atomic64_t
381 page_stat[VMW_BALLOON_PAGE_STAT_NUM][VMW_BALLOON_NUM_PAGE_SIZES];
382
383 /* Monitor operations: total operations, and failures */
384 atomic64_t ops[VMW_BALLOON_CMD_NUM][VMW_BALLOON_OP_STAT_TYPES];
385};
386
387static inline bool is_vmballoon_stats_on(void)
388{
389 return IS_ENABLED(CONFIG_DEBUG_FS) &&
390 static_branch_unlikely(&balloon_stat_enabled);
391}
392
393static inline void vmballoon_stats_op_inc(struct vmballoon *b, unsigned int op,
394 enum vmballoon_op_stat_type type)
395{
396 if (is_vmballoon_stats_on())
397 atomic64_inc(&b->stats->ops[op][type]);
398}
399
400static inline void vmballoon_stats_gen_inc(struct vmballoon *b,
401 enum vmballoon_stat_general stat)
402{
403 if (is_vmballoon_stats_on())
404 atomic64_inc(&b->stats->general_stat[stat]);
405}
406
407static inline void vmballoon_stats_gen_add(struct vmballoon *b,
408 enum vmballoon_stat_general stat,
409 unsigned int val)
410{
411 if (is_vmballoon_stats_on())
412 atomic64_add(val, &b->stats->general_stat[stat]);
413}
414
415static inline void vmballoon_stats_page_inc(struct vmballoon *b,
416 enum vmballoon_stat_page stat,
Nadav Amit6e4453b2018-09-20 10:30:18 -0700417 enum vmballoon_page_size_type size)
Nadav Amitc7b36902018-09-20 10:30:17 -0700418{
419 if (is_vmballoon_stats_on())
Nadav Amit6e4453b2018-09-20 10:30:18 -0700420 atomic64_inc(&b->stats->page_stat[stat][size]);
421}
422
423static inline void vmballoon_stats_page_add(struct vmballoon *b,
424 enum vmballoon_stat_page stat,
425 enum vmballoon_page_size_type size,
426 unsigned int val)
427{
428 if (is_vmballoon_stats_on())
429 atomic64_add(val, &b->stats->page_stat[stat][size]);
Nadav Amitc7b36902018-09-20 10:30:17 -0700430}
431
Nadav Amit10a95d52018-09-20 10:30:07 -0700432static inline unsigned long
433__vmballoon_cmd(struct vmballoon *b, unsigned long cmd, unsigned long arg1,
434 unsigned long arg2, unsigned long *result)
435{
436 unsigned long status, dummy1, dummy2, dummy3, local_result;
437
Nadav Amitc7b36902018-09-20 10:30:17 -0700438 vmballoon_stats_op_inc(b, cmd, VMW_BALLOON_OP_STAT);
Nadav Amit68131182018-09-20 10:30:08 -0700439
Nadav Amit10a95d52018-09-20 10:30:07 -0700440 asm volatile ("inl %%dx" :
441 "=a"(status),
442 "=c"(dummy1),
443 "=d"(dummy2),
444 "=b"(local_result),
445 "=S"(dummy3) :
446 "0"(VMW_BALLOON_HV_MAGIC),
447 "1"(cmd),
448 "2"(VMW_BALLOON_HV_PORT),
449 "3"(arg1),
450 "4"(arg2) :
451 "memory");
452
453 /* update the result if needed */
454 if (result)
455 *result = (cmd == VMW_BALLOON_CMD_START) ? dummy1 :
456 local_result;
457
458 /* update target when applicable */
459 if (status == VMW_BALLOON_SUCCESS &&
460 ((1ul << cmd) & VMW_BALLOON_CMD_WITH_TARGET_MASK))
Nadav Amit6e4453b2018-09-20 10:30:18 -0700461 WRITE_ONCE(b->target, local_result);
Nadav Amit10a95d52018-09-20 10:30:07 -0700462
Nadav Amit68131182018-09-20 10:30:08 -0700463 if (status != VMW_BALLOON_SUCCESS &&
464 status != VMW_BALLOON_SUCCESS_WITH_CAPABILITIES) {
Nadav Amitc7b36902018-09-20 10:30:17 -0700465 vmballoon_stats_op_inc(b, cmd, VMW_BALLOON_OP_FAIL_STAT);
Nadav Amit68131182018-09-20 10:30:08 -0700466 pr_debug("%s: %s [0x%lx,0x%lx) failed, returned %ld\n",
467 __func__, vmballoon_cmd_names[cmd], arg1, arg2,
468 status);
469 }
470
Nadav Amit10a95d52018-09-20 10:30:07 -0700471 /* mark reset required accordingly */
472 if (status == VMW_BALLOON_ERROR_RESET)
473 b->reset_required = true;
474
475 return status;
476}
477
478static __always_inline unsigned long
479vmballoon_cmd(struct vmballoon *b, unsigned long cmd, unsigned long arg1,
480 unsigned long arg2)
481{
482 unsigned long dummy;
483
484 return __vmballoon_cmd(b, cmd, arg1, arg2, &dummy);
485}
486
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400487/*
488 * Send "start" command to the host, communicating supported version
489 * of the protocol.
490 */
Nadav Amit22d293e2018-09-20 10:30:19 -0700491static int vmballoon_send_start(struct vmballoon *b, unsigned long req_caps)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400492{
Nadav Amit10a95d52018-09-20 10:30:07 -0700493 unsigned long status, capabilities;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400494
Nadav Amit10a95d52018-09-20 10:30:07 -0700495 status = __vmballoon_cmd(b, VMW_BALLOON_CMD_START, req_caps, 0,
496 &capabilities);
Xavier Deguillardf220a802015-08-06 15:17:58 -0700497
498 switch (status) {
499 case VMW_BALLOON_SUCCESS_WITH_CAPABILITIES:
500 b->capabilities = capabilities;
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700501 break;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700502 case VMW_BALLOON_SUCCESS:
503 b->capabilities = VMW_BALLOON_BASIC_CMDS;
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700504 break;
505 default:
Nadav Amit22d293e2018-09-20 10:30:19 -0700506 return -EIO;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700507 }
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400508
Nadav Amit5081efd2018-06-19 16:00:25 -0700509 /*
510 * 2MB pages are only supported with batching. If batching is for some
511 * reason disabled, do not use 2MB pages, since otherwise the legacy
512 * mechanism is used with 2MB pages, causing a failure.
513 */
Nadav Amit6e4453b2018-09-20 10:30:18 -0700514 b->max_page_size = VMW_BALLOON_4K_PAGE;
Nadav Amit5081efd2018-06-19 16:00:25 -0700515 if ((b->capabilities & VMW_BALLOON_BATCHED_2M_CMDS) &&
516 (b->capabilities & VMW_BALLOON_BATCHED_CMDS))
Nadav Amit6e4453b2018-09-20 10:30:18 -0700517 b->max_page_size = VMW_BALLOON_2M_PAGE;
518
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700519
Nadav Amit22d293e2018-09-20 10:30:19 -0700520 return 0;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400521}
522
Nadav Amit22d293e2018-09-20 10:30:19 -0700523/**
524 * vmballoon_send_guest_id - communicate guest type to the host.
525 *
526 * @b: pointer to the balloon.
527 *
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400528 * Communicate guest type to the host so that it can adjust ballooning
529 * algorithm to the one most appropriate for the guest. This command
530 * is normally issued after sending "start" command and is part of
531 * standard reset sequence.
Nadav Amit22d293e2018-09-20 10:30:19 -0700532 *
533 * Return: zero on success or appropriate error code.
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400534 */
Nadav Amit22d293e2018-09-20 10:30:19 -0700535static int vmballoon_send_guest_id(struct vmballoon *b)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400536{
Nadav Amit10a95d52018-09-20 10:30:07 -0700537 unsigned long status;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400538
Nadav Amit10a95d52018-09-20 10:30:07 -0700539 status = vmballoon_cmd(b, VMW_BALLOON_CMD_GUEST_ID,
540 VMW_BALLOON_GUEST_ID, 0);
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400541
Nadav Amit22d293e2018-09-20 10:30:19 -0700542 return status == VMW_BALLOON_SUCCESS ? 0 : -EIO;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400543}
544
Nadav Amit6e4453b2018-09-20 10:30:18 -0700545/**
546 * vmballoon_page_order() - return the order of the page
547 * @page_size: the size of the page.
548 *
549 * Return: the allocation order.
550 */
551static inline
552unsigned int vmballoon_page_order(enum vmballoon_page_size_type page_size)
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700553{
Nadav Amit6e4453b2018-09-20 10:30:18 -0700554 return page_size == VMW_BALLOON_2M_PAGE ? VMW_BALLOON_2M_ORDER : 0;
555}
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700556
Nadav Amit6e4453b2018-09-20 10:30:18 -0700557/**
558 * vmballoon_page_in_frames() - returns the number of frames in a page.
559 * @page_size: the size of the page.
560 *
561 * Return: the number of 4k frames.
562 */
563static inline unsigned int
564vmballoon_page_in_frames(enum vmballoon_page_size_type page_size)
565{
566 return 1 << vmballoon_page_order(page_size);
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700567}
568
Nadav Amit0395be32018-09-20 10:30:16 -0700569/**
David Hildenbrand81655402019-03-05 15:42:41 -0800570 * vmballoon_mark_page_offline() - mark a page as offline
571 * @page: pointer for the page.
572 * @page_size: the size of the page.
573 */
574static void
575vmballoon_mark_page_offline(struct page *page,
576 enum vmballoon_page_size_type page_size)
577{
578 int i;
579
580 for (i = 0; i < vmballoon_page_in_frames(page_size); i++)
581 __SetPageOffline(page + i);
582}
583
584/**
585 * vmballoon_mark_page_online() - mark a page as online
586 * @page: pointer for the page.
587 * @page_size: the size of the page.
588 */
589static void
590vmballoon_mark_page_online(struct page *page,
591 enum vmballoon_page_size_type page_size)
592{
593 int i;
594
595 for (i = 0; i < vmballoon_page_in_frames(page_size); i++)
596 __ClearPageOffline(page + i);
597}
598
599/**
Nadav Amit0395be32018-09-20 10:30:16 -0700600 * vmballoon_send_get_target() - Retrieve desired balloon size from the host.
601 *
602 * @b: pointer to the balloon.
603 *
604 * Return: zero on success, EINVAL if limit does not fit in 32-bit, as required
605 * by the host-guest protocol and EIO if an error occurred in communicating with
606 * the host.
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400607 */
Nadav Amit0395be32018-09-20 10:30:16 -0700608static int vmballoon_send_get_target(struct vmballoon *b)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400609{
610 unsigned long status;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400611 unsigned long limit;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400612
Arun KSca79b0c2018-12-28 00:34:29 -0800613 limit = totalram_pages();
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400614
Xavier Deguillard55398302019-02-06 15:57:02 -0800615 /* Ensure limit fits in 32-bits if 64-bit targets are not supported */
616 if (!(b->capabilities & VMW_BALLOON_64_BIT_TARGET) &&
617 limit != (u32)limit)
Nadav Amit0395be32018-09-20 10:30:16 -0700618 return -EINVAL;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400619
Nadav Amit10a95d52018-09-20 10:30:07 -0700620 status = vmballoon_cmd(b, VMW_BALLOON_CMD_GET_TARGET, limit, 0);
621
Nadav Amit0395be32018-09-20 10:30:16 -0700622 return status == VMW_BALLOON_SUCCESS ? 0 : -EIO;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400623}
624
Nadav Amit6e4453b2018-09-20 10:30:18 -0700625/**
626 * vmballoon_alloc_page_list - allocates a list of pages.
627 *
628 * @b: pointer to the balloon.
629 * @ctl: pointer for the %struct vmballoon_ctl, which defines the operation.
630 * @req_n_pages: the number of requested pages.
631 *
632 * Tries to allocate @req_n_pages. Add them to the list of balloon pages in
633 * @ctl.pages and updates @ctl.n_pages to reflect the number of pages.
634 *
635 * Return: zero on success or error code otherwise.
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400636 */
Nadav Amit6e4453b2018-09-20 10:30:18 -0700637static int vmballoon_alloc_page_list(struct vmballoon *b,
638 struct vmballoon_ctl *ctl,
639 unsigned int req_n_pages)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400640{
Nadav Amit6e4453b2018-09-20 10:30:18 -0700641 struct page *page;
642 unsigned int i;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400643
Nadav Amit6e4453b2018-09-20 10:30:18 -0700644 for (i = 0; i < req_n_pages; i++) {
645 if (ctl->page_size == VMW_BALLOON_2M_PAGE)
646 page = alloc_pages(VMW_HUGE_PAGE_ALLOC_FLAGS,
647 VMW_BALLOON_2M_ORDER);
648 else
649 page = alloc_page(VMW_PAGE_ALLOC_FLAGS);
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700650
Nadav Amit6e4453b2018-09-20 10:30:18 -0700651 /* Update statistics */
652 vmballoon_stats_page_inc(b, VMW_BALLOON_PAGE_STAT_ALLOC,
653 ctl->page_size);
654
655 if (page) {
David Hildenbrand81655402019-03-05 15:42:41 -0800656 vmballoon_mark_page_offline(page, ctl->page_size);
Nadav Amit6e4453b2018-09-20 10:30:18 -0700657 /* Success. Add the page to the list and continue. */
658 list_add(&page->lru, &ctl->pages);
659 continue;
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700660 }
Nadav Amit6e4453b2018-09-20 10:30:18 -0700661
662 /* Allocation failed. Update statistics and stop. */
663 vmballoon_stats_page_inc(b, VMW_BALLOON_PAGE_STAT_ALLOC_FAIL,
664 ctl->page_size);
665 break;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400666 }
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400667
Nadav Amit6e4453b2018-09-20 10:30:18 -0700668 ctl->n_pages = i;
669
670 return req_n_pages == ctl->n_pages ? 0 : -ENOMEM;
671}
672
673/**
674 * vmballoon_handle_one_result - Handle lock/unlock result for a single page.
675 *
676 * @b: pointer for %struct vmballoon.
677 * @page: pointer for the page whose result should be handled.
678 * @page_size: size of the page.
679 * @status: status of the operation as provided by the hypervisor.
680 */
681static int vmballoon_handle_one_result(struct vmballoon *b, struct page *page,
682 enum vmballoon_page_size_type page_size,
683 unsigned long status)
684{
685 /* On success do nothing. The page is already on the balloon list. */
686 if (likely(status == VMW_BALLOON_SUCCESS))
687 return 0;
688
689 pr_debug("%s: failed comm pfn %lx status %lu page_size %s\n", __func__,
690 page_to_pfn(page), status,
691 vmballoon_page_size_names[page_size]);
692
693 /* Error occurred */
694 vmballoon_stats_page_inc(b, VMW_BALLOON_PAGE_STAT_REFUSED_ALLOC,
695 page_size);
696
697 return -EIO;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400698}
699
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700700/**
701 * vmballoon_status_page - returns the status of (un)lock operation
702 *
703 * @b: pointer to the balloon.
704 * @idx: index for the page for which the operation is performed.
705 * @p: pointer to where the page struct is returned.
706 *
707 * Following a lock or unlock operation, returns the status of the operation for
708 * an individual page. Provides the page that the operation was performed on on
709 * the @page argument.
710 *
711 * Returns: The status of a lock or unlock operation for an individual page.
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400712 */
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700713static unsigned long vmballoon_status_page(struct vmballoon *b, int idx,
714 struct page **p)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400715{
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700716 if (static_branch_likely(&vmw_balloon_batching)) {
717 /* batching mode */
718 *p = pfn_to_page(b->batch_page[idx].pfn);
719 return b->batch_page[idx].status;
Xavier Deguillardef0f8f12015-06-12 11:43:22 -0700720 }
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400721
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700722 /* non-batching mode */
723 *p = b->page;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400724
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700725 /*
726 * If a failure occurs, the indication will be provided in the status
727 * of the entire operation, which is considered before the individual
728 * page status. So for non-batching mode, the indication is always of
729 * success.
730 */
731 return VMW_BALLOON_SUCCESS;
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400732}
733
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700734/**
735 * vmballoon_lock_op - notifies the host about inflated/deflated pages.
736 * @b: pointer to the balloon.
737 * @num_pages: number of inflated/deflated pages.
Nadav Amit6e4453b2018-09-20 10:30:18 -0700738 * @page_size: size of the page.
739 * @op: the type of operation (lock or unlock).
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700740 *
741 * Notify the host about page(s) that were ballooned (or removed from the
742 * balloon) so that host can use it without fear that guest will need it (or
743 * stop using them since the VM does). Host may reject some pages, we need to
744 * check the return value and maybe submit a different page. The pages that are
745 * inflated/deflated are pointed by @b->page.
746 *
747 * Return: result as provided by the hypervisor.
748 */
749static unsigned long vmballoon_lock_op(struct vmballoon *b,
750 unsigned int num_pages,
Nadav Amit6e4453b2018-09-20 10:30:18 -0700751 enum vmballoon_page_size_type page_size,
752 enum vmballoon_op op)
Xavier Deguillardf220a802015-08-06 15:17:58 -0700753{
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700754 unsigned long cmd, pfn;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700755
Nadav Amit6e4453b2018-09-20 10:30:18 -0700756 lockdep_assert_held(&b->comm_lock);
757
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700758 if (static_branch_likely(&vmw_balloon_batching)) {
Nadav Amit6e4453b2018-09-20 10:30:18 -0700759 if (op == VMW_BALLOON_INFLATE)
760 cmd = page_size == VMW_BALLOON_2M_PAGE ?
761 VMW_BALLOON_CMD_BATCHED_2M_LOCK :
762 VMW_BALLOON_CMD_BATCHED_LOCK;
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700763 else
Nadav Amit6e4453b2018-09-20 10:30:18 -0700764 cmd = page_size == VMW_BALLOON_2M_PAGE ?
765 VMW_BALLOON_CMD_BATCHED_2M_UNLOCK :
766 VMW_BALLOON_CMD_BATCHED_UNLOCK;
Nadav Amit10a95d52018-09-20 10:30:07 -0700767
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700768 pfn = PHYS_PFN(virt_to_phys(b->batch_page));
769 } else {
Nadav Amit6e4453b2018-09-20 10:30:18 -0700770 cmd = op == VMW_BALLOON_INFLATE ? VMW_BALLOON_CMD_LOCK :
771 VMW_BALLOON_CMD_UNLOCK;
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700772 pfn = page_to_pfn(b->page);
Xavier Deguillardf220a802015-08-06 15:17:58 -0700773
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700774 /* In non-batching mode, PFNs must fit in 32-bit */
775 if (unlikely(pfn != (u32)pfn))
776 return VMW_BALLOON_ERROR_PPN_INVALID;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700777 }
778
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700779 return vmballoon_cmd(b, cmd, pfn, num_pages);
780}
781
Nadav Amit6e4453b2018-09-20 10:30:18 -0700782/**
783 * vmballoon_add_page - adds a page towards lock/unlock operation.
784 *
785 * @b: pointer to the balloon.
786 * @idx: index of the page to be ballooned in this batch.
787 * @p: pointer to the page that is about to be ballooned.
788 *
789 * Adds the page to be ballooned. Must be called while holding @comm_lock.
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400790 */
Nadav Amit6e4453b2018-09-20 10:30:18 -0700791static void vmballoon_add_page(struct vmballoon *b, unsigned int idx,
792 struct page *p)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400793{
Nadav Amit6e4453b2018-09-20 10:30:18 -0700794 lockdep_assert_held(&b->comm_lock);
795
796 if (static_branch_likely(&vmw_balloon_batching))
797 b->batch_page[idx] = (struct vmballoon_batch_entry)
798 { .pfn = page_to_pfn(p) };
799 else
800 b->page = p;
801}
802
803/**
804 * vmballoon_lock - lock or unlock a batch of pages.
805 *
806 * @b: pointer to the balloon.
807 * @ctl: pointer for the %struct vmballoon_ctl, which defines the operation.
808 *
809 * Notifies the host of about ballooned pages (after inflation or deflation,
810 * according to @ctl). If the host rejects the page put it on the
811 * @ctl refuse list. These refused page are then released when moving to the
812 * next size of pages.
813 *
814 * Note that we neither free any @page here nor put them back on the ballooned
815 * pages list. Instead we queue it for later processing. We do that for several
816 * reasons. First, we do not want to free the page under the lock. Second, it
817 * allows us to unify the handling of lock and unlock. In the inflate case, the
818 * caller will check if there are too many refused pages and release them.
819 * Although it is not identical to the past behavior, it should not affect
820 * performance.
821 */
822static int vmballoon_lock(struct vmballoon *b, struct vmballoon_ctl *ctl)
823{
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700824 unsigned long batch_status;
Nadav Amit6e4453b2018-09-20 10:30:18 -0700825 struct page *page;
826 unsigned int i, num_pages;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700827
Nadav Amit6e4453b2018-09-20 10:30:18 -0700828 num_pages = ctl->n_pages;
829 if (num_pages == 0)
830 return 0;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700831
Nadav Amit6e4453b2018-09-20 10:30:18 -0700832 /* communication with the host is done under the communication lock */
833 spin_lock(&b->comm_lock);
834
835 i = 0;
836 list_for_each_entry(page, &ctl->pages, lru)
837 vmballoon_add_page(b, i++, page);
838
839 batch_status = vmballoon_lock_op(b, ctl->n_pages, ctl->page_size,
840 ctl->op);
841
842 /*
843 * Iterate over the pages in the provided list. Since we are changing
844 * @ctl->n_pages we are saving the original value in @num_pages and
845 * use this value to bound the loop.
846 */
Xavier Deguillardf220a802015-08-06 15:17:58 -0700847 for (i = 0; i < num_pages; i++) {
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700848 unsigned long status;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700849
Nadav Amit6e4453b2018-09-20 10:30:18 -0700850 status = vmballoon_status_page(b, i, &page);
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700851
852 /*
853 * Failure of the whole batch overrides a single operation
854 * results.
855 */
856 if (batch_status != VMW_BALLOON_SUCCESS)
857 status = batch_status;
858
Nadav Amit6e4453b2018-09-20 10:30:18 -0700859 /* Continue if no error happened */
860 if (!vmballoon_handle_one_result(b, page, ctl->page_size,
861 status))
862 continue;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700863
Nadav Amit6e4453b2018-09-20 10:30:18 -0700864 /*
865 * Error happened. Move the pages to the refused list and update
866 * the pages number.
867 */
868 list_move(&page->lru, &ctl->refused_pages);
869 ctl->n_pages--;
870 ctl->n_refused_pages++;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700871 }
872
Nadav Amit6e4453b2018-09-20 10:30:18 -0700873 spin_unlock(&b->comm_lock);
874
Nadav Amitdf8d0d42018-09-20 10:30:12 -0700875 return batch_status == VMW_BALLOON_SUCCESS ? 0 : -EIO;
Xavier Deguillardf220a802015-08-06 15:17:58 -0700876}
877
Nadav Amit6e4453b2018-09-20 10:30:18 -0700878/**
879 * vmballoon_release_page_list() - Releases a page list
880 *
881 * @page_list: list of pages to release.
882 * @n_pages: pointer to the number of pages.
883 * @page_size: whether the pages in the list are 2MB (or else 4KB).
884 *
885 * Releases the list of pages and zeros the number of pages.
886 */
887static void vmballoon_release_page_list(struct list_head *page_list,
888 int *n_pages,
889 enum vmballoon_page_size_type page_size)
890{
891 struct page *page, *tmp;
892
893 list_for_each_entry_safe(page, tmp, page_list, lru) {
894 list_del(&page->lru);
David Hildenbrand81655402019-03-05 15:42:41 -0800895 vmballoon_mark_page_online(page, page_size);
Nadav Amit6e4453b2018-09-20 10:30:18 -0700896 __free_pages(page, vmballoon_page_order(page_size));
897 }
898
899 *n_pages = 0;
900}
901
902
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400903/*
904 * Release pages that were allocated while attempting to inflate the
905 * balloon but were refused by the host for one reason or another.
906 */
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -0700907static void vmballoon_release_refused_pages(struct vmballoon *b,
Nadav Amit6e4453b2018-09-20 10:30:18 -0700908 struct vmballoon_ctl *ctl)
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400909{
Nadav Amit6e4453b2018-09-20 10:30:18 -0700910 vmballoon_stats_page_inc(b, VMW_BALLOON_PAGE_STAT_REFUSED_FREE,
911 ctl->page_size);
Dmitry Torokhov453dc652010-04-23 13:18:08 -0400912
Nadav Amit6e4453b2018-09-20 10:30:18 -0700913 vmballoon_release_page_list(&ctl->refused_pages, &ctl->n_refused_pages,
914 ctl->page_size);
Xavier Deguillardf220a802015-08-06 15:17:58 -0700915}
916
Nadav Amit8b079cd2018-09-20 10:30:15 -0700917/**
918 * vmballoon_change - retrieve the required balloon change
919 *
920 * @b: pointer for the balloon.
921 *
922 * Return: the required change for the balloon size. A positive number
923 * indicates inflation, a negative number indicates a deflation.
924 */
925static int64_t vmballoon_change(struct vmballoon *b)
926{
927 int64_t size, target;
928
Nadav Amit6e4453b2018-09-20 10:30:18 -0700929 size = atomic64_read(&b->size);
930 target = READ_ONCE(b->target);
Nadav Amit8b079cd2018-09-20 10:30:15 -0700931
932 /*
933 * We must cast first because of int sizes
934 * Otherwise we might get huge positives instead of negatives
935 */
936
937 if (b->reset_required)
938 return 0;
939
940 /* consider a 2MB slack on deflate, unless the balloon is emptied */
Nadav Amit6e4453b2018-09-20 10:30:18 -0700941 if (target < size && target != 0 &&
942 size - target < vmballoon_page_in_frames(VMW_BALLOON_2M_PAGE))
Nadav Amit8b079cd2018-09-20 10:30:15 -0700943 return 0;
944
945 return target - size;
946}
947
Nadav Amit6e4453b2018-09-20 10:30:18 -0700948/**
949 * vmballoon_enqueue_page_list() - Enqueues list of pages after inflation.
950 *
951 * @b: pointer to balloon.
952 * @pages: list of pages to enqueue.
953 * @n_pages: pointer to number of pages in list. The value is zeroed.
954 * @page_size: whether the pages are 2MB or 4KB pages.
955 *
956 * Enqueues the provides list of pages in the ballooned page list, clears the
957 * list and zeroes the number of pages that was provided.
958 */
959static void vmballoon_enqueue_page_list(struct vmballoon *b,
960 struct list_head *pages,
961 unsigned int *n_pages,
962 enum vmballoon_page_size_type page_size)
963{
964 struct vmballoon_page_size *page_size_info = &b->page_sizes[page_size];
965
966 list_splice_init(pages, &page_size_info->pages);
967 *n_pages = 0;
968}
969
970/**
971 * vmballoon_dequeue_page_list() - Dequeues page lists for deflation.
972 *
973 * @b: pointer to balloon.
974 * @pages: list of pages to enqueue.
975 * @n_pages: pointer to number of pages in list. The value is zeroed.
976 * @page_size: whether the pages are 2MB or 4KB pages.
977 * @n_req_pages: the number of requested pages.
978 *
979 * Dequeues the number of requested pages from the balloon for deflation. The
980 * number of dequeued pages may be lower, if not enough pages in the requested
981 * size are available.
982 */
983static void vmballoon_dequeue_page_list(struct vmballoon *b,
984 struct list_head *pages,
985 unsigned int *n_pages,
986 enum vmballoon_page_size_type page_size,
987 unsigned int n_req_pages)
988{
989 struct vmballoon_page_size *page_size_info = &b->page_sizes[page_size];
990 struct page *page, *tmp;
991 unsigned int i = 0;
992
993 list_for_each_entry_safe(page, tmp, &page_size_info->pages, lru) {
994 list_move(&page->lru, pages);
995 if (++i == n_req_pages)
996 break;
997 }
998 *n_pages = i;
999}
1000
1001/**
1002 * vmballoon_inflate() - Inflate the balloon towards its target size.
1003 *
1004 * @b: pointer to the balloon.
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001005 */
1006static void vmballoon_inflate(struct vmballoon *b)
1007{
Nadav Amit6e4453b2018-09-20 10:30:18 -07001008 int64_t to_inflate_frames;
1009 struct vmballoon_ctl ctl = {
1010 .pages = LIST_HEAD_INIT(ctl.pages),
1011 .refused_pages = LIST_HEAD_INIT(ctl.refused_pages),
1012 .page_size = b->max_page_size,
1013 .op = VMW_BALLOON_INFLATE
1014 };
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001015
Nadav Amit6e4453b2018-09-20 10:30:18 -07001016 while ((to_inflate_frames = vmballoon_change(b)) > 0) {
1017 unsigned int to_inflate_pages, page_in_frames;
1018 int alloc_error, lock_error = 0;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001019
Nadav Amit6e4453b2018-09-20 10:30:18 -07001020 VM_BUG_ON(!list_empty(&ctl.pages));
1021 VM_BUG_ON(ctl.n_pages != 0);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001022
Nadav Amit6e4453b2018-09-20 10:30:18 -07001023 page_in_frames = vmballoon_page_in_frames(ctl.page_size);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001024
Nadav Amit6e4453b2018-09-20 10:30:18 -07001025 to_inflate_pages = min_t(unsigned long, b->batch_max_pages,
1026 DIV_ROUND_UP_ULL(to_inflate_frames,
1027 page_in_frames));
Nadav Amitc7b36902018-09-20 10:30:17 -07001028
Nadav Amit6e4453b2018-09-20 10:30:18 -07001029 /* Start by allocating */
1030 alloc_error = vmballoon_alloc_page_list(b, &ctl,
1031 to_inflate_pages);
Nadav Amitc7b36902018-09-20 10:30:17 -07001032
Nadav Amit6e4453b2018-09-20 10:30:18 -07001033 /* Actually lock the pages by telling the hypervisor */
1034 lock_error = vmballoon_lock(b, &ctl);
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -07001035
Nadav Amit6e4453b2018-09-20 10:30:18 -07001036 /*
1037 * If an error indicates that something serious went wrong,
1038 * stop the inflation.
1039 */
1040 if (lock_error)
Nadav Amit622074a2018-09-20 10:30:11 -07001041 break;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001042
Nadav Amit6e4453b2018-09-20 10:30:18 -07001043 /* Update the balloon size */
1044 atomic64_add(ctl.n_pages * page_in_frames, &b->size);
Nadav Amit8fa3c612018-09-20 10:30:13 -07001045
Nadav Amit6e4453b2018-09-20 10:30:18 -07001046 vmballoon_enqueue_page_list(b, &ctl.pages, &ctl.n_pages,
1047 ctl.page_size);
Nadav Amit10a95d52018-09-20 10:30:07 -07001048
Nadav Amit6e4453b2018-09-20 10:30:18 -07001049 /*
1050 * If allocation failed or the number of refused pages exceeds
1051 * the maximum allowed, move to the next page size.
1052 */
1053 if (alloc_error ||
1054 ctl.n_refused_pages >= VMW_BALLOON_MAX_REFUSED) {
1055 if (ctl.page_size == VMW_BALLOON_4K_PAGE)
1056 break;
Nadav Amit8fa3c612018-09-20 10:30:13 -07001057
1058 /*
Nadav Amit6e4453b2018-09-20 10:30:18 -07001059 * Ignore errors from locking as we now switch to 4k
1060 * pages and we might get different errors.
Nadav Amit8fa3c612018-09-20 10:30:13 -07001061 */
Nadav Amit6e4453b2018-09-20 10:30:18 -07001062 vmballoon_release_refused_pages(b, &ctl);
1063 ctl.page_size--;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001064 }
Xavier Deguillardef0f8f12015-06-12 11:43:22 -07001065
Philip P. Moltmann33d268e2015-08-06 15:18:01 -07001066 cond_resched();
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001067 }
1068
Nadav Amit6e4453b2018-09-20 10:30:18 -07001069 /*
1070 * Release pages that were allocated while attempting to inflate the
1071 * balloon but were refused by the host for one reason or another,
1072 * and update the statistics.
1073 */
1074 if (ctl.n_refused_pages != 0)
1075 vmballoon_release_refused_pages(b, &ctl);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001076}
1077
Nadav Amit6e4453b2018-09-20 10:30:18 -07001078/**
1079 * vmballoon_deflate() - Decrease the size of the balloon.
1080 *
1081 * @b: pointer to the balloon
1082 * @n_frames: the number of frames to deflate. If zero, automatically
1083 * calculated according to the target size.
1084 * @coordinated: whether to coordinate with the host
1085 *
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001086 * Decrease the size of the balloon allowing guest to use more memory.
Nadav Amit6e4453b2018-09-20 10:30:18 -07001087 *
1088 * Return: The number of deflated frames (i.e., basic page size units)
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001089 */
Nadav Amit6e4453b2018-09-20 10:30:18 -07001090static unsigned long vmballoon_deflate(struct vmballoon *b, uint64_t n_frames,
1091 bool coordinated)
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001092{
Nadav Amit6e4453b2018-09-20 10:30:18 -07001093 unsigned long deflated_frames = 0;
1094 unsigned long tried_frames = 0;
1095 struct vmballoon_ctl ctl = {
1096 .pages = LIST_HEAD_INIT(ctl.pages),
1097 .refused_pages = LIST_HEAD_INIT(ctl.refused_pages),
1098 .page_size = VMW_BALLOON_4K_PAGE,
1099 .op = VMW_BALLOON_DEFLATE
1100 };
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001101
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001102 /* free pages to reach target */
Nadav Amit6e4453b2018-09-20 10:30:18 -07001103 while (true) {
1104 unsigned int to_deflate_pages, n_unlocked_frames;
1105 unsigned int page_in_frames;
1106 int64_t to_deflate_frames;
1107 bool deflated_all;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001108
Nadav Amit6e4453b2018-09-20 10:30:18 -07001109 page_in_frames = vmballoon_page_in_frames(ctl.page_size);
1110
1111 VM_BUG_ON(!list_empty(&ctl.pages));
1112 VM_BUG_ON(ctl.n_pages);
1113 VM_BUG_ON(!list_empty(&ctl.refused_pages));
1114 VM_BUG_ON(ctl.n_refused_pages);
1115
1116 /*
1117 * If we were requested a specific number of frames, we try to
1118 * deflate this number of frames. Otherwise, deflation is
1119 * performed according to the target and balloon size.
1120 */
1121 to_deflate_frames = n_frames ? n_frames - tried_frames :
1122 -vmballoon_change(b);
1123
1124 /* break if no work to do */
1125 if (to_deflate_frames <= 0)
1126 break;
1127
1128 /*
1129 * Calculate the number of frames based on current page size,
1130 * but limit the deflated frames to a single chunk
1131 */
1132 to_deflate_pages = min_t(unsigned long, b->batch_max_pages,
1133 DIV_ROUND_UP_ULL(to_deflate_frames,
1134 page_in_frames));
1135
1136 /* First take the pages from the balloon pages. */
1137 vmballoon_dequeue_page_list(b, &ctl.pages, &ctl.n_pages,
1138 ctl.page_size, to_deflate_pages);
1139
1140 /*
1141 * Before pages are moving to the refused list, count their
1142 * frames as frames that we tried to deflate.
1143 */
1144 tried_frames += ctl.n_pages * page_in_frames;
1145
1146 /*
1147 * Unlock the pages by communicating with the hypervisor if the
1148 * communication is coordinated (i.e., not pop). We ignore the
1149 * return code. Instead we check if all the pages we manage to
1150 * unlock all the pages. If we failed, we will move to the next
1151 * page size, and would eventually try again later.
1152 */
1153 if (coordinated)
1154 vmballoon_lock(b, &ctl);
1155
1156 /*
1157 * Check if we deflated enough. We will move to the next page
1158 * size if we did not manage to do so. This calculation takes
1159 * place now, as once the pages are released, the number of
1160 * pages is zeroed.
1161 */
1162 deflated_all = (ctl.n_pages == to_deflate_pages);
1163
1164 /* Update local and global counters */
1165 n_unlocked_frames = ctl.n_pages * page_in_frames;
1166 atomic64_sub(n_unlocked_frames, &b->size);
1167 deflated_frames += n_unlocked_frames;
1168
1169 vmballoon_stats_page_add(b, VMW_BALLOON_PAGE_STAT_FREE,
1170 ctl.page_size, ctl.n_pages);
1171
1172 /* free the ballooned pages */
1173 vmballoon_release_page_list(&ctl.pages, &ctl.n_pages,
1174 ctl.page_size);
1175
1176 /* Return the refused pages to the ballooned list. */
1177 vmballoon_enqueue_page_list(b, &ctl.refused_pages,
1178 &ctl.n_refused_pages,
1179 ctl.page_size);
1180
1181 /* If we failed to unlock all the pages, move to next size. */
1182 if (!deflated_all) {
1183 if (ctl.page_size == b->max_page_size)
Philip P. Moltmann365bd7e2015-08-06 15:18:01 -07001184 break;
Nadav Amit6e4453b2018-09-20 10:30:18 -07001185 ctl.page_size++;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001186 }
1187
Nadav Amit6e4453b2018-09-20 10:30:18 -07001188 cond_resched();
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001189 }
Nadav Amit6e4453b2018-09-20 10:30:18 -07001190
1191 return deflated_frames;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001192}
1193
Nadav Amitdf8d0d42018-09-20 10:30:12 -07001194/**
1195 * vmballoon_deinit_batching - disables batching mode.
1196 *
1197 * @b: pointer to &struct vmballoon.
1198 *
1199 * Disables batching, by deallocating the page for communication with the
1200 * hypervisor and disabling the static key to indicate that batching is off.
1201 */
1202static void vmballoon_deinit_batching(struct vmballoon *b)
1203{
1204 free_page((unsigned long)b->batch_page);
1205 b->batch_page = NULL;
1206 static_branch_disable(&vmw_balloon_batching);
1207 b->batch_max_pages = 1;
1208}
Xavier Deguillardf220a802015-08-06 15:17:58 -07001209
Nadav Amitdf8d0d42018-09-20 10:30:12 -07001210/**
1211 * vmballoon_init_batching - enable batching mode.
1212 *
1213 * @b: pointer to &struct vmballoon.
1214 *
1215 * Enables batching, by allocating a page for communication with the hypervisor
1216 * and enabling the static_key to use batching.
1217 *
1218 * Return: zero on success or an appropriate error-code.
1219 */
1220static int vmballoon_init_batching(struct vmballoon *b)
Xavier Deguillardf220a802015-08-06 15:17:58 -07001221{
Gil Kupferb23220f2018-06-01 00:47:47 -07001222 struct page *page;
1223
1224 page = alloc_page(GFP_KERNEL | __GFP_ZERO);
1225 if (!page)
Nadav Amitdf8d0d42018-09-20 10:30:12 -07001226 return -ENOMEM;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001227
Gil Kupferb23220f2018-06-01 00:47:47 -07001228 b->batch_page = page_address(page);
Nadav Amitdf8d0d42018-09-20 10:30:12 -07001229 b->batch_max_pages = PAGE_SIZE / sizeof(struct vmballoon_batch_entry);
1230
1231 static_branch_enable(&vmw_balloon_batching);
1232
1233 return 0;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001234}
1235
1236/*
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001237 * Receive notification and resize balloon
1238 */
1239static void vmballoon_doorbell(void *client_data)
1240{
1241 struct vmballoon *b = client_data;
1242
Nadav Amitc7b36902018-09-20 10:30:17 -07001243 vmballoon_stats_gen_inc(b, VMW_BALLOON_STAT_DOORBELL);
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001244
1245 mod_delayed_work(system_freezable_wq, &b->dwork, 0);
1246}
1247
1248/*
1249 * Clean up vmci doorbell
1250 */
1251static void vmballoon_vmci_cleanup(struct vmballoon *b)
1252{
Nadav Amit10a95d52018-09-20 10:30:07 -07001253 vmballoon_cmd(b, VMW_BALLOON_CMD_VMCI_DOORBELL_SET,
1254 VMCI_INVALID_ID, VMCI_INVALID_ID);
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001255
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001256 if (!vmci_handle_is_invalid(b->vmci_doorbell)) {
1257 vmci_doorbell_destroy(b->vmci_doorbell);
1258 b->vmci_doorbell = VMCI_INVALID_HANDLE;
1259 }
1260}
1261
Nadav Amit22d293e2018-09-20 10:30:19 -07001262/**
1263 * vmballoon_vmci_init - Initialize vmci doorbell.
1264 *
1265 * @b: pointer to the balloon.
1266 *
1267 * Return: zero on success or when wakeup command not supported. Error-code
1268 * otherwise.
1269 *
1270 * Initialize vmci doorbell, to get notified as soon as balloon changes.
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001271 */
1272static int vmballoon_vmci_init(struct vmballoon *b)
1273{
Nadav Amit10a95d52018-09-20 10:30:07 -07001274 unsigned long error;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001275
Nadav Amitce664332018-06-19 16:00:26 -07001276 if ((b->capabilities & VMW_BALLOON_SIGNALLED_WAKEUP_CMD) == 0)
1277 return 0;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001278
Nadav Amitce664332018-06-19 16:00:26 -07001279 error = vmci_doorbell_create(&b->vmci_doorbell, VMCI_FLAG_DELAYED_CB,
1280 VMCI_PRIVILEGE_FLAG_RESTRICTED,
1281 vmballoon_doorbell, b);
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001282
Nadav Amitce664332018-06-19 16:00:26 -07001283 if (error != VMCI_SUCCESS)
1284 goto fail;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001285
Nadav Amit10a95d52018-09-20 10:30:07 -07001286 error = __vmballoon_cmd(b, VMW_BALLOON_CMD_VMCI_DOORBELL_SET,
1287 b->vmci_doorbell.context,
1288 b->vmci_doorbell.resource, NULL);
Nadav Amitce664332018-06-19 16:00:26 -07001289
Nadav Amitce664332018-06-19 16:00:26 -07001290 if (error != VMW_BALLOON_SUCCESS)
1291 goto fail;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001292
1293 return 0;
Nadav Amitce664332018-06-19 16:00:26 -07001294fail:
1295 vmballoon_vmci_cleanup(b);
1296 return -EIO;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001297}
1298
Nadav Amit6e4453b2018-09-20 10:30:18 -07001299/**
1300 * vmballoon_pop - Quickly release all pages allocate for the balloon.
1301 *
1302 * @b: pointer to the balloon.
1303 *
1304 * This function is called when host decides to "reset" balloon for one reason
1305 * or another. Unlike normal "deflate" we do not (shall not) notify host of the
1306 * pages being released.
1307 */
1308static void vmballoon_pop(struct vmballoon *b)
1309{
1310 unsigned long size;
1311
1312 while ((size = atomic64_read(&b->size)))
1313 vmballoon_deflate(b, size, false);
1314}
1315
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001316/*
Xavier Deguillardf220a802015-08-06 15:17:58 -07001317 * Perform standard reset sequence by popping the balloon (in case it
1318 * is not empty) and then restarting protocol. This operation normally
1319 * happens when host responds with VMW_BALLOON_ERROR_RESET to a command.
1320 */
1321static void vmballoon_reset(struct vmballoon *b)
1322{
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001323 int error;
1324
Nadav Amitc7b36902018-09-20 10:30:17 -07001325 down_write(&b->conf_sem);
1326
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001327 vmballoon_vmci_cleanup(b);
1328
Xavier Deguillardf220a802015-08-06 15:17:58 -07001329 /* free all pages, skipping monitor unlock */
1330 vmballoon_pop(b);
1331
Nadav Amit22d293e2018-09-20 10:30:19 -07001332 if (vmballoon_send_start(b, VMW_BALLOON_CAPABILITIES))
Dan Carpenterd04071a2019-02-11 21:45:45 +03001333 goto unlock;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001334
1335 if ((b->capabilities & VMW_BALLOON_BATCHED_CMDS) != 0) {
Nadav Amitdf8d0d42018-09-20 10:30:12 -07001336 if (vmballoon_init_batching(b)) {
Xavier Deguillardf220a802015-08-06 15:17:58 -07001337 /*
1338 * We failed to initialize batching, inform the monitor
1339 * about it by sending a null capability.
1340 *
1341 * The guest will retry in one second.
1342 */
1343 vmballoon_send_start(b, 0);
Dan Carpenterd04071a2019-02-11 21:45:45 +03001344 goto unlock;
Xavier Deguillardf220a802015-08-06 15:17:58 -07001345 }
1346 } else if ((b->capabilities & VMW_BALLOON_BASIC_CMDS) != 0) {
Nadav Amitdf8d0d42018-09-20 10:30:12 -07001347 vmballoon_deinit_batching(b);
Xavier Deguillardf220a802015-08-06 15:17:58 -07001348 }
1349
Nadav Amit8840a6f2018-09-20 10:30:20 -07001350 vmballoon_stats_gen_inc(b, VMW_BALLOON_STAT_RESET);
Xavier Deguillardf220a802015-08-06 15:17:58 -07001351 b->reset_required = false;
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001352
1353 error = vmballoon_vmci_init(b);
1354 if (error)
1355 pr_err("failed to initialize vmci doorbell\n");
1356
Nadav Amit22d293e2018-09-20 10:30:19 -07001357 if (vmballoon_send_guest_id(b))
Xavier Deguillardf220a802015-08-06 15:17:58 -07001358 pr_err("failed to send guest ID to the host\n");
Nadav Amitc7b36902018-09-20 10:30:17 -07001359
Dan Carpenterd04071a2019-02-11 21:45:45 +03001360unlock:
Nadav Amitc7b36902018-09-20 10:30:17 -07001361 up_write(&b->conf_sem);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001362}
1363
Nadav Amit8b079cd2018-09-20 10:30:15 -07001364/**
1365 * vmballoon_work - periodic balloon worker for reset, inflation and deflation.
1366 *
1367 * @work: pointer to the &work_struct which is provided by the workqueue.
1368 *
1369 * Resets the protocol if needed, gets the new size and adjusts balloon as
1370 * needed. Repeat in 1 sec.
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001371 */
1372static void vmballoon_work(struct work_struct *work)
1373{
1374 struct delayed_work *dwork = to_delayed_work(work);
1375 struct vmballoon *b = container_of(dwork, struct vmballoon, dwork);
Nadav Amit8b079cd2018-09-20 10:30:15 -07001376 int64_t change = 0;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001377
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001378 if (b->reset_required)
1379 vmballoon_reset(b);
1380
Nadav Amitc7b36902018-09-20 10:30:17 -07001381 down_read(&b->conf_sem);
1382
1383 /*
1384 * Update the stats while holding the semaphore to ensure that
1385 * @stats_enabled is consistent with whether the stats are actually
1386 * enabled
1387 */
1388 vmballoon_stats_gen_inc(b, VMW_BALLOON_STAT_TIMER);
1389
Nadav Amit0395be32018-09-20 10:30:16 -07001390 if (!vmballoon_send_get_target(b))
Nadav Amit8b079cd2018-09-20 10:30:15 -07001391 change = vmballoon_change(b);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001392
Nadav Amit8b079cd2018-09-20 10:30:15 -07001393 if (change != 0) {
Nadav Amit6e4453b2018-09-20 10:30:18 -07001394 pr_debug("%s - size: %llu, target %lu\n", __func__,
1395 atomic64_read(&b->size), READ_ONCE(b->target));
Nadav Amit8b079cd2018-09-20 10:30:15 -07001396
1397 if (change > 0)
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001398 vmballoon_inflate(b);
Nadav Amit8b079cd2018-09-20 10:30:15 -07001399 else /* (change < 0) */
Nadav Amit6e4453b2018-09-20 10:30:18 -07001400 vmballoon_deflate(b, 0, true);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001401 }
1402
Nadav Amitc7b36902018-09-20 10:30:17 -07001403 up_read(&b->conf_sem);
1404
Dmitry Torokhovbeda94d2011-07-26 16:08:56 -07001405 /*
1406 * We are using a freezable workqueue so that balloon operations are
1407 * stopped while the system transitions to/from sleep/hibernation.
1408 */
1409 queue_delayed_work(system_freezable_wq,
1410 dwork, round_jiffies_relative(HZ));
Nadav Amitc7b36902018-09-20 10:30:17 -07001411
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001412}
1413
1414/*
1415 * DEBUGFS Interface
1416 */
1417#ifdef CONFIG_DEBUG_FS
1418
Nadav Amitc7b36902018-09-20 10:30:17 -07001419static const char * const vmballoon_stat_page_names[] = {
1420 [VMW_BALLOON_PAGE_STAT_ALLOC] = "alloc",
1421 [VMW_BALLOON_PAGE_STAT_ALLOC_FAIL] = "allocFail",
1422 [VMW_BALLOON_PAGE_STAT_REFUSED_ALLOC] = "errAlloc",
1423 [VMW_BALLOON_PAGE_STAT_REFUSED_FREE] = "errFree",
1424 [VMW_BALLOON_PAGE_STAT_FREE] = "free"
1425};
1426
1427static const char * const vmballoon_stat_names[] = {
1428 [VMW_BALLOON_STAT_TIMER] = "timer",
Nadav Amit8840a6f2018-09-20 10:30:20 -07001429 [VMW_BALLOON_STAT_DOORBELL] = "doorbell",
1430 [VMW_BALLOON_STAT_RESET] = "reset",
Nadav Amitc7b36902018-09-20 10:30:17 -07001431};
1432
Nadav Amitc7b36902018-09-20 10:30:17 -07001433static int vmballoon_enable_stats(struct vmballoon *b)
1434{
1435 int r = 0;
1436
1437 down_write(&b->conf_sem);
1438
1439 /* did we somehow race with another reader which enabled stats? */
1440 if (b->stats)
1441 goto out;
1442
1443 b->stats = kzalloc(sizeof(*b->stats), GFP_KERNEL);
1444
1445 if (!b->stats) {
1446 /* allocation failed */
1447 r = -ENOMEM;
1448 goto out;
1449 }
1450 static_key_enable(&balloon_stat_enabled.key);
1451out:
1452 up_write(&b->conf_sem);
1453 return r;
1454}
1455
1456/**
1457 * vmballoon_debug_show - shows statistics of balloon operations.
1458 * @f: pointer to the &struct seq_file.
1459 * @offset: ignored.
1460 *
1461 * Provides the statistics that can be accessed in vmmemctl in the debugfs.
1462 * To avoid the overhead - mainly that of memory - of collecting the statistics,
1463 * we only collect statistics after the first time the counters are read.
1464 *
1465 * Return: zero on success or an error code.
1466 */
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001467static int vmballoon_debug_show(struct seq_file *f, void *offset)
1468{
1469 struct vmballoon *b = f->private;
Nadav Amitc7b36902018-09-20 10:30:17 -07001470 int i, j;
1471
1472 /* enables stats if they are disabled */
1473 if (!b->stats) {
1474 int r = vmballoon_enable_stats(b);
1475
1476 if (r)
1477 return r;
1478 }
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001479
Philip P. Moltmannb36e89d2015-08-06 15:18:00 -07001480 /* format capabilities info */
Nadav Amit6e4453b2018-09-20 10:30:18 -07001481 seq_printf(f, "%-22s: %#16x\n", "balloon capabilities",
Nadav Amitc7b36902018-09-20 10:30:17 -07001482 VMW_BALLOON_CAPABILITIES);
Nadav Amit6e4453b2018-09-20 10:30:18 -07001483 seq_printf(f, "%-22s: %#16lx\n", "used capabilities", b->capabilities);
Nadav Amitc7b36902018-09-20 10:30:17 -07001484 seq_printf(f, "%-22s: %16s\n", "is resetting",
1485 b->reset_required ? "y" : "n");
Philip P. Moltmannb36e89d2015-08-06 15:18:00 -07001486
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001487 /* format size info */
Nadav Amit6e4453b2018-09-20 10:30:18 -07001488 seq_printf(f, "%-22s: %16lu\n", "target", READ_ONCE(b->target));
1489 seq_printf(f, "%-22s: %16llu\n", "current", atomic64_read(&b->size));
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001490
Nadav Amit68131182018-09-20 10:30:08 -07001491 for (i = 0; i < VMW_BALLOON_CMD_NUM; i++) {
1492 if (vmballoon_cmd_names[i] == NULL)
1493 continue;
1494
Nadav Amitc7b36902018-09-20 10:30:17 -07001495 seq_printf(f, "%-22s: %16llu (%llu failed)\n",
1496 vmballoon_cmd_names[i],
1497 atomic64_read(&b->stats->ops[i][VMW_BALLOON_OP_STAT]),
1498 atomic64_read(&b->stats->ops[i][VMW_BALLOON_OP_FAIL_STAT]));
Nadav Amit68131182018-09-20 10:30:08 -07001499 }
1500
Nadav Amitc7b36902018-09-20 10:30:17 -07001501 for (i = 0; i < VMW_BALLOON_STAT_NUM; i++)
1502 seq_printf(f, "%-22s: %16llu\n",
1503 vmballoon_stat_names[i],
1504 atomic64_read(&b->stats->general_stat[i]));
1505
1506 for (i = 0; i < VMW_BALLOON_PAGE_STAT_NUM; i++) {
1507 for (j = 0; j < VMW_BALLOON_NUM_PAGE_SIZES; j++)
1508 seq_printf(f, "%-18s(%s): %16llu\n",
1509 vmballoon_stat_page_names[i],
1510 vmballoon_page_size_names[j],
1511 atomic64_read(&b->stats->page_stat[i][j]));
1512 }
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001513
1514 return 0;
1515}
1516
Yangtao Li2796b432018-12-01 12:05:30 -05001517DEFINE_SHOW_ATTRIBUTE(vmballoon_debug);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001518
1519static int __init vmballoon_debugfs_init(struct vmballoon *b)
1520{
1521 int error;
1522
1523 b->dbg_entry = debugfs_create_file("vmmemctl", S_IRUGO, NULL, b,
1524 &vmballoon_debug_fops);
1525 if (IS_ERR(b->dbg_entry)) {
1526 error = PTR_ERR(b->dbg_entry);
1527 pr_err("failed to create debugfs entry, error: %d\n", error);
1528 return error;
1529 }
1530
1531 return 0;
1532}
1533
1534static void __exit vmballoon_debugfs_exit(struct vmballoon *b)
1535{
Nadav Amitc7b36902018-09-20 10:30:17 -07001536 static_key_disable(&balloon_stat_enabled.key);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001537 debugfs_remove(b->dbg_entry);
Nadav Amitc7b36902018-09-20 10:30:17 -07001538 kfree(b->stats);
1539 b->stats = NULL;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001540}
1541
1542#else
1543
1544static inline int vmballoon_debugfs_init(struct vmballoon *b)
1545{
1546 return 0;
1547}
1548
1549static inline void vmballoon_debugfs_exit(struct vmballoon *b)
1550{
1551}
1552
1553#endif /* CONFIG_DEBUG_FS */
1554
1555static int __init vmballoon_init(void)
1556{
Nadav Amit6e4453b2018-09-20 10:30:18 -07001557 enum vmballoon_page_size_type page_size;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001558 int error;
Nadav Amit6e4453b2018-09-20 10:30:18 -07001559
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001560 /*
1561 * Check if we are running on VMware's hypervisor and bail out
1562 * if we are not.
1563 */
Juergen Gross03b2a322017-11-09 14:27:36 +01001564 if (x86_hyper_type != X86_HYPER_VMWARE)
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001565 return -ENODEV;
1566
Nadav Amit6e4453b2018-09-20 10:30:18 -07001567 for (page_size = VMW_BALLOON_4K_PAGE;
1568 page_size <= VMW_BALLOON_LAST_SIZE; page_size++)
1569 INIT_LIST_HEAD(&balloon.page_sizes[page_size].pages);
1570
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001571
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001572 INIT_DELAYED_WORK(&balloon.dwork, vmballoon_work);
1573
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001574 error = vmballoon_debugfs_init(&balloon);
1575 if (error)
Dmitry Torokhovbeda94d2011-07-26 16:08:56 -07001576 return error;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001577
Nadav Amit6e4453b2018-09-20 10:30:18 -07001578 spin_lock_init(&balloon.comm_lock);
Nadav Amitc7b36902018-09-20 10:30:17 -07001579 init_rwsem(&balloon.conf_sem);
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001580 balloon.vmci_doorbell = VMCI_INVALID_HANDLE;
Philip P. Moltmannd7568c12015-08-06 15:18:01 -07001581 balloon.batch_page = NULL;
1582 balloon.page = NULL;
1583 balloon.reset_required = true;
1584
Dmitry Torokhovbeda94d2011-07-26 16:08:56 -07001585 queue_delayed_work(system_freezable_wq, &balloon.dwork, 0);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001586
1587 return 0;
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001588}
Nadav Amitc3cc1b02018-06-19 16:00:27 -07001589
1590/*
1591 * Using late_initcall() instead of module_init() allows the balloon to use the
1592 * VMCI doorbell even when the balloon is built into the kernel. Otherwise the
1593 * VMCI is probed only after the balloon is initialized. If the balloon is used
1594 * as a module, late_initcall() is equivalent to module_init().
1595 */
1596late_initcall(vmballoon_init);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001597
1598static void __exit vmballoon_exit(void)
1599{
Philip P. Moltmann48e3d662015-08-06 15:18:01 -07001600 vmballoon_vmci_cleanup(&balloon);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001601 cancel_delayed_work_sync(&balloon.dwork);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001602
1603 vmballoon_debugfs_exit(&balloon);
1604
1605 /*
1606 * Deallocate all reserved memory, and reset connection with monitor.
1607 * Reset connection before deallocating memory to avoid potential for
1608 * additional spurious resets from guest touching deallocated pages.
1609 */
Philip P. Moltmannd7568c12015-08-06 15:18:01 -07001610 vmballoon_send_start(&balloon, 0);
Dmitry Torokhov453dc652010-04-23 13:18:08 -04001611 vmballoon_pop(&balloon);
1612}
1613module_exit(vmballoon_exit);