]>
Commit | Line | Data |
---|---|---|
bd322087 | 1 | /* |
d4443cb6 | 2 | * Virtio Balloon Device |
bd322087 AL |
3 | * |
4 | * Copyright IBM, Corp. 2008 | |
d4443cb6 AS |
5 | * Copyright (C) 2011 Red Hat, Inc. |
6 | * Copyright (C) 2011 Amit Shah <[email protected]> | |
bd322087 AL |
7 | * |
8 | * Authors: | |
9 | * Anthony Liguori <[email protected]> | |
10 | * | |
11 | * This work is licensed under the terms of the GNU GPL, version 2. See | |
12 | * the COPYING file in the top-level directory. | |
13 | * | |
14 | */ | |
15 | ||
1de7afc9 | 16 | #include "qemu/iov.h" |
bd322087 AL |
17 | #include "qemu-common.h" |
18 | #include "virtio.h" | |
19 | #include "pc.h" | |
bd322087 | 20 | #include "cpu.h" |
9c17d615 | 21 | #include "sysemu/balloon.h" |
bd322087 | 22 | #include "virtio-balloon.h" |
9c17d615 | 23 | #include "sysemu/kvm.h" |
022c62cb | 24 | #include "exec/address-spaces.h" |
bd322087 AL |
25 | |
26 | #if defined(__linux__) | |
27 | #include <sys/mman.h> | |
28 | #endif | |
29 | ||
30 | typedef struct VirtIOBalloon | |
31 | { | |
32 | VirtIODevice vdev; | |
625a5bef | 33 | VirtQueue *ivq, *dvq, *svq; |
bd322087 AL |
34 | uint32_t num_pages; |
35 | uint32_t actual; | |
625a5bef AL |
36 | uint64_t stats[VIRTIO_BALLOON_S_NR]; |
37 | VirtQueueElement stats_vq_elem; | |
38 | size_t stats_vq_offset; | |
ac720400 | 39 | DeviceState *qdev; |
bd322087 AL |
40 | } VirtIOBalloon; |
41 | ||
42 | static VirtIOBalloon *to_virtio_balloon(VirtIODevice *vdev) | |
43 | { | |
44 | return (VirtIOBalloon *)vdev; | |
45 | } | |
46 | ||
47 | static void balloon_page(void *addr, int deflate) | |
48 | { | |
49 | #if defined(__linux__) | |
50 | if (!kvm_enabled() || kvm_has_sync_mmu()) | |
e78815a5 AF |
51 | qemu_madvise(addr, TARGET_PAGE_SIZE, |
52 | deflate ? QEMU_MADV_WILLNEED : QEMU_MADV_DONTNEED); | |
bd322087 AL |
53 | #endif |
54 | } | |
55 | ||
625a5bef AL |
56 | /* |
57 | * reset_stats - Mark all items in the stats array as unset | |
58 | * | |
59 | * This function needs to be called at device intialization and before | |
60 | * before updating to a set of newly-generated stats. This will ensure that no | |
61 | * stale values stick around in case the guest reports a subset of the supported | |
62 | * statistics. | |
63 | */ | |
64 | static inline void reset_stats(VirtIOBalloon *dev) | |
65 | { | |
66 | int i; | |
67 | for (i = 0; i < VIRTIO_BALLOON_S_NR; dev->stats[i++] = -1); | |
68 | } | |
69 | ||
bd322087 AL |
70 | static void virtio_balloon_handle_output(VirtIODevice *vdev, VirtQueue *vq) |
71 | { | |
72 | VirtIOBalloon *s = to_virtio_balloon(vdev); | |
73 | VirtQueueElement elem; | |
b7c28c74 | 74 | MemoryRegionSection section; |
bd322087 AL |
75 | |
76 | while (virtqueue_pop(vq, &elem)) { | |
77 | size_t offset = 0; | |
78 | uint32_t pfn; | |
79 | ||
dcf6f5e1 | 80 | while (iov_to_buf(elem.out_sg, elem.out_num, offset, &pfn, 4) == 4) { |
c227f099 AL |
81 | ram_addr_t pa; |
82 | ram_addr_t addr; | |
bd322087 | 83 | |
c227f099 | 84 | pa = (ram_addr_t)ldl_p(&pfn) << VIRTIO_BALLOON_PFN_SHIFT; |
bd322087 AL |
85 | offset += 4; |
86 | ||
b7c28c74 AK |
87 | /* FIXME: remove get_system_memory(), but how? */ |
88 | section = memory_region_find(get_system_memory(), pa, 1); | |
89 | if (!section.size || !memory_region_is_ram(section.mr)) | |
bd322087 AL |
90 | continue; |
91 | ||
b7c28c74 | 92 | /* Using memory_region_get_ram_ptr is bending the rules a bit, but |
5c130f65 | 93 | should be OK because we only want a single page. */ |
b7c28c74 AK |
94 | addr = section.offset_within_region; |
95 | balloon_page(memory_region_get_ram_ptr(section.mr) + addr, | |
96 | !!(vq == s->dvq)); | |
bd322087 AL |
97 | } |
98 | ||
99 | virtqueue_push(vq, &elem, offset); | |
100 | virtio_notify(vdev, vq); | |
101 | } | |
102 | } | |
103 | ||
625a5bef AL |
104 | static void virtio_balloon_receive_stats(VirtIODevice *vdev, VirtQueue *vq) |
105 | { | |
106 | VirtIOBalloon *s = DO_UPCAST(VirtIOBalloon, vdev, vdev); | |
107 | VirtQueueElement *elem = &s->stats_vq_elem; | |
108 | VirtIOBalloonStat stat; | |
109 | size_t offset = 0; | |
110 | ||
111 | if (!virtqueue_pop(vq, elem)) { | |
112 | return; | |
113 | } | |
114 | ||
115 | /* Initialize the stats to get rid of any stale values. This is only | |
116 | * needed to handle the case where a guest supports fewer stats than it | |
117 | * used to (ie. it has booted into an old kernel). | |
118 | */ | |
119 | reset_stats(s); | |
120 | ||
dcf6f5e1 | 121 | while (iov_to_buf(elem->out_sg, elem->out_num, offset, &stat, sizeof(stat)) |
fa6111f2 | 122 | == sizeof(stat)) { |
625a5bef AL |
123 | uint16_t tag = tswap16(stat.tag); |
124 | uint64_t val = tswap64(stat.val); | |
125 | ||
126 | offset += sizeof(stat); | |
127 | if (tag < VIRTIO_BALLOON_S_NR) | |
128 | s->stats[tag] = val; | |
129 | } | |
130 | s->stats_vq_offset = offset; | |
625a5bef AL |
131 | } |
132 | ||
bd322087 AL |
133 | static void virtio_balloon_get_config(VirtIODevice *vdev, uint8_t *config_data) |
134 | { | |
135 | VirtIOBalloon *dev = to_virtio_balloon(vdev); | |
136 | struct virtio_balloon_config config; | |
137 | ||
138 | config.num_pages = cpu_to_le32(dev->num_pages); | |
139 | config.actual = cpu_to_le32(dev->actual); | |
140 | ||
141 | memcpy(config_data, &config, 8); | |
142 | } | |
143 | ||
144 | static void virtio_balloon_set_config(VirtIODevice *vdev, | |
145 | const uint8_t *config_data) | |
146 | { | |
147 | VirtIOBalloon *dev = to_virtio_balloon(vdev); | |
148 | struct virtio_balloon_config config; | |
973603a8 | 149 | uint32_t oldactual = dev->actual; |
bd322087 | 150 | memcpy(&config, config_data, 8); |
e54f1771 | 151 | dev->actual = le32_to_cpu(config.actual); |
973603a8 DB |
152 | if (dev->actual != oldactual) { |
153 | qemu_balloon_changed(ram_size - | |
154 | (dev->actual << VIRTIO_BALLOON_PFN_SHIFT)); | |
155 | } | |
bd322087 AL |
156 | } |
157 | ||
8172539d | 158 | static uint32_t virtio_balloon_get_features(VirtIODevice *vdev, uint32_t f) |
bd322087 | 159 | { |
625a5bef | 160 | f |= (1 << VIRTIO_BALLOON_F_STATS_VQ); |
8172539d | 161 | return f; |
bd322087 AL |
162 | } |
163 | ||
96637bcd | 164 | static void virtio_balloon_stat(void *opaque, BalloonInfo *info) |
dce911c7 AS |
165 | { |
166 | VirtIOBalloon *dev = opaque; | |
167 | ||
96637bcd LC |
168 | #if 0 |
169 | /* Disable guest-provided stats for now. For more details please check: | |
170 | * https://bugzilla.redhat.com/show_bug.cgi?id=623903 | |
171 | * | |
172 | * If you do enable it (which is probably not going to happen as we | |
173 | * need a new command for it), remember that you also need to fill the | |
174 | * appropriate members of the BalloonInfo structure so that the stats | |
175 | * are returned to the client. | |
dce911c7 | 176 | */ |
96637bcd | 177 | if (dev->vdev.guest_features & (1 << VIRTIO_BALLOON_F_STATS_VQ)) { |
dce911c7 AS |
178 | virtqueue_push(dev->svq, &dev->stats_vq_elem, dev->stats_vq_offset); |
179 | virtio_notify(&dev->vdev, dev->svq); | |
180 | return; | |
181 | } | |
96637bcd | 182 | #endif |
dce911c7 AS |
183 | |
184 | /* Stats are not supported. Clear out any stale values that might | |
185 | * have been set by a more featureful guest kernel. | |
186 | */ | |
187 | reset_stats(dev); | |
96637bcd LC |
188 | |
189 | info->actual = ram_size - ((uint64_t) dev->actual << | |
190 | VIRTIO_BALLOON_PFN_SHIFT); | |
dce911c7 AS |
191 | } |
192 | ||
30fb2ca6 | 193 | static void virtio_balloon_to_target(void *opaque, ram_addr_t target) |
bd322087 AL |
194 | { |
195 | VirtIOBalloon *dev = opaque; | |
196 | ||
dce911c7 | 197 | if (target > ram_size) { |
bd322087 | 198 | target = ram_size; |
dce911c7 | 199 | } |
bd322087 AL |
200 | if (target) { |
201 | dev->num_pages = (ram_size - target) >> VIRTIO_BALLOON_PFN_SHIFT; | |
202 | virtio_notify_config(&dev->vdev); | |
203 | } | |
bd322087 AL |
204 | } |
205 | ||
206 | static void virtio_balloon_save(QEMUFile *f, void *opaque) | |
207 | { | |
208 | VirtIOBalloon *s = opaque; | |
209 | ||
210 | virtio_save(&s->vdev, f); | |
211 | ||
212 | qemu_put_be32(f, s->num_pages); | |
213 | qemu_put_be32(f, s->actual); | |
214 | } | |
215 | ||
216 | static int virtio_balloon_load(QEMUFile *f, void *opaque, int version_id) | |
217 | { | |
218 | VirtIOBalloon *s = opaque; | |
2a633c46 | 219 | int ret; |
bd322087 AL |
220 | |
221 | if (version_id != 1) | |
222 | return -EINVAL; | |
223 | ||
2a633c46 OW |
224 | ret = virtio_load(&s->vdev, f); |
225 | if (ret) { | |
226 | return ret; | |
227 | } | |
bd322087 AL |
228 | |
229 | s->num_pages = qemu_get_be32(f); | |
230 | s->actual = qemu_get_be32(f); | |
bd322087 AL |
231 | return 0; |
232 | } | |
233 | ||
53c25cea | 234 | VirtIODevice *virtio_balloon_init(DeviceState *dev) |
bd322087 AL |
235 | { |
236 | VirtIOBalloon *s; | |
f76f6655 | 237 | int ret; |
bd322087 | 238 | |
53c25cea PB |
239 | s = (VirtIOBalloon *)virtio_common_init("virtio-balloon", |
240 | VIRTIO_ID_BALLOON, | |
241 | 8, sizeof(VirtIOBalloon)); | |
bd322087 AL |
242 | |
243 | s->vdev.get_config = virtio_balloon_get_config; | |
244 | s->vdev.set_config = virtio_balloon_set_config; | |
245 | s->vdev.get_features = virtio_balloon_get_features; | |
246 | ||
f76f6655 AS |
247 | ret = qemu_add_balloon_handler(virtio_balloon_to_target, |
248 | virtio_balloon_stat, s); | |
249 | if (ret < 0) { | |
250 | virtio_cleanup(&s->vdev); | |
251 | return NULL; | |
252 | } | |
253 | ||
bd322087 AL |
254 | s->ivq = virtio_add_queue(&s->vdev, 128, virtio_balloon_handle_output); |
255 | s->dvq = virtio_add_queue(&s->vdev, 128, virtio_balloon_handle_output); | |
625a5bef | 256 | s->svq = virtio_add_queue(&s->vdev, 128, virtio_balloon_receive_stats); |
bd322087 | 257 | |
625a5bef | 258 | reset_stats(s); |
bd322087 | 259 | |
ac720400 | 260 | s->qdev = dev; |
0be71e32 AW |
261 | register_savevm(dev, "virtio-balloon", -1, 1, |
262 | virtio_balloon_save, virtio_balloon_load, s); | |
bd322087 | 263 | |
53c25cea | 264 | return &s->vdev; |
bd322087 | 265 | } |
855d7e25 AS |
266 | |
267 | void virtio_balloon_exit(VirtIODevice *vdev) | |
268 | { | |
ac720400 | 269 | VirtIOBalloon *s = DO_UPCAST(VirtIOBalloon, vdev, vdev); |
3b86b13a AS |
270 | |
271 | qemu_remove_balloon_handler(s); | |
ac720400 | 272 | unregister_savevm(s->qdev, "virtio-balloon", s); |
855d7e25 AS |
273 | virtio_cleanup(vdev); |
274 | } |