1 /*
2 * QEMU Guest Agent Linux-specific command implementations
3 *
4 * Copyright IBM Corp. 2011
5 *
6 * Authors:
7 * Michael Roth <mdroth@linux.vnet.ibm.com>
8 * Michal Privoznik <mprivozn@redhat.com>
9 *
10 * This work is licensed under the terms of the GNU GPL, version 2 or later.
11 * See the COPYING file in the top-level directory.
12 */
13
14 #include "qemu/osdep.h"
15 #include "qapi/error.h"
16 #include "qga-qapi-commands.h"
17 #include "qapi/error.h"
18 #include "commands-common.h"
19 #include "cutils.h"
20 #include <mntent.h>
21 #include <sys/ioctl.h>
22 #include <mntent.h>
23 #include <linux/nvme_ioctl.h>
24 #include "block/nvme.h"
25
26 #ifdef CONFIG_LIBUDEV
27 #include <libudev.h>
28 #endif
29
30 #ifdef HAVE_GETIFADDRS
31 #include <net/if.h>
32 #endif
33
34 #include <sys/statvfs.h>
35
36 #if defined(CONFIG_FSFREEZE) || defined(CONFIG_FSTRIM)
dev_major_minor(const char * devpath,unsigned int * devmajor,unsigned int * devminor)37 static int dev_major_minor(const char *devpath,
38 unsigned int *devmajor, unsigned int *devminor)
39 {
40 struct stat st;
41
42 *devmajor = 0;
43 *devminor = 0;
44
45 if (stat(devpath, &st) < 0) {
46 slog("failed to stat device file '%s': %s", devpath, strerror(errno));
47 return -1;
48 }
49 if (S_ISDIR(st.st_mode)) {
50 /* It is bind mount */
51 return -2;
52 }
53 if (S_ISBLK(st.st_mode)) {
54 *devmajor = major(st.st_rdev);
55 *devminor = minor(st.st_rdev);
56 return 0;
57 }
58 return -1;
59 }
60
build_fs_mount_list_from_mtab(FsMountList * mounts,Error ** errp)61 static bool build_fs_mount_list_from_mtab(FsMountList *mounts, Error **errp)
62 {
63 struct mntent *ment;
64 FsMount *mount;
65 char const *mtab = "/proc/self/mounts";
66 FILE *fp;
67 unsigned int devmajor, devminor;
68
69 fp = setmntent(mtab, "r");
70 if (!fp) {
71 error_setg(errp, "failed to open mtab file: '%s'", mtab);
72 return false;
73 }
74
75 while ((ment = getmntent(fp))) {
76 /*
77 * An entry which device name doesn't start with a '/' is
78 * either a dummy file system or a network file system.
79 * Add special handling for smbfs and cifs as is done by
80 * coreutils as well.
81 */
82 if ((ment->mnt_fsname[0] != '/') ||
83 (strcmp(ment->mnt_type, "smbfs") == 0) ||
84 (strcmp(ment->mnt_type, "cifs") == 0)) {
85 continue;
86 }
87 if (dev_major_minor(ment->mnt_fsname, &devmajor, &devminor) == -2) {
88 /* Skip bind mounts */
89 continue;
90 }
91
92 mount = g_new0(FsMount, 1);
93 mount->dirname = g_strdup(ment->mnt_dir);
94 mount->devtype = g_strdup(ment->mnt_type);
95 mount->devmajor = devmajor;
96 mount->devminor = devminor;
97
98 QTAILQ_INSERT_TAIL(mounts, mount, next);
99 }
100
101 endmntent(fp);
102 return true;
103 }
104
decode_mntname(char * name,int len)105 static void decode_mntname(char *name, int len)
106 {
107 int i, j = 0;
108 for (i = 0; i <= len; i++) {
109 if (name[i] != '\\') {
110 name[j++] = name[i];
111 } else if (name[i + 1] == '\\') {
112 name[j++] = '\\';
113 i++;
114 } else if (name[i + 1] >= '0' && name[i + 1] <= '3' &&
115 name[i + 2] >= '0' && name[i + 2] <= '7' &&
116 name[i + 3] >= '0' && name[i + 3] <= '7') {
117 name[j++] = (name[i + 1] - '0') * 64 +
118 (name[i + 2] - '0') * 8 +
119 (name[i + 3] - '0');
120 i += 3;
121 } else {
122 name[j++] = name[i];
123 }
124 }
125 }
126
127 /*
128 * Walk the mount table and build a list of local file systems
129 */
build_fs_mount_list(FsMountList * mounts,Error ** errp)130 bool build_fs_mount_list(FsMountList *mounts, Error **errp)
131 {
132 FsMount *mount;
133 char const *mountinfo = "/proc/self/mountinfo";
134 FILE *fp;
135 char *line = NULL, *dash;
136 size_t n;
137 char check;
138 unsigned int devmajor, devminor;
139 int ret, dir_s, dir_e, type_s, type_e, dev_s, dev_e;
140
141 fp = fopen(mountinfo, "r");
142 if (!fp) {
143 return build_fs_mount_list_from_mtab(mounts, errp);
144 }
145
146 while (getline(&line, &n, fp) != -1) {
147 ret = sscanf(line, "%*u %*u %u:%u %*s %n%*s%n%c",
148 &devmajor, &devminor, &dir_s, &dir_e, &check);
149 if (ret < 3) {
150 continue;
151 }
152 dash = strstr(line + dir_e, " - ");
153 if (!dash) {
154 continue;
155 }
156 ret = sscanf(dash, " - %n%*s%n %n%*s%n%c",
157 &type_s, &type_e, &dev_s, &dev_e, &check);
158 if (ret < 1) {
159 continue;
160 }
161 line[dir_e] = 0;
162 dash[type_e] = 0;
163 dash[dev_e] = 0;
164 decode_mntname(line + dir_s, dir_e - dir_s);
165 decode_mntname(dash + dev_s, dev_e - dev_s);
166 if (devmajor == 0) {
167 /* btrfs reports major number = 0 */
168 if (strcmp("btrfs", dash + type_s) != 0 ||
169 dev_major_minor(dash + dev_s, &devmajor, &devminor) < 0) {
170 continue;
171 }
172 }
173
174 mount = g_new0(FsMount, 1);
175 mount->dirname = g_strdup(line + dir_s);
176 mount->devtype = g_strdup(dash + type_s);
177 mount->devmajor = devmajor;
178 mount->devminor = devminor;
179
180 QTAILQ_INSERT_TAIL(mounts, mount, next);
181 }
182 free(line);
183
184 fclose(fp);
185 return true;
186 }
187 #endif /* CONFIG_FSFREEZE || CONFIG_FSTRIM */
188
189 #ifdef CONFIG_FSFREEZE
190 /*
191 * Walk list of mounted file systems in the guest, and freeze the ones which
192 * are real local file systems.
193 */
qmp_guest_fsfreeze_do_freeze_list(bool has_mountpoints,strList * mountpoints,FsMountList mounts,Error ** errp)194 int64_t qmp_guest_fsfreeze_do_freeze_list(bool has_mountpoints,
195 strList *mountpoints,
196 FsMountList mounts,
197 Error **errp)
198 {
199 struct FsMount *mount;
200 strList *list;
201 int fd, ret, i = 0;
202
203 QTAILQ_FOREACH_REVERSE(mount, &mounts, next) {
204 /* To issue fsfreeze in the reverse order of mounts, check if the
205 * mount is listed in the list here */
206 if (has_mountpoints) {
207 for (list = mountpoints; list; list = list->next) {
208 if (strcmp(list->value, mount->dirname) == 0) {
209 break;
210 }
211 }
212 if (!list) {
213 continue;
214 }
215 }
216
217 fd = qga_open_cloexec(mount->dirname, O_RDONLY, 0);
218 if (fd == -1) {
219 error_setg_errno(errp, errno, "failed to open %s", mount->dirname);
220 return -1;
221 }
222
223 /* we try to cull filesystems we know won't work in advance, but other
224 * filesystems may not implement fsfreeze for less obvious reasons.
225 * these will report EOPNOTSUPP. we simply ignore these when tallying
226 * the number of frozen filesystems.
227 * if a filesystem is mounted more than once (aka bind mount) a
228 * consecutive attempt to freeze an already frozen filesystem will
229 * return EBUSY.
230 *
231 * any other error means a failure to freeze a filesystem we
232 * expect to be freezable, so return an error in those cases
233 * and return system to thawed state.
234 */
235 ret = ioctl(fd, FIFREEZE);
236 if (ret == -1) {
237 if (errno != EOPNOTSUPP && errno != EBUSY) {
238 error_setg_errno(errp, errno, "failed to freeze %s",
239 mount->dirname);
240 close(fd);
241 return -1;
242 }
243 } else {
244 i++;
245 }
246 close(fd);
247 }
248 return i;
249 }
250
qmp_guest_fsfreeze_do_thaw(Error ** errp)251 int qmp_guest_fsfreeze_do_thaw(Error **errp)
252 {
253 int ret;
254 FsMountList mounts;
255 FsMount *mount;
256 int fd, i = 0, logged;
257 Error *local_err = NULL;
258
259 QTAILQ_INIT(&mounts);
260 if (!build_fs_mount_list(&mounts, &local_err)) {
261 error_propagate(errp, local_err);
262 return -1;
263 }
264
265 QTAILQ_FOREACH(mount, &mounts, next) {
266 logged = false;
267 fd = qga_open_cloexec(mount->dirname, O_RDONLY, 0);
268 if (fd == -1) {
269 continue;
270 }
271 /* we have no way of knowing whether a filesystem was actually unfrozen
272 * as a result of a successful call to FITHAW, only that if an error
273 * was returned the filesystem was *not* unfrozen by that particular
274 * call.
275 *
276 * since multiple preceding FIFREEZEs require multiple calls to FITHAW
277 * to unfreeze, continuing issuing FITHAW until an error is returned,
278 * in which case either the filesystem is in an unfreezable state, or,
279 * more likely, it was thawed previously (and remains so afterward).
280 *
281 * also, since the most recent successful call is the one that did
282 * the actual unfreeze, we can use this to provide an accurate count
283 * of the number of filesystems unfrozen by guest-fsfreeze-thaw, which
284 * may * be useful for determining whether a filesystem was unfrozen
285 * during the freeze/thaw phase by a process other than qemu-ga.
286 */
287 do {
288 ret = ioctl(fd, FITHAW);
289 if (ret == 0 && !logged) {
290 i++;
291 logged = true;
292 }
293 } while (ret == 0);
294 close(fd);
295 }
296
297 free_fs_mount_list(&mounts);
298
299 return i;
300 }
301 #endif /* CONFIG_FSFREEZE */
302
303 #if defined(CONFIG_FSFREEZE)
304
get_pci_driver(char const * syspath,int pathlen,Error ** errp)305 static char *get_pci_driver(char const *syspath, int pathlen, Error **errp)
306 {
307 char *path;
308 char *dpath;
309 char *driver = NULL;
310 char buf[PATH_MAX];
311 ssize_t len;
312
313 path = g_strndup(syspath, pathlen);
314 dpath = g_strdup_printf("%s/driver", path);
315 len = readlink(dpath, buf, sizeof(buf) - 1);
316 if (len != -1) {
317 buf[len] = 0;
318 driver = g_path_get_basename(buf);
319 }
320 g_free(dpath);
321 g_free(path);
322 return driver;
323 }
324
compare_uint(const void * _a,const void * _b)325 static int compare_uint(const void *_a, const void *_b)
326 {
327 unsigned int a = *(unsigned int *)_a;
328 unsigned int b = *(unsigned int *)_b;
329
330 return a < b ? -1 : a > b ? 1 : 0;
331 }
332
333 /* Walk the specified sysfs and build a sorted list of host or ata numbers */
build_hosts(char const * syspath,char const * host,bool ata,unsigned int * hosts,int hosts_max,Error ** errp)334 static int build_hosts(char const *syspath, char const *host, bool ata,
335 unsigned int *hosts, int hosts_max, Error **errp)
336 {
337 char *path;
338 DIR *dir;
339 struct dirent *entry;
340 int i = 0;
341
342 path = g_strndup(syspath, host - syspath);
343 dir = opendir(path);
344 if (!dir) {
345 error_setg_errno(errp, errno, "opendir(\"%s\")", path);
346 g_free(path);
347 return -1;
348 }
349
350 while (i < hosts_max) {
351 entry = readdir(dir);
352 if (!entry) {
353 break;
354 }
355 if (ata && sscanf(entry->d_name, "ata%d", hosts + i) == 1) {
356 ++i;
357 } else if (!ata && sscanf(entry->d_name, "host%d", hosts + i) == 1) {
358 ++i;
359 }
360 }
361
362 qsort(hosts, i, sizeof(hosts[0]), compare_uint);
363
364 g_free(path);
365 closedir(dir);
366 return i;
367 }
368
369 /*
370 * Store disk device info for devices on the PCI bus.
371 * Returns true if information has been stored, or false for failure.
372 */
build_guest_fsinfo_for_pci_dev(char const * syspath,GuestDiskAddress * disk,Error ** errp)373 static bool build_guest_fsinfo_for_pci_dev(char const *syspath,
374 GuestDiskAddress *disk,
375 Error **errp)
376 {
377 unsigned int pci[4], host, hosts[8], tgt[3];
378 int i, nhosts = 0, pcilen;
379 GuestPCIAddress *pciaddr = disk->pci_controller;
380 bool has_ata = false, has_host = false, has_tgt = false;
381 char *p, *q, *driver = NULL;
382 bool ret = false;
383
384 p = strstr(syspath, "/devices/pci");
385 if (!p || sscanf(p + 12, "%*x:%*x/%x:%x:%x.%x%n",
386 pci, pci + 1, pci + 2, pci + 3, &pcilen) < 4) {
387 g_debug("only pci device is supported: sysfs path '%s'", syspath);
388 return false;
389 }
390
391 p += 12 + pcilen;
392 while (true) {
393 driver = get_pci_driver(syspath, p - syspath, errp);
394 if (driver && (g_str_equal(driver, "ata_piix") ||
395 g_str_equal(driver, "sym53c8xx") ||
396 g_str_equal(driver, "virtio-pci") ||
397 g_str_equal(driver, "ahci") ||
398 g_str_equal(driver, "nvme") ||
399 g_str_equal(driver, "xhci_hcd") ||
400 g_str_equal(driver, "ehci-pci"))) {
401 break;
402 }
403
404 g_free(driver);
405 if (sscanf(p, "/%x:%x:%x.%x%n",
406 pci, pci + 1, pci + 2, pci + 3, &pcilen) == 4) {
407 p += pcilen;
408 continue;
409 }
410
411 g_debug("unsupported driver or sysfs path '%s'", syspath);
412 return false;
413 }
414
415 p = strstr(syspath, "/target");
416 if (p && sscanf(p + 7, "%*u:%*u:%*u/%*u:%u:%u:%u",
417 tgt, tgt + 1, tgt + 2) == 3) {
418 has_tgt = true;
419 }
420
421 p = strstr(syspath, "/ata");
422 if (p) {
423 q = p + 4;
424 has_ata = true;
425 } else {
426 p = strstr(syspath, "/host");
427 q = p + 5;
428 }
429 if (p && sscanf(q, "%u", &host) == 1) {
430 has_host = true;
431 nhosts = build_hosts(syspath, p, has_ata, hosts,
432 ARRAY_SIZE(hosts), errp);
433 if (nhosts < 0) {
434 goto cleanup;
435 }
436 }
437
438 pciaddr->domain = pci[0];
439 pciaddr->bus = pci[1];
440 pciaddr->slot = pci[2];
441 pciaddr->function = pci[3];
442
443 if (strcmp(driver, "ata_piix") == 0) {
444 /* a host per ide bus, target*:0:<unit>:0 */
445 if (!has_host || !has_tgt) {
446 g_debug("invalid sysfs path '%s' (driver '%s')", syspath, driver);
447 goto cleanup;
448 }
449 for (i = 0; i < nhosts; i++) {
450 if (host == hosts[i]) {
451 disk->bus_type = GUEST_DISK_BUS_TYPE_IDE;
452 disk->bus = i;
453 disk->unit = tgt[1];
454 break;
455 }
456 }
457 if (i >= nhosts) {
458 g_debug("no host for '%s' (driver '%s')", syspath, driver);
459 goto cleanup;
460 }
461 } else if (strcmp(driver, "sym53c8xx") == 0) {
462 /* scsi(LSI Logic): target*:0:<unit>:0 */
463 if (!has_tgt) {
464 g_debug("invalid sysfs path '%s' (driver '%s')", syspath, driver);
465 goto cleanup;
466 }
467 disk->bus_type = GUEST_DISK_BUS_TYPE_SCSI;
468 disk->unit = tgt[1];
469 } else if (strcmp(driver, "virtio-pci") == 0) {
470 if (has_tgt) {
471 /* virtio-scsi: target*:0:0:<unit> */
472 disk->bus_type = GUEST_DISK_BUS_TYPE_SCSI;
473 disk->unit = tgt[2];
474 } else {
475 /* virtio-blk: 1 disk per 1 device */
476 disk->bus_type = GUEST_DISK_BUS_TYPE_VIRTIO;
477 }
478 } else if (strcmp(driver, "ahci") == 0) {
479 /* ahci: 1 host per 1 unit */
480 if (!has_host || !has_tgt) {
481 g_debug("invalid sysfs path '%s' (driver '%s')", syspath, driver);
482 goto cleanup;
483 }
484 for (i = 0; i < nhosts; i++) {
485 if (host == hosts[i]) {
486 disk->unit = i;
487 disk->bus_type = GUEST_DISK_BUS_TYPE_SATA;
488 break;
489 }
490 }
491 if (i >= nhosts) {
492 g_debug("no host for '%s' (driver '%s')", syspath, driver);
493 goto cleanup;
494 }
495 } else if (strcmp(driver, "nvme") == 0) {
496 disk->bus_type = GUEST_DISK_BUS_TYPE_NVME;
497 } else if (strcmp(driver, "ehci-pci") == 0 || strcmp(driver, "xhci_hcd") == 0) {
498 disk->bus_type = GUEST_DISK_BUS_TYPE_USB;
499 } else {
500 g_debug("unknown driver '%s' (sysfs path '%s')", driver, syspath);
501 goto cleanup;
502 }
503
504 ret = true;
505
506 cleanup:
507 g_free(driver);
508 return ret;
509 }
510
511 /*
512 * Store disk device info for non-PCI virtio devices (for example s390x
513 * channel I/O devices). Returns true if information has been stored, or
514 * false for failure.
515 */
build_guest_fsinfo_for_nonpci_virtio(char const * syspath,GuestDiskAddress * disk,Error ** errp)516 static bool build_guest_fsinfo_for_nonpci_virtio(char const *syspath,
517 GuestDiskAddress *disk,
518 Error **errp)
519 {
520 unsigned int tgt[3];
521 char *p;
522
523 if (!strstr(syspath, "/virtio") || !strstr(syspath, "/block")) {
524 g_debug("Unsupported virtio device '%s'", syspath);
525 return false;
526 }
527
528 p = strstr(syspath, "/target");
529 if (p && sscanf(p + 7, "%*u:%*u:%*u/%*u:%u:%u:%u",
530 &tgt[0], &tgt[1], &tgt[2]) == 3) {
531 /* virtio-scsi: target*:0:<target>:<unit> */
532 disk->bus_type = GUEST_DISK_BUS_TYPE_SCSI;
533 disk->bus = tgt[0];
534 disk->target = tgt[1];
535 disk->unit = tgt[2];
536 } else {
537 /* virtio-blk: 1 disk per 1 device */
538 disk->bus_type = GUEST_DISK_BUS_TYPE_VIRTIO;
539 }
540
541 return true;
542 }
543
544 /*
545 * Store disk device info for CCW devices (s390x channel I/O devices).
546 * Returns true if information has been stored, or false for failure.
547 */
build_guest_fsinfo_for_ccw_dev(char const * syspath,GuestDiskAddress * disk,Error ** errp)548 static bool build_guest_fsinfo_for_ccw_dev(char const *syspath,
549 GuestDiskAddress *disk,
550 Error **errp)
551 {
552 unsigned int cssid, ssid, subchno, devno;
553 char *p;
554
555 p = strstr(syspath, "/devices/css");
556 if (!p || sscanf(p + 12, "%*x/%x.%x.%x/%*x.%*x.%x/",
557 &cssid, &ssid, &subchno, &devno) < 4) {
558 g_debug("could not parse ccw device sysfs path: %s", syspath);
559 return false;
560 }
561
562 disk->ccw_address = g_new0(GuestCCWAddress, 1);
563 disk->ccw_address->cssid = cssid;
564 disk->ccw_address->ssid = ssid;
565 disk->ccw_address->subchno = subchno;
566 disk->ccw_address->devno = devno;
567
568 if (strstr(p, "/virtio")) {
569 build_guest_fsinfo_for_nonpci_virtio(syspath, disk, errp);
570 }
571
572 return true;
573 }
574
575 /* Store disk device info specified by @sysfs into @fs */
build_guest_fsinfo_for_real_device(char const * syspath,GuestFilesystemInfo * fs,Error ** errp)576 static void build_guest_fsinfo_for_real_device(char const *syspath,
577 GuestFilesystemInfo *fs,
578 Error **errp)
579 {
580 GuestDiskAddress *disk;
581 GuestPCIAddress *pciaddr;
582 bool has_hwinf;
583 #ifdef CONFIG_LIBUDEV
584 struct udev *udev = NULL;
585 struct udev_device *udevice = NULL;
586 #endif
587
588 pciaddr = g_new0(GuestPCIAddress, 1);
589 pciaddr->domain = -1; /* -1 means field is invalid */
590 pciaddr->bus = -1;
591 pciaddr->slot = -1;
592 pciaddr->function = -1;
593
594 disk = g_new0(GuestDiskAddress, 1);
595 disk->pci_controller = pciaddr;
596 disk->bus_type = GUEST_DISK_BUS_TYPE_UNKNOWN;
597
598 #ifdef CONFIG_LIBUDEV
599 udev = udev_new();
600 udevice = udev_device_new_from_syspath(udev, syspath);
601 if (udev == NULL || udevice == NULL) {
602 g_debug("failed to query udev");
603 } else {
604 const char *devnode, *serial;
605 devnode = udev_device_get_devnode(udevice);
606 if (devnode != NULL) {
607 disk->dev = g_strdup(devnode);
608 }
609 serial = udev_device_get_property_value(udevice, "ID_SERIAL");
610 if (serial != NULL && *serial != 0) {
611 disk->serial = g_strdup(serial);
612 }
613 }
614
615 udev_unref(udev);
616 udev_device_unref(udevice);
617 #endif
618
619 if (strstr(syspath, "/devices/pci")) {
620 has_hwinf = build_guest_fsinfo_for_pci_dev(syspath, disk, errp);
621 } else if (strstr(syspath, "/devices/css")) {
622 has_hwinf = build_guest_fsinfo_for_ccw_dev(syspath, disk, errp);
623 } else if (strstr(syspath, "/virtio")) {
624 has_hwinf = build_guest_fsinfo_for_nonpci_virtio(syspath, disk, errp);
625 } else {
626 g_debug("Unsupported device type for '%s'", syspath);
627 has_hwinf = false;
628 }
629
630 if (has_hwinf || disk->dev || disk->serial) {
631 QAPI_LIST_PREPEND(fs->disk, disk);
632 } else {
633 qapi_free_GuestDiskAddress(disk);
634 }
635 }
636
637 static void build_guest_fsinfo_for_device(char const *devpath,
638 GuestFilesystemInfo *fs,
639 Error **errp);
640
641 /* Store a list of slave devices of virtual volume specified by @syspath into
642 * @fs */
build_guest_fsinfo_for_virtual_device(char const * syspath,GuestFilesystemInfo * fs,Error ** errp)643 static void build_guest_fsinfo_for_virtual_device(char const *syspath,
644 GuestFilesystemInfo *fs,
645 Error **errp)
646 {
647 Error *err = NULL;
648 DIR *dir;
649 char *dirpath;
650 struct dirent *entry;
651
652 dirpath = g_strdup_printf("%s/slaves", syspath);
653 dir = opendir(dirpath);
654 if (!dir) {
655 if (errno != ENOENT) {
656 error_setg_errno(errp, errno, "opendir(\"%s\")", dirpath);
657 }
658 g_free(dirpath);
659 return;
660 }
661
662 for (;;) {
663 errno = 0;
664 entry = readdir(dir);
665 if (entry == NULL) {
666 if (errno) {
667 error_setg_errno(errp, errno, "readdir(\"%s\")", dirpath);
668 }
669 break;
670 }
671
672 if (entry->d_type == DT_LNK) {
673 char *path;
674
675 g_debug(" slave device '%s'", entry->d_name);
676 path = g_strdup_printf("%s/slaves/%s", syspath, entry->d_name);
677 build_guest_fsinfo_for_device(path, fs, &err);
678 g_free(path);
679
680 if (err) {
681 error_propagate(errp, err);
682 break;
683 }
684 }
685 }
686
687 g_free(dirpath);
688 closedir(dir);
689 }
690
is_disk_virtual(const char * devpath,Error ** errp)691 static bool is_disk_virtual(const char *devpath, Error **errp)
692 {
693 g_autofree char *syspath = realpath(devpath, NULL);
694
695 if (!syspath) {
696 error_setg_errno(errp, errno, "realpath(\"%s\")", devpath);
697 return false;
698 }
699 return strstr(syspath, "/devices/virtual/block/") != NULL;
700 }
701
702 /* Dispatch to functions for virtual/real device */
build_guest_fsinfo_for_device(char const * devpath,GuestFilesystemInfo * fs,Error ** errp)703 static void build_guest_fsinfo_for_device(char const *devpath,
704 GuestFilesystemInfo *fs,
705 Error **errp)
706 {
707 ERRP_GUARD();
708 g_autofree char *syspath = NULL;
709 bool is_virtual = false;
710
711 syspath = realpath(devpath, NULL);
712 if (!syspath) {
713 if (errno != ENOENT) {
714 error_setg_errno(errp, errno, "realpath(\"%s\")", devpath);
715 return;
716 }
717
718 /* ENOENT: This devpath may not exist because of container config */
719 if (!fs->name) {
720 fs->name = g_path_get_basename(devpath);
721 }
722 return;
723 }
724
725 if (!fs->name) {
726 fs->name = g_path_get_basename(syspath);
727 }
728
729 g_debug(" parse sysfs path '%s'", syspath);
730 is_virtual = is_disk_virtual(syspath, errp);
731 if (*errp != NULL) {
732 return;
733 }
734 if (is_virtual) {
735 build_guest_fsinfo_for_virtual_device(syspath, fs, errp);
736 } else {
737 build_guest_fsinfo_for_real_device(syspath, fs, errp);
738 }
739 }
740
741 #ifdef CONFIG_LIBUDEV
742
743 /*
744 * Wrapper around build_guest_fsinfo_for_device() for getting just
745 * the disk address.
746 */
get_disk_address(const char * syspath,Error ** errp)747 static GuestDiskAddress *get_disk_address(const char *syspath, Error **errp)
748 {
749 g_autoptr(GuestFilesystemInfo) fs = NULL;
750
751 fs = g_new0(GuestFilesystemInfo, 1);
752 build_guest_fsinfo_for_device(syspath, fs, errp);
753 if (fs->disk != NULL) {
754 return g_steal_pointer(&fs->disk->value);
755 }
756 return NULL;
757 }
758
get_alias_for_syspath(const char * syspath)759 static char *get_alias_for_syspath(const char *syspath)
760 {
761 struct udev *udev = NULL;
762 struct udev_device *udevice = NULL;
763 char *ret = NULL;
764
765 udev = udev_new();
766 if (udev == NULL) {
767 g_debug("failed to query udev");
768 goto out;
769 }
770 udevice = udev_device_new_from_syspath(udev, syspath);
771 if (udevice == NULL) {
772 g_debug("failed to query udev for path: %s", syspath);
773 goto out;
774 } else {
775 const char *alias = udev_device_get_property_value(
776 udevice, "DM_NAME");
777 /*
778 * NULL means there was an error and empty string means there is no
779 * alias. In case of no alias we return NULL instead of empty string.
780 */
781 if (alias == NULL) {
782 g_debug("failed to query udev for device alias for: %s",
783 syspath);
784 } else if (*alias != 0) {
785 ret = g_strdup(alias);
786 }
787 }
788
789 out:
790 udev_unref(udev);
791 udev_device_unref(udevice);
792 return ret;
793 }
794
get_device_for_syspath(const char * syspath)795 static char *get_device_for_syspath(const char *syspath)
796 {
797 struct udev *udev = NULL;
798 struct udev_device *udevice = NULL;
799 char *ret = NULL;
800
801 udev = udev_new();
802 if (udev == NULL) {
803 g_debug("failed to query udev");
804 goto out;
805 }
806 udevice = udev_device_new_from_syspath(udev, syspath);
807 if (udevice == NULL) {
808 g_debug("failed to query udev for path: %s", syspath);
809 goto out;
810 } else {
811 ret = g_strdup(udev_device_get_devnode(udevice));
812 }
813
814 out:
815 udev_unref(udev);
816 udev_device_unref(udevice);
817 return ret;
818 }
819
get_disk_deps(const char * disk_dir,GuestDiskInfo * disk)820 static void get_disk_deps(const char *disk_dir, GuestDiskInfo *disk)
821 {
822 g_autofree char *deps_dir = NULL;
823 const gchar *dep;
824 GDir *dp_deps = NULL;
825
826 /* List dependent disks */
827 deps_dir = g_strdup_printf("%s/slaves", disk_dir);
828 g_debug(" listing entries in: %s", deps_dir);
829 dp_deps = g_dir_open(deps_dir, 0, NULL);
830 if (dp_deps == NULL) {
831 g_debug("failed to list entries in %s", deps_dir);
832 return;
833 }
834 disk->has_dependencies = true;
835 while ((dep = g_dir_read_name(dp_deps)) != NULL) {
836 g_autofree char *dep_dir = NULL;
837 char *dev_name;
838
839 /* Add dependent disks */
840 dep_dir = g_strdup_printf("%s/%s", deps_dir, dep);
841 dev_name = get_device_for_syspath(dep_dir);
842 if (dev_name != NULL) {
843 g_debug(" adding dependent device: %s", dev_name);
844 QAPI_LIST_PREPEND(disk->dependencies, dev_name);
845 }
846 }
847 g_dir_close(dp_deps);
848 }
849
850 /*
851 * Detect partitions subdirectory, name is "<disk_name><number>" or
852 * "<disk_name>p<number>"
853 *
854 * @disk_name -- last component of /sys path (e.g. sda)
855 * @disk_dir -- sys path of the disk (e.g. /sys/block/sda)
856 * @disk_dev -- device node of the disk (e.g. /dev/sda)
857 */
get_disk_partitions(GuestDiskInfoList * list,const char * disk_name,const char * disk_dir,const char * disk_dev)858 static GuestDiskInfoList *get_disk_partitions(
859 GuestDiskInfoList *list,
860 const char *disk_name, const char *disk_dir,
861 const char *disk_dev)
862 {
863 GuestDiskInfoList *ret = list;
864 struct dirent *de_disk;
865 DIR *dp_disk = NULL;
866 size_t len = strlen(disk_name);
867
868 dp_disk = opendir(disk_dir);
869 while ((de_disk = readdir(dp_disk)) != NULL) {
870 g_autofree char *partition_dir = NULL;
871 char *dev_name;
872 GuestDiskInfo *partition;
873
874 if (!(de_disk->d_type & DT_DIR)) {
875 continue;
876 }
877
878 if (!(strncmp(disk_name, de_disk->d_name, len) == 0 &&
879 ((*(de_disk->d_name + len) == 'p' &&
880 isdigit(*(de_disk->d_name + len + 1))) ||
881 isdigit(*(de_disk->d_name + len))))) {
882 continue;
883 }
884
885 partition_dir = g_strdup_printf("%s/%s",
886 disk_dir, de_disk->d_name);
887 dev_name = get_device_for_syspath(partition_dir);
888 if (dev_name == NULL) {
889 g_debug("Failed to get device name for syspath: %s",
890 disk_dir);
891 continue;
892 }
893 partition = g_new0(GuestDiskInfo, 1);
894 partition->name = dev_name;
895 partition->partition = true;
896 partition->has_dependencies = true;
897 /* Add parent disk as dependent for easier tracking of hierarchy */
898 QAPI_LIST_PREPEND(partition->dependencies, g_strdup(disk_dev));
899
900 QAPI_LIST_PREPEND(ret, partition);
901 }
902 closedir(dp_disk);
903
904 return ret;
905 }
906
get_nvme_smart(GuestDiskInfo * disk)907 static void get_nvme_smart(GuestDiskInfo *disk)
908 {
909 int fd;
910 GuestNVMeSmart *smart;
911 NvmeSmartLog log = {0};
912 struct nvme_admin_cmd cmd = {
913 .opcode = NVME_ADM_CMD_GET_LOG_PAGE,
914 .nsid = NVME_NSID_BROADCAST,
915 .addr = (uintptr_t)&log,
916 .data_len = sizeof(log),
917 .cdw10 = NVME_LOG_SMART_INFO | (1 << 15) /* RAE bit */
918 | (((sizeof(log) >> 2) - 1) << 16)
919 };
920
921 fd = qga_open_cloexec(disk->name, O_RDONLY, 0);
922 if (fd == -1) {
923 g_debug("Failed to open device: %s: %s", disk->name, g_strerror(errno));
924 return;
925 }
926
927 if (ioctl(fd, NVME_IOCTL_ADMIN_CMD, &cmd)) {
928 g_debug("Failed to get smart: %s: %s", disk->name, g_strerror(errno));
929 close(fd);
930 return;
931 }
932
933 disk->smart = g_new0(GuestDiskSmart, 1);
934 disk->smart->type = GUEST_DISK_BUS_TYPE_NVME;
935
936 smart = &disk->smart->u.nvme;
937 smart->critical_warning = log.critical_warning;
938 smart->temperature = lduw_le_p(&log.temperature); /* unaligned field */
939 smart->available_spare = log.available_spare;
940 smart->available_spare_threshold = log.available_spare_threshold;
941 smart->percentage_used = log.percentage_used;
942 smart->data_units_read_lo = le64_to_cpu(log.data_units_read[0]);
943 smart->data_units_read_hi = le64_to_cpu(log.data_units_read[1]);
944 smart->data_units_written_lo = le64_to_cpu(log.data_units_written[0]);
945 smart->data_units_written_hi = le64_to_cpu(log.data_units_written[1]);
946 smart->host_read_commands_lo = le64_to_cpu(log.host_read_commands[0]);
947 smart->host_read_commands_hi = le64_to_cpu(log.host_read_commands[1]);
948 smart->host_write_commands_lo = le64_to_cpu(log.host_write_commands[0]);
949 smart->host_write_commands_hi = le64_to_cpu(log.host_write_commands[1]);
950 smart->controller_busy_time_lo = le64_to_cpu(log.controller_busy_time[0]);
951 smart->controller_busy_time_hi = le64_to_cpu(log.controller_busy_time[1]);
952 smart->power_cycles_lo = le64_to_cpu(log.power_cycles[0]);
953 smart->power_cycles_hi = le64_to_cpu(log.power_cycles[1]);
954 smart->power_on_hours_lo = le64_to_cpu(log.power_on_hours[0]);
955 smart->power_on_hours_hi = le64_to_cpu(log.power_on_hours[1]);
956 smart->unsafe_shutdowns_lo = le64_to_cpu(log.unsafe_shutdowns[0]);
957 smart->unsafe_shutdowns_hi = le64_to_cpu(log.unsafe_shutdowns[1]);
958 smart->media_errors_lo = le64_to_cpu(log.media_errors[0]);
959 smart->media_errors_hi = le64_to_cpu(log.media_errors[1]);
960 smart->number_of_error_log_entries_lo =
961 le64_to_cpu(log.number_of_error_log_entries[0]);
962 smart->number_of_error_log_entries_hi =
963 le64_to_cpu(log.number_of_error_log_entries[1]);
964
965 close(fd);
966 }
967
get_disk_smart(GuestDiskInfo * disk)968 static void get_disk_smart(GuestDiskInfo *disk)
969 {
970 if (disk->address
971 && (disk->address->bus_type == GUEST_DISK_BUS_TYPE_NVME)) {
972 get_nvme_smart(disk);
973 }
974 }
975
qmp_guest_get_disks(Error ** errp)976 GuestDiskInfoList *qmp_guest_get_disks(Error **errp)
977 {
978 GuestDiskInfoList *ret = NULL;
979 GuestDiskInfo *disk;
980 DIR *dp = NULL;
981 struct dirent *de = NULL;
982
983 g_debug("listing /sys/block directory");
984 dp = opendir("/sys/block");
985 if (dp == NULL) {
986 error_setg_errno(errp, errno, "Can't open directory \"/sys/block\"");
987 return NULL;
988 }
989 while ((de = readdir(dp)) != NULL) {
990 g_autofree char *disk_dir = NULL, *line = NULL,
991 *size_path = NULL;
992 char *dev_name;
993 Error *local_err = NULL;
994 if (de->d_type != DT_LNK) {
995 g_debug(" skipping entry: %s", de->d_name);
996 continue;
997 }
998
999 /* Check size and skip zero-sized disks */
1000 g_debug(" checking disk size");
1001 size_path = g_strdup_printf("/sys/block/%s/size", de->d_name);
1002 if (!g_file_get_contents(size_path, &line, NULL, NULL)) {
1003 g_debug(" failed to read disk size");
1004 continue;
1005 }
1006 if (g_strcmp0(line, "0\n") == 0) {
1007 g_debug(" skipping zero-sized disk");
1008 continue;
1009 }
1010
1011 g_debug(" adding %s", de->d_name);
1012 disk_dir = g_strdup_printf("/sys/block/%s", de->d_name);
1013 dev_name = get_device_for_syspath(disk_dir);
1014 if (dev_name == NULL) {
1015 g_debug("Failed to get device name for syspath: %s",
1016 disk_dir);
1017 continue;
1018 }
1019 disk = g_new0(GuestDiskInfo, 1);
1020 disk->name = dev_name;
1021 disk->partition = false;
1022 disk->alias = get_alias_for_syspath(disk_dir);
1023 QAPI_LIST_PREPEND(ret, disk);
1024
1025 /* Get address for non-virtual devices */
1026 bool is_virtual = is_disk_virtual(disk_dir, &local_err);
1027 if (local_err != NULL) {
1028 g_debug(" failed to check disk path, ignoring error: %s",
1029 error_get_pretty(local_err));
1030 error_free(local_err);
1031 local_err = NULL;
1032 /* Don't try to get the address */
1033 is_virtual = true;
1034 }
1035 if (!is_virtual) {
1036 disk->address = get_disk_address(disk_dir, &local_err);
1037 if (local_err != NULL) {
1038 g_debug(" failed to get device info, ignoring error: %s",
1039 error_get_pretty(local_err));
1040 error_free(local_err);
1041 local_err = NULL;
1042 }
1043 }
1044
1045 get_disk_deps(disk_dir, disk);
1046 get_disk_smart(disk);
1047 ret = get_disk_partitions(ret, de->d_name, disk_dir, dev_name);
1048 }
1049
1050 closedir(dp);
1051
1052 return ret;
1053 }
1054
1055 #endif
1056
1057 /* Return a list of the disk device(s)' info which @mount lies on */
build_guest_fsinfo(struct FsMount * mount,Error ** errp)1058 static GuestFilesystemInfo *build_guest_fsinfo(struct FsMount *mount,
1059 Error **errp)
1060 {
1061 GuestFilesystemInfo *fs = g_malloc0(sizeof(*fs));
1062 struct statvfs buf;
1063 unsigned long used, nonroot_total, fr_size;
1064 char *devpath = g_strdup_printf("/sys/dev/block/%u:%u",
1065 mount->devmajor, mount->devminor);
1066
1067 fs->mountpoint = g_strdup(mount->dirname);
1068 fs->type = g_strdup(mount->devtype);
1069 build_guest_fsinfo_for_device(devpath, fs, errp);
1070
1071 if (statvfs(fs->mountpoint, &buf) == 0) {
1072 fr_size = buf.f_frsize;
1073 used = buf.f_blocks - buf.f_bfree;
1074 nonroot_total = used + buf.f_bavail;
1075 fs->used_bytes = used * fr_size;
1076 fs->total_bytes = nonroot_total * fr_size;
1077 fs->total_bytes_privileged = buf.f_blocks * fr_size;
1078
1079 fs->has_total_bytes = true;
1080 fs->has_total_bytes_privileged = true;
1081 fs->has_used_bytes = true;
1082 }
1083
1084 g_free(devpath);
1085
1086 return fs;
1087 }
1088
qmp_guest_get_fsinfo(Error ** errp)1089 GuestFilesystemInfoList *qmp_guest_get_fsinfo(Error **errp)
1090 {
1091 FsMountList mounts;
1092 struct FsMount *mount;
1093 GuestFilesystemInfoList *ret = NULL;
1094 Error *local_err = NULL;
1095
1096 QTAILQ_INIT(&mounts);
1097 if (!build_fs_mount_list(&mounts, &local_err)) {
1098 error_propagate(errp, local_err);
1099 return NULL;
1100 }
1101
1102 QTAILQ_FOREACH(mount, &mounts, next) {
1103 g_debug("Building guest fsinfo for '%s'", mount->dirname);
1104
1105 QAPI_LIST_PREPEND(ret, build_guest_fsinfo(mount, &local_err));
1106 if (local_err) {
1107 error_propagate(errp, local_err);
1108 qapi_free_GuestFilesystemInfoList(ret);
1109 ret = NULL;
1110 break;
1111 }
1112 }
1113
1114 free_fs_mount_list(&mounts);
1115 return ret;
1116 }
1117 #endif /* CONFIG_FSFREEZE */
1118
1119 #if defined(CONFIG_FSTRIM)
1120 /*
1121 * Walk list of mounted file systems in the guest, and trim them.
1122 */
1123 GuestFilesystemTrimResponse *
qmp_guest_fstrim(bool has_minimum,int64_t minimum,Error ** errp)1124 qmp_guest_fstrim(bool has_minimum, int64_t minimum, Error **errp)
1125 {
1126 GuestFilesystemTrimResponse *response;
1127 GuestFilesystemTrimResult *result;
1128 int ret = 0;
1129 FsMountList mounts;
1130 struct FsMount *mount;
1131 int fd;
1132 struct fstrim_range r;
1133
1134 slog("guest-fstrim called");
1135
1136 QTAILQ_INIT(&mounts);
1137 if (!build_fs_mount_list(&mounts, errp)) {
1138 return NULL;
1139 }
1140
1141 response = g_malloc0(sizeof(*response));
1142
1143 QTAILQ_FOREACH(mount, &mounts, next) {
1144 result = g_malloc0(sizeof(*result));
1145 result->path = g_strdup(mount->dirname);
1146
1147 QAPI_LIST_PREPEND(response->paths, result);
1148
1149 fd = qga_open_cloexec(mount->dirname, O_RDONLY, 0);
1150 if (fd == -1) {
1151 result->error = g_strdup_printf("failed to open: %s",
1152 strerror(errno));
1153 continue;
1154 }
1155
1156 /* We try to cull filesystems we know won't work in advance, but other
1157 * filesystems may not implement fstrim for less obvious reasons.
1158 * These will report EOPNOTSUPP; while in some other cases ENOTTY
1159 * will be reported (e.g. CD-ROMs).
1160 * Any other error means an unexpected error.
1161 */
1162 r.start = 0;
1163 r.len = -1;
1164 r.minlen = has_minimum ? minimum : 0;
1165 ret = ioctl(fd, FITRIM, &r);
1166 if (ret == -1) {
1167 if (errno == ENOTTY || errno == EOPNOTSUPP) {
1168 result->error = g_strdup("trim not supported");
1169 } else {
1170 result->error = g_strdup_printf("failed to trim: %s",
1171 strerror(errno));
1172 }
1173 close(fd);
1174 continue;
1175 }
1176
1177 result->has_minimum = true;
1178 result->minimum = r.minlen;
1179 result->has_trimmed = true;
1180 result->trimmed = r.len;
1181 close(fd);
1182 }
1183
1184 free_fs_mount_list(&mounts);
1185 return response;
1186 }
1187 #endif /* CONFIG_FSTRIM */
1188
1189 #define LINUX_SYS_STATE_FILE "/sys/power/state"
1190 #define SUSPEND_SUPPORTED 0
1191 #define SUSPEND_NOT_SUPPORTED 1
1192
1193 typedef enum {
1194 SUSPEND_MODE_DISK = 0,
1195 SUSPEND_MODE_RAM = 1,
1196 SUSPEND_MODE_HYBRID = 2,
1197 } SuspendMode;
1198
1199 /*
1200 * Executes a command in a child process using g_spawn_sync,
1201 * returning an int >= 0 representing the exit status of the
1202 * process.
1203 *
1204 * If the program wasn't found in path, returns -1.
1205 *
1206 * If a problem happened when creating the child process,
1207 * returns -1 and errp is set.
1208 */
run_process_child(const char * command[],Error ** errp)1209 static int run_process_child(const char *command[], Error **errp)
1210 {
1211 int exit_status, spawn_flag;
1212 GError *g_err = NULL;
1213 bool success;
1214
1215 spawn_flag = G_SPAWN_SEARCH_PATH | G_SPAWN_STDOUT_TO_DEV_NULL |
1216 G_SPAWN_STDERR_TO_DEV_NULL;
1217
1218 success = g_spawn_sync(NULL, (char **)command, NULL, spawn_flag,
1219 NULL, NULL, NULL, NULL,
1220 &exit_status, &g_err);
1221
1222 if (success) {
1223 return WEXITSTATUS(exit_status);
1224 }
1225
1226 if (g_err && (g_err->code != G_SPAWN_ERROR_NOENT)) {
1227 error_setg(errp, "failed to create child process, error '%s'",
1228 g_err->message);
1229 }
1230
1231 g_error_free(g_err);
1232 return -1;
1233 }
1234
systemd_supports_mode(SuspendMode mode,Error ** errp)1235 static bool systemd_supports_mode(SuspendMode mode, Error **errp)
1236 {
1237 const char *systemctl_args[3] = {"systemd-hibernate", "systemd-suspend",
1238 "systemd-hybrid-sleep"};
1239 const char *cmd[4] = {"systemctl", "status", systemctl_args[mode], NULL};
1240 int status;
1241
1242 status = run_process_child(cmd, errp);
1243
1244 /*
1245 * systemctl status uses LSB return codes so we can expect
1246 * status > 0 and be ok. To assert if the guest has support
1247 * for the selected suspend mode, status should be < 4. 4 is
1248 * the code for unknown service status, the return value when
1249 * the service does not exist. A common value is status = 3
1250 * (program is not running).
1251 */
1252 if (status > 0 && status < 4) {
1253 return true;
1254 }
1255
1256 return false;
1257 }
1258
systemd_suspend(SuspendMode mode,Error ** errp)1259 static void systemd_suspend(SuspendMode mode, Error **errp)
1260 {
1261 Error *local_err = NULL;
1262 const char *systemctl_args[3] = {"hibernate", "suspend", "hybrid-sleep"};
1263 const char *cmd[3] = {"systemctl", systemctl_args[mode], NULL};
1264 int status;
1265
1266 status = run_process_child(cmd, &local_err);
1267
1268 if (status == 0) {
1269 return;
1270 }
1271
1272 if ((status == -1) && !local_err) {
1273 error_setg(errp, "the helper program 'systemctl %s' was not found",
1274 systemctl_args[mode]);
1275 return;
1276 }
1277
1278 if (local_err) {
1279 error_propagate(errp, local_err);
1280 } else {
1281 error_setg(errp, "the helper program 'systemctl %s' returned an "
1282 "unexpected exit status code (%d)",
1283 systemctl_args[mode], status);
1284 }
1285 }
1286
pmutils_supports_mode(SuspendMode mode,Error ** errp)1287 static bool pmutils_supports_mode(SuspendMode mode, Error **errp)
1288 {
1289 Error *local_err = NULL;
1290 const char *pmutils_args[3] = {"--hibernate", "--suspend",
1291 "--suspend-hybrid"};
1292 const char *cmd[3] = {"pm-is-supported", pmutils_args[mode], NULL};
1293 int status;
1294
1295 status = run_process_child(cmd, &local_err);
1296
1297 if (status == SUSPEND_SUPPORTED) {
1298 return true;
1299 }
1300
1301 if ((status == -1) && !local_err) {
1302 return false;
1303 }
1304
1305 if (local_err) {
1306 error_propagate(errp, local_err);
1307 } else {
1308 error_setg(errp,
1309 "the helper program '%s' returned an unexpected exit"
1310 " status code (%d)", "pm-is-supported", status);
1311 }
1312
1313 return false;
1314 }
1315
pmutils_suspend(SuspendMode mode,Error ** errp)1316 static void pmutils_suspend(SuspendMode mode, Error **errp)
1317 {
1318 Error *local_err = NULL;
1319 const char *pmutils_binaries[3] = {"pm-hibernate", "pm-suspend",
1320 "pm-suspend-hybrid"};
1321 const char *cmd[2] = {pmutils_binaries[mode], NULL};
1322 int status;
1323
1324 status = run_process_child(cmd, &local_err);
1325
1326 if (status == 0) {
1327 return;
1328 }
1329
1330 if ((status == -1) && !local_err) {
1331 error_setg(errp, "the helper program '%s' was not found",
1332 pmutils_binaries[mode]);
1333 return;
1334 }
1335
1336 if (local_err) {
1337 error_propagate(errp, local_err);
1338 } else {
1339 error_setg(errp,
1340 "the helper program '%s' returned an unexpected exit"
1341 " status code (%d)", pmutils_binaries[mode], status);
1342 }
1343 }
1344
linux_sys_state_supports_mode(SuspendMode mode,Error ** errp)1345 static bool linux_sys_state_supports_mode(SuspendMode mode, Error **errp)
1346 {
1347 const char *sysfile_strs[3] = {"disk", "mem", NULL};
1348 const char *sysfile_str = sysfile_strs[mode];
1349 char buf[32]; /* hopefully big enough */
1350 int fd;
1351 ssize_t ret;
1352
1353 if (!sysfile_str) {
1354 error_setg(errp, "unknown guest suspend mode");
1355 return false;
1356 }
1357
1358 fd = open(LINUX_SYS_STATE_FILE, O_RDONLY);
1359 if (fd < 0) {
1360 return false;
1361 }
1362
1363 ret = read(fd, buf, sizeof(buf) - 1);
1364 close(fd);
1365 if (ret <= 0) {
1366 return false;
1367 }
1368 buf[ret] = '\0';
1369
1370 if (strstr(buf, sysfile_str)) {
1371 return true;
1372 }
1373 return false;
1374 }
1375
linux_sys_state_suspend(SuspendMode mode,Error ** errp)1376 static void linux_sys_state_suspend(SuspendMode mode, Error **errp)
1377 {
1378 g_autoptr(GError) local_gerr = NULL;
1379 const char *sysfile_strs[3] = {"disk", "mem", NULL};
1380 const char *sysfile_str = sysfile_strs[mode];
1381
1382 if (!sysfile_str) {
1383 error_setg(errp, "unknown guest suspend mode");
1384 return;
1385 }
1386
1387 if (!g_file_set_contents(LINUX_SYS_STATE_FILE, sysfile_str,
1388 -1, &local_gerr)) {
1389 error_setg(errp, "suspend: cannot write to '%s': %s",
1390 LINUX_SYS_STATE_FILE, local_gerr->message);
1391 return;
1392 }
1393 }
1394
guest_suspend(SuspendMode mode,Error ** errp)1395 static void guest_suspend(SuspendMode mode, Error **errp)
1396 {
1397 Error *local_err = NULL;
1398 bool mode_supported = false;
1399
1400 if (systemd_supports_mode(mode, &local_err)) {
1401 mode_supported = true;
1402 systemd_suspend(mode, &local_err);
1403
1404 if (!local_err) {
1405 return;
1406 }
1407 }
1408
1409 error_free(local_err);
1410 local_err = NULL;
1411
1412 if (pmutils_supports_mode(mode, &local_err)) {
1413 mode_supported = true;
1414 pmutils_suspend(mode, &local_err);
1415
1416 if (!local_err) {
1417 return;
1418 }
1419 }
1420
1421 error_free(local_err);
1422 local_err = NULL;
1423
1424 if (linux_sys_state_supports_mode(mode, &local_err)) {
1425 mode_supported = true;
1426 linux_sys_state_suspend(mode, &local_err);
1427 }
1428
1429 if (!mode_supported) {
1430 error_free(local_err);
1431 error_setg(errp,
1432 "the requested suspend mode is not supported by the guest");
1433 } else {
1434 error_propagate(errp, local_err);
1435 }
1436 }
1437
qmp_guest_suspend_disk(Error ** errp)1438 void qmp_guest_suspend_disk(Error **errp)
1439 {
1440 guest_suspend(SUSPEND_MODE_DISK, errp);
1441 }
1442
qmp_guest_suspend_ram(Error ** errp)1443 void qmp_guest_suspend_ram(Error **errp)
1444 {
1445 guest_suspend(SUSPEND_MODE_RAM, errp);
1446 }
1447
qmp_guest_suspend_hybrid(Error ** errp)1448 void qmp_guest_suspend_hybrid(Error **errp)
1449 {
1450 guest_suspend(SUSPEND_MODE_HYBRID, errp);
1451 }
1452
1453 /* Transfer online/offline status between @vcpu and the guest system.
1454 *
1455 * On input either @errp or *@errp must be NULL.
1456 *
1457 * In system-to-@vcpu direction, the following @vcpu fields are accessed:
1458 * - R: vcpu->logical_id
1459 * - W: vcpu->online
1460 * - W: vcpu->can_offline
1461 *
1462 * In @vcpu-to-system direction, the following @vcpu fields are accessed:
1463 * - R: vcpu->logical_id
1464 * - R: vcpu->online
1465 *
1466 * Written members remain unmodified on error.
1467 */
transfer_vcpu(GuestLogicalProcessor * vcpu,bool sys2vcpu,char * dirpath,Error ** errp)1468 static void transfer_vcpu(GuestLogicalProcessor *vcpu, bool sys2vcpu,
1469 char *dirpath, Error **errp)
1470 {
1471 int fd;
1472 int res;
1473 int dirfd;
1474 static const char fn[] = "online";
1475
1476 dirfd = open(dirpath, O_RDONLY | O_DIRECTORY);
1477 if (dirfd == -1) {
1478 error_setg_errno(errp, errno, "open(\"%s\")", dirpath);
1479 return;
1480 }
1481
1482 fd = openat(dirfd, fn, sys2vcpu ? O_RDONLY : O_RDWR);
1483 if (fd == -1) {
1484 if (errno != ENOENT) {
1485 error_setg_errno(errp, errno, "open(\"%s/%s\")", dirpath, fn);
1486 } else if (sys2vcpu) {
1487 vcpu->online = true;
1488 vcpu->can_offline = false;
1489 } else if (!vcpu->online) {
1490 error_setg(errp, "logical processor #%" PRId64 " can't be "
1491 "offlined", vcpu->logical_id);
1492 } /* otherwise pretend successful re-onlining */
1493 } else {
1494 unsigned char status;
1495
1496 res = pread(fd, &status, 1, 0);
1497 if (res == -1) {
1498 error_setg_errno(errp, errno, "pread(\"%s/%s\")", dirpath, fn);
1499 } else if (res == 0) {
1500 error_setg(errp, "pread(\"%s/%s\"): unexpected EOF", dirpath,
1501 fn);
1502 } else if (sys2vcpu) {
1503 vcpu->online = (status != '0');
1504 vcpu->can_offline = true;
1505 } else if (vcpu->online != (status != '0')) {
1506 status = '0' + vcpu->online;
1507 if (pwrite(fd, &status, 1, 0) == -1) {
1508 error_setg_errno(errp, errno, "pwrite(\"%s/%s\")", dirpath,
1509 fn);
1510 }
1511 } /* otherwise pretend successful re-(on|off)-lining */
1512
1513 res = close(fd);
1514 g_assert(res == 0);
1515 }
1516
1517 res = close(dirfd);
1518 g_assert(res == 0);
1519 }
1520
qmp_guest_get_vcpus(Error ** errp)1521 GuestLogicalProcessorList *qmp_guest_get_vcpus(Error **errp)
1522 {
1523 GuestLogicalProcessorList *head, **tail;
1524 const char *cpu_dir = "/sys/devices/system/cpu";
1525 const gchar *line;
1526 g_autoptr(GDir) cpu_gdir = NULL;
1527 Error *local_err = NULL;
1528
1529 head = NULL;
1530 tail = &head;
1531 cpu_gdir = g_dir_open(cpu_dir, 0, NULL);
1532
1533 if (cpu_gdir == NULL) {
1534 error_setg_errno(errp, errno, "failed to list entries: %s", cpu_dir);
1535 return NULL;
1536 }
1537
1538 while (local_err == NULL && (line = g_dir_read_name(cpu_gdir)) != NULL) {
1539 GuestLogicalProcessor *vcpu;
1540 int64_t id;
1541 if (sscanf(line, "cpu%" PRId64, &id)) {
1542 g_autofree char *path = g_strdup_printf("/sys/devices/system/cpu/"
1543 "cpu%" PRId64 "/", id);
1544 vcpu = g_malloc0(sizeof *vcpu);
1545 vcpu->logical_id = id;
1546 vcpu->has_can_offline = true; /* lolspeak ftw */
1547 transfer_vcpu(vcpu, true, path, &local_err);
1548 QAPI_LIST_APPEND(tail, vcpu);
1549 }
1550 }
1551
1552 if (local_err == NULL) {
1553 /* there's no guest with zero VCPUs */
1554 g_assert(head != NULL);
1555 return head;
1556 }
1557
1558 qapi_free_GuestLogicalProcessorList(head);
1559 error_propagate(errp, local_err);
1560 return NULL;
1561 }
1562
qmp_guest_set_vcpus(GuestLogicalProcessorList * vcpus,Error ** errp)1563 int64_t qmp_guest_set_vcpus(GuestLogicalProcessorList *vcpus, Error **errp)
1564 {
1565 int64_t processed;
1566 Error *local_err = NULL;
1567
1568 processed = 0;
1569 while (vcpus != NULL) {
1570 char *path = g_strdup_printf("/sys/devices/system/cpu/cpu%" PRId64 "/",
1571 vcpus->value->logical_id);
1572
1573 transfer_vcpu(vcpus->value, false, path, &local_err);
1574 g_free(path);
1575 if (local_err != NULL) {
1576 break;
1577 }
1578 ++processed;
1579 vcpus = vcpus->next;
1580 }
1581
1582 if (local_err != NULL) {
1583 if (processed == 0) {
1584 error_propagate(errp, local_err);
1585 } else {
1586 error_free(local_err);
1587 }
1588 }
1589
1590 return processed;
1591 }
1592
1593
ga_read_sysfs_file(int dirfd,const char * pathname,char * buf,int size,Error ** errp)1594 static void ga_read_sysfs_file(int dirfd, const char *pathname, char *buf,
1595 int size, Error **errp)
1596 {
1597 int fd;
1598 int res;
1599
1600 errno = 0;
1601 fd = openat(dirfd, pathname, O_RDONLY);
1602 if (fd == -1) {
1603 error_setg_errno(errp, errno, "open sysfs file \"%s\"", pathname);
1604 return;
1605 }
1606
1607 res = pread(fd, buf, size, 0);
1608 if (res == -1) {
1609 error_setg_errno(errp, errno, "pread sysfs file \"%s\"", pathname);
1610 } else if (res == 0) {
1611 error_setg(errp, "pread sysfs file \"%s\": unexpected EOF", pathname);
1612 }
1613 close(fd);
1614 }
1615
ga_write_sysfs_file(int dirfd,const char * pathname,const char * buf,int size,Error ** errp)1616 static void ga_write_sysfs_file(int dirfd, const char *pathname,
1617 const char *buf, int size, Error **errp)
1618 {
1619 int fd;
1620
1621 errno = 0;
1622 fd = openat(dirfd, pathname, O_WRONLY);
1623 if (fd == -1) {
1624 error_setg_errno(errp, errno, "open sysfs file \"%s\"", pathname);
1625 return;
1626 }
1627
1628 if (pwrite(fd, buf, size, 0) == -1) {
1629 error_setg_errno(errp, errno, "pwrite sysfs file \"%s\"", pathname);
1630 }
1631
1632 close(fd);
1633 }
1634
1635 /* Transfer online/offline status between @mem_blk and the guest system.
1636 *
1637 * On input either @errp or *@errp must be NULL.
1638 *
1639 * In system-to-@mem_blk direction, the following @mem_blk fields are accessed:
1640 * - R: mem_blk->phys_index
1641 * - W: mem_blk->online
1642 * - W: mem_blk->can_offline
1643 *
1644 * In @mem_blk-to-system direction, the following @mem_blk fields are accessed:
1645 * - R: mem_blk->phys_index
1646 * - R: mem_blk->online
1647 *- R: mem_blk->can_offline
1648 * Written members remain unmodified on error.
1649 */
transfer_memory_block(GuestMemoryBlock * mem_blk,bool sys2memblk,GuestMemoryBlockResponse * result,Error ** errp)1650 static void transfer_memory_block(GuestMemoryBlock *mem_blk, bool sys2memblk,
1651 GuestMemoryBlockResponse *result,
1652 Error **errp)
1653 {
1654 char *dirpath;
1655 int dirfd;
1656 char *status;
1657 Error *local_err = NULL;
1658
1659 if (!sys2memblk) {
1660 DIR *dp;
1661
1662 if (!result) {
1663 error_setg(errp, "Internal error, 'result' should not be NULL");
1664 return;
1665 }
1666 errno = 0;
1667 dp = opendir("/sys/devices/system/memory/");
1668 /* if there is no 'memory' directory in sysfs,
1669 * we think this VM does not support online/offline memory block,
1670 * any other solution?
1671 */
1672 if (!dp) {
1673 if (errno == ENOENT) {
1674 result->response =
1675 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_NOT_SUPPORTED;
1676 }
1677 goto out1;
1678 }
1679 closedir(dp);
1680 }
1681
1682 dirpath = g_strdup_printf("/sys/devices/system/memory/memory%" PRId64 "/",
1683 mem_blk->phys_index);
1684 dirfd = open(dirpath, O_RDONLY | O_DIRECTORY);
1685 if (dirfd == -1) {
1686 if (sys2memblk) {
1687 error_setg_errno(errp, errno, "open(\"%s\")", dirpath);
1688 } else {
1689 if (errno == ENOENT) {
1690 result->response = GUEST_MEMORY_BLOCK_RESPONSE_TYPE_NOT_FOUND;
1691 } else {
1692 result->response =
1693 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_FAILED;
1694 }
1695 }
1696 g_free(dirpath);
1697 goto out1;
1698 }
1699 g_free(dirpath);
1700
1701 status = g_malloc0(10);
1702 ga_read_sysfs_file(dirfd, "state", status, 10, &local_err);
1703 if (local_err) {
1704 /* treat with sysfs file that not exist in old kernel */
1705 if (errno == ENOENT) {
1706 error_free(local_err);
1707 if (sys2memblk) {
1708 mem_blk->online = true;
1709 mem_blk->can_offline = false;
1710 } else if (!mem_blk->online) {
1711 result->response =
1712 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_NOT_SUPPORTED;
1713 }
1714 } else {
1715 if (sys2memblk) {
1716 error_propagate(errp, local_err);
1717 } else {
1718 error_free(local_err);
1719 result->response =
1720 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_FAILED;
1721 }
1722 }
1723 goto out2;
1724 }
1725
1726 if (sys2memblk) {
1727 char removable = '0';
1728
1729 mem_blk->online = (strncmp(status, "online", 6) == 0);
1730
1731 ga_read_sysfs_file(dirfd, "removable", &removable, 1, &local_err);
1732 if (local_err) {
1733 /* if no 'removable' file, it doesn't support offline mem blk */
1734 if (errno == ENOENT) {
1735 error_free(local_err);
1736 mem_blk->can_offline = false;
1737 } else {
1738 error_propagate(errp, local_err);
1739 }
1740 } else {
1741 mem_blk->can_offline = (removable != '0');
1742 }
1743 } else {
1744 if (mem_blk->online != (strncmp(status, "online", 6) == 0)) {
1745 const char *new_state = mem_blk->online ? "online" : "offline";
1746
1747 ga_write_sysfs_file(dirfd, "state", new_state, strlen(new_state),
1748 &local_err);
1749 if (local_err) {
1750 error_free(local_err);
1751 result->response =
1752 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_FAILED;
1753 goto out2;
1754 }
1755
1756 result->response = GUEST_MEMORY_BLOCK_RESPONSE_TYPE_SUCCESS;
1757 result->has_error_code = false;
1758 } /* otherwise pretend successful re-(on|off)-lining */
1759 }
1760 g_free(status);
1761 close(dirfd);
1762 return;
1763
1764 out2:
1765 g_free(status);
1766 close(dirfd);
1767 out1:
1768 if (!sys2memblk) {
1769 result->has_error_code = true;
1770 result->error_code = errno;
1771 }
1772 }
1773
qmp_guest_get_memory_blocks(Error ** errp)1774 GuestMemoryBlockList *qmp_guest_get_memory_blocks(Error **errp)
1775 {
1776 GuestMemoryBlockList *head, **tail;
1777 Error *local_err = NULL;
1778 struct dirent *de;
1779 DIR *dp;
1780
1781 head = NULL;
1782 tail = &head;
1783
1784 dp = opendir("/sys/devices/system/memory/");
1785 if (!dp) {
1786 /* it's ok if this happens to be a system that doesn't expose
1787 * memory blocks via sysfs, but otherwise we should report
1788 * an error
1789 */
1790 if (errno != ENOENT) {
1791 error_setg_errno(errp, errno, "Can't open directory"
1792 "\"/sys/devices/system/memory/\"");
1793 }
1794 return NULL;
1795 }
1796
1797 /* Note: the phys_index of memory block may be discontinuous,
1798 * this is because a memblk is the unit of the Sparse Memory design, which
1799 * allows discontinuous memory ranges (ex. NUMA), so here we should
1800 * traverse the memory block directory.
1801 */
1802 while ((de = readdir(dp)) != NULL) {
1803 GuestMemoryBlock *mem_blk;
1804
1805 if ((strncmp(de->d_name, "memory", 6) != 0) ||
1806 !(de->d_type & DT_DIR)) {
1807 continue;
1808 }
1809
1810 mem_blk = g_malloc0(sizeof *mem_blk);
1811 /* The d_name is "memoryXXX", phys_index is block id, same as XXX */
1812 mem_blk->phys_index = strtoul(&de->d_name[6], NULL, 10);
1813 mem_blk->has_can_offline = true; /* lolspeak ftw */
1814 transfer_memory_block(mem_blk, true, NULL, &local_err);
1815 if (local_err) {
1816 break;
1817 }
1818
1819 QAPI_LIST_APPEND(tail, mem_blk);
1820 }
1821
1822 closedir(dp);
1823 if (local_err == NULL) {
1824 /* there's no guest with zero memory blocks */
1825 if (head == NULL) {
1826 error_setg(errp, "guest reported zero memory blocks!");
1827 }
1828 return head;
1829 }
1830
1831 qapi_free_GuestMemoryBlockList(head);
1832 error_propagate(errp, local_err);
1833 return NULL;
1834 }
1835
1836 GuestMemoryBlockResponseList *
qmp_guest_set_memory_blocks(GuestMemoryBlockList * mem_blks,Error ** errp)1837 qmp_guest_set_memory_blocks(GuestMemoryBlockList *mem_blks, Error **errp)
1838 {
1839 GuestMemoryBlockResponseList *head, **tail;
1840 Error *local_err = NULL;
1841
1842 head = NULL;
1843 tail = &head;
1844
1845 while (mem_blks != NULL) {
1846 GuestMemoryBlockResponse *result;
1847 GuestMemoryBlock *current_mem_blk = mem_blks->value;
1848
1849 result = g_malloc0(sizeof(*result));
1850 result->phys_index = current_mem_blk->phys_index;
1851 transfer_memory_block(current_mem_blk, false, result, &local_err);
1852 if (local_err) { /* should never happen */
1853 goto err;
1854 }
1855
1856 QAPI_LIST_APPEND(tail, result);
1857 mem_blks = mem_blks->next;
1858 }
1859
1860 return head;
1861 err:
1862 qapi_free_GuestMemoryBlockResponseList(head);
1863 error_propagate(errp, local_err);
1864 return NULL;
1865 }
1866
qmp_guest_get_memory_block_info(Error ** errp)1867 GuestMemoryBlockInfo *qmp_guest_get_memory_block_info(Error **errp)
1868 {
1869 Error *local_err = NULL;
1870 char *dirpath;
1871 int dirfd;
1872 char *buf;
1873 GuestMemoryBlockInfo *info;
1874
1875 dirpath = g_strdup_printf("/sys/devices/system/memory/");
1876 dirfd = open(dirpath, O_RDONLY | O_DIRECTORY);
1877 if (dirfd == -1) {
1878 error_setg_errno(errp, errno, "open(\"%s\")", dirpath);
1879 g_free(dirpath);
1880 return NULL;
1881 }
1882 g_free(dirpath);
1883
1884 buf = g_malloc0(20);
1885 ga_read_sysfs_file(dirfd, "block_size_bytes", buf, 20, &local_err);
1886 close(dirfd);
1887 if (local_err) {
1888 g_free(buf);
1889 error_propagate(errp, local_err);
1890 return NULL;
1891 }
1892
1893 info = g_new0(GuestMemoryBlockInfo, 1);
1894 info->size = strtol(buf, NULL, 16); /* the unit is bytes */
1895
1896 g_free(buf);
1897
1898 return info;
1899 }
1900
1901 #define MAX_NAME_LEN 128
guest_get_diskstats(Error ** errp)1902 static GuestDiskStatsInfoList *guest_get_diskstats(Error **errp)
1903 {
1904 GuestDiskStatsInfoList *head = NULL, **tail = &head;
1905 const char *diskstats = "/proc/diskstats";
1906 FILE *fp;
1907 size_t n;
1908 char *line = NULL;
1909
1910 fp = fopen(diskstats, "r");
1911 if (fp == NULL) {
1912 error_setg_errno(errp, errno, "open(\"%s\")", diskstats);
1913 return NULL;
1914 }
1915
1916 while (getline(&line, &n, fp) != -1) {
1917 g_autofree GuestDiskStatsInfo *diskstatinfo = NULL;
1918 g_autofree GuestDiskStats *diskstat = NULL;
1919 char dev_name[MAX_NAME_LEN];
1920 unsigned int ios_pgr, tot_ticks, rq_ticks, wr_ticks, dc_ticks, fl_ticks;
1921 unsigned long rd_ios, rd_merges_or_rd_sec, rd_ticks_or_wr_sec, wr_ios;
1922 unsigned long wr_merges, rd_sec_or_wr_ios, wr_sec;
1923 unsigned long dc_ios, dc_merges, dc_sec, fl_ios;
1924 unsigned int major, minor;
1925 int i;
1926
1927 i = sscanf(line, "%u %u %s %lu %lu %lu"
1928 "%lu %lu %lu %lu %u %u %u %u"
1929 "%lu %lu %lu %u %lu %u",
1930 &major, &minor, dev_name,
1931 &rd_ios, &rd_merges_or_rd_sec, &rd_sec_or_wr_ios,
1932 &rd_ticks_or_wr_sec, &wr_ios, &wr_merges, &wr_sec,
1933 &wr_ticks, &ios_pgr, &tot_ticks, &rq_ticks,
1934 &dc_ios, &dc_merges, &dc_sec, &dc_ticks,
1935 &fl_ios, &fl_ticks);
1936
1937 if (i < 7) {
1938 continue;
1939 }
1940
1941 diskstatinfo = g_new0(GuestDiskStatsInfo, 1);
1942 diskstatinfo->name = g_strdup(dev_name);
1943 diskstatinfo->major = major;
1944 diskstatinfo->minor = minor;
1945
1946 diskstat = g_new0(GuestDiskStats, 1);
1947 if (i == 7) {
1948 diskstat->has_read_ios = true;
1949 diskstat->read_ios = rd_ios;
1950 diskstat->has_read_sectors = true;
1951 diskstat->read_sectors = rd_merges_or_rd_sec;
1952 diskstat->has_write_ios = true;
1953 diskstat->write_ios = rd_sec_or_wr_ios;
1954 diskstat->has_write_sectors = true;
1955 diskstat->write_sectors = rd_ticks_or_wr_sec;
1956 }
1957 if (i >= 14) {
1958 diskstat->has_read_ios = true;
1959 diskstat->read_ios = rd_ios;
1960 diskstat->has_read_sectors = true;
1961 diskstat->read_sectors = rd_sec_or_wr_ios;
1962 diskstat->has_read_merges = true;
1963 diskstat->read_merges = rd_merges_or_rd_sec;
1964 diskstat->has_read_ticks = true;
1965 diskstat->read_ticks = rd_ticks_or_wr_sec;
1966 diskstat->has_write_ios = true;
1967 diskstat->write_ios = wr_ios;
1968 diskstat->has_write_sectors = true;
1969 diskstat->write_sectors = wr_sec;
1970 diskstat->has_write_merges = true;
1971 diskstat->write_merges = wr_merges;
1972 diskstat->has_write_ticks = true;
1973 diskstat->write_ticks = wr_ticks;
1974 diskstat->has_ios_pgr = true;
1975 diskstat->ios_pgr = ios_pgr;
1976 diskstat->has_total_ticks = true;
1977 diskstat->total_ticks = tot_ticks;
1978 diskstat->has_weight_ticks = true;
1979 diskstat->weight_ticks = rq_ticks;
1980 }
1981 if (i >= 18) {
1982 diskstat->has_discard_ios = true;
1983 diskstat->discard_ios = dc_ios;
1984 diskstat->has_discard_merges = true;
1985 diskstat->discard_merges = dc_merges;
1986 diskstat->has_discard_sectors = true;
1987 diskstat->discard_sectors = dc_sec;
1988 diskstat->has_discard_ticks = true;
1989 diskstat->discard_ticks = dc_ticks;
1990 }
1991 if (i >= 20) {
1992 diskstat->has_flush_ios = true;
1993 diskstat->flush_ios = fl_ios;
1994 diskstat->has_flush_ticks = true;
1995 diskstat->flush_ticks = fl_ticks;
1996 }
1997
1998 diskstatinfo->stats = g_steal_pointer(&diskstat);
1999 QAPI_LIST_APPEND(tail, diskstatinfo);
2000 diskstatinfo = NULL;
2001 }
2002 free(line);
2003 fclose(fp);
2004 return head;
2005 }
2006
qmp_guest_get_diskstats(Error ** errp)2007 GuestDiskStatsInfoList *qmp_guest_get_diskstats(Error **errp)
2008 {
2009 return guest_get_diskstats(errp);
2010 }
2011
qmp_guest_get_cpustats(Error ** errp)2012 GuestCpuStatsList *qmp_guest_get_cpustats(Error **errp)
2013 {
2014 GuestCpuStatsList *head = NULL, **tail = &head;
2015 const char *cpustats = "/proc/stat";
2016 int clk_tck = sysconf(_SC_CLK_TCK);
2017 FILE *fp;
2018 size_t n;
2019 char *line = NULL;
2020
2021 fp = fopen(cpustats, "r");
2022 if (fp == NULL) {
2023 error_setg_errno(errp, errno, "open(\"%s\")", cpustats);
2024 return NULL;
2025 }
2026
2027 while (getline(&line, &n, fp) != -1) {
2028 GuestCpuStats *cpustat = NULL;
2029 GuestLinuxCpuStats *linuxcpustat;
2030 int i;
2031 unsigned long user, system, idle, iowait, irq, softirq, steal, guest;
2032 unsigned long nice, guest_nice;
2033 char name[64];
2034
2035 i = sscanf(line, "%s %lu %lu %lu %lu %lu %lu %lu %lu %lu %lu",
2036 name, &user, &nice, &system, &idle, &iowait, &irq, &softirq,
2037 &steal, &guest, &guest_nice);
2038
2039 /* drop "cpu 1 2 3 ...", get "cpuX 1 2 3 ..." only */
2040 if ((i == EOF) || strncmp(name, "cpu", 3) || (name[3] == '\0')) {
2041 continue;
2042 }
2043
2044 if (i < 5) {
2045 slog("Parsing cpu stat from %s failed, see \"man proc\"", cpustats);
2046 break;
2047 }
2048
2049 cpustat = g_new0(GuestCpuStats, 1);
2050 cpustat->type = GUEST_CPU_STATS_TYPE_LINUX;
2051
2052 linuxcpustat = &cpustat->u.q_linux;
2053 linuxcpustat->cpu = atoi(&name[3]);
2054 linuxcpustat->user = user * 1000 / clk_tck;
2055 linuxcpustat->nice = nice * 1000 / clk_tck;
2056 linuxcpustat->system = system * 1000 / clk_tck;
2057 linuxcpustat->idle = idle * 1000 / clk_tck;
2058
2059 if (i > 5) {
2060 linuxcpustat->has_iowait = true;
2061 linuxcpustat->iowait = iowait * 1000 / clk_tck;
2062 }
2063
2064 if (i > 6) {
2065 linuxcpustat->has_irq = true;
2066 linuxcpustat->irq = irq * 1000 / clk_tck;
2067 linuxcpustat->has_softirq = true;
2068 linuxcpustat->softirq = softirq * 1000 / clk_tck;
2069 }
2070
2071 if (i > 8) {
2072 linuxcpustat->has_steal = true;
2073 linuxcpustat->steal = steal * 1000 / clk_tck;
2074 }
2075
2076 if (i > 9) {
2077 linuxcpustat->has_guest = true;
2078 linuxcpustat->guest = guest * 1000 / clk_tck;
2079 }
2080
2081 if (i > 10) {
2082 linuxcpustat->has_guest = true;
2083 linuxcpustat->guest = guest * 1000 / clk_tck;
2084 linuxcpustat->has_guestnice = true;
2085 linuxcpustat->guestnice = guest_nice * 1000 / clk_tck;
2086 }
2087
2088 QAPI_LIST_APPEND(tail, cpustat);
2089 }
2090
2091 free(line);
2092 fclose(fp);
2093 return head;
2094 }
2095
hex_to_ip_address(const void * hex_value,int is_ipv6)2096 static char *hex_to_ip_address(const void *hex_value, int is_ipv6)
2097 {
2098 if (is_ipv6) {
2099 char addr[INET6_ADDRSTRLEN];
2100 struct in6_addr in6;
2101 const char *hex_str = (const char *)hex_value;
2102 int i;
2103
2104 for (i = 0; i < 16; i++) {
2105 if (sscanf(&hex_str[i * 2], "%02hhx", &in6.s6_addr[i]) != 1) {
2106 return NULL;
2107 }
2108 }
2109 inet_ntop(AF_INET6, &in6, addr, INET6_ADDRSTRLEN);
2110
2111 return g_strdup(addr);
2112 } else {
2113 unsigned int hex_int = *(unsigned int *)hex_value;
2114 unsigned int byte1 = (hex_int >> 24) & 0xFF;
2115 unsigned int byte2 = (hex_int >> 16) & 0xFF;
2116 unsigned int byte3 = (hex_int >> 8) & 0xFF;
2117 unsigned int byte4 = hex_int & 0xFF;
2118
2119 return g_strdup_printf("%u.%u.%u.%u", byte4, byte3, byte2, byte1);
2120 }
2121 }
2122
qmp_guest_network_get_route(Error ** errp)2123 GuestNetworkRouteList *qmp_guest_network_get_route(Error **errp)
2124 {
2125 GuestNetworkRouteList *head = NULL, **tail = &head;
2126 const char *route_files[] = {"/proc/net/route", "/proc/net/ipv6_route"};
2127 FILE *fp;
2128 size_t n = 0;
2129 char *line = NULL;
2130 int firstLine;
2131 int is_ipv6;
2132 int i;
2133 char iface[IFNAMSIZ];
2134
2135 for (i = 0; i < 2; i++) {
2136 firstLine = 1;
2137 is_ipv6 = (i == 1);
2138 fp = fopen(route_files[i], "r");
2139 if (fp == NULL) {
2140 error_setg_errno(errp, errno, "open(\"%s\")", route_files[i]);
2141 continue;
2142 }
2143
2144 while (getline(&line, &n, fp) != -1) {
2145 if (firstLine && !is_ipv6) {
2146 firstLine = 0;
2147 continue;
2148 }
2149 g_autoptr(GuestNetworkRoute) route = g_new0(GuestNetworkRoute, 1);
2150
2151 if (is_ipv6) {
2152 char destination[33], source[33], next_hop[33];
2153 int des_prefixlen, src_prefixlen, metric, refcnt, use, flags;
2154 if (sscanf(line, "%32s %x %32s %x %32s %x %x %x %x %s",
2155 destination, &des_prefixlen, source,
2156 &src_prefixlen, next_hop, &metric, &refcnt,
2157 &use, &flags, iface) != 10) {
2158 continue;
2159 }
2160
2161 route->destination = hex_to_ip_address(destination, 1);
2162 if (route->destination == NULL) {
2163 continue;
2164 }
2165 route->iface = g_strdup(iface);
2166 route->source = hex_to_ip_address(source, 1);
2167 route->nexthop = hex_to_ip_address(next_hop, 1);
2168 route->desprefixlen = g_strdup_printf("%d", des_prefixlen);
2169 route->srcprefixlen = g_strdup_printf("%d", src_prefixlen);
2170 route->metric = metric;
2171 route->has_flags = true;
2172 route->flags = flags;
2173 route->has_refcnt = true;
2174 route->refcnt = refcnt;
2175 route->has_use = true;
2176 route->use = use;
2177 route->version = 6;
2178 } else {
2179 unsigned int destination, gateway, mask, flags;
2180 int refcnt, use, metric, mtu, window, irtt;
2181 if (sscanf(line, "%s %X %X %x %d %d %d %X %d %d %d",
2182 iface, &destination, &gateway, &flags, &refcnt,
2183 &use, &metric, &mask, &mtu, &window, &irtt) != 11) {
2184 continue;
2185 }
2186
2187 route->destination = hex_to_ip_address(&destination, 0);
2188 if (route->destination == NULL) {
2189 continue;
2190 }
2191 route->iface = g_strdup(iface);
2192 route->gateway = hex_to_ip_address(&gateway, 0);
2193 route->mask = hex_to_ip_address(&mask, 0);
2194 route->metric = metric;
2195 route->has_flags = true;
2196 route->flags = flags;
2197 route->has_refcnt = true;
2198 route->refcnt = refcnt;
2199 route->has_use = true;
2200 route->use = use;
2201 route->has_mtu = true;
2202 route->mtu = mtu;
2203 route->has_window = true;
2204 route->window = window;
2205 route->has_irtt = true;
2206 route->irtt = irtt;
2207 route->version = 4;
2208 }
2209
2210 QAPI_LIST_APPEND(tail, route);
2211 route = NULL;
2212 }
2213
2214 fclose(fp);
2215 }
2216
2217 free(line);
2218 return head;
2219 }
2220