]> git.proxmox.com Git - mirror_qemu.git/blob - qga/commands-posix.c
hw/fsi: Introduce IBM's fsi-slave model
[mirror_qemu.git] / qga / commands-posix.c
1 /*
2 * QEMU Guest Agent POSIX-specific command implementations
3 *
4 * Copyright IBM Corp. 2011
5 *
6 * Authors:
7 * Michael Roth <mdroth@linux.vnet.ibm.com>
8 * Michal Privoznik <mprivozn@redhat.com>
9 *
10 * This work is licensed under the terms of the GNU GPL, version 2 or later.
11 * See the COPYING file in the top-level directory.
12 */
13
14 #include "qemu/osdep.h"
15 #include <sys/ioctl.h>
16 #include <sys/utsname.h>
17 #include <sys/wait.h>
18 #include <dirent.h>
19 #include "qga-qapi-commands.h"
20 #include "qapi/error.h"
21 #include "qapi/qmp/qerror.h"
22 #include "qemu/host-utils.h"
23 #include "qemu/sockets.h"
24 #include "qemu/base64.h"
25 #include "qemu/cutils.h"
26 #include "commands-common.h"
27 #include "block/nvme.h"
28 #include "cutils.h"
29
30 #ifdef HAVE_UTMPX
31 #include <utmpx.h>
32 #endif
33
34 #if defined(__linux__)
35 #include <mntent.h>
36 #include <sys/statvfs.h>
37 #include <linux/nvme_ioctl.h>
38
39 #ifdef CONFIG_LIBUDEV
40 #include <libudev.h>
41 #endif
42 #endif
43
44 #ifdef HAVE_GETIFADDRS
45 #include <arpa/inet.h>
46 #include <sys/socket.h>
47 #include <net/if.h>
48 #if defined(__NetBSD__) || defined(__OpenBSD__) || defined(CONFIG_SOLARIS)
49 #include <net/if_arp.h>
50 #include <netinet/if_ether.h>
51 #if !defined(ETHER_ADDR_LEN) && defined(ETHERADDRL)
52 #define ETHER_ADDR_LEN ETHERADDRL
53 #endif
54 #else
55 #include <net/ethernet.h>
56 #endif
57 #ifdef CONFIG_SOLARIS
58 #include <sys/sockio.h>
59 #endif
60 #endif
61
62 static void ga_wait_child(pid_t pid, int *status, Error **errp)
63 {
64 pid_t rpid;
65
66 *status = 0;
67
68 rpid = RETRY_ON_EINTR(waitpid(pid, status, 0));
69
70 if (rpid == -1) {
71 error_setg_errno(errp, errno, "failed to wait for child (pid: %d)",
72 pid);
73 return;
74 }
75
76 g_assert(rpid == pid);
77 }
78
79 void qmp_guest_shutdown(const char *mode, Error **errp)
80 {
81 const char *shutdown_flag;
82 Error *local_err = NULL;
83 pid_t pid;
84 int status;
85
86 #ifdef CONFIG_SOLARIS
87 const char *powerdown_flag = "-i5";
88 const char *halt_flag = "-i0";
89 const char *reboot_flag = "-i6";
90 #elif defined(CONFIG_BSD)
91 const char *powerdown_flag = "-p";
92 const char *halt_flag = "-h";
93 const char *reboot_flag = "-r";
94 #else
95 const char *powerdown_flag = "-P";
96 const char *halt_flag = "-H";
97 const char *reboot_flag = "-r";
98 #endif
99
100 slog("guest-shutdown called, mode: %s", mode);
101 if (!mode || strcmp(mode, "powerdown") == 0) {
102 shutdown_flag = powerdown_flag;
103 } else if (strcmp(mode, "halt") == 0) {
104 shutdown_flag = halt_flag;
105 } else if (strcmp(mode, "reboot") == 0) {
106 shutdown_flag = reboot_flag;
107 } else {
108 error_setg(errp,
109 "mode is invalid (valid values are: halt|powerdown|reboot");
110 return;
111 }
112
113 pid = fork();
114 if (pid == 0) {
115 /* child, start the shutdown */
116 setsid();
117 reopen_fd_to_null(0);
118 reopen_fd_to_null(1);
119 reopen_fd_to_null(2);
120
121 #ifdef CONFIG_SOLARIS
122 execl("/sbin/shutdown", "shutdown", shutdown_flag, "-g0", "-y",
123 "hypervisor initiated shutdown", (char *)NULL);
124 #elif defined(CONFIG_BSD)
125 execl("/sbin/shutdown", "shutdown", shutdown_flag, "+0",
126 "hypervisor initiated shutdown", (char *)NULL);
127 #else
128 execl("/sbin/shutdown", "shutdown", "-h", shutdown_flag, "+0",
129 "hypervisor initiated shutdown", (char *)NULL);
130 #endif
131 _exit(EXIT_FAILURE);
132 } else if (pid < 0) {
133 error_setg_errno(errp, errno, "failed to create child process");
134 return;
135 }
136
137 ga_wait_child(pid, &status, &local_err);
138 if (local_err) {
139 error_propagate(errp, local_err);
140 return;
141 }
142
143 if (!WIFEXITED(status)) {
144 error_setg(errp, "child process has terminated abnormally");
145 return;
146 }
147
148 if (WEXITSTATUS(status)) {
149 error_setg(errp, "child process has failed to shutdown");
150 return;
151 }
152
153 /* succeeded */
154 }
155
156 void qmp_guest_set_time(bool has_time, int64_t time_ns, Error **errp)
157 {
158 int ret;
159 int status;
160 pid_t pid;
161 Error *local_err = NULL;
162 struct timeval tv;
163 static const char hwclock_path[] = "/sbin/hwclock";
164 static int hwclock_available = -1;
165
166 if (hwclock_available < 0) {
167 hwclock_available = (access(hwclock_path, X_OK) == 0);
168 }
169
170 if (!hwclock_available) {
171 error_setg(errp, QERR_UNSUPPORTED);
172 return;
173 }
174
175 /* If user has passed a time, validate and set it. */
176 if (has_time) {
177 GDate date = { 0, };
178
179 /* year-2038 will overflow in case time_t is 32bit */
180 if (time_ns / 1000000000 != (time_t)(time_ns / 1000000000)) {
181 error_setg(errp, "Time %" PRId64 " is too large", time_ns);
182 return;
183 }
184
185 tv.tv_sec = time_ns / 1000000000;
186 tv.tv_usec = (time_ns % 1000000000) / 1000;
187 g_date_set_time_t(&date, tv.tv_sec);
188 if (date.year < 1970 || date.year >= 2070) {
189 error_setg_errno(errp, errno, "Invalid time");
190 return;
191 }
192
193 ret = settimeofday(&tv, NULL);
194 if (ret < 0) {
195 error_setg_errno(errp, errno, "Failed to set time to guest");
196 return;
197 }
198 }
199
200 /* Now, if user has passed a time to set and the system time is set, we
201 * just need to synchronize the hardware clock. However, if no time was
202 * passed, user is requesting the opposite: set the system time from the
203 * hardware clock (RTC). */
204 pid = fork();
205 if (pid == 0) {
206 setsid();
207 reopen_fd_to_null(0);
208 reopen_fd_to_null(1);
209 reopen_fd_to_null(2);
210
211 /* Use '/sbin/hwclock -w' to set RTC from the system time,
212 * or '/sbin/hwclock -s' to set the system time from RTC. */
213 execl(hwclock_path, "hwclock", has_time ? "-w" : "-s", NULL);
214 _exit(EXIT_FAILURE);
215 } else if (pid < 0) {
216 error_setg_errno(errp, errno, "failed to create child process");
217 return;
218 }
219
220 ga_wait_child(pid, &status, &local_err);
221 if (local_err) {
222 error_propagate(errp, local_err);
223 return;
224 }
225
226 if (!WIFEXITED(status)) {
227 error_setg(errp, "child process has terminated abnormally");
228 return;
229 }
230
231 if (WEXITSTATUS(status)) {
232 error_setg(errp, "hwclock failed to set hardware clock to system time");
233 return;
234 }
235 }
236
237 typedef enum {
238 RW_STATE_NEW,
239 RW_STATE_READING,
240 RW_STATE_WRITING,
241 } RwState;
242
243 struct GuestFileHandle {
244 uint64_t id;
245 FILE *fh;
246 RwState state;
247 QTAILQ_ENTRY(GuestFileHandle) next;
248 };
249
250 static struct {
251 QTAILQ_HEAD(, GuestFileHandle) filehandles;
252 } guest_file_state = {
253 .filehandles = QTAILQ_HEAD_INITIALIZER(guest_file_state.filehandles),
254 };
255
256 static int64_t guest_file_handle_add(FILE *fh, Error **errp)
257 {
258 GuestFileHandle *gfh;
259 int64_t handle;
260
261 handle = ga_get_fd_handle(ga_state, errp);
262 if (handle < 0) {
263 return -1;
264 }
265
266 gfh = g_new0(GuestFileHandle, 1);
267 gfh->id = handle;
268 gfh->fh = fh;
269 QTAILQ_INSERT_TAIL(&guest_file_state.filehandles, gfh, next);
270
271 return handle;
272 }
273
274 GuestFileHandle *guest_file_handle_find(int64_t id, Error **errp)
275 {
276 GuestFileHandle *gfh;
277
278 QTAILQ_FOREACH(gfh, &guest_file_state.filehandles, next)
279 {
280 if (gfh->id == id) {
281 return gfh;
282 }
283 }
284
285 error_setg(errp, "handle '%" PRId64 "' has not been found", id);
286 return NULL;
287 }
288
289 typedef const char * const ccpc;
290
291 #ifndef O_BINARY
292 #define O_BINARY 0
293 #endif
294
295 /* http://pubs.opengroup.org/onlinepubs/9699919799/functions/fopen.html */
296 static const struct {
297 ccpc *forms;
298 int oflag_base;
299 } guest_file_open_modes[] = {
300 { (ccpc[]){ "r", NULL }, O_RDONLY },
301 { (ccpc[]){ "rb", NULL }, O_RDONLY | O_BINARY },
302 { (ccpc[]){ "w", NULL }, O_WRONLY | O_CREAT | O_TRUNC },
303 { (ccpc[]){ "wb", NULL }, O_WRONLY | O_CREAT | O_TRUNC | O_BINARY },
304 { (ccpc[]){ "a", NULL }, O_WRONLY | O_CREAT | O_APPEND },
305 { (ccpc[]){ "ab", NULL }, O_WRONLY | O_CREAT | O_APPEND | O_BINARY },
306 { (ccpc[]){ "r+", NULL }, O_RDWR },
307 { (ccpc[]){ "rb+", "r+b", NULL }, O_RDWR | O_BINARY },
308 { (ccpc[]){ "w+", NULL }, O_RDWR | O_CREAT | O_TRUNC },
309 { (ccpc[]){ "wb+", "w+b", NULL }, O_RDWR | O_CREAT | O_TRUNC | O_BINARY },
310 { (ccpc[]){ "a+", NULL }, O_RDWR | O_CREAT | O_APPEND },
311 { (ccpc[]){ "ab+", "a+b", NULL }, O_RDWR | O_CREAT | O_APPEND | O_BINARY }
312 };
313
314 static int
315 find_open_flag(const char *mode_str, Error **errp)
316 {
317 unsigned mode;
318
319 for (mode = 0; mode < ARRAY_SIZE(guest_file_open_modes); ++mode) {
320 ccpc *form;
321
322 form = guest_file_open_modes[mode].forms;
323 while (*form != NULL && strcmp(*form, mode_str) != 0) {
324 ++form;
325 }
326 if (*form != NULL) {
327 break;
328 }
329 }
330
331 if (mode == ARRAY_SIZE(guest_file_open_modes)) {
332 error_setg(errp, "invalid file open mode '%s'", mode_str);
333 return -1;
334 }
335 return guest_file_open_modes[mode].oflag_base | O_NOCTTY | O_NONBLOCK;
336 }
337
338 #define DEFAULT_NEW_FILE_MODE (S_IRUSR | S_IWUSR | \
339 S_IRGRP | S_IWGRP | \
340 S_IROTH | S_IWOTH)
341
342 static FILE *
343 safe_open_or_create(const char *path, const char *mode, Error **errp)
344 {
345 int oflag;
346 int fd = -1;
347 FILE *f = NULL;
348
349 oflag = find_open_flag(mode, errp);
350 if (oflag < 0) {
351 goto end;
352 }
353
354 /* If the caller wants / allows creation of a new file, we implement it
355 * with a two step process: open() + (open() / fchmod()).
356 *
357 * First we insist on creating the file exclusively as a new file. If
358 * that succeeds, we're free to set any file-mode bits on it. (The
359 * motivation is that we want to set those file-mode bits independently
360 * of the current umask.)
361 *
362 * If the exclusive creation fails because the file already exists
363 * (EEXIST is not possible for any other reason), we just attempt to
364 * open the file, but in this case we won't be allowed to change the
365 * file-mode bits on the preexistent file.
366 *
367 * The pathname should never disappear between the two open()s in
368 * practice. If it happens, then someone very likely tried to race us.
369 * In this case just go ahead and report the ENOENT from the second
370 * open() to the caller.
371 *
372 * If the caller wants to open a preexistent file, then the first
373 * open() is decisive and its third argument is ignored, and the second
374 * open() and the fchmod() are never called.
375 */
376 fd = qga_open_cloexec(path, oflag | ((oflag & O_CREAT) ? O_EXCL : 0), 0);
377 if (fd == -1 && errno == EEXIST) {
378 oflag &= ~(unsigned)O_CREAT;
379 fd = qga_open_cloexec(path, oflag, 0);
380 }
381 if (fd == -1) {
382 error_setg_errno(errp, errno,
383 "failed to open file '%s' (mode: '%s')",
384 path, mode);
385 goto end;
386 }
387
388 if ((oflag & O_CREAT) && fchmod(fd, DEFAULT_NEW_FILE_MODE) == -1) {
389 error_setg_errno(errp, errno, "failed to set permission "
390 "0%03o on new file '%s' (mode: '%s')",
391 (unsigned)DEFAULT_NEW_FILE_MODE, path, mode);
392 goto end;
393 }
394
395 f = fdopen(fd, mode);
396 if (f == NULL) {
397 error_setg_errno(errp, errno, "failed to associate stdio stream with "
398 "file descriptor %d, file '%s' (mode: '%s')",
399 fd, path, mode);
400 }
401
402 end:
403 if (f == NULL && fd != -1) {
404 close(fd);
405 if (oflag & O_CREAT) {
406 unlink(path);
407 }
408 }
409 return f;
410 }
411
412 int64_t qmp_guest_file_open(const char *path, const char *mode,
413 Error **errp)
414 {
415 FILE *fh;
416 Error *local_err = NULL;
417 int64_t handle;
418
419 if (!mode) {
420 mode = "r";
421 }
422 slog("guest-file-open called, filepath: %s, mode: %s", path, mode);
423 fh = safe_open_or_create(path, mode, &local_err);
424 if (local_err != NULL) {
425 error_propagate(errp, local_err);
426 return -1;
427 }
428
429 /* set fd non-blocking to avoid common use cases (like reading from a
430 * named pipe) from hanging the agent
431 */
432 if (!g_unix_set_fd_nonblocking(fileno(fh), true, NULL)) {
433 fclose(fh);
434 error_setg_errno(errp, errno, "Failed to set FD nonblocking");
435 return -1;
436 }
437
438 handle = guest_file_handle_add(fh, errp);
439 if (handle < 0) {
440 fclose(fh);
441 return -1;
442 }
443
444 slog("guest-file-open, handle: %" PRId64, handle);
445 return handle;
446 }
447
448 void qmp_guest_file_close(int64_t handle, Error **errp)
449 {
450 GuestFileHandle *gfh = guest_file_handle_find(handle, errp);
451 int ret;
452
453 slog("guest-file-close called, handle: %" PRId64, handle);
454 if (!gfh) {
455 return;
456 }
457
458 ret = fclose(gfh->fh);
459 if (ret == EOF) {
460 error_setg_errno(errp, errno, "failed to close handle");
461 return;
462 }
463
464 QTAILQ_REMOVE(&guest_file_state.filehandles, gfh, next);
465 g_free(gfh);
466 }
467
468 GuestFileRead *guest_file_read_unsafe(GuestFileHandle *gfh,
469 int64_t count, Error **errp)
470 {
471 GuestFileRead *read_data = NULL;
472 guchar *buf;
473 FILE *fh = gfh->fh;
474 size_t read_count;
475
476 /* explicitly flush when switching from writing to reading */
477 if (gfh->state == RW_STATE_WRITING) {
478 int ret = fflush(fh);
479 if (ret == EOF) {
480 error_setg_errno(errp, errno, "failed to flush file");
481 return NULL;
482 }
483 gfh->state = RW_STATE_NEW;
484 }
485
486 buf = g_malloc0(count + 1);
487 read_count = fread(buf, 1, count, fh);
488 if (ferror(fh)) {
489 error_setg_errno(errp, errno, "failed to read file");
490 } else {
491 buf[read_count] = 0;
492 read_data = g_new0(GuestFileRead, 1);
493 read_data->count = read_count;
494 read_data->eof = feof(fh);
495 if (read_count) {
496 read_data->buf_b64 = g_base64_encode(buf, read_count);
497 }
498 gfh->state = RW_STATE_READING;
499 }
500 g_free(buf);
501 clearerr(fh);
502
503 return read_data;
504 }
505
506 GuestFileWrite *qmp_guest_file_write(int64_t handle, const char *buf_b64,
507 bool has_count, int64_t count,
508 Error **errp)
509 {
510 GuestFileWrite *write_data = NULL;
511 guchar *buf;
512 gsize buf_len;
513 int write_count;
514 GuestFileHandle *gfh = guest_file_handle_find(handle, errp);
515 FILE *fh;
516
517 if (!gfh) {
518 return NULL;
519 }
520
521 fh = gfh->fh;
522
523 if (gfh->state == RW_STATE_READING) {
524 int ret = fseek(fh, 0, SEEK_CUR);
525 if (ret == -1) {
526 error_setg_errno(errp, errno, "failed to seek file");
527 return NULL;
528 }
529 gfh->state = RW_STATE_NEW;
530 }
531
532 buf = qbase64_decode(buf_b64, -1, &buf_len, errp);
533 if (!buf) {
534 return NULL;
535 }
536
537 if (!has_count) {
538 count = buf_len;
539 } else if (count < 0 || count > buf_len) {
540 error_setg(errp, "value '%" PRId64 "' is invalid for argument count",
541 count);
542 g_free(buf);
543 return NULL;
544 }
545
546 write_count = fwrite(buf, 1, count, fh);
547 if (ferror(fh)) {
548 error_setg_errno(errp, errno, "failed to write to file");
549 slog("guest-file-write failed, handle: %" PRId64, handle);
550 } else {
551 write_data = g_new0(GuestFileWrite, 1);
552 write_data->count = write_count;
553 write_data->eof = feof(fh);
554 gfh->state = RW_STATE_WRITING;
555 }
556 g_free(buf);
557 clearerr(fh);
558
559 return write_data;
560 }
561
562 struct GuestFileSeek *qmp_guest_file_seek(int64_t handle, int64_t offset,
563 GuestFileWhence *whence_code,
564 Error **errp)
565 {
566 GuestFileHandle *gfh = guest_file_handle_find(handle, errp);
567 GuestFileSeek *seek_data = NULL;
568 FILE *fh;
569 int ret;
570 int whence;
571 Error *err = NULL;
572
573 if (!gfh) {
574 return NULL;
575 }
576
577 /* We stupidly exposed 'whence':'int' in our qapi */
578 whence = ga_parse_whence(whence_code, &err);
579 if (err) {
580 error_propagate(errp, err);
581 return NULL;
582 }
583
584 fh = gfh->fh;
585 ret = fseek(fh, offset, whence);
586 if (ret == -1) {
587 error_setg_errno(errp, errno, "failed to seek file");
588 if (errno == ESPIPE) {
589 /* file is non-seekable, stdio shouldn't be buffering anyways */
590 gfh->state = RW_STATE_NEW;
591 }
592 } else {
593 seek_data = g_new0(GuestFileSeek, 1);
594 seek_data->position = ftell(fh);
595 seek_data->eof = feof(fh);
596 gfh->state = RW_STATE_NEW;
597 }
598 clearerr(fh);
599
600 return seek_data;
601 }
602
603 void qmp_guest_file_flush(int64_t handle, Error **errp)
604 {
605 GuestFileHandle *gfh = guest_file_handle_find(handle, errp);
606 FILE *fh;
607 int ret;
608
609 if (!gfh) {
610 return;
611 }
612
613 fh = gfh->fh;
614 ret = fflush(fh);
615 if (ret == EOF) {
616 error_setg_errno(errp, errno, "failed to flush file");
617 } else {
618 gfh->state = RW_STATE_NEW;
619 }
620 }
621
622 #if defined(CONFIG_FSFREEZE) || defined(CONFIG_FSTRIM)
623 void free_fs_mount_list(FsMountList *mounts)
624 {
625 FsMount *mount, *temp;
626
627 if (!mounts) {
628 return;
629 }
630
631 QTAILQ_FOREACH_SAFE(mount, mounts, next, temp) {
632 QTAILQ_REMOVE(mounts, mount, next);
633 g_free(mount->dirname);
634 g_free(mount->devtype);
635 g_free(mount);
636 }
637 }
638 #endif
639
640 #if defined(CONFIG_FSFREEZE)
641 typedef enum {
642 FSFREEZE_HOOK_THAW = 0,
643 FSFREEZE_HOOK_FREEZE,
644 } FsfreezeHookArg;
645
646 static const char *fsfreeze_hook_arg_string[] = {
647 "thaw",
648 "freeze",
649 };
650
651 static void execute_fsfreeze_hook(FsfreezeHookArg arg, Error **errp)
652 {
653 int status;
654 pid_t pid;
655 const char *hook;
656 const char *arg_str = fsfreeze_hook_arg_string[arg];
657 Error *local_err = NULL;
658
659 hook = ga_fsfreeze_hook(ga_state);
660 if (!hook) {
661 return;
662 }
663 if (access(hook, X_OK) != 0) {
664 error_setg_errno(errp, errno, "can't access fsfreeze hook '%s'", hook);
665 return;
666 }
667
668 slog("executing fsfreeze hook with arg '%s'", arg_str);
669 pid = fork();
670 if (pid == 0) {
671 setsid();
672 reopen_fd_to_null(0);
673 reopen_fd_to_null(1);
674 reopen_fd_to_null(2);
675
676 execl(hook, hook, arg_str, NULL);
677 _exit(EXIT_FAILURE);
678 } else if (pid < 0) {
679 error_setg_errno(errp, errno, "failed to create child process");
680 return;
681 }
682
683 ga_wait_child(pid, &status, &local_err);
684 if (local_err) {
685 error_propagate(errp, local_err);
686 return;
687 }
688
689 if (!WIFEXITED(status)) {
690 error_setg(errp, "fsfreeze hook has terminated abnormally");
691 return;
692 }
693
694 status = WEXITSTATUS(status);
695 if (status) {
696 error_setg(errp, "fsfreeze hook has failed with status %d", status);
697 return;
698 }
699 }
700
701 /*
702 * Return status of freeze/thaw
703 */
704 GuestFsfreezeStatus qmp_guest_fsfreeze_status(Error **errp)
705 {
706 if (ga_is_frozen(ga_state)) {
707 return GUEST_FSFREEZE_STATUS_FROZEN;
708 }
709
710 return GUEST_FSFREEZE_STATUS_THAWED;
711 }
712
713 int64_t qmp_guest_fsfreeze_freeze(Error **errp)
714 {
715 return qmp_guest_fsfreeze_freeze_list(false, NULL, errp);
716 }
717
718 int64_t qmp_guest_fsfreeze_freeze_list(bool has_mountpoints,
719 strList *mountpoints,
720 Error **errp)
721 {
722 int ret;
723 FsMountList mounts;
724 Error *local_err = NULL;
725
726 slog("guest-fsfreeze called");
727
728 execute_fsfreeze_hook(FSFREEZE_HOOK_FREEZE, &local_err);
729 if (local_err) {
730 error_propagate(errp, local_err);
731 return -1;
732 }
733
734 QTAILQ_INIT(&mounts);
735 if (!build_fs_mount_list(&mounts, &local_err)) {
736 error_propagate(errp, local_err);
737 return -1;
738 }
739
740 /* cannot risk guest agent blocking itself on a write in this state */
741 ga_set_frozen(ga_state);
742
743 ret = qmp_guest_fsfreeze_do_freeze_list(has_mountpoints, mountpoints,
744 mounts, errp);
745
746 free_fs_mount_list(&mounts);
747 /* We may not issue any FIFREEZE here.
748 * Just unset ga_state here and ready for the next call.
749 */
750 if (ret == 0) {
751 ga_unset_frozen(ga_state);
752 } else if (ret < 0) {
753 qmp_guest_fsfreeze_thaw(NULL);
754 }
755 return ret;
756 }
757
758 int64_t qmp_guest_fsfreeze_thaw(Error **errp)
759 {
760 int ret;
761
762 ret = qmp_guest_fsfreeze_do_thaw(errp);
763 if (ret >= 0) {
764 ga_unset_frozen(ga_state);
765 execute_fsfreeze_hook(FSFREEZE_HOOK_THAW, errp);
766 } else {
767 ret = 0;
768 }
769
770 return ret;
771 }
772
773 static void guest_fsfreeze_cleanup(void)
774 {
775 Error *err = NULL;
776
777 if (ga_is_frozen(ga_state) == GUEST_FSFREEZE_STATUS_FROZEN) {
778 qmp_guest_fsfreeze_thaw(&err);
779 if (err) {
780 slog("failed to clean up frozen filesystems: %s",
781 error_get_pretty(err));
782 error_free(err);
783 }
784 }
785 }
786 #endif
787
788 /* linux-specific implementations. avoid this if at all possible. */
789 #if defined(__linux__)
790 #if defined(CONFIG_FSFREEZE)
791
792 static char *get_pci_driver(char const *syspath, int pathlen, Error **errp)
793 {
794 char *path;
795 char *dpath;
796 char *driver = NULL;
797 char buf[PATH_MAX];
798 ssize_t len;
799
800 path = g_strndup(syspath, pathlen);
801 dpath = g_strdup_printf("%s/driver", path);
802 len = readlink(dpath, buf, sizeof(buf) - 1);
803 if (len != -1) {
804 buf[len] = 0;
805 driver = g_path_get_basename(buf);
806 }
807 g_free(dpath);
808 g_free(path);
809 return driver;
810 }
811
812 static int compare_uint(const void *_a, const void *_b)
813 {
814 unsigned int a = *(unsigned int *)_a;
815 unsigned int b = *(unsigned int *)_b;
816
817 return a < b ? -1 : a > b ? 1 : 0;
818 }
819
820 /* Walk the specified sysfs and build a sorted list of host or ata numbers */
821 static int build_hosts(char const *syspath, char const *host, bool ata,
822 unsigned int *hosts, int hosts_max, Error **errp)
823 {
824 char *path;
825 DIR *dir;
826 struct dirent *entry;
827 int i = 0;
828
829 path = g_strndup(syspath, host - syspath);
830 dir = opendir(path);
831 if (!dir) {
832 error_setg_errno(errp, errno, "opendir(\"%s\")", path);
833 g_free(path);
834 return -1;
835 }
836
837 while (i < hosts_max) {
838 entry = readdir(dir);
839 if (!entry) {
840 break;
841 }
842 if (ata && sscanf(entry->d_name, "ata%d", hosts + i) == 1) {
843 ++i;
844 } else if (!ata && sscanf(entry->d_name, "host%d", hosts + i) == 1) {
845 ++i;
846 }
847 }
848
849 qsort(hosts, i, sizeof(hosts[0]), compare_uint);
850
851 g_free(path);
852 closedir(dir);
853 return i;
854 }
855
856 /*
857 * Store disk device info for devices on the PCI bus.
858 * Returns true if information has been stored, or false for failure.
859 */
860 static bool build_guest_fsinfo_for_pci_dev(char const *syspath,
861 GuestDiskAddress *disk,
862 Error **errp)
863 {
864 unsigned int pci[4], host, hosts[8], tgt[3];
865 int i, nhosts = 0, pcilen;
866 GuestPCIAddress *pciaddr = disk->pci_controller;
867 bool has_ata = false, has_host = false, has_tgt = false;
868 char *p, *q, *driver = NULL;
869 bool ret = false;
870
871 p = strstr(syspath, "/devices/pci");
872 if (!p || sscanf(p + 12, "%*x:%*x/%x:%x:%x.%x%n",
873 pci, pci + 1, pci + 2, pci + 3, &pcilen) < 4) {
874 g_debug("only pci device is supported: sysfs path '%s'", syspath);
875 return false;
876 }
877
878 p += 12 + pcilen;
879 while (true) {
880 driver = get_pci_driver(syspath, p - syspath, errp);
881 if (driver && (g_str_equal(driver, "ata_piix") ||
882 g_str_equal(driver, "sym53c8xx") ||
883 g_str_equal(driver, "virtio-pci") ||
884 g_str_equal(driver, "ahci") ||
885 g_str_equal(driver, "nvme") ||
886 g_str_equal(driver, "xhci_hcd") ||
887 g_str_equal(driver, "ehci-pci"))) {
888 break;
889 }
890
891 g_free(driver);
892 if (sscanf(p, "/%x:%x:%x.%x%n",
893 pci, pci + 1, pci + 2, pci + 3, &pcilen) == 4) {
894 p += pcilen;
895 continue;
896 }
897
898 g_debug("unsupported driver or sysfs path '%s'", syspath);
899 return false;
900 }
901
902 p = strstr(syspath, "/target");
903 if (p && sscanf(p + 7, "%*u:%*u:%*u/%*u:%u:%u:%u",
904 tgt, tgt + 1, tgt + 2) == 3) {
905 has_tgt = true;
906 }
907
908 p = strstr(syspath, "/ata");
909 if (p) {
910 q = p + 4;
911 has_ata = true;
912 } else {
913 p = strstr(syspath, "/host");
914 q = p + 5;
915 }
916 if (p && sscanf(q, "%u", &host) == 1) {
917 has_host = true;
918 nhosts = build_hosts(syspath, p, has_ata, hosts,
919 ARRAY_SIZE(hosts), errp);
920 if (nhosts < 0) {
921 goto cleanup;
922 }
923 }
924
925 pciaddr->domain = pci[0];
926 pciaddr->bus = pci[1];
927 pciaddr->slot = pci[2];
928 pciaddr->function = pci[3];
929
930 if (strcmp(driver, "ata_piix") == 0) {
931 /* a host per ide bus, target*:0:<unit>:0 */
932 if (!has_host || !has_tgt) {
933 g_debug("invalid sysfs path '%s' (driver '%s')", syspath, driver);
934 goto cleanup;
935 }
936 for (i = 0; i < nhosts; i++) {
937 if (host == hosts[i]) {
938 disk->bus_type = GUEST_DISK_BUS_TYPE_IDE;
939 disk->bus = i;
940 disk->unit = tgt[1];
941 break;
942 }
943 }
944 if (i >= nhosts) {
945 g_debug("no host for '%s' (driver '%s')", syspath, driver);
946 goto cleanup;
947 }
948 } else if (strcmp(driver, "sym53c8xx") == 0) {
949 /* scsi(LSI Logic): target*:0:<unit>:0 */
950 if (!has_tgt) {
951 g_debug("invalid sysfs path '%s' (driver '%s')", syspath, driver);
952 goto cleanup;
953 }
954 disk->bus_type = GUEST_DISK_BUS_TYPE_SCSI;
955 disk->unit = tgt[1];
956 } else if (strcmp(driver, "virtio-pci") == 0) {
957 if (has_tgt) {
958 /* virtio-scsi: target*:0:0:<unit> */
959 disk->bus_type = GUEST_DISK_BUS_TYPE_SCSI;
960 disk->unit = tgt[2];
961 } else {
962 /* virtio-blk: 1 disk per 1 device */
963 disk->bus_type = GUEST_DISK_BUS_TYPE_VIRTIO;
964 }
965 } else if (strcmp(driver, "ahci") == 0) {
966 /* ahci: 1 host per 1 unit */
967 if (!has_host || !has_tgt) {
968 g_debug("invalid sysfs path '%s' (driver '%s')", syspath, driver);
969 goto cleanup;
970 }
971 for (i = 0; i < nhosts; i++) {
972 if (host == hosts[i]) {
973 disk->unit = i;
974 disk->bus_type = GUEST_DISK_BUS_TYPE_SATA;
975 break;
976 }
977 }
978 if (i >= nhosts) {
979 g_debug("no host for '%s' (driver '%s')", syspath, driver);
980 goto cleanup;
981 }
982 } else if (strcmp(driver, "nvme") == 0) {
983 disk->bus_type = GUEST_DISK_BUS_TYPE_NVME;
984 } else if (strcmp(driver, "ehci-pci") == 0 || strcmp(driver, "xhci_hcd") == 0) {
985 disk->bus_type = GUEST_DISK_BUS_TYPE_USB;
986 } else {
987 g_debug("unknown driver '%s' (sysfs path '%s')", driver, syspath);
988 goto cleanup;
989 }
990
991 ret = true;
992
993 cleanup:
994 g_free(driver);
995 return ret;
996 }
997
998 /*
999 * Store disk device info for non-PCI virtio devices (for example s390x
1000 * channel I/O devices). Returns true if information has been stored, or
1001 * false for failure.
1002 */
1003 static bool build_guest_fsinfo_for_nonpci_virtio(char const *syspath,
1004 GuestDiskAddress *disk,
1005 Error **errp)
1006 {
1007 unsigned int tgt[3];
1008 char *p;
1009
1010 if (!strstr(syspath, "/virtio") || !strstr(syspath, "/block")) {
1011 g_debug("Unsupported virtio device '%s'", syspath);
1012 return false;
1013 }
1014
1015 p = strstr(syspath, "/target");
1016 if (p && sscanf(p + 7, "%*u:%*u:%*u/%*u:%u:%u:%u",
1017 &tgt[0], &tgt[1], &tgt[2]) == 3) {
1018 /* virtio-scsi: target*:0:<target>:<unit> */
1019 disk->bus_type = GUEST_DISK_BUS_TYPE_SCSI;
1020 disk->bus = tgt[0];
1021 disk->target = tgt[1];
1022 disk->unit = tgt[2];
1023 } else {
1024 /* virtio-blk: 1 disk per 1 device */
1025 disk->bus_type = GUEST_DISK_BUS_TYPE_VIRTIO;
1026 }
1027
1028 return true;
1029 }
1030
1031 /*
1032 * Store disk device info for CCW devices (s390x channel I/O devices).
1033 * Returns true if information has been stored, or false for failure.
1034 */
1035 static bool build_guest_fsinfo_for_ccw_dev(char const *syspath,
1036 GuestDiskAddress *disk,
1037 Error **errp)
1038 {
1039 unsigned int cssid, ssid, subchno, devno;
1040 char *p;
1041
1042 p = strstr(syspath, "/devices/css");
1043 if (!p || sscanf(p + 12, "%*x/%x.%x.%x/%*x.%*x.%x/",
1044 &cssid, &ssid, &subchno, &devno) < 4) {
1045 g_debug("could not parse ccw device sysfs path: %s", syspath);
1046 return false;
1047 }
1048
1049 disk->ccw_address = g_new0(GuestCCWAddress, 1);
1050 disk->ccw_address->cssid = cssid;
1051 disk->ccw_address->ssid = ssid;
1052 disk->ccw_address->subchno = subchno;
1053 disk->ccw_address->devno = devno;
1054
1055 if (strstr(p, "/virtio")) {
1056 build_guest_fsinfo_for_nonpci_virtio(syspath, disk, errp);
1057 }
1058
1059 return true;
1060 }
1061
1062 /* Store disk device info specified by @sysfs into @fs */
1063 static void build_guest_fsinfo_for_real_device(char const *syspath,
1064 GuestFilesystemInfo *fs,
1065 Error **errp)
1066 {
1067 GuestDiskAddress *disk;
1068 GuestPCIAddress *pciaddr;
1069 bool has_hwinf;
1070 #ifdef CONFIG_LIBUDEV
1071 struct udev *udev = NULL;
1072 struct udev_device *udevice = NULL;
1073 #endif
1074
1075 pciaddr = g_new0(GuestPCIAddress, 1);
1076 pciaddr->domain = -1; /* -1 means field is invalid */
1077 pciaddr->bus = -1;
1078 pciaddr->slot = -1;
1079 pciaddr->function = -1;
1080
1081 disk = g_new0(GuestDiskAddress, 1);
1082 disk->pci_controller = pciaddr;
1083 disk->bus_type = GUEST_DISK_BUS_TYPE_UNKNOWN;
1084
1085 #ifdef CONFIG_LIBUDEV
1086 udev = udev_new();
1087 udevice = udev_device_new_from_syspath(udev, syspath);
1088 if (udev == NULL || udevice == NULL) {
1089 g_debug("failed to query udev");
1090 } else {
1091 const char *devnode, *serial;
1092 devnode = udev_device_get_devnode(udevice);
1093 if (devnode != NULL) {
1094 disk->dev = g_strdup(devnode);
1095 }
1096 serial = udev_device_get_property_value(udevice, "ID_SERIAL");
1097 if (serial != NULL && *serial != 0) {
1098 disk->serial = g_strdup(serial);
1099 }
1100 }
1101
1102 udev_unref(udev);
1103 udev_device_unref(udevice);
1104 #endif
1105
1106 if (strstr(syspath, "/devices/pci")) {
1107 has_hwinf = build_guest_fsinfo_for_pci_dev(syspath, disk, errp);
1108 } else if (strstr(syspath, "/devices/css")) {
1109 has_hwinf = build_guest_fsinfo_for_ccw_dev(syspath, disk, errp);
1110 } else if (strstr(syspath, "/virtio")) {
1111 has_hwinf = build_guest_fsinfo_for_nonpci_virtio(syspath, disk, errp);
1112 } else {
1113 g_debug("Unsupported device type for '%s'", syspath);
1114 has_hwinf = false;
1115 }
1116
1117 if (has_hwinf || disk->dev || disk->serial) {
1118 QAPI_LIST_PREPEND(fs->disk, disk);
1119 } else {
1120 qapi_free_GuestDiskAddress(disk);
1121 }
1122 }
1123
1124 static void build_guest_fsinfo_for_device(char const *devpath,
1125 GuestFilesystemInfo *fs,
1126 Error **errp);
1127
1128 /* Store a list of slave devices of virtual volume specified by @syspath into
1129 * @fs */
1130 static void build_guest_fsinfo_for_virtual_device(char const *syspath,
1131 GuestFilesystemInfo *fs,
1132 Error **errp)
1133 {
1134 Error *err = NULL;
1135 DIR *dir;
1136 char *dirpath;
1137 struct dirent *entry;
1138
1139 dirpath = g_strdup_printf("%s/slaves", syspath);
1140 dir = opendir(dirpath);
1141 if (!dir) {
1142 if (errno != ENOENT) {
1143 error_setg_errno(errp, errno, "opendir(\"%s\")", dirpath);
1144 }
1145 g_free(dirpath);
1146 return;
1147 }
1148
1149 for (;;) {
1150 errno = 0;
1151 entry = readdir(dir);
1152 if (entry == NULL) {
1153 if (errno) {
1154 error_setg_errno(errp, errno, "readdir(\"%s\")", dirpath);
1155 }
1156 break;
1157 }
1158
1159 if (entry->d_type == DT_LNK) {
1160 char *path;
1161
1162 g_debug(" slave device '%s'", entry->d_name);
1163 path = g_strdup_printf("%s/slaves/%s", syspath, entry->d_name);
1164 build_guest_fsinfo_for_device(path, fs, &err);
1165 g_free(path);
1166
1167 if (err) {
1168 error_propagate(errp, err);
1169 break;
1170 }
1171 }
1172 }
1173
1174 g_free(dirpath);
1175 closedir(dir);
1176 }
1177
1178 static bool is_disk_virtual(const char *devpath, Error **errp)
1179 {
1180 g_autofree char *syspath = realpath(devpath, NULL);
1181
1182 if (!syspath) {
1183 error_setg_errno(errp, errno, "realpath(\"%s\")", devpath);
1184 return false;
1185 }
1186 return strstr(syspath, "/devices/virtual/block/") != NULL;
1187 }
1188
1189 /* Dispatch to functions for virtual/real device */
1190 static void build_guest_fsinfo_for_device(char const *devpath,
1191 GuestFilesystemInfo *fs,
1192 Error **errp)
1193 {
1194 ERRP_GUARD();
1195 g_autofree char *syspath = NULL;
1196 bool is_virtual = false;
1197
1198 syspath = realpath(devpath, NULL);
1199 if (!syspath) {
1200 if (errno != ENOENT) {
1201 error_setg_errno(errp, errno, "realpath(\"%s\")", devpath);
1202 return;
1203 }
1204
1205 /* ENOENT: This devpath may not exist because of container config */
1206 if (!fs->name) {
1207 fs->name = g_path_get_basename(devpath);
1208 }
1209 return;
1210 }
1211
1212 if (!fs->name) {
1213 fs->name = g_path_get_basename(syspath);
1214 }
1215
1216 g_debug(" parse sysfs path '%s'", syspath);
1217 is_virtual = is_disk_virtual(syspath, errp);
1218 if (*errp != NULL) {
1219 return;
1220 }
1221 if (is_virtual) {
1222 build_guest_fsinfo_for_virtual_device(syspath, fs, errp);
1223 } else {
1224 build_guest_fsinfo_for_real_device(syspath, fs, errp);
1225 }
1226 }
1227
1228 #ifdef CONFIG_LIBUDEV
1229
1230 /*
1231 * Wrapper around build_guest_fsinfo_for_device() for getting just
1232 * the disk address.
1233 */
1234 static GuestDiskAddress *get_disk_address(const char *syspath, Error **errp)
1235 {
1236 g_autoptr(GuestFilesystemInfo) fs = NULL;
1237
1238 fs = g_new0(GuestFilesystemInfo, 1);
1239 build_guest_fsinfo_for_device(syspath, fs, errp);
1240 if (fs->disk != NULL) {
1241 return g_steal_pointer(&fs->disk->value);
1242 }
1243 return NULL;
1244 }
1245
1246 static char *get_alias_for_syspath(const char *syspath)
1247 {
1248 struct udev *udev = NULL;
1249 struct udev_device *udevice = NULL;
1250 char *ret = NULL;
1251
1252 udev = udev_new();
1253 if (udev == NULL) {
1254 g_debug("failed to query udev");
1255 goto out;
1256 }
1257 udevice = udev_device_new_from_syspath(udev, syspath);
1258 if (udevice == NULL) {
1259 g_debug("failed to query udev for path: %s", syspath);
1260 goto out;
1261 } else {
1262 const char *alias = udev_device_get_property_value(
1263 udevice, "DM_NAME");
1264 /*
1265 * NULL means there was an error and empty string means there is no
1266 * alias. In case of no alias we return NULL instead of empty string.
1267 */
1268 if (alias == NULL) {
1269 g_debug("failed to query udev for device alias for: %s",
1270 syspath);
1271 } else if (*alias != 0) {
1272 ret = g_strdup(alias);
1273 }
1274 }
1275
1276 out:
1277 udev_unref(udev);
1278 udev_device_unref(udevice);
1279 return ret;
1280 }
1281
1282 static char *get_device_for_syspath(const char *syspath)
1283 {
1284 struct udev *udev = NULL;
1285 struct udev_device *udevice = NULL;
1286 char *ret = NULL;
1287
1288 udev = udev_new();
1289 if (udev == NULL) {
1290 g_debug("failed to query udev");
1291 goto out;
1292 }
1293 udevice = udev_device_new_from_syspath(udev, syspath);
1294 if (udevice == NULL) {
1295 g_debug("failed to query udev for path: %s", syspath);
1296 goto out;
1297 } else {
1298 ret = g_strdup(udev_device_get_devnode(udevice));
1299 }
1300
1301 out:
1302 udev_unref(udev);
1303 udev_device_unref(udevice);
1304 return ret;
1305 }
1306
1307 static void get_disk_deps(const char *disk_dir, GuestDiskInfo *disk)
1308 {
1309 g_autofree char *deps_dir = NULL;
1310 const gchar *dep;
1311 GDir *dp_deps = NULL;
1312
1313 /* List dependent disks */
1314 deps_dir = g_strdup_printf("%s/slaves", disk_dir);
1315 g_debug(" listing entries in: %s", deps_dir);
1316 dp_deps = g_dir_open(deps_dir, 0, NULL);
1317 if (dp_deps == NULL) {
1318 g_debug("failed to list entries in %s", deps_dir);
1319 return;
1320 }
1321 disk->has_dependencies = true;
1322 while ((dep = g_dir_read_name(dp_deps)) != NULL) {
1323 g_autofree char *dep_dir = NULL;
1324 char *dev_name;
1325
1326 /* Add dependent disks */
1327 dep_dir = g_strdup_printf("%s/%s", deps_dir, dep);
1328 dev_name = get_device_for_syspath(dep_dir);
1329 if (dev_name != NULL) {
1330 g_debug(" adding dependent device: %s", dev_name);
1331 QAPI_LIST_PREPEND(disk->dependencies, dev_name);
1332 }
1333 }
1334 g_dir_close(dp_deps);
1335 }
1336
1337 /*
1338 * Detect partitions subdirectory, name is "<disk_name><number>" or
1339 * "<disk_name>p<number>"
1340 *
1341 * @disk_name -- last component of /sys path (e.g. sda)
1342 * @disk_dir -- sys path of the disk (e.g. /sys/block/sda)
1343 * @disk_dev -- device node of the disk (e.g. /dev/sda)
1344 */
1345 static GuestDiskInfoList *get_disk_partitions(
1346 GuestDiskInfoList *list,
1347 const char *disk_name, const char *disk_dir,
1348 const char *disk_dev)
1349 {
1350 GuestDiskInfoList *ret = list;
1351 struct dirent *de_disk;
1352 DIR *dp_disk = NULL;
1353 size_t len = strlen(disk_name);
1354
1355 dp_disk = opendir(disk_dir);
1356 while ((de_disk = readdir(dp_disk)) != NULL) {
1357 g_autofree char *partition_dir = NULL;
1358 char *dev_name;
1359 GuestDiskInfo *partition;
1360
1361 if (!(de_disk->d_type & DT_DIR)) {
1362 continue;
1363 }
1364
1365 if (!(strncmp(disk_name, de_disk->d_name, len) == 0 &&
1366 ((*(de_disk->d_name + len) == 'p' &&
1367 isdigit(*(de_disk->d_name + len + 1))) ||
1368 isdigit(*(de_disk->d_name + len))))) {
1369 continue;
1370 }
1371
1372 partition_dir = g_strdup_printf("%s/%s",
1373 disk_dir, de_disk->d_name);
1374 dev_name = get_device_for_syspath(partition_dir);
1375 if (dev_name == NULL) {
1376 g_debug("Failed to get device name for syspath: %s",
1377 disk_dir);
1378 continue;
1379 }
1380 partition = g_new0(GuestDiskInfo, 1);
1381 partition->name = dev_name;
1382 partition->partition = true;
1383 partition->has_dependencies = true;
1384 /* Add parent disk as dependent for easier tracking of hierarchy */
1385 QAPI_LIST_PREPEND(partition->dependencies, g_strdup(disk_dev));
1386
1387 QAPI_LIST_PREPEND(ret, partition);
1388 }
1389 closedir(dp_disk);
1390
1391 return ret;
1392 }
1393
1394 static void get_nvme_smart(GuestDiskInfo *disk)
1395 {
1396 int fd;
1397 GuestNVMeSmart *smart;
1398 NvmeSmartLog log = {0};
1399 struct nvme_admin_cmd cmd = {
1400 .opcode = NVME_ADM_CMD_GET_LOG_PAGE,
1401 .nsid = NVME_NSID_BROADCAST,
1402 .addr = (uintptr_t)&log,
1403 .data_len = sizeof(log),
1404 .cdw10 = NVME_LOG_SMART_INFO | (1 << 15) /* RAE bit */
1405 | (((sizeof(log) >> 2) - 1) << 16)
1406 };
1407
1408 fd = qga_open_cloexec(disk->name, O_RDONLY, 0);
1409 if (fd == -1) {
1410 g_debug("Failed to open device: %s: %s", disk->name, g_strerror(errno));
1411 return;
1412 }
1413
1414 if (ioctl(fd, NVME_IOCTL_ADMIN_CMD, &cmd)) {
1415 g_debug("Failed to get smart: %s: %s", disk->name, g_strerror(errno));
1416 close(fd);
1417 return;
1418 }
1419
1420 disk->smart = g_new0(GuestDiskSmart, 1);
1421 disk->smart->type = GUEST_DISK_BUS_TYPE_NVME;
1422
1423 smart = &disk->smart->u.nvme;
1424 smart->critical_warning = log.critical_warning;
1425 smart->temperature = lduw_le_p(&log.temperature); /* unaligned field */
1426 smart->available_spare = log.available_spare;
1427 smart->available_spare_threshold = log.available_spare_threshold;
1428 smart->percentage_used = log.percentage_used;
1429 smart->data_units_read_lo = le64_to_cpu(log.data_units_read[0]);
1430 smart->data_units_read_hi = le64_to_cpu(log.data_units_read[1]);
1431 smart->data_units_written_lo = le64_to_cpu(log.data_units_written[0]);
1432 smart->data_units_written_hi = le64_to_cpu(log.data_units_written[1]);
1433 smart->host_read_commands_lo = le64_to_cpu(log.host_read_commands[0]);
1434 smart->host_read_commands_hi = le64_to_cpu(log.host_read_commands[1]);
1435 smart->host_write_commands_lo = le64_to_cpu(log.host_write_commands[0]);
1436 smart->host_write_commands_hi = le64_to_cpu(log.host_write_commands[1]);
1437 smart->controller_busy_time_lo = le64_to_cpu(log.controller_busy_time[0]);
1438 smart->controller_busy_time_hi = le64_to_cpu(log.controller_busy_time[1]);
1439 smart->power_cycles_lo = le64_to_cpu(log.power_cycles[0]);
1440 smart->power_cycles_hi = le64_to_cpu(log.power_cycles[1]);
1441 smart->power_on_hours_lo = le64_to_cpu(log.power_on_hours[0]);
1442 smart->power_on_hours_hi = le64_to_cpu(log.power_on_hours[1]);
1443 smart->unsafe_shutdowns_lo = le64_to_cpu(log.unsafe_shutdowns[0]);
1444 smart->unsafe_shutdowns_hi = le64_to_cpu(log.unsafe_shutdowns[1]);
1445 smart->media_errors_lo = le64_to_cpu(log.media_errors[0]);
1446 smart->media_errors_hi = le64_to_cpu(log.media_errors[1]);
1447 smart->number_of_error_log_entries_lo =
1448 le64_to_cpu(log.number_of_error_log_entries[0]);
1449 smart->number_of_error_log_entries_hi =
1450 le64_to_cpu(log.number_of_error_log_entries[1]);
1451
1452 close(fd);
1453 }
1454
1455 static void get_disk_smart(GuestDiskInfo *disk)
1456 {
1457 if (disk->address
1458 && (disk->address->bus_type == GUEST_DISK_BUS_TYPE_NVME)) {
1459 get_nvme_smart(disk);
1460 }
1461 }
1462
1463 GuestDiskInfoList *qmp_guest_get_disks(Error **errp)
1464 {
1465 GuestDiskInfoList *ret = NULL;
1466 GuestDiskInfo *disk;
1467 DIR *dp = NULL;
1468 struct dirent *de = NULL;
1469
1470 g_debug("listing /sys/block directory");
1471 dp = opendir("/sys/block");
1472 if (dp == NULL) {
1473 error_setg_errno(errp, errno, "Can't open directory \"/sys/block\"");
1474 return NULL;
1475 }
1476 while ((de = readdir(dp)) != NULL) {
1477 g_autofree char *disk_dir = NULL, *line = NULL,
1478 *size_path = NULL;
1479 char *dev_name;
1480 Error *local_err = NULL;
1481 if (de->d_type != DT_LNK) {
1482 g_debug(" skipping entry: %s", de->d_name);
1483 continue;
1484 }
1485
1486 /* Check size and skip zero-sized disks */
1487 g_debug(" checking disk size");
1488 size_path = g_strdup_printf("/sys/block/%s/size", de->d_name);
1489 if (!g_file_get_contents(size_path, &line, NULL, NULL)) {
1490 g_debug(" failed to read disk size");
1491 continue;
1492 }
1493 if (g_strcmp0(line, "0\n") == 0) {
1494 g_debug(" skipping zero-sized disk");
1495 continue;
1496 }
1497
1498 g_debug(" adding %s", de->d_name);
1499 disk_dir = g_strdup_printf("/sys/block/%s", de->d_name);
1500 dev_name = get_device_for_syspath(disk_dir);
1501 if (dev_name == NULL) {
1502 g_debug("Failed to get device name for syspath: %s",
1503 disk_dir);
1504 continue;
1505 }
1506 disk = g_new0(GuestDiskInfo, 1);
1507 disk->name = dev_name;
1508 disk->partition = false;
1509 disk->alias = get_alias_for_syspath(disk_dir);
1510 QAPI_LIST_PREPEND(ret, disk);
1511
1512 /* Get address for non-virtual devices */
1513 bool is_virtual = is_disk_virtual(disk_dir, &local_err);
1514 if (local_err != NULL) {
1515 g_debug(" failed to check disk path, ignoring error: %s",
1516 error_get_pretty(local_err));
1517 error_free(local_err);
1518 local_err = NULL;
1519 /* Don't try to get the address */
1520 is_virtual = true;
1521 }
1522 if (!is_virtual) {
1523 disk->address = get_disk_address(disk_dir, &local_err);
1524 if (local_err != NULL) {
1525 g_debug(" failed to get device info, ignoring error: %s",
1526 error_get_pretty(local_err));
1527 error_free(local_err);
1528 local_err = NULL;
1529 }
1530 }
1531
1532 get_disk_deps(disk_dir, disk);
1533 get_disk_smart(disk);
1534 ret = get_disk_partitions(ret, de->d_name, disk_dir, dev_name);
1535 }
1536
1537 closedir(dp);
1538
1539 return ret;
1540 }
1541
1542 #else
1543
1544 GuestDiskInfoList *qmp_guest_get_disks(Error **errp)
1545 {
1546 error_setg(errp, QERR_UNSUPPORTED);
1547 return NULL;
1548 }
1549
1550 #endif
1551
1552 /* Return a list of the disk device(s)' info which @mount lies on */
1553 static GuestFilesystemInfo *build_guest_fsinfo(struct FsMount *mount,
1554 Error **errp)
1555 {
1556 GuestFilesystemInfo *fs = g_malloc0(sizeof(*fs));
1557 struct statvfs buf;
1558 unsigned long used, nonroot_total, fr_size;
1559 char *devpath = g_strdup_printf("/sys/dev/block/%u:%u",
1560 mount->devmajor, mount->devminor);
1561
1562 fs->mountpoint = g_strdup(mount->dirname);
1563 fs->type = g_strdup(mount->devtype);
1564 build_guest_fsinfo_for_device(devpath, fs, errp);
1565
1566 if (statvfs(fs->mountpoint, &buf) == 0) {
1567 fr_size = buf.f_frsize;
1568 used = buf.f_blocks - buf.f_bfree;
1569 nonroot_total = used + buf.f_bavail;
1570 fs->used_bytes = used * fr_size;
1571 fs->total_bytes = nonroot_total * fr_size;
1572
1573 fs->has_total_bytes = true;
1574 fs->has_used_bytes = true;
1575 }
1576
1577 g_free(devpath);
1578
1579 return fs;
1580 }
1581
1582 GuestFilesystemInfoList *qmp_guest_get_fsinfo(Error **errp)
1583 {
1584 FsMountList mounts;
1585 struct FsMount *mount;
1586 GuestFilesystemInfoList *ret = NULL;
1587 Error *local_err = NULL;
1588
1589 QTAILQ_INIT(&mounts);
1590 if (!build_fs_mount_list(&mounts, &local_err)) {
1591 error_propagate(errp, local_err);
1592 return NULL;
1593 }
1594
1595 QTAILQ_FOREACH(mount, &mounts, next) {
1596 g_debug("Building guest fsinfo for '%s'", mount->dirname);
1597
1598 QAPI_LIST_PREPEND(ret, build_guest_fsinfo(mount, &local_err));
1599 if (local_err) {
1600 error_propagate(errp, local_err);
1601 qapi_free_GuestFilesystemInfoList(ret);
1602 ret = NULL;
1603 break;
1604 }
1605 }
1606
1607 free_fs_mount_list(&mounts);
1608 return ret;
1609 }
1610 #endif /* CONFIG_FSFREEZE */
1611
1612 #if defined(CONFIG_FSTRIM)
1613 /*
1614 * Walk list of mounted file systems in the guest, and trim them.
1615 */
1616 GuestFilesystemTrimResponse *
1617 qmp_guest_fstrim(bool has_minimum, int64_t minimum, Error **errp)
1618 {
1619 GuestFilesystemTrimResponse *response;
1620 GuestFilesystemTrimResult *result;
1621 int ret = 0;
1622 FsMountList mounts;
1623 struct FsMount *mount;
1624 int fd;
1625 struct fstrim_range r;
1626
1627 slog("guest-fstrim called");
1628
1629 QTAILQ_INIT(&mounts);
1630 if (!build_fs_mount_list(&mounts, errp)) {
1631 return NULL;
1632 }
1633
1634 response = g_malloc0(sizeof(*response));
1635
1636 QTAILQ_FOREACH(mount, &mounts, next) {
1637 result = g_malloc0(sizeof(*result));
1638 result->path = g_strdup(mount->dirname);
1639
1640 QAPI_LIST_PREPEND(response->paths, result);
1641
1642 fd = qga_open_cloexec(mount->dirname, O_RDONLY, 0);
1643 if (fd == -1) {
1644 result->error = g_strdup_printf("failed to open: %s",
1645 strerror(errno));
1646 continue;
1647 }
1648
1649 /* We try to cull filesystems we know won't work in advance, but other
1650 * filesystems may not implement fstrim for less obvious reasons.
1651 * These will report EOPNOTSUPP; while in some other cases ENOTTY
1652 * will be reported (e.g. CD-ROMs).
1653 * Any other error means an unexpected error.
1654 */
1655 r.start = 0;
1656 r.len = -1;
1657 r.minlen = has_minimum ? minimum : 0;
1658 ret = ioctl(fd, FITRIM, &r);
1659 if (ret == -1) {
1660 if (errno == ENOTTY || errno == EOPNOTSUPP) {
1661 result->error = g_strdup("trim not supported");
1662 } else {
1663 result->error = g_strdup_printf("failed to trim: %s",
1664 strerror(errno));
1665 }
1666 close(fd);
1667 continue;
1668 }
1669
1670 result->has_minimum = true;
1671 result->minimum = r.minlen;
1672 result->has_trimmed = true;
1673 result->trimmed = r.len;
1674 close(fd);
1675 }
1676
1677 free_fs_mount_list(&mounts);
1678 return response;
1679 }
1680 #endif /* CONFIG_FSTRIM */
1681
1682
1683 #define LINUX_SYS_STATE_FILE "/sys/power/state"
1684 #define SUSPEND_SUPPORTED 0
1685 #define SUSPEND_NOT_SUPPORTED 1
1686
1687 typedef enum {
1688 SUSPEND_MODE_DISK = 0,
1689 SUSPEND_MODE_RAM = 1,
1690 SUSPEND_MODE_HYBRID = 2,
1691 } SuspendMode;
1692
1693 /*
1694 * Executes a command in a child process using g_spawn_sync,
1695 * returning an int >= 0 representing the exit status of the
1696 * process.
1697 *
1698 * If the program wasn't found in path, returns -1.
1699 *
1700 * If a problem happened when creating the child process,
1701 * returns -1 and errp is set.
1702 */
1703 static int run_process_child(const char *command[], Error **errp)
1704 {
1705 int exit_status, spawn_flag;
1706 GError *g_err = NULL;
1707 bool success;
1708
1709 spawn_flag = G_SPAWN_SEARCH_PATH | G_SPAWN_STDOUT_TO_DEV_NULL |
1710 G_SPAWN_STDERR_TO_DEV_NULL;
1711
1712 success = g_spawn_sync(NULL, (char **)command, NULL, spawn_flag,
1713 NULL, NULL, NULL, NULL,
1714 &exit_status, &g_err);
1715
1716 if (success) {
1717 return WEXITSTATUS(exit_status);
1718 }
1719
1720 if (g_err && (g_err->code != G_SPAWN_ERROR_NOENT)) {
1721 error_setg(errp, "failed to create child process, error '%s'",
1722 g_err->message);
1723 }
1724
1725 g_error_free(g_err);
1726 return -1;
1727 }
1728
1729 static bool systemd_supports_mode(SuspendMode mode, Error **errp)
1730 {
1731 const char *systemctl_args[3] = {"systemd-hibernate", "systemd-suspend",
1732 "systemd-hybrid-sleep"};
1733 const char *cmd[4] = {"systemctl", "status", systemctl_args[mode], NULL};
1734 int status;
1735
1736 status = run_process_child(cmd, errp);
1737
1738 /*
1739 * systemctl status uses LSB return codes so we can expect
1740 * status > 0 and be ok. To assert if the guest has support
1741 * for the selected suspend mode, status should be < 4. 4 is
1742 * the code for unknown service status, the return value when
1743 * the service does not exist. A common value is status = 3
1744 * (program is not running).
1745 */
1746 if (status > 0 && status < 4) {
1747 return true;
1748 }
1749
1750 return false;
1751 }
1752
1753 static void systemd_suspend(SuspendMode mode, Error **errp)
1754 {
1755 Error *local_err = NULL;
1756 const char *systemctl_args[3] = {"hibernate", "suspend", "hybrid-sleep"};
1757 const char *cmd[3] = {"systemctl", systemctl_args[mode], NULL};
1758 int status;
1759
1760 status = run_process_child(cmd, &local_err);
1761
1762 if (status == 0) {
1763 return;
1764 }
1765
1766 if ((status == -1) && !local_err) {
1767 error_setg(errp, "the helper program 'systemctl %s' was not found",
1768 systemctl_args[mode]);
1769 return;
1770 }
1771
1772 if (local_err) {
1773 error_propagate(errp, local_err);
1774 } else {
1775 error_setg(errp, "the helper program 'systemctl %s' returned an "
1776 "unexpected exit status code (%d)",
1777 systemctl_args[mode], status);
1778 }
1779 }
1780
1781 static bool pmutils_supports_mode(SuspendMode mode, Error **errp)
1782 {
1783 Error *local_err = NULL;
1784 const char *pmutils_args[3] = {"--hibernate", "--suspend",
1785 "--suspend-hybrid"};
1786 const char *cmd[3] = {"pm-is-supported", pmutils_args[mode], NULL};
1787 int status;
1788
1789 status = run_process_child(cmd, &local_err);
1790
1791 if (status == SUSPEND_SUPPORTED) {
1792 return true;
1793 }
1794
1795 if ((status == -1) && !local_err) {
1796 return false;
1797 }
1798
1799 if (local_err) {
1800 error_propagate(errp, local_err);
1801 } else {
1802 error_setg(errp,
1803 "the helper program '%s' returned an unexpected exit"
1804 " status code (%d)", "pm-is-supported", status);
1805 }
1806
1807 return false;
1808 }
1809
1810 static void pmutils_suspend(SuspendMode mode, Error **errp)
1811 {
1812 Error *local_err = NULL;
1813 const char *pmutils_binaries[3] = {"pm-hibernate", "pm-suspend",
1814 "pm-suspend-hybrid"};
1815 const char *cmd[2] = {pmutils_binaries[mode], NULL};
1816 int status;
1817
1818 status = run_process_child(cmd, &local_err);
1819
1820 if (status == 0) {
1821 return;
1822 }
1823
1824 if ((status == -1) && !local_err) {
1825 error_setg(errp, "the helper program '%s' was not found",
1826 pmutils_binaries[mode]);
1827 return;
1828 }
1829
1830 if (local_err) {
1831 error_propagate(errp, local_err);
1832 } else {
1833 error_setg(errp,
1834 "the helper program '%s' returned an unexpected exit"
1835 " status code (%d)", pmutils_binaries[mode], status);
1836 }
1837 }
1838
1839 static bool linux_sys_state_supports_mode(SuspendMode mode, Error **errp)
1840 {
1841 const char *sysfile_strs[3] = {"disk", "mem", NULL};
1842 const char *sysfile_str = sysfile_strs[mode];
1843 char buf[32]; /* hopefully big enough */
1844 int fd;
1845 ssize_t ret;
1846
1847 if (!sysfile_str) {
1848 error_setg(errp, "unknown guest suspend mode");
1849 return false;
1850 }
1851
1852 fd = open(LINUX_SYS_STATE_FILE, O_RDONLY);
1853 if (fd < 0) {
1854 return false;
1855 }
1856
1857 ret = read(fd, buf, sizeof(buf) - 1);
1858 close(fd);
1859 if (ret <= 0) {
1860 return false;
1861 }
1862 buf[ret] = '\0';
1863
1864 if (strstr(buf, sysfile_str)) {
1865 return true;
1866 }
1867 return false;
1868 }
1869
1870 static void linux_sys_state_suspend(SuspendMode mode, Error **errp)
1871 {
1872 Error *local_err = NULL;
1873 const char *sysfile_strs[3] = {"disk", "mem", NULL};
1874 const char *sysfile_str = sysfile_strs[mode];
1875 pid_t pid;
1876 int status;
1877
1878 if (!sysfile_str) {
1879 error_setg(errp, "unknown guest suspend mode");
1880 return;
1881 }
1882
1883 pid = fork();
1884 if (!pid) {
1885 /* child */
1886 int fd;
1887
1888 setsid();
1889 reopen_fd_to_null(0);
1890 reopen_fd_to_null(1);
1891 reopen_fd_to_null(2);
1892
1893 fd = open(LINUX_SYS_STATE_FILE, O_WRONLY);
1894 if (fd < 0) {
1895 _exit(EXIT_FAILURE);
1896 }
1897
1898 if (write(fd, sysfile_str, strlen(sysfile_str)) < 0) {
1899 _exit(EXIT_FAILURE);
1900 }
1901
1902 _exit(EXIT_SUCCESS);
1903 } else if (pid < 0) {
1904 error_setg_errno(errp, errno, "failed to create child process");
1905 return;
1906 }
1907
1908 ga_wait_child(pid, &status, &local_err);
1909 if (local_err) {
1910 error_propagate(errp, local_err);
1911 return;
1912 }
1913
1914 if (WEXITSTATUS(status)) {
1915 error_setg(errp, "child process has failed to suspend");
1916 }
1917
1918 }
1919
1920 static void guest_suspend(SuspendMode mode, Error **errp)
1921 {
1922 Error *local_err = NULL;
1923 bool mode_supported = false;
1924
1925 if (systemd_supports_mode(mode, &local_err)) {
1926 mode_supported = true;
1927 systemd_suspend(mode, &local_err);
1928
1929 if (!local_err) {
1930 return;
1931 }
1932 }
1933
1934 error_free(local_err);
1935 local_err = NULL;
1936
1937 if (pmutils_supports_mode(mode, &local_err)) {
1938 mode_supported = true;
1939 pmutils_suspend(mode, &local_err);
1940
1941 if (!local_err) {
1942 return;
1943 }
1944 }
1945
1946 error_free(local_err);
1947 local_err = NULL;
1948
1949 if (linux_sys_state_supports_mode(mode, &local_err)) {
1950 mode_supported = true;
1951 linux_sys_state_suspend(mode, &local_err);
1952 }
1953
1954 if (!mode_supported) {
1955 error_free(local_err);
1956 error_setg(errp,
1957 "the requested suspend mode is not supported by the guest");
1958 } else {
1959 error_propagate(errp, local_err);
1960 }
1961 }
1962
1963 void qmp_guest_suspend_disk(Error **errp)
1964 {
1965 guest_suspend(SUSPEND_MODE_DISK, errp);
1966 }
1967
1968 void qmp_guest_suspend_ram(Error **errp)
1969 {
1970 guest_suspend(SUSPEND_MODE_RAM, errp);
1971 }
1972
1973 void qmp_guest_suspend_hybrid(Error **errp)
1974 {
1975 guest_suspend(SUSPEND_MODE_HYBRID, errp);
1976 }
1977
1978 /* Transfer online/offline status between @vcpu and the guest system.
1979 *
1980 * On input either @errp or *@errp must be NULL.
1981 *
1982 * In system-to-@vcpu direction, the following @vcpu fields are accessed:
1983 * - R: vcpu->logical_id
1984 * - W: vcpu->online
1985 * - W: vcpu->can_offline
1986 *
1987 * In @vcpu-to-system direction, the following @vcpu fields are accessed:
1988 * - R: vcpu->logical_id
1989 * - R: vcpu->online
1990 *
1991 * Written members remain unmodified on error.
1992 */
1993 static void transfer_vcpu(GuestLogicalProcessor *vcpu, bool sys2vcpu,
1994 char *dirpath, Error **errp)
1995 {
1996 int fd;
1997 int res;
1998 int dirfd;
1999 static const char fn[] = "online";
2000
2001 dirfd = open(dirpath, O_RDONLY | O_DIRECTORY);
2002 if (dirfd == -1) {
2003 error_setg_errno(errp, errno, "open(\"%s\")", dirpath);
2004 return;
2005 }
2006
2007 fd = openat(dirfd, fn, sys2vcpu ? O_RDONLY : O_RDWR);
2008 if (fd == -1) {
2009 if (errno != ENOENT) {
2010 error_setg_errno(errp, errno, "open(\"%s/%s\")", dirpath, fn);
2011 } else if (sys2vcpu) {
2012 vcpu->online = true;
2013 vcpu->can_offline = false;
2014 } else if (!vcpu->online) {
2015 error_setg(errp, "logical processor #%" PRId64 " can't be "
2016 "offlined", vcpu->logical_id);
2017 } /* otherwise pretend successful re-onlining */
2018 } else {
2019 unsigned char status;
2020
2021 res = pread(fd, &status, 1, 0);
2022 if (res == -1) {
2023 error_setg_errno(errp, errno, "pread(\"%s/%s\")", dirpath, fn);
2024 } else if (res == 0) {
2025 error_setg(errp, "pread(\"%s/%s\"): unexpected EOF", dirpath,
2026 fn);
2027 } else if (sys2vcpu) {
2028 vcpu->online = (status != '0');
2029 vcpu->can_offline = true;
2030 } else if (vcpu->online != (status != '0')) {
2031 status = '0' + vcpu->online;
2032 if (pwrite(fd, &status, 1, 0) == -1) {
2033 error_setg_errno(errp, errno, "pwrite(\"%s/%s\")", dirpath,
2034 fn);
2035 }
2036 } /* otherwise pretend successful re-(on|off)-lining */
2037
2038 res = close(fd);
2039 g_assert(res == 0);
2040 }
2041
2042 res = close(dirfd);
2043 g_assert(res == 0);
2044 }
2045
2046 GuestLogicalProcessorList *qmp_guest_get_vcpus(Error **errp)
2047 {
2048 GuestLogicalProcessorList *head, **tail;
2049 const char *cpu_dir = "/sys/devices/system/cpu";
2050 const gchar *line;
2051 g_autoptr(GDir) cpu_gdir = NULL;
2052 Error *local_err = NULL;
2053
2054 head = NULL;
2055 tail = &head;
2056 cpu_gdir = g_dir_open(cpu_dir, 0, NULL);
2057
2058 if (cpu_gdir == NULL) {
2059 error_setg_errno(errp, errno, "failed to list entries: %s", cpu_dir);
2060 return NULL;
2061 }
2062
2063 while (local_err == NULL && (line = g_dir_read_name(cpu_gdir)) != NULL) {
2064 GuestLogicalProcessor *vcpu;
2065 int64_t id;
2066 if (sscanf(line, "cpu%" PRId64, &id)) {
2067 g_autofree char *path = g_strdup_printf("/sys/devices/system/cpu/"
2068 "cpu%" PRId64 "/", id);
2069 vcpu = g_malloc0(sizeof *vcpu);
2070 vcpu->logical_id = id;
2071 vcpu->has_can_offline = true; /* lolspeak ftw */
2072 transfer_vcpu(vcpu, true, path, &local_err);
2073 QAPI_LIST_APPEND(tail, vcpu);
2074 }
2075 }
2076
2077 if (local_err == NULL) {
2078 /* there's no guest with zero VCPUs */
2079 g_assert(head != NULL);
2080 return head;
2081 }
2082
2083 qapi_free_GuestLogicalProcessorList(head);
2084 error_propagate(errp, local_err);
2085 return NULL;
2086 }
2087
2088 int64_t qmp_guest_set_vcpus(GuestLogicalProcessorList *vcpus, Error **errp)
2089 {
2090 int64_t processed;
2091 Error *local_err = NULL;
2092
2093 processed = 0;
2094 while (vcpus != NULL) {
2095 char *path = g_strdup_printf("/sys/devices/system/cpu/cpu%" PRId64 "/",
2096 vcpus->value->logical_id);
2097
2098 transfer_vcpu(vcpus->value, false, path, &local_err);
2099 g_free(path);
2100 if (local_err != NULL) {
2101 break;
2102 }
2103 ++processed;
2104 vcpus = vcpus->next;
2105 }
2106
2107 if (local_err != NULL) {
2108 if (processed == 0) {
2109 error_propagate(errp, local_err);
2110 } else {
2111 error_free(local_err);
2112 }
2113 }
2114
2115 return processed;
2116 }
2117 #endif /* __linux__ */
2118
2119 #if defined(__linux__) || defined(__FreeBSD__)
2120 void qmp_guest_set_user_password(const char *username,
2121 const char *password,
2122 bool crypted,
2123 Error **errp)
2124 {
2125 Error *local_err = NULL;
2126 char *passwd_path = NULL;
2127 pid_t pid;
2128 int status;
2129 int datafd[2] = { -1, -1 };
2130 char *rawpasswddata = NULL;
2131 size_t rawpasswdlen;
2132 char *chpasswddata = NULL;
2133 size_t chpasswdlen;
2134
2135 rawpasswddata = (char *)qbase64_decode(password, -1, &rawpasswdlen, errp);
2136 if (!rawpasswddata) {
2137 return;
2138 }
2139 rawpasswddata = g_renew(char, rawpasswddata, rawpasswdlen + 1);
2140 rawpasswddata[rawpasswdlen] = '\0';
2141
2142 if (strchr(rawpasswddata, '\n')) {
2143 error_setg(errp, "forbidden characters in raw password");
2144 goto out;
2145 }
2146
2147 if (strchr(username, '\n') ||
2148 strchr(username, ':')) {
2149 error_setg(errp, "forbidden characters in username");
2150 goto out;
2151 }
2152
2153 #ifdef __FreeBSD__
2154 chpasswddata = g_strdup(rawpasswddata);
2155 passwd_path = g_find_program_in_path("pw");
2156 #else
2157 chpasswddata = g_strdup_printf("%s:%s\n", username, rawpasswddata);
2158 passwd_path = g_find_program_in_path("chpasswd");
2159 #endif
2160
2161 chpasswdlen = strlen(chpasswddata);
2162
2163 if (!passwd_path) {
2164 error_setg(errp, "cannot find 'passwd' program in PATH");
2165 goto out;
2166 }
2167
2168 if (!g_unix_open_pipe(datafd, FD_CLOEXEC, NULL)) {
2169 error_setg(errp, "cannot create pipe FDs");
2170 goto out;
2171 }
2172
2173 pid = fork();
2174 if (pid == 0) {
2175 close(datafd[1]);
2176 /* child */
2177 setsid();
2178 dup2(datafd[0], 0);
2179 reopen_fd_to_null(1);
2180 reopen_fd_to_null(2);
2181
2182 #ifdef __FreeBSD__
2183 const char *h_arg;
2184 h_arg = (crypted) ? "-H" : "-h";
2185 execl(passwd_path, "pw", "usermod", "-n", username, h_arg, "0", NULL);
2186 #else
2187 if (crypted) {
2188 execl(passwd_path, "chpasswd", "-e", NULL);
2189 } else {
2190 execl(passwd_path, "chpasswd", NULL);
2191 }
2192 #endif
2193 _exit(EXIT_FAILURE);
2194 } else if (pid < 0) {
2195 error_setg_errno(errp, errno, "failed to create child process");
2196 goto out;
2197 }
2198 close(datafd[0]);
2199 datafd[0] = -1;
2200
2201 if (qemu_write_full(datafd[1], chpasswddata, chpasswdlen) != chpasswdlen) {
2202 error_setg_errno(errp, errno, "cannot write new account password");
2203 goto out;
2204 }
2205 close(datafd[1]);
2206 datafd[1] = -1;
2207
2208 ga_wait_child(pid, &status, &local_err);
2209 if (local_err) {
2210 error_propagate(errp, local_err);
2211 goto out;
2212 }
2213
2214 if (!WIFEXITED(status)) {
2215 error_setg(errp, "child process has terminated abnormally");
2216 goto out;
2217 }
2218
2219 if (WEXITSTATUS(status)) {
2220 error_setg(errp, "child process has failed to set user password");
2221 goto out;
2222 }
2223
2224 out:
2225 g_free(chpasswddata);
2226 g_free(rawpasswddata);
2227 g_free(passwd_path);
2228 if (datafd[0] != -1) {
2229 close(datafd[0]);
2230 }
2231 if (datafd[1] != -1) {
2232 close(datafd[1]);
2233 }
2234 }
2235 #else /* __linux__ || __FreeBSD__ */
2236 void qmp_guest_set_user_password(const char *username,
2237 const char *password,
2238 bool crypted,
2239 Error **errp)
2240 {
2241 error_setg(errp, QERR_UNSUPPORTED);
2242 }
2243 #endif /* __linux__ || __FreeBSD__ */
2244
2245 #ifdef __linux__
2246 static void ga_read_sysfs_file(int dirfd, const char *pathname, char *buf,
2247 int size, Error **errp)
2248 {
2249 int fd;
2250 int res;
2251
2252 errno = 0;
2253 fd = openat(dirfd, pathname, O_RDONLY);
2254 if (fd == -1) {
2255 error_setg_errno(errp, errno, "open sysfs file \"%s\"", pathname);
2256 return;
2257 }
2258
2259 res = pread(fd, buf, size, 0);
2260 if (res == -1) {
2261 error_setg_errno(errp, errno, "pread sysfs file \"%s\"", pathname);
2262 } else if (res == 0) {
2263 error_setg(errp, "pread sysfs file \"%s\": unexpected EOF", pathname);
2264 }
2265 close(fd);
2266 }
2267
2268 static void ga_write_sysfs_file(int dirfd, const char *pathname,
2269 const char *buf, int size, Error **errp)
2270 {
2271 int fd;
2272
2273 errno = 0;
2274 fd = openat(dirfd, pathname, O_WRONLY);
2275 if (fd == -1) {
2276 error_setg_errno(errp, errno, "open sysfs file \"%s\"", pathname);
2277 return;
2278 }
2279
2280 if (pwrite(fd, buf, size, 0) == -1) {
2281 error_setg_errno(errp, errno, "pwrite sysfs file \"%s\"", pathname);
2282 }
2283
2284 close(fd);
2285 }
2286
2287 /* Transfer online/offline status between @mem_blk and the guest system.
2288 *
2289 * On input either @errp or *@errp must be NULL.
2290 *
2291 * In system-to-@mem_blk direction, the following @mem_blk fields are accessed:
2292 * - R: mem_blk->phys_index
2293 * - W: mem_blk->online
2294 * - W: mem_blk->can_offline
2295 *
2296 * In @mem_blk-to-system direction, the following @mem_blk fields are accessed:
2297 * - R: mem_blk->phys_index
2298 * - R: mem_blk->online
2299 *- R: mem_blk->can_offline
2300 * Written members remain unmodified on error.
2301 */
2302 static void transfer_memory_block(GuestMemoryBlock *mem_blk, bool sys2memblk,
2303 GuestMemoryBlockResponse *result,
2304 Error **errp)
2305 {
2306 char *dirpath;
2307 int dirfd;
2308 char *status;
2309 Error *local_err = NULL;
2310
2311 if (!sys2memblk) {
2312 DIR *dp;
2313
2314 if (!result) {
2315 error_setg(errp, "Internal error, 'result' should not be NULL");
2316 return;
2317 }
2318 errno = 0;
2319 dp = opendir("/sys/devices/system/memory/");
2320 /* if there is no 'memory' directory in sysfs,
2321 * we think this VM does not support online/offline memory block,
2322 * any other solution?
2323 */
2324 if (!dp) {
2325 if (errno == ENOENT) {
2326 result->response =
2327 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_NOT_SUPPORTED;
2328 }
2329 goto out1;
2330 }
2331 closedir(dp);
2332 }
2333
2334 dirpath = g_strdup_printf("/sys/devices/system/memory/memory%" PRId64 "/",
2335 mem_blk->phys_index);
2336 dirfd = open(dirpath, O_RDONLY | O_DIRECTORY);
2337 if (dirfd == -1) {
2338 if (sys2memblk) {
2339 error_setg_errno(errp, errno, "open(\"%s\")", dirpath);
2340 } else {
2341 if (errno == ENOENT) {
2342 result->response = GUEST_MEMORY_BLOCK_RESPONSE_TYPE_NOT_FOUND;
2343 } else {
2344 result->response =
2345 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_FAILED;
2346 }
2347 }
2348 g_free(dirpath);
2349 goto out1;
2350 }
2351 g_free(dirpath);
2352
2353 status = g_malloc0(10);
2354 ga_read_sysfs_file(dirfd, "state", status, 10, &local_err);
2355 if (local_err) {
2356 /* treat with sysfs file that not exist in old kernel */
2357 if (errno == ENOENT) {
2358 error_free(local_err);
2359 if (sys2memblk) {
2360 mem_blk->online = true;
2361 mem_blk->can_offline = false;
2362 } else if (!mem_blk->online) {
2363 result->response =
2364 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_NOT_SUPPORTED;
2365 }
2366 } else {
2367 if (sys2memblk) {
2368 error_propagate(errp, local_err);
2369 } else {
2370 error_free(local_err);
2371 result->response =
2372 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_FAILED;
2373 }
2374 }
2375 goto out2;
2376 }
2377
2378 if (sys2memblk) {
2379 char removable = '0';
2380
2381 mem_blk->online = (strncmp(status, "online", 6) == 0);
2382
2383 ga_read_sysfs_file(dirfd, "removable", &removable, 1, &local_err);
2384 if (local_err) {
2385 /* if no 'removable' file, it doesn't support offline mem blk */
2386 if (errno == ENOENT) {
2387 error_free(local_err);
2388 mem_blk->can_offline = false;
2389 } else {
2390 error_propagate(errp, local_err);
2391 }
2392 } else {
2393 mem_blk->can_offline = (removable != '0');
2394 }
2395 } else {
2396 if (mem_blk->online != (strncmp(status, "online", 6) == 0)) {
2397 const char *new_state = mem_blk->online ? "online" : "offline";
2398
2399 ga_write_sysfs_file(dirfd, "state", new_state, strlen(new_state),
2400 &local_err);
2401 if (local_err) {
2402 error_free(local_err);
2403 result->response =
2404 GUEST_MEMORY_BLOCK_RESPONSE_TYPE_OPERATION_FAILED;
2405 goto out2;
2406 }
2407
2408 result->response = GUEST_MEMORY_BLOCK_RESPONSE_TYPE_SUCCESS;
2409 result->has_error_code = false;
2410 } /* otherwise pretend successful re-(on|off)-lining */
2411 }
2412 g_free(status);
2413 close(dirfd);
2414 return;
2415
2416 out2:
2417 g_free(status);
2418 close(dirfd);
2419 out1:
2420 if (!sys2memblk) {
2421 result->has_error_code = true;
2422 result->error_code = errno;
2423 }
2424 }
2425
2426 GuestMemoryBlockList *qmp_guest_get_memory_blocks(Error **errp)
2427 {
2428 GuestMemoryBlockList *head, **tail;
2429 Error *local_err = NULL;
2430 struct dirent *de;
2431 DIR *dp;
2432
2433 head = NULL;
2434 tail = &head;
2435
2436 dp = opendir("/sys/devices/system/memory/");
2437 if (!dp) {
2438 /* it's ok if this happens to be a system that doesn't expose
2439 * memory blocks via sysfs, but otherwise we should report
2440 * an error
2441 */
2442 if (errno != ENOENT) {
2443 error_setg_errno(errp, errno, "Can't open directory"
2444 "\"/sys/devices/system/memory/\"");
2445 }
2446 return NULL;
2447 }
2448
2449 /* Note: the phys_index of memory block may be discontinuous,
2450 * this is because a memblk is the unit of the Sparse Memory design, which
2451 * allows discontinuous memory ranges (ex. NUMA), so here we should
2452 * traverse the memory block directory.
2453 */
2454 while ((de = readdir(dp)) != NULL) {
2455 GuestMemoryBlock *mem_blk;
2456
2457 if ((strncmp(de->d_name, "memory", 6) != 0) ||
2458 !(de->d_type & DT_DIR)) {
2459 continue;
2460 }
2461
2462 mem_blk = g_malloc0(sizeof *mem_blk);
2463 /* The d_name is "memoryXXX", phys_index is block id, same as XXX */
2464 mem_blk->phys_index = strtoul(&de->d_name[6], NULL, 10);
2465 mem_blk->has_can_offline = true; /* lolspeak ftw */
2466 transfer_memory_block(mem_blk, true, NULL, &local_err);
2467 if (local_err) {
2468 break;
2469 }
2470
2471 QAPI_LIST_APPEND(tail, mem_blk);
2472 }
2473
2474 closedir(dp);
2475 if (local_err == NULL) {
2476 /* there's no guest with zero memory blocks */
2477 if (head == NULL) {
2478 error_setg(errp, "guest reported zero memory blocks!");
2479 }
2480 return head;
2481 }
2482
2483 qapi_free_GuestMemoryBlockList(head);
2484 error_propagate(errp, local_err);
2485 return NULL;
2486 }
2487
2488 GuestMemoryBlockResponseList *
2489 qmp_guest_set_memory_blocks(GuestMemoryBlockList *mem_blks, Error **errp)
2490 {
2491 GuestMemoryBlockResponseList *head, **tail;
2492 Error *local_err = NULL;
2493
2494 head = NULL;
2495 tail = &head;
2496
2497 while (mem_blks != NULL) {
2498 GuestMemoryBlockResponse *result;
2499 GuestMemoryBlock *current_mem_blk = mem_blks->value;
2500
2501 result = g_malloc0(sizeof(*result));
2502 result->phys_index = current_mem_blk->phys_index;
2503 transfer_memory_block(current_mem_blk, false, result, &local_err);
2504 if (local_err) { /* should never happen */
2505 goto err;
2506 }
2507
2508 QAPI_LIST_APPEND(tail, result);
2509 mem_blks = mem_blks->next;
2510 }
2511
2512 return head;
2513 err:
2514 qapi_free_GuestMemoryBlockResponseList(head);
2515 error_propagate(errp, local_err);
2516 return NULL;
2517 }
2518
2519 GuestMemoryBlockInfo *qmp_guest_get_memory_block_info(Error **errp)
2520 {
2521 Error *local_err = NULL;
2522 char *dirpath;
2523 int dirfd;
2524 char *buf;
2525 GuestMemoryBlockInfo *info;
2526
2527 dirpath = g_strdup_printf("/sys/devices/system/memory/");
2528 dirfd = open(dirpath, O_RDONLY | O_DIRECTORY);
2529 if (dirfd == -1) {
2530 error_setg_errno(errp, errno, "open(\"%s\")", dirpath);
2531 g_free(dirpath);
2532 return NULL;
2533 }
2534 g_free(dirpath);
2535
2536 buf = g_malloc0(20);
2537 ga_read_sysfs_file(dirfd, "block_size_bytes", buf, 20, &local_err);
2538 close(dirfd);
2539 if (local_err) {
2540 g_free(buf);
2541 error_propagate(errp, local_err);
2542 return NULL;
2543 }
2544
2545 info = g_new0(GuestMemoryBlockInfo, 1);
2546 info->size = strtol(buf, NULL, 16); /* the unit is bytes */
2547
2548 g_free(buf);
2549
2550 return info;
2551 }
2552
2553 #define MAX_NAME_LEN 128
2554 static GuestDiskStatsInfoList *guest_get_diskstats(Error **errp)
2555 {
2556 #ifdef CONFIG_LINUX
2557 GuestDiskStatsInfoList *head = NULL, **tail = &head;
2558 const char *diskstats = "/proc/diskstats";
2559 FILE *fp;
2560 size_t n;
2561 char *line = NULL;
2562
2563 fp = fopen(diskstats, "r");
2564 if (fp == NULL) {
2565 error_setg_errno(errp, errno, "open(\"%s\")", diskstats);
2566 return NULL;
2567 }
2568
2569 while (getline(&line, &n, fp) != -1) {
2570 g_autofree GuestDiskStatsInfo *diskstatinfo = NULL;
2571 g_autofree GuestDiskStats *diskstat = NULL;
2572 char dev_name[MAX_NAME_LEN];
2573 unsigned int ios_pgr, tot_ticks, rq_ticks, wr_ticks, dc_ticks, fl_ticks;
2574 unsigned long rd_ios, rd_merges_or_rd_sec, rd_ticks_or_wr_sec, wr_ios;
2575 unsigned long wr_merges, rd_sec_or_wr_ios, wr_sec;
2576 unsigned long dc_ios, dc_merges, dc_sec, fl_ios;
2577 unsigned int major, minor;
2578 int i;
2579
2580 i = sscanf(line, "%u %u %s %lu %lu %lu"
2581 "%lu %lu %lu %lu %u %u %u %u"
2582 "%lu %lu %lu %u %lu %u",
2583 &major, &minor, dev_name,
2584 &rd_ios, &rd_merges_or_rd_sec, &rd_sec_or_wr_ios,
2585 &rd_ticks_or_wr_sec, &wr_ios, &wr_merges, &wr_sec,
2586 &wr_ticks, &ios_pgr, &tot_ticks, &rq_ticks,
2587 &dc_ios, &dc_merges, &dc_sec, &dc_ticks,
2588 &fl_ios, &fl_ticks);
2589
2590 if (i < 7) {
2591 continue;
2592 }
2593
2594 diskstatinfo = g_new0(GuestDiskStatsInfo, 1);
2595 diskstatinfo->name = g_strdup(dev_name);
2596 diskstatinfo->major = major;
2597 diskstatinfo->minor = minor;
2598
2599 diskstat = g_new0(GuestDiskStats, 1);
2600 if (i == 7) {
2601 diskstat->has_read_ios = true;
2602 diskstat->read_ios = rd_ios;
2603 diskstat->has_read_sectors = true;
2604 diskstat->read_sectors = rd_merges_or_rd_sec;
2605 diskstat->has_write_ios = true;
2606 diskstat->write_ios = rd_sec_or_wr_ios;
2607 diskstat->has_write_sectors = true;
2608 diskstat->write_sectors = rd_ticks_or_wr_sec;
2609 }
2610 if (i >= 14) {
2611 diskstat->has_read_ios = true;
2612 diskstat->read_ios = rd_ios;
2613 diskstat->has_read_sectors = true;
2614 diskstat->read_sectors = rd_sec_or_wr_ios;
2615 diskstat->has_read_merges = true;
2616 diskstat->read_merges = rd_merges_or_rd_sec;
2617 diskstat->has_read_ticks = true;
2618 diskstat->read_ticks = rd_ticks_or_wr_sec;
2619 diskstat->has_write_ios = true;
2620 diskstat->write_ios = wr_ios;
2621 diskstat->has_write_sectors = true;
2622 diskstat->write_sectors = wr_sec;
2623 diskstat->has_write_merges = true;
2624 diskstat->write_merges = wr_merges;
2625 diskstat->has_write_ticks = true;
2626 diskstat->write_ticks = wr_ticks;
2627 diskstat->has_ios_pgr = true;
2628 diskstat->ios_pgr = ios_pgr;
2629 diskstat->has_total_ticks = true;
2630 diskstat->total_ticks = tot_ticks;
2631 diskstat->has_weight_ticks = true;
2632 diskstat->weight_ticks = rq_ticks;
2633 }
2634 if (i >= 18) {
2635 diskstat->has_discard_ios = true;
2636 diskstat->discard_ios = dc_ios;
2637 diskstat->has_discard_merges = true;
2638 diskstat->discard_merges = dc_merges;
2639 diskstat->has_discard_sectors = true;
2640 diskstat->discard_sectors = dc_sec;
2641 diskstat->has_discard_ticks = true;
2642 diskstat->discard_ticks = dc_ticks;
2643 }
2644 if (i >= 20) {
2645 diskstat->has_flush_ios = true;
2646 diskstat->flush_ios = fl_ios;
2647 diskstat->has_flush_ticks = true;
2648 diskstat->flush_ticks = fl_ticks;
2649 }
2650
2651 diskstatinfo->stats = g_steal_pointer(&diskstat);
2652 QAPI_LIST_APPEND(tail, diskstatinfo);
2653 diskstatinfo = NULL;
2654 }
2655 free(line);
2656 fclose(fp);
2657 return head;
2658 #else
2659 g_debug("disk stats reporting available only for Linux");
2660 return NULL;
2661 #endif
2662 }
2663
2664 GuestDiskStatsInfoList *qmp_guest_get_diskstats(Error **errp)
2665 {
2666 return guest_get_diskstats(errp);
2667 }
2668
2669 GuestCpuStatsList *qmp_guest_get_cpustats(Error **errp)
2670 {
2671 GuestCpuStatsList *head = NULL, **tail = &head;
2672 const char *cpustats = "/proc/stat";
2673 int clk_tck = sysconf(_SC_CLK_TCK);
2674 FILE *fp;
2675 size_t n;
2676 char *line = NULL;
2677
2678 fp = fopen(cpustats, "r");
2679 if (fp == NULL) {
2680 error_setg_errno(errp, errno, "open(\"%s\")", cpustats);
2681 return NULL;
2682 }
2683
2684 while (getline(&line, &n, fp) != -1) {
2685 GuestCpuStats *cpustat = NULL;
2686 GuestLinuxCpuStats *linuxcpustat;
2687 int i;
2688 unsigned long user, system, idle, iowait, irq, softirq, steal, guest;
2689 unsigned long nice, guest_nice;
2690 char name[64];
2691
2692 i = sscanf(line, "%s %lu %lu %lu %lu %lu %lu %lu %lu %lu %lu",
2693 name, &user, &nice, &system, &idle, &iowait, &irq, &softirq,
2694 &steal, &guest, &guest_nice);
2695
2696 /* drop "cpu 1 2 3 ...", get "cpuX 1 2 3 ..." only */
2697 if ((i == EOF) || strncmp(name, "cpu", 3) || (name[3] == '\0')) {
2698 continue;
2699 }
2700
2701 if (i < 5) {
2702 slog("Parsing cpu stat from %s failed, see \"man proc\"", cpustats);
2703 break;
2704 }
2705
2706 cpustat = g_new0(GuestCpuStats, 1);
2707 cpustat->type = GUEST_CPU_STATS_TYPE_LINUX;
2708
2709 linuxcpustat = &cpustat->u.q_linux;
2710 linuxcpustat->cpu = atoi(&name[3]);
2711 linuxcpustat->user = user * 1000 / clk_tck;
2712 linuxcpustat->nice = nice * 1000 / clk_tck;
2713 linuxcpustat->system = system * 1000 / clk_tck;
2714 linuxcpustat->idle = idle * 1000 / clk_tck;
2715
2716 if (i > 5) {
2717 linuxcpustat->has_iowait = true;
2718 linuxcpustat->iowait = iowait * 1000 / clk_tck;
2719 }
2720
2721 if (i > 6) {
2722 linuxcpustat->has_irq = true;
2723 linuxcpustat->irq = irq * 1000 / clk_tck;
2724 linuxcpustat->has_softirq = true;
2725 linuxcpustat->softirq = softirq * 1000 / clk_tck;
2726 }
2727
2728 if (i > 8) {
2729 linuxcpustat->has_steal = true;
2730 linuxcpustat->steal = steal * 1000 / clk_tck;
2731 }
2732
2733 if (i > 9) {
2734 linuxcpustat->has_guest = true;
2735 linuxcpustat->guest = guest * 1000 / clk_tck;
2736 }
2737
2738 if (i > 10) {
2739 linuxcpustat->has_guest = true;
2740 linuxcpustat->guest = guest * 1000 / clk_tck;
2741 linuxcpustat->has_guestnice = true;
2742 linuxcpustat->guestnice = guest_nice * 1000 / clk_tck;
2743 }
2744
2745 QAPI_LIST_APPEND(tail, cpustat);
2746 }
2747
2748 free(line);
2749 fclose(fp);
2750 return head;
2751 }
2752
2753 #else /* defined(__linux__) */
2754
2755 void qmp_guest_suspend_disk(Error **errp)
2756 {
2757 error_setg(errp, QERR_UNSUPPORTED);
2758 }
2759
2760 void qmp_guest_suspend_ram(Error **errp)
2761 {
2762 error_setg(errp, QERR_UNSUPPORTED);
2763 }
2764
2765 void qmp_guest_suspend_hybrid(Error **errp)
2766 {
2767 error_setg(errp, QERR_UNSUPPORTED);
2768 }
2769
2770 GuestLogicalProcessorList *qmp_guest_get_vcpus(Error **errp)
2771 {
2772 error_setg(errp, QERR_UNSUPPORTED);
2773 return NULL;
2774 }
2775
2776 int64_t qmp_guest_set_vcpus(GuestLogicalProcessorList *vcpus, Error **errp)
2777 {
2778 error_setg(errp, QERR_UNSUPPORTED);
2779 return -1;
2780 }
2781
2782 GuestMemoryBlockList *qmp_guest_get_memory_blocks(Error **errp)
2783 {
2784 error_setg(errp, QERR_UNSUPPORTED);
2785 return NULL;
2786 }
2787
2788 GuestMemoryBlockResponseList *
2789 qmp_guest_set_memory_blocks(GuestMemoryBlockList *mem_blks, Error **errp)
2790 {
2791 error_setg(errp, QERR_UNSUPPORTED);
2792 return NULL;
2793 }
2794
2795 GuestMemoryBlockInfo *qmp_guest_get_memory_block_info(Error **errp)
2796 {
2797 error_setg(errp, QERR_UNSUPPORTED);
2798 return NULL;
2799 }
2800
2801 #endif
2802
2803 #ifdef HAVE_GETIFADDRS
2804 static GuestNetworkInterface *
2805 guest_find_interface(GuestNetworkInterfaceList *head,
2806 const char *name)
2807 {
2808 for (; head; head = head->next) {
2809 if (strcmp(head->value->name, name) == 0) {
2810 return head->value;
2811 }
2812 }
2813
2814 return NULL;
2815 }
2816
2817 static int guest_get_network_stats(const char *name,
2818 GuestNetworkInterfaceStat *stats)
2819 {
2820 #ifdef CONFIG_LINUX
2821 int name_len;
2822 char const *devinfo = "/proc/net/dev";
2823 FILE *fp;
2824 char *line = NULL, *colon;
2825 size_t n = 0;
2826 fp = fopen(devinfo, "r");
2827 if (!fp) {
2828 g_debug("failed to open network stats %s: %s", devinfo,
2829 g_strerror(errno));
2830 return -1;
2831 }
2832 name_len = strlen(name);
2833 while (getline(&line, &n, fp) != -1) {
2834 long long dummy;
2835 long long rx_bytes;
2836 long long rx_packets;
2837 long long rx_errs;
2838 long long rx_dropped;
2839 long long tx_bytes;
2840 long long tx_packets;
2841 long long tx_errs;
2842 long long tx_dropped;
2843 char *trim_line;
2844 trim_line = g_strchug(line);
2845 if (trim_line[0] == '\0') {
2846 continue;
2847 }
2848 colon = strchr(trim_line, ':');
2849 if (!colon) {
2850 continue;
2851 }
2852 if (colon - name_len == trim_line &&
2853 strncmp(trim_line, name, name_len) == 0) {
2854 if (sscanf(colon + 1,
2855 "%lld %lld %lld %lld %lld %lld %lld %lld %lld %lld %lld %lld %lld %lld %lld %lld",
2856 &rx_bytes, &rx_packets, &rx_errs, &rx_dropped,
2857 &dummy, &dummy, &dummy, &dummy,
2858 &tx_bytes, &tx_packets, &tx_errs, &tx_dropped,
2859 &dummy, &dummy, &dummy, &dummy) != 16) {
2860 continue;
2861 }
2862 stats->rx_bytes = rx_bytes;
2863 stats->rx_packets = rx_packets;
2864 stats->rx_errs = rx_errs;
2865 stats->rx_dropped = rx_dropped;
2866 stats->tx_bytes = tx_bytes;
2867 stats->tx_packets = tx_packets;
2868 stats->tx_errs = tx_errs;
2869 stats->tx_dropped = tx_dropped;
2870 fclose(fp);
2871 g_free(line);
2872 return 0;
2873 }
2874 }
2875 fclose(fp);
2876 g_free(line);
2877 g_debug("/proc/net/dev: Interface '%s' not found", name);
2878 #else /* !CONFIG_LINUX */
2879 g_debug("Network stats reporting available only for Linux");
2880 #endif /* !CONFIG_LINUX */
2881 return -1;
2882 }
2883
2884 #ifndef CONFIG_BSD
2885 /*
2886 * Fill "buf" with MAC address by ifaddrs. Pointer buf must point to a
2887 * buffer with ETHER_ADDR_LEN length at least.
2888 *
2889 * Returns false in case of an error, otherwise true. "obtained" argument
2890 * is true if a MAC address was obtained successful, otherwise false.
2891 */
2892 bool guest_get_hw_addr(struct ifaddrs *ifa, unsigned char *buf,
2893 bool *obtained, Error **errp)
2894 {
2895 struct ifreq ifr;
2896 int sock;
2897
2898 *obtained = false;
2899
2900 /* we haven't obtained HW address yet */
2901 sock = socket(PF_INET, SOCK_STREAM, 0);
2902 if (sock == -1) {
2903 error_setg_errno(errp, errno, "failed to create socket");
2904 return false;
2905 }
2906
2907 memset(&ifr, 0, sizeof(ifr));
2908 pstrcpy(ifr.ifr_name, IF_NAMESIZE, ifa->ifa_name);
2909 if (ioctl(sock, SIOCGIFHWADDR, &ifr) == -1) {
2910 /*
2911 * We can't get the hw addr of this interface, but that's not a
2912 * fatal error.
2913 */
2914 if (errno == EADDRNOTAVAIL) {
2915 /* The interface doesn't have a hw addr (e.g. loopback). */
2916 g_debug("failed to get MAC address of %s: %s",
2917 ifa->ifa_name, strerror(errno));
2918 } else{
2919 g_warning("failed to get MAC address of %s: %s",
2920 ifa->ifa_name, strerror(errno));
2921 }
2922 } else {
2923 #ifdef CONFIG_SOLARIS
2924 memcpy(buf, &ifr.ifr_addr.sa_data, ETHER_ADDR_LEN);
2925 #else
2926 memcpy(buf, &ifr.ifr_hwaddr.sa_data, ETHER_ADDR_LEN);
2927 #endif
2928 *obtained = true;
2929 }
2930 close(sock);
2931 return true;
2932 }
2933 #endif /* CONFIG_BSD */
2934
2935 /*
2936 * Build information about guest interfaces
2937 */
2938 GuestNetworkInterfaceList *qmp_guest_network_get_interfaces(Error **errp)
2939 {
2940 GuestNetworkInterfaceList *head = NULL, **tail = &head;
2941 struct ifaddrs *ifap, *ifa;
2942
2943 if (getifaddrs(&ifap) < 0) {
2944 error_setg_errno(errp, errno, "getifaddrs failed");
2945 goto error;
2946 }
2947
2948 for (ifa = ifap; ifa; ifa = ifa->ifa_next) {
2949 GuestNetworkInterface *info;
2950 GuestIpAddressList **address_tail;
2951 GuestIpAddress *address_item = NULL;
2952 GuestNetworkInterfaceStat *interface_stat = NULL;
2953 char addr4[INET_ADDRSTRLEN];
2954 char addr6[INET6_ADDRSTRLEN];
2955 unsigned char mac_addr[ETHER_ADDR_LEN];
2956 bool obtained;
2957 void *p;
2958
2959 g_debug("Processing %s interface", ifa->ifa_name);
2960
2961 info = guest_find_interface(head, ifa->ifa_name);
2962
2963 if (!info) {
2964 info = g_malloc0(sizeof(*info));
2965 info->name = g_strdup(ifa->ifa_name);
2966
2967 QAPI_LIST_APPEND(tail, info);
2968 }
2969
2970 if (!info->hardware_address) {
2971 if (!guest_get_hw_addr(ifa, mac_addr, &obtained, errp)) {
2972 goto error;
2973 }
2974 if (obtained) {
2975 info->hardware_address =
2976 g_strdup_printf("%02x:%02x:%02x:%02x:%02x:%02x",
2977 (int) mac_addr[0], (int) mac_addr[1],
2978 (int) mac_addr[2], (int) mac_addr[3],
2979 (int) mac_addr[4], (int) mac_addr[5]);
2980 }
2981 }
2982
2983 if (ifa->ifa_addr &&
2984 ifa->ifa_addr->sa_family == AF_INET) {
2985 /* interface with IPv4 address */
2986 p = &((struct sockaddr_in *)ifa->ifa_addr)->sin_addr;
2987 if (!inet_ntop(AF_INET, p, addr4, sizeof(addr4))) {
2988 error_setg_errno(errp, errno, "inet_ntop failed");
2989 goto error;
2990 }
2991
2992 address_item = g_malloc0(sizeof(*address_item));
2993 address_item->ip_address = g_strdup(addr4);
2994 address_item->ip_address_type = GUEST_IP_ADDRESS_TYPE_IPV4;
2995
2996 if (ifa->ifa_netmask) {
2997 /* Count the number of set bits in netmask.
2998 * This is safe as '1' and '0' cannot be shuffled in netmask. */
2999 p = &((struct sockaddr_in *)ifa->ifa_netmask)->sin_addr;
3000 address_item->prefix = ctpop32(((uint32_t *) p)[0]);
3001 }
3002 } else if (ifa->ifa_addr &&
3003 ifa->ifa_addr->sa_family == AF_INET6) {
3004 /* interface with IPv6 address */
3005 p = &((struct sockaddr_in6 *)ifa->ifa_addr)->sin6_addr;
3006 if (!inet_ntop(AF_INET6, p, addr6, sizeof(addr6))) {
3007 error_setg_errno(errp, errno, "inet_ntop failed");
3008 goto error;
3009 }
3010
3011 address_item = g_malloc0(sizeof(*address_item));
3012 address_item->ip_address = g_strdup(addr6);
3013 address_item->ip_address_type = GUEST_IP_ADDRESS_TYPE_IPV6;
3014
3015 if (ifa->ifa_netmask) {
3016 /* Count the number of set bits in netmask.
3017 * This is safe as '1' and '0' cannot be shuffled in netmask. */
3018 p = &((struct sockaddr_in6 *)ifa->ifa_netmask)->sin6_addr;
3019 address_item->prefix =
3020 ctpop32(((uint32_t *) p)[0]) +
3021 ctpop32(((uint32_t *) p)[1]) +
3022 ctpop32(((uint32_t *) p)[2]) +
3023 ctpop32(((uint32_t *) p)[3]);
3024 }
3025 }
3026
3027 if (!address_item) {
3028 continue;
3029 }
3030
3031 address_tail = &info->ip_addresses;
3032 while (*address_tail) {
3033 address_tail = &(*address_tail)->next;
3034 }
3035 QAPI_LIST_APPEND(address_tail, address_item);
3036
3037 info->has_ip_addresses = true;
3038
3039 if (!info->statistics) {
3040 interface_stat = g_malloc0(sizeof(*interface_stat));
3041 if (guest_get_network_stats(info->name, interface_stat) == -1) {
3042 g_free(interface_stat);
3043 } else {
3044 info->statistics = interface_stat;
3045 }
3046 }
3047 }
3048
3049 freeifaddrs(ifap);
3050 return head;
3051
3052 error:
3053 freeifaddrs(ifap);
3054 qapi_free_GuestNetworkInterfaceList(head);
3055 return NULL;
3056 }
3057
3058 #else
3059
3060 GuestNetworkInterfaceList *qmp_guest_network_get_interfaces(Error **errp)
3061 {
3062 error_setg(errp, QERR_UNSUPPORTED);
3063 return NULL;
3064 }
3065
3066 #endif /* HAVE_GETIFADDRS */
3067
3068 #if !defined(CONFIG_FSFREEZE)
3069
3070 GuestFilesystemInfoList *qmp_guest_get_fsinfo(Error **errp)
3071 {
3072 error_setg(errp, QERR_UNSUPPORTED);
3073 return NULL;
3074 }
3075
3076 GuestFsfreezeStatus qmp_guest_fsfreeze_status(Error **errp)
3077 {
3078 error_setg(errp, QERR_UNSUPPORTED);
3079
3080 return 0;
3081 }
3082
3083 int64_t qmp_guest_fsfreeze_freeze(Error **errp)
3084 {
3085 error_setg(errp, QERR_UNSUPPORTED);
3086
3087 return 0;
3088 }
3089
3090 int64_t qmp_guest_fsfreeze_freeze_list(bool has_mountpoints,
3091 strList *mountpoints,
3092 Error **errp)
3093 {
3094 error_setg(errp, QERR_UNSUPPORTED);
3095
3096 return 0;
3097 }
3098
3099 int64_t qmp_guest_fsfreeze_thaw(Error **errp)
3100 {
3101 error_setg(errp, QERR_UNSUPPORTED);
3102
3103 return 0;
3104 }
3105
3106 GuestDiskInfoList *qmp_guest_get_disks(Error **errp)
3107 {
3108 error_setg(errp, QERR_UNSUPPORTED);
3109 return NULL;
3110 }
3111
3112 GuestDiskStatsInfoList *qmp_guest_get_diskstats(Error **errp)
3113 {
3114 error_setg(errp, QERR_UNSUPPORTED);
3115 return NULL;
3116 }
3117
3118 GuestCpuStatsList *qmp_guest_get_cpustats(Error **errp)
3119 {
3120 error_setg(errp, QERR_UNSUPPORTED);
3121 return NULL;
3122 }
3123
3124 #endif /* CONFIG_FSFREEZE */
3125
3126 #if !defined(CONFIG_FSTRIM)
3127 GuestFilesystemTrimResponse *
3128 qmp_guest_fstrim(bool has_minimum, int64_t minimum, Error **errp)
3129 {
3130 error_setg(errp, QERR_UNSUPPORTED);
3131 return NULL;
3132 }
3133 #endif
3134
3135 /* add unsupported commands to the list of blocked RPCs */
3136 GList *ga_command_init_blockedrpcs(GList *blockedrpcs)
3137 {
3138 #if !defined(__linux__)
3139 {
3140 const char *list[] = {
3141 "guest-suspend-disk", "guest-suspend-ram",
3142 "guest-suspend-hybrid", "guest-get-vcpus", "guest-set-vcpus",
3143 "guest-get-memory-blocks", "guest-set-memory-blocks",
3144 "guest-get-memory-block-size", "guest-get-memory-block-info",
3145 NULL};
3146 char **p = (char **)list;
3147
3148 while (*p) {
3149 blockedrpcs = g_list_append(blockedrpcs, g_strdup(*p++));
3150 }
3151 }
3152 #endif
3153
3154 #if !defined(HAVE_GETIFADDRS)
3155 blockedrpcs = g_list_append(blockedrpcs,
3156 g_strdup("guest-network-get-interfaces"));
3157 #endif
3158
3159 #if !defined(CONFIG_FSFREEZE)
3160 {
3161 const char *list[] = {
3162 "guest-get-fsinfo", "guest-fsfreeze-status",
3163 "guest-fsfreeze-freeze", "guest-fsfreeze-freeze-list",
3164 "guest-fsfreeze-thaw", "guest-get-fsinfo",
3165 "guest-get-disks", NULL};
3166 char **p = (char **)list;
3167
3168 while (*p) {
3169 blockedrpcs = g_list_append(blockedrpcs, g_strdup(*p++));
3170 }
3171 }
3172 #endif
3173
3174 #if !defined(CONFIG_FSTRIM)
3175 blockedrpcs = g_list_append(blockedrpcs, g_strdup("guest-fstrim"));
3176 #endif
3177
3178 blockedrpcs = g_list_append(blockedrpcs, g_strdup("guest-get-devices"));
3179
3180 return blockedrpcs;
3181 }
3182
3183 /* register init/cleanup routines for stateful command groups */
3184 void ga_command_state_init(GAState *s, GACommandState *cs)
3185 {
3186 #if defined(CONFIG_FSFREEZE)
3187 ga_command_state_add(cs, NULL, guest_fsfreeze_cleanup);
3188 #endif
3189 }
3190
3191 #ifdef HAVE_UTMPX
3192
3193 #define QGA_MICRO_SECOND_TO_SECOND 1000000
3194
3195 static double ga_get_login_time(struct utmpx *user_info)
3196 {
3197 double seconds = (double)user_info->ut_tv.tv_sec;
3198 double useconds = (double)user_info->ut_tv.tv_usec;
3199 useconds /= QGA_MICRO_SECOND_TO_SECOND;
3200 return seconds + useconds;
3201 }
3202
3203 GuestUserList *qmp_guest_get_users(Error **errp)
3204 {
3205 GHashTable *cache = NULL;
3206 GuestUserList *head = NULL, **tail = &head;
3207 struct utmpx *user_info = NULL;
3208 gpointer value = NULL;
3209 GuestUser *user = NULL;
3210 double login_time = 0;
3211
3212 cache = g_hash_table_new(g_str_hash, g_str_equal);
3213 setutxent();
3214
3215 for (;;) {
3216 user_info = getutxent();
3217 if (user_info == NULL) {
3218 break;
3219 } else if (user_info->ut_type != USER_PROCESS) {
3220 continue;
3221 } else if (g_hash_table_contains(cache, user_info->ut_user)) {
3222 value = g_hash_table_lookup(cache, user_info->ut_user);
3223 user = (GuestUser *)value;
3224 login_time = ga_get_login_time(user_info);
3225 /* We're ensuring the earliest login time to be sent */
3226 if (login_time < user->login_time) {
3227 user->login_time = login_time;
3228 }
3229 continue;
3230 }
3231
3232 user = g_new0(GuestUser, 1);
3233 user->user = g_strdup(user_info->ut_user);
3234 user->login_time = ga_get_login_time(user_info);
3235
3236 g_hash_table_insert(cache, user->user, user);
3237
3238 QAPI_LIST_APPEND(tail, user);
3239 }
3240 endutxent();
3241 g_hash_table_destroy(cache);
3242 return head;
3243 }
3244
3245 #else
3246
3247 GuestUserList *qmp_guest_get_users(Error **errp)
3248 {
3249 error_setg(errp, QERR_UNSUPPORTED);
3250 return NULL;
3251 }
3252
3253 #endif
3254
3255 /* Replace escaped special characters with their real values. The replacement
3256 * is done in place -- returned value is in the original string.
3257 */
3258 static void ga_osrelease_replace_special(gchar *value)
3259 {
3260 gchar *p, *p2, quote;
3261
3262 /* Trim the string at first space or semicolon if it is not enclosed in
3263 * single or double quotes. */
3264 if ((value[0] != '"') || (value[0] == '\'')) {
3265 p = strchr(value, ' ');
3266 if (p != NULL) {
3267 *p = 0;
3268 }
3269 p = strchr(value, ';');
3270 if (p != NULL) {
3271 *p = 0;
3272 }
3273 return;
3274 }
3275
3276 quote = value[0];
3277 p2 = value;
3278 p = value + 1;
3279 while (*p != 0) {
3280 if (*p == '\\') {
3281 p++;
3282 switch (*p) {
3283 case '$':
3284 case '\'':
3285 case '"':
3286 case '\\':
3287 case '`':
3288 break;
3289 default:
3290 /* Keep literal backslash followed by whatever is there */
3291 p--;
3292 break;
3293 }
3294 } else if (*p == quote) {
3295 *p2 = 0;
3296 break;
3297 }
3298 *(p2++) = *(p++);
3299 }
3300 }
3301
3302 static GKeyFile *ga_parse_osrelease(const char *fname)
3303 {
3304 gchar *content = NULL;
3305 gchar *content2 = NULL;
3306 GError *err = NULL;
3307 GKeyFile *keys = g_key_file_new();
3308 const char *group = "[os-release]\n";
3309
3310 if (!g_file_get_contents(fname, &content, NULL, &err)) {
3311 slog("failed to read '%s', error: %s", fname, err->message);
3312 goto fail;
3313 }
3314
3315 if (!g_utf8_validate(content, -1, NULL)) {
3316 slog("file is not utf-8 encoded: %s", fname);
3317 goto fail;
3318 }
3319 content2 = g_strdup_printf("%s%s", group, content);
3320
3321 if (!g_key_file_load_from_data(keys, content2, -1, G_KEY_FILE_NONE,
3322 &err)) {
3323 slog("failed to parse file '%s', error: %s", fname, err->message);
3324 goto fail;
3325 }
3326
3327 g_free(content);
3328 g_free(content2);
3329 return keys;
3330
3331 fail:
3332 g_error_free(err);
3333 g_free(content);
3334 g_free(content2);
3335 g_key_file_free(keys);
3336 return NULL;
3337 }
3338
3339 GuestOSInfo *qmp_guest_get_osinfo(Error **errp)
3340 {
3341 GuestOSInfo *info = NULL;
3342 struct utsname kinfo;
3343 GKeyFile *osrelease = NULL;
3344 const char *qga_os_release = g_getenv("QGA_OS_RELEASE");
3345
3346 info = g_new0(GuestOSInfo, 1);
3347
3348 if (uname(&kinfo) != 0) {
3349 error_setg_errno(errp, errno, "uname failed");
3350 } else {
3351 info->kernel_version = g_strdup(kinfo.version);
3352 info->kernel_release = g_strdup(kinfo.release);
3353 info->machine = g_strdup(kinfo.machine);
3354 }
3355
3356 if (qga_os_release != NULL) {
3357 osrelease = ga_parse_osrelease(qga_os_release);
3358 } else {
3359 osrelease = ga_parse_osrelease("/etc/os-release");
3360 if (osrelease == NULL) {
3361 osrelease = ga_parse_osrelease("/usr/lib/os-release");
3362 }
3363 }
3364
3365 if (osrelease != NULL) {
3366 char *value;
3367
3368 #define GET_FIELD(field, osfield) do { \
3369 value = g_key_file_get_value(osrelease, "os-release", osfield, NULL); \
3370 if (value != NULL) { \
3371 ga_osrelease_replace_special(value); \
3372 info->field = value; \
3373 } \
3374 } while (0)
3375 GET_FIELD(id, "ID");
3376 GET_FIELD(name, "NAME");
3377 GET_FIELD(pretty_name, "PRETTY_NAME");
3378 GET_FIELD(version, "VERSION");
3379 GET_FIELD(version_id, "VERSION_ID");
3380 GET_FIELD(variant, "VARIANT");
3381 GET_FIELD(variant_id, "VARIANT_ID");
3382 #undef GET_FIELD
3383
3384 g_key_file_free(osrelease);
3385 }
3386
3387 return info;
3388 }
3389
3390 GuestDeviceInfoList *qmp_guest_get_devices(Error **errp)
3391 {
3392 error_setg(errp, QERR_UNSUPPORTED);
3393
3394 return NULL;
3395 }
3396
3397 #ifndef HOST_NAME_MAX
3398 # ifdef _POSIX_HOST_NAME_MAX
3399 # define HOST_NAME_MAX _POSIX_HOST_NAME_MAX
3400 # else
3401 # define HOST_NAME_MAX 255
3402 # endif
3403 #endif
3404
3405 char *qga_get_host_name(Error **errp)
3406 {
3407 long len = -1;
3408 g_autofree char *hostname = NULL;
3409
3410 #ifdef _SC_HOST_NAME_MAX
3411 len = sysconf(_SC_HOST_NAME_MAX);
3412 #endif /* _SC_HOST_NAME_MAX */
3413
3414 if (len < 0) {
3415 len = HOST_NAME_MAX;
3416 }
3417
3418 /* Unfortunately, gethostname() below does not guarantee a
3419 * NULL terminated string. Therefore, allocate one byte more
3420 * to be sure. */
3421 hostname = g_new0(char, len + 1);
3422
3423 if (gethostname(hostname, len) < 0) {
3424 error_setg_errno(errp, errno,
3425 "cannot get hostname");
3426 return NULL;
3427 }
3428
3429 return g_steal_pointer(&hostname);
3430 }