diff options
Diffstat (limited to 'Documentation/lguest/lguest.c')
-rw-r--r-- | Documentation/lguest/lguest.c | 49 |
1 files changed, 43 insertions, 6 deletions
diff --git a/Documentation/lguest/lguest.c b/Documentation/lguest/lguest.c index 9b0e322118b5..6c8a2386cd50 100644 --- a/Documentation/lguest/lguest.c +++ b/Documentation/lguest/lguest.c | |||
@@ -79,6 +79,9 @@ static void *guest_base; | |||
79 | /* The maximum guest physical address allowed, and maximum possible. */ | 79 | /* The maximum guest physical address allowed, and maximum possible. */ |
80 | static unsigned long guest_limit, guest_max; | 80 | static unsigned long guest_limit, guest_max; |
81 | 81 | ||
82 | /* a per-cpu variable indicating whose vcpu is currently running */ | ||
83 | static unsigned int __thread cpu_id; | ||
84 | |||
82 | /* This is our list of devices. */ | 85 | /* This is our list of devices. */ |
83 | struct device_list | 86 | struct device_list |
84 | { | 87 | { |
@@ -153,6 +156,9 @@ struct virtqueue | |||
153 | void (*handle_output)(int fd, struct virtqueue *me); | 156 | void (*handle_output)(int fd, struct virtqueue *me); |
154 | }; | 157 | }; |
155 | 158 | ||
159 | /* Remember the arguments to the program so we can "reboot" */ | ||
160 | static char **main_args; | ||
161 | |||
156 | /* Since guest is UP and we don't run at the same time, we don't need barriers. | 162 | /* Since guest is UP and we don't run at the same time, we don't need barriers. |
157 | * But I include them in the code in case others copy it. */ | 163 | * But I include them in the code in case others copy it. */ |
158 | #define wmb() | 164 | #define wmb() |
@@ -554,7 +560,7 @@ static void wake_parent(int pipefd, int lguest_fd) | |||
554 | else | 560 | else |
555 | FD_CLR(-fd - 1, &devices.infds); | 561 | FD_CLR(-fd - 1, &devices.infds); |
556 | } else /* Send LHREQ_BREAK command. */ | 562 | } else /* Send LHREQ_BREAK command. */ |
557 | write(lguest_fd, args, sizeof(args)); | 563 | pwrite(lguest_fd, args, sizeof(args), cpu_id); |
558 | } | 564 | } |
559 | } | 565 | } |
560 | 566 | ||
@@ -1489,7 +1495,9 @@ static void setup_block_file(const char *filename) | |||
1489 | 1495 | ||
1490 | /* Create stack for thread and run it */ | 1496 | /* Create stack for thread and run it */ |
1491 | stack = malloc(32768); | 1497 | stack = malloc(32768); |
1492 | if (clone(io_thread, stack + 32768, CLONE_VM, dev) == -1) | 1498 | /* SIGCHLD - We dont "wait" for our cloned thread, so prevent it from |
1499 | * becoming a zombie. */ | ||
1500 | if (clone(io_thread, stack + 32768, CLONE_VM | SIGCHLD, dev) == -1) | ||
1493 | err(1, "Creating clone"); | 1501 | err(1, "Creating clone"); |
1494 | 1502 | ||
1495 | /* We don't need to keep the I/O thread's end of the pipes open. */ | 1503 | /* We don't need to keep the I/O thread's end of the pipes open. */ |
@@ -1499,7 +1507,21 @@ static void setup_block_file(const char *filename) | |||
1499 | verbose("device %u: virtblock %llu sectors\n", | 1507 | verbose("device %u: virtblock %llu sectors\n", |
1500 | devices.device_num, cap); | 1508 | devices.device_num, cap); |
1501 | } | 1509 | } |
1502 | /* That's the end of device setup. */ | 1510 | /* That's the end of device setup. :*/ |
1511 | |||
1512 | /* Reboot */ | ||
1513 | static void __attribute__((noreturn)) restart_guest(void) | ||
1514 | { | ||
1515 | unsigned int i; | ||
1516 | |||
1517 | /* Closing pipes causes the waker thread and io_threads to die, and | ||
1518 | * closing /dev/lguest cleans up the Guest. Since we don't track all | ||
1519 | * open fds, we simply close everything beyond stderr. */ | ||
1520 | for (i = 3; i < FD_SETSIZE; i++) | ||
1521 | close(i); | ||
1522 | execv(main_args[0], main_args); | ||
1523 | err(1, "Could not exec %s", main_args[0]); | ||
1524 | } | ||
1503 | 1525 | ||
1504 | /*L:220 Finally we reach the core of the Launcher, which runs the Guest, serves | 1526 | /*L:220 Finally we reach the core of the Launcher, which runs the Guest, serves |
1505 | * its input and output, and finally, lays it to rest. */ | 1527 | * its input and output, and finally, lays it to rest. */ |
@@ -1511,7 +1533,8 @@ static void __attribute__((noreturn)) run_guest(int lguest_fd) | |||
1511 | int readval; | 1533 | int readval; |
1512 | 1534 | ||
1513 | /* We read from the /dev/lguest device to run the Guest. */ | 1535 | /* We read from the /dev/lguest device to run the Guest. */ |
1514 | readval = read(lguest_fd, ¬ify_addr, sizeof(notify_addr)); | 1536 | readval = pread(lguest_fd, ¬ify_addr, |
1537 | sizeof(notify_addr), cpu_id); | ||
1515 | 1538 | ||
1516 | /* One unsigned long means the Guest did HCALL_NOTIFY */ | 1539 | /* One unsigned long means the Guest did HCALL_NOTIFY */ |
1517 | if (readval == sizeof(notify_addr)) { | 1540 | if (readval == sizeof(notify_addr)) { |
@@ -1521,16 +1544,23 @@ static void __attribute__((noreturn)) run_guest(int lguest_fd) | |||
1521 | /* ENOENT means the Guest died. Reading tells us why. */ | 1544 | /* ENOENT means the Guest died. Reading tells us why. */ |
1522 | } else if (errno == ENOENT) { | 1545 | } else if (errno == ENOENT) { |
1523 | char reason[1024] = { 0 }; | 1546 | char reason[1024] = { 0 }; |
1524 | read(lguest_fd, reason, sizeof(reason)-1); | 1547 | pread(lguest_fd, reason, sizeof(reason)-1, cpu_id); |
1525 | errx(1, "%s", reason); | 1548 | errx(1, "%s", reason); |
1549 | /* ERESTART means that we need to reboot the guest */ | ||
1550 | } else if (errno == ERESTART) { | ||
1551 | restart_guest(); | ||
1526 | /* EAGAIN means the Waker wanted us to look at some input. | 1552 | /* EAGAIN means the Waker wanted us to look at some input. |
1527 | * Anything else means a bug or incompatible change. */ | 1553 | * Anything else means a bug or incompatible change. */ |
1528 | } else if (errno != EAGAIN) | 1554 | } else if (errno != EAGAIN) |
1529 | err(1, "Running guest failed"); | 1555 | err(1, "Running guest failed"); |
1530 | 1556 | ||
1557 | /* Only service input on thread for CPU 0. */ | ||
1558 | if (cpu_id != 0) | ||
1559 | continue; | ||
1560 | |||
1531 | /* Service input, then unset the BREAK to release the Waker. */ | 1561 | /* Service input, then unset the BREAK to release the Waker. */ |
1532 | handle_input(lguest_fd); | 1562 | handle_input(lguest_fd); |
1533 | if (write(lguest_fd, args, sizeof(args)) < 0) | 1563 | if (pwrite(lguest_fd, args, sizeof(args), cpu_id) < 0) |
1534 | err(1, "Resetting break"); | 1564 | err(1, "Resetting break"); |
1535 | } | 1565 | } |
1536 | } | 1566 | } |
@@ -1571,6 +1601,12 @@ int main(int argc, char *argv[]) | |||
1571 | /* If they specify an initrd file to load. */ | 1601 | /* If they specify an initrd file to load. */ |
1572 | const char *initrd_name = NULL; | 1602 | const char *initrd_name = NULL; |
1573 | 1603 | ||
1604 | /* Save the args: we "reboot" by execing ourselves again. */ | ||
1605 | main_args = argv; | ||
1606 | /* We don't "wait" for the children, so prevent them from becoming | ||
1607 | * zombies. */ | ||
1608 | signal(SIGCHLD, SIG_IGN); | ||
1609 | |||
1574 | /* First we initialize the device list. Since console and network | 1610 | /* First we initialize the device list. Since console and network |
1575 | * device receive input from a file descriptor, we keep an fdset | 1611 | * device receive input from a file descriptor, we keep an fdset |
1576 | * (infds) and the maximum fd number (max_infd) with the head of the | 1612 | * (infds) and the maximum fd number (max_infd) with the head of the |
@@ -1582,6 +1618,7 @@ int main(int argc, char *argv[]) | |||
1582 | devices.lastdev = &devices.dev; | 1618 | devices.lastdev = &devices.dev; |
1583 | devices.next_irq = 1; | 1619 | devices.next_irq = 1; |
1584 | 1620 | ||
1621 | cpu_id = 0; | ||
1585 | /* We need to know how much memory so we can set up the device | 1622 | /* We need to know how much memory so we can set up the device |
1586 | * descriptor and memory pages for the devices as we parse the command | 1623 | * descriptor and memory pages for the devices as we parse the command |
1587 | * line. So we quickly look through the arguments to find the amount | 1624 | * line. So we quickly look through the arguments to find the amount |