diff options
author | Sasha Levin <levinsasha928@gmail.com> | 2011-07-27 09:00:48 -0400 |
---|---|---|
committer | Avi Kivity <avi@redhat.com> | 2011-09-25 12:17:59 -0400 |
commit | 743eeb0b01d2fbf4154bf87bff1ebb6fb18aeb7a (patch) | |
tree | 5392464930f7e77131d65f32ba96ce4665307629 /virt/kvm | |
parent | 0d460ffc0956d2dbe12ca9f5f6aa0f8701ea9d73 (diff) |
KVM: Intelligent device lookup on I/O bus
Currently the method of dealing with an IO operation on a bus (PIO/MMIO)
is to call the read or write callback for each device registered
on the bus until we find a device which handles it.
Since the number of devices on a bus can be significant due to ioeventfds
and coalesced MMIO zones, this leads to a lot of overhead on each IO
operation.
Instead of registering devices, we now register ranges which points to
a device. Lookup is done using an efficient bsearch instead of a linear
search.
Performance test was conducted by comparing exit count per second with
200 ioeventfds created on one byte and the guest is trying to access a
different byte continuously (triggering usermode exits).
Before the patch the guest has achieved 259k exits per second, after the
patch the guest does 274k exits per second.
Cc: Avi Kivity <avi@redhat.com>
Cc: Marcelo Tosatti <mtosatti@redhat.com>
Signed-off-by: Sasha Levin <levinsasha928@gmail.com>
Signed-off-by: Avi Kivity <avi@redhat.com>
Diffstat (limited to 'virt/kvm')
-rw-r--r-- | virt/kvm/coalesced_mmio.c | 3 | ||||
-rw-r--r-- | virt/kvm/eventfd.c | 3 | ||||
-rw-r--r-- | virt/kvm/ioapic.c | 3 | ||||
-rw-r--r-- | virt/kvm/kvm_main.c | 112 |
4 files changed, 106 insertions, 15 deletions
diff --git a/virt/kvm/coalesced_mmio.c b/virt/kvm/coalesced_mmio.c index 2316ec1aadc..a6ec206f36b 100644 --- a/virt/kvm/coalesced_mmio.c +++ b/virt/kvm/coalesced_mmio.c | |||
@@ -141,7 +141,8 @@ int kvm_vm_ioctl_register_coalesced_mmio(struct kvm *kvm, | |||
141 | dev->zone = *zone; | 141 | dev->zone = *zone; |
142 | 142 | ||
143 | mutex_lock(&kvm->slots_lock); | 143 | mutex_lock(&kvm->slots_lock); |
144 | ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, &dev->dev); | 144 | ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, zone->addr, |
145 | zone->size, &dev->dev); | ||
145 | if (ret < 0) | 146 | if (ret < 0) |
146 | goto out_free_dev; | 147 | goto out_free_dev; |
147 | list_add_tail(&dev->list, &kvm->coalesced_zones); | 148 | list_add_tail(&dev->list, &kvm->coalesced_zones); |
diff --git a/virt/kvm/eventfd.c b/virt/kvm/eventfd.c index 73358d256fa..f59c1e8de7a 100644 --- a/virt/kvm/eventfd.c +++ b/virt/kvm/eventfd.c | |||
@@ -586,7 +586,8 @@ kvm_assign_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args) | |||
586 | 586 | ||
587 | kvm_iodevice_init(&p->dev, &ioeventfd_ops); | 587 | kvm_iodevice_init(&p->dev, &ioeventfd_ops); |
588 | 588 | ||
589 | ret = kvm_io_bus_register_dev(kvm, bus_idx, &p->dev); | 589 | ret = kvm_io_bus_register_dev(kvm, bus_idx, p->addr, p->length, |
590 | &p->dev); | ||
590 | if (ret < 0) | 591 | if (ret < 0) |
591 | goto unlock_fail; | 592 | goto unlock_fail; |
592 | 593 | ||
diff --git a/virt/kvm/ioapic.c b/virt/kvm/ioapic.c index 8df1ca104a7..3eed61eb486 100644 --- a/virt/kvm/ioapic.c +++ b/virt/kvm/ioapic.c | |||
@@ -394,7 +394,8 @@ int kvm_ioapic_init(struct kvm *kvm) | |||
394 | kvm_iodevice_init(&ioapic->dev, &ioapic_mmio_ops); | 394 | kvm_iodevice_init(&ioapic->dev, &ioapic_mmio_ops); |
395 | ioapic->kvm = kvm; | 395 | ioapic->kvm = kvm; |
396 | mutex_lock(&kvm->slots_lock); | 396 | mutex_lock(&kvm->slots_lock); |
397 | ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, &ioapic->dev); | 397 | ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, ioapic->base_address, |
398 | IOAPIC_MEM_LENGTH, &ioapic->dev); | ||
398 | mutex_unlock(&kvm->slots_lock); | 399 | mutex_unlock(&kvm->slots_lock); |
399 | if (ret < 0) { | 400 | if (ret < 0) { |
400 | kvm->arch.vioapic = NULL; | 401 | kvm->arch.vioapic = NULL; |
diff --git a/virt/kvm/kvm_main.c b/virt/kvm/kvm_main.c index aefdda390f5..d9cfb782cb8 100644 --- a/virt/kvm/kvm_main.c +++ b/virt/kvm/kvm_main.c | |||
@@ -47,6 +47,8 @@ | |||
47 | #include <linux/srcu.h> | 47 | #include <linux/srcu.h> |
48 | #include <linux/hugetlb.h> | 48 | #include <linux/hugetlb.h> |
49 | #include <linux/slab.h> | 49 | #include <linux/slab.h> |
50 | #include <linux/sort.h> | ||
51 | #include <linux/bsearch.h> | ||
50 | 52 | ||
51 | #include <asm/processor.h> | 53 | #include <asm/processor.h> |
52 | #include <asm/io.h> | 54 | #include <asm/io.h> |
@@ -2391,24 +2393,92 @@ static void kvm_io_bus_destroy(struct kvm_io_bus *bus) | |||
2391 | int i; | 2393 | int i; |
2392 | 2394 | ||
2393 | for (i = 0; i < bus->dev_count; i++) { | 2395 | for (i = 0; i < bus->dev_count; i++) { |
2394 | struct kvm_io_device *pos = bus->devs[i]; | 2396 | struct kvm_io_device *pos = bus->range[i].dev; |
2395 | 2397 | ||
2396 | kvm_iodevice_destructor(pos); | 2398 | kvm_iodevice_destructor(pos); |
2397 | } | 2399 | } |
2398 | kfree(bus); | 2400 | kfree(bus); |
2399 | } | 2401 | } |
2400 | 2402 | ||
2403 | int kvm_io_bus_sort_cmp(const void *p1, const void *p2) | ||
2404 | { | ||
2405 | const struct kvm_io_range *r1 = p1; | ||
2406 | const struct kvm_io_range *r2 = p2; | ||
2407 | |||
2408 | if (r1->addr < r2->addr) | ||
2409 | return -1; | ||
2410 | if (r1->addr + r1->len > r2->addr + r2->len) | ||
2411 | return 1; | ||
2412 | return 0; | ||
2413 | } | ||
2414 | |||
2415 | int kvm_io_bus_insert_dev(struct kvm_io_bus *bus, struct kvm_io_device *dev, | ||
2416 | gpa_t addr, int len) | ||
2417 | { | ||
2418 | if (bus->dev_count == NR_IOBUS_DEVS) | ||
2419 | return -ENOSPC; | ||
2420 | |||
2421 | bus->range[bus->dev_count++] = (struct kvm_io_range) { | ||
2422 | .addr = addr, | ||
2423 | .len = len, | ||
2424 | .dev = dev, | ||
2425 | }; | ||
2426 | |||
2427 | sort(bus->range, bus->dev_count, sizeof(struct kvm_io_range), | ||
2428 | kvm_io_bus_sort_cmp, NULL); | ||
2429 | |||
2430 | return 0; | ||
2431 | } | ||
2432 | |||
2433 | int kvm_io_bus_get_first_dev(struct kvm_io_bus *bus, | ||
2434 | gpa_t addr, int len) | ||
2435 | { | ||
2436 | struct kvm_io_range *range, key; | ||
2437 | int off; | ||
2438 | |||
2439 | key = (struct kvm_io_range) { | ||
2440 | .addr = addr, | ||
2441 | .len = len, | ||
2442 | }; | ||
2443 | |||
2444 | range = bsearch(&key, bus->range, bus->dev_count, | ||
2445 | sizeof(struct kvm_io_range), kvm_io_bus_sort_cmp); | ||
2446 | if (range == NULL) | ||
2447 | return -ENOENT; | ||
2448 | |||
2449 | off = range - bus->range; | ||
2450 | |||
2451 | while (off > 0 && kvm_io_bus_sort_cmp(&key, &bus->range[off-1]) == 0) | ||
2452 | off--; | ||
2453 | |||
2454 | return off; | ||
2455 | } | ||
2456 | |||
2401 | /* kvm_io_bus_write - called under kvm->slots_lock */ | 2457 | /* kvm_io_bus_write - called under kvm->slots_lock */ |
2402 | int kvm_io_bus_write(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, | 2458 | int kvm_io_bus_write(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, |
2403 | int len, const void *val) | 2459 | int len, const void *val) |
2404 | { | 2460 | { |
2405 | int i; | 2461 | int idx; |
2406 | struct kvm_io_bus *bus; | 2462 | struct kvm_io_bus *bus; |
2463 | struct kvm_io_range range; | ||
2464 | |||
2465 | range = (struct kvm_io_range) { | ||
2466 | .addr = addr, | ||
2467 | .len = len, | ||
2468 | }; | ||
2407 | 2469 | ||
2408 | bus = srcu_dereference(kvm->buses[bus_idx], &kvm->srcu); | 2470 | bus = srcu_dereference(kvm->buses[bus_idx], &kvm->srcu); |
2409 | for (i = 0; i < bus->dev_count; i++) | 2471 | idx = kvm_io_bus_get_first_dev(bus, addr, len); |
2410 | if (!kvm_iodevice_write(bus->devs[i], addr, len, val)) | 2472 | if (idx < 0) |
2473 | return -EOPNOTSUPP; | ||
2474 | |||
2475 | while (idx < bus->dev_count && | ||
2476 | kvm_io_bus_sort_cmp(&range, &bus->range[idx]) == 0) { | ||
2477 | if (!kvm_iodevice_write(bus->range[idx].dev, addr, len, val)) | ||
2411 | return 0; | 2478 | return 0; |
2479 | idx++; | ||
2480 | } | ||
2481 | |||
2412 | return -EOPNOTSUPP; | 2482 | return -EOPNOTSUPP; |
2413 | } | 2483 | } |
2414 | 2484 | ||
@@ -2416,19 +2486,33 @@ int kvm_io_bus_write(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, | |||
2416 | int kvm_io_bus_read(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, | 2486 | int kvm_io_bus_read(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, |
2417 | int len, void *val) | 2487 | int len, void *val) |
2418 | { | 2488 | { |
2419 | int i; | 2489 | int idx; |
2420 | struct kvm_io_bus *bus; | 2490 | struct kvm_io_bus *bus; |
2491 | struct kvm_io_range range; | ||
2492 | |||
2493 | range = (struct kvm_io_range) { | ||
2494 | .addr = addr, | ||
2495 | .len = len, | ||
2496 | }; | ||
2421 | 2497 | ||
2422 | bus = srcu_dereference(kvm->buses[bus_idx], &kvm->srcu); | 2498 | bus = srcu_dereference(kvm->buses[bus_idx], &kvm->srcu); |
2423 | for (i = 0; i < bus->dev_count; i++) | 2499 | idx = kvm_io_bus_get_first_dev(bus, addr, len); |
2424 | if (!kvm_iodevice_read(bus->devs[i], addr, len, val)) | 2500 | if (idx < 0) |
2501 | return -EOPNOTSUPP; | ||
2502 | |||
2503 | while (idx < bus->dev_count && | ||
2504 | kvm_io_bus_sort_cmp(&range, &bus->range[idx]) == 0) { | ||
2505 | if (!kvm_iodevice_read(bus->range[idx].dev, addr, len, val)) | ||
2425 | return 0; | 2506 | return 0; |
2507 | idx++; | ||
2508 | } | ||
2509 | |||
2426 | return -EOPNOTSUPP; | 2510 | return -EOPNOTSUPP; |
2427 | } | 2511 | } |
2428 | 2512 | ||
2429 | /* Caller must hold slots_lock. */ | 2513 | /* Caller must hold slots_lock. */ |
2430 | int kvm_io_bus_register_dev(struct kvm *kvm, enum kvm_bus bus_idx, | 2514 | int kvm_io_bus_register_dev(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, |
2431 | struct kvm_io_device *dev) | 2515 | int len, struct kvm_io_device *dev) |
2432 | { | 2516 | { |
2433 | struct kvm_io_bus *new_bus, *bus; | 2517 | struct kvm_io_bus *new_bus, *bus; |
2434 | 2518 | ||
@@ -2440,7 +2524,7 @@ int kvm_io_bus_register_dev(struct kvm *kvm, enum kvm_bus bus_idx, | |||
2440 | if (!new_bus) | 2524 | if (!new_bus) |
2441 | return -ENOMEM; | 2525 | return -ENOMEM; |
2442 | memcpy(new_bus, bus, sizeof(struct kvm_io_bus)); | 2526 | memcpy(new_bus, bus, sizeof(struct kvm_io_bus)); |
2443 | new_bus->devs[new_bus->dev_count++] = dev; | 2527 | kvm_io_bus_insert_dev(new_bus, dev, addr, len); |
2444 | rcu_assign_pointer(kvm->buses[bus_idx], new_bus); | 2528 | rcu_assign_pointer(kvm->buses[bus_idx], new_bus); |
2445 | synchronize_srcu_expedited(&kvm->srcu); | 2529 | synchronize_srcu_expedited(&kvm->srcu); |
2446 | kfree(bus); | 2530 | kfree(bus); |
@@ -2464,9 +2548,13 @@ int kvm_io_bus_unregister_dev(struct kvm *kvm, enum kvm_bus bus_idx, | |||
2464 | 2548 | ||
2465 | r = -ENOENT; | 2549 | r = -ENOENT; |
2466 | for (i = 0; i < new_bus->dev_count; i++) | 2550 | for (i = 0; i < new_bus->dev_count; i++) |
2467 | if (new_bus->devs[i] == dev) { | 2551 | if (new_bus->range[i].dev == dev) { |
2468 | r = 0; | 2552 | r = 0; |
2469 | new_bus->devs[i] = new_bus->devs[--new_bus->dev_count]; | 2553 | new_bus->dev_count--; |
2554 | new_bus->range[i] = new_bus->range[new_bus->dev_count]; | ||
2555 | sort(new_bus->range, new_bus->dev_count, | ||
2556 | sizeof(struct kvm_io_range), | ||
2557 | kvm_io_bus_sort_cmp, NULL); | ||
2470 | break; | 2558 | break; |
2471 | } | 2559 | } |
2472 | 2560 | ||