aboutsummaryrefslogtreecommitdiffstats
path: root/drivers/gpu/drm/i915/i915_gem.c
diff options
context:
space:
mode:
Diffstat (limited to 'drivers/gpu/drm/i915/i915_gem.c')
-rw-r--r--drivers/gpu/drm/i915/i915_gem.c31
1 files changed, 18 insertions, 13 deletions
diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
index 6ecfd108effa..6a89449f31d1 100644
--- a/drivers/gpu/drm/i915/i915_gem.c
+++ b/drivers/gpu/drm/i915/i915_gem.c
@@ -176,7 +176,8 @@ i915_gem_gtt_pwrite(struct drm_device *dev, struct drm_gem_object *obj,
176 ssize_t remain; 176 ssize_t remain;
177 loff_t offset; 177 loff_t offset;
178 char __user *user_data; 178 char __user *user_data;
179 char *vaddr; 179 char __iomem *vaddr;
180 char *vaddr_atomic;
180 int i, o, l; 181 int i, o, l;
181 int ret = 0; 182 int ret = 0;
182 unsigned long pfn; 183 unsigned long pfn;
@@ -219,16 +220,20 @@ i915_gem_gtt_pwrite(struct drm_device *dev, struct drm_gem_object *obj,
219 pfn = (dev->agp->base >> PAGE_SHIFT) + i; 220 pfn = (dev->agp->base >> PAGE_SHIFT) + i;
220 221
221#ifdef CONFIG_HIGHMEM 222#ifdef CONFIG_HIGHMEM
222 /* kmap_atomic can't map IO pages on non-HIGHMEM kernels 223 /* This is a workaround for the low performance of iounmap
224 * (approximate 10% cpu cost on normal 3D workloads).
225 * kmap_atomic on HIGHMEM kernels happens to let us map card
226 * memory without taking IPIs. When the vmap rework lands
227 * we should be able to dump this hack.
223 */ 228 */
224 vaddr = kmap_atomic_pfn(pfn, KM_USER0); 229 vaddr_atomic = kmap_atomic_pfn(pfn, KM_USER0);
225#if WATCH_PWRITE 230#if WATCH_PWRITE
226 DRM_INFO("pwrite i %d o %d l %d pfn %ld vaddr %p\n", 231 DRM_INFO("pwrite i %d o %d l %d pfn %ld vaddr %p\n",
227 i, o, l, pfn, vaddr); 232 i, o, l, pfn, vaddr_atomic);
228#endif 233#endif
229 unwritten = __copy_from_user_inatomic_nocache(vaddr + o, 234 unwritten = __copy_from_user_inatomic_nocache(vaddr_atomic + o,
230 user_data, l); 235 user_data, l);
231 kunmap_atomic(vaddr, KM_USER0); 236 kunmap_atomic(vaddr_atomic, KM_USER0);
232 237
233 if (unwritten) 238 if (unwritten)
234#endif /* CONFIG_HIGHMEM */ 239#endif /* CONFIG_HIGHMEM */
@@ -271,7 +276,7 @@ fail:
271 return ret; 276 return ret;
272} 277}
273 278
274int 279static int
275i915_gem_shmem_pwrite(struct drm_device *dev, struct drm_gem_object *obj, 280i915_gem_shmem_pwrite(struct drm_device *dev, struct drm_gem_object *obj,
276 struct drm_i915_gem_pwrite *args, 281 struct drm_i915_gem_pwrite *args,
277 struct drm_file *file_priv) 282 struct drm_file *file_priv)
@@ -587,7 +592,7 @@ i915_add_request(struct drm_device *dev, uint32_t flush_domains)
587 * Ensures that all commands in the ring are finished 592 * Ensures that all commands in the ring are finished
588 * before signalling the CPU 593 * before signalling the CPU
589 */ 594 */
590uint32_t 595static uint32_t
591i915_retire_commands(struct drm_device *dev) 596i915_retire_commands(struct drm_device *dev)
592{ 597{
593 drm_i915_private_t *dev_priv = dev->dev_private; 598 drm_i915_private_t *dev_priv = dev->dev_private;
@@ -734,7 +739,7 @@ i915_gem_retire_work_handler(struct work_struct *work)
734 * Waits for a sequence number to be signaled, and cleans up the 739 * Waits for a sequence number to be signaled, and cleans up the
735 * request and object lists appropriately for that event. 740 * request and object lists appropriately for that event.
736 */ 741 */
737int 742static int
738i915_wait_request(struct drm_device *dev, uint32_t seqno) 743i915_wait_request(struct drm_device *dev, uint32_t seqno)
739{ 744{
740 drm_i915_private_t *dev_priv = dev->dev_private; 745 drm_i915_private_t *dev_priv = dev->dev_private;
@@ -1483,7 +1488,7 @@ i915_gem_object_pin_and_relocate(struct drm_gem_object *obj,
1483 struct drm_i915_gem_object *obj_priv = obj->driver_private; 1488 struct drm_i915_gem_object *obj_priv = obj->driver_private;
1484 int i, ret; 1489 int i, ret;
1485 uint32_t last_reloc_offset = -1; 1490 uint32_t last_reloc_offset = -1;
1486 void *reloc_page = NULL; 1491 void __iomem *reloc_page = NULL;
1487 1492
1488 /* Choose the GTT offset for our buffer and put it there. */ 1493 /* Choose the GTT offset for our buffer and put it there. */
1489 ret = i915_gem_object_pin(obj, (uint32_t) entry->alignment); 1494 ret = i915_gem_object_pin(obj, (uint32_t) entry->alignment);
@@ -1500,8 +1505,8 @@ i915_gem_object_pin_and_relocate(struct drm_gem_object *obj,
1500 for (i = 0; i < entry->relocation_count; i++) { 1505 for (i = 0; i < entry->relocation_count; i++) {
1501 struct drm_gem_object *target_obj; 1506 struct drm_gem_object *target_obj;
1502 struct drm_i915_gem_object *target_obj_priv; 1507 struct drm_i915_gem_object *target_obj_priv;
1503 uint32_t reloc_val, reloc_offset, *reloc_entry; 1508 uint32_t reloc_val, reloc_offset;
1504 int ret; 1509 uint32_t __iomem *reloc_entry;
1505 1510
1506 ret = copy_from_user(&reloc, relocs + i, sizeof(reloc)); 1511 ret = copy_from_user(&reloc, relocs + i, sizeof(reloc));
1507 if (ret != 0) { 1512 if (ret != 0) {
@@ -1624,7 +1629,7 @@ i915_gem_object_pin_and_relocate(struct drm_gem_object *obj,
1624 } 1629 }
1625 } 1630 }
1626 1631
1627 reloc_entry = (uint32_t *)((char *)reloc_page + 1632 reloc_entry = (uint32_t __iomem *)(reloc_page +
1628 (reloc_offset & (PAGE_SIZE - 1))); 1633 (reloc_offset & (PAGE_SIZE - 1)));
1629 reloc_val = target_obj_priv->gtt_offset + reloc.delta; 1634 reloc_val = target_obj_priv->gtt_offset + reloc.delta;
1630 1635