aboutsummaryrefslogtreecommitdiffstats
path: root/drivers/gpu/drm/radeon/r600_blit.c
diff options
context:
space:
mode:
authorLinus Torvalds <torvalds@linux-foundation.org>2012-10-04 02:29:23 -0400
committerLinus Torvalds <torvalds@linux-foundation.org>2012-10-04 02:29:23 -0400
commit612a9aab56a93533e76e3ad91642db7033e03b69 (patch)
tree8402096973f67af941f9392f7da06cca03e0b58a /drivers/gpu/drm/radeon/r600_blit.c
parent3a494318b14b1bc0f59d2d6ce84c505c74d82d2a (diff)
parent268d28371cd326be4dfcd7eba5917bf4b9d30c8f (diff)
Merge branch 'drm-next' of git://people.freedesktop.org/~airlied/linux
Pull drm merge (part 1) from Dave Airlie: "So first of all my tree and uapi stuff has a conflict mess, its my fault as the nouveau stuff didn't hit -next as were trying to rebase regressions out of it before we merged. Highlights: - SH mobile modesetting driver and associated helpers - some DRM core documentation - i915 modesetting rework, haswell hdmi, haswell and vlv fixes, write combined pte writing, ilk rc6 support, - nouveau: major driver rework into a hw core driver, makes features like SLI a lot saner to implement, - psb: add eDP/DP support for Cedarview - radeon: 2 layer page tables, async VM pte updates, better PLL selection for > 2 screens, better ACPI interactions The rest is general grab bag of fixes. So why part 1? well I have the exynos pull req which came in a bit late but was waiting for me to do something they shouldn't have and it looks fairly safe, and David Howells has some more header cleanups he'd like me to pull, that seem like a good idea, but I'd like to get this merge out of the way so -next dosen't get blocked." Tons of conflicts mostly due to silly include line changes, but mostly mindless. A few other small semantic conflicts too, noted from Dave's pre-merged branch. * 'drm-next' of git://people.freedesktop.org/~airlied/linux: (447 commits) drm/nv98/crypt: fix fuc build with latest envyas drm/nouveau/devinit: fixup various issues with subdev ctor/init ordering drm/nv41/vm: fix and enable use of "real" pciegart drm/nv44/vm: fix and enable use of "real" pciegart drm/nv04/dmaobj: fixup vm target handling in preparation for nv4x pcie drm/nouveau: store supported dma mask in vmmgr drm/nvc0/ibus: initial implementation of subdev drm/nouveau/therm: add support for fan-control modes drm/nouveau/hwmon: rename pwm0* to pmw1* to follow hwmon's rules drm/nouveau/therm: calculate the pwm divisor on nv50+ drm/nouveau/fan: rewrite the fan tachometer driver to get more precision, faster drm/nouveau/therm: move thermal-related functions to the therm subdev drm/nouveau/bios: parse the pwm divisor from the perf table drm/nouveau/therm: use the EXTDEV table to detect i2c monitoring devices drm/nouveau/therm: rework thermal table parsing drm/nouveau/gpio: expose the PWM/TOGGLE parameter found in the gpio vbios table drm/nouveau: fix pm initialization order drm/nouveau/bios: check that fixed tvdac gpio data is valid before using it drm/nouveau: log channel debug/error messages from client object rather than drm client drm/nouveau: have drm debugging macros build on top of core macros ...
Diffstat (limited to 'drivers/gpu/drm/radeon/r600_blit.c')
-rw-r--r--drivers/gpu/drm/radeon/r600_blit.c115
1 files changed, 60 insertions, 55 deletions
diff --git a/drivers/gpu/drm/radeon/r600_blit.c b/drivers/gpu/drm/radeon/r600_blit.c
index 26ace5623dc7..77da1f9c0b8e 100644
--- a/drivers/gpu/drm/radeon/r600_blit.c
+++ b/drivers/gpu/drm/radeon/r600_blit.c
@@ -488,31 +488,36 @@ set_default_state(drm_radeon_private_t *dev_priv)
488 ADVANCE_RING(); 488 ADVANCE_RING();
489} 489}
490 490
491static uint32_t i2f(uint32_t input) 491/* 23 bits of float fractional data */
492#define I2F_FRAC_BITS 23
493#define I2F_MASK ((1 << I2F_FRAC_BITS) - 1)
494
495/*
496 * Converts unsigned integer into 32-bit IEEE floating point representation.
497 * Will be exact from 0 to 2^24. Above that, we round towards zero
498 * as the fractional bits will not fit in a float. (It would be better to
499 * round towards even as the fpu does, but that is slower.)
500 */
501__pure uint32_t int2float(uint32_t x)
492{ 502{
493 u32 result, i, exponent, fraction; 503 uint32_t msb, exponent, fraction;
494 504
495 if ((input & 0x3fff) == 0) 505 /* Zero is special */
496 result = 0; /* 0 is a special case */ 506 if (!x) return 0;
497 else { 507
498 exponent = 140; /* exponent biased by 127; */ 508 /* Get location of the most significant bit */
499 fraction = (input & 0x3fff) << 10; /* cheat and only 509 msb = __fls(x);
500 handle numbers below 2^^15 */
501 for (i = 0; i < 14; i++) {
502 if (fraction & 0x800000)
503 break;
504 else {
505 fraction = fraction << 1; /* keep
506 shifting left until top bit = 1 */
507 exponent = exponent - 1;
508 }
509 }
510 result = exponent << 23 | (fraction & 0x7fffff); /* mask
511 off top bit; assumed 1 */
512 }
513 return result;
514}
515 510
511 /*
512 * Use a rotate instead of a shift because that works both leftwards
513 * and rightwards due to the mod(32) behaviour. This means we don't
514 * need to check to see if we are above 2^24 or not.
515 */
516 fraction = ror32(x, (msb - I2F_FRAC_BITS) & 0x1f) & I2F_MASK;
517 exponent = (127 + msb) << I2F_FRAC_BITS;
518
519 return fraction + exponent;
520}
516 521
517static int r600_nomm_get_vb(struct drm_device *dev) 522static int r600_nomm_get_vb(struct drm_device *dev)
518{ 523{
@@ -631,20 +636,20 @@ r600_blit_copy(struct drm_device *dev,
631 vb = r600_nomm_get_vb_ptr(dev); 636 vb = r600_nomm_get_vb_ptr(dev);
632 } 637 }
633 638
634 vb[0] = i2f(dst_x); 639 vb[0] = int2float(dst_x);
635 vb[1] = 0; 640 vb[1] = 0;
636 vb[2] = i2f(src_x); 641 vb[2] = int2float(src_x);
637 vb[3] = 0; 642 vb[3] = 0;
638 643
639 vb[4] = i2f(dst_x); 644 vb[4] = int2float(dst_x);
640 vb[5] = i2f(h); 645 vb[5] = int2float(h);
641 vb[6] = i2f(src_x); 646 vb[6] = int2float(src_x);
642 vb[7] = i2f(h); 647 vb[7] = int2float(h);
643 648
644 vb[8] = i2f(dst_x + cur_size); 649 vb[8] = int2float(dst_x + cur_size);
645 vb[9] = i2f(h); 650 vb[9] = int2float(h);
646 vb[10] = i2f(src_x + cur_size); 651 vb[10] = int2float(src_x + cur_size);
647 vb[11] = i2f(h); 652 vb[11] = int2float(h);
648 653
649 /* src */ 654 /* src */
650 set_tex_resource(dev_priv, FMT_8, 655 set_tex_resource(dev_priv, FMT_8,
@@ -720,20 +725,20 @@ r600_blit_copy(struct drm_device *dev,
720 vb = r600_nomm_get_vb_ptr(dev); 725 vb = r600_nomm_get_vb_ptr(dev);
721 } 726 }
722 727
723 vb[0] = i2f(dst_x / 4); 728 vb[0] = int2float(dst_x / 4);
724 vb[1] = 0; 729 vb[1] = 0;
725 vb[2] = i2f(src_x / 4); 730 vb[2] = int2float(src_x / 4);
726 vb[3] = 0; 731 vb[3] = 0;
727 732
728 vb[4] = i2f(dst_x / 4); 733 vb[4] = int2float(dst_x / 4);
729 vb[5] = i2f(h); 734 vb[5] = int2float(h);
730 vb[6] = i2f(src_x / 4); 735 vb[6] = int2float(src_x / 4);
731 vb[7] = i2f(h); 736 vb[7] = int2float(h);
732 737
733 vb[8] = i2f((dst_x + cur_size) / 4); 738 vb[8] = int2float((dst_x + cur_size) / 4);
734 vb[9] = i2f(h); 739 vb[9] = int2float(h);
735 vb[10] = i2f((src_x + cur_size) / 4); 740 vb[10] = int2float((src_x + cur_size) / 4);
736 vb[11] = i2f(h); 741 vb[11] = int2float(h);
737 742
738 /* src */ 743 /* src */
739 set_tex_resource(dev_priv, FMT_8_8_8_8, 744 set_tex_resource(dev_priv, FMT_8_8_8_8,
@@ -803,20 +808,20 @@ r600_blit_swap(struct drm_device *dev,
803 dx2 = dx + w; 808 dx2 = dx + w;
804 dy2 = dy + h; 809 dy2 = dy + h;
805 810
806 vb[0] = i2f(dx); 811 vb[0] = int2float(dx);
807 vb[1] = i2f(dy); 812 vb[1] = int2float(dy);
808 vb[2] = i2f(sx); 813 vb[2] = int2float(sx);
809 vb[3] = i2f(sy); 814 vb[3] = int2float(sy);
810 815
811 vb[4] = i2f(dx); 816 vb[4] = int2float(dx);
812 vb[5] = i2f(dy2); 817 vb[5] = int2float(dy2);
813 vb[6] = i2f(sx); 818 vb[6] = int2float(sx);
814 vb[7] = i2f(sy2); 819 vb[7] = int2float(sy2);
815 820
816 vb[8] = i2f(dx2); 821 vb[8] = int2float(dx2);
817 vb[9] = i2f(dy2); 822 vb[9] = int2float(dy2);
818 vb[10] = i2f(sx2); 823 vb[10] = int2float(sx2);
819 vb[11] = i2f(sy2); 824 vb[11] = int2float(sy2);
820 825
821 switch(cpp) { 826 switch(cpp) {
822 case 4: 827 case 4: