Merge branch 'drm-next' of git://people.freedesktop.org/~airlied/linux

Pull drm merge (part 1) from Dave Airlie: "So first of all my tree and uapi stuff has a conflict mess, its my fault as the nouveau stuff didn't hit -next as were trying to rebase regressions out of it before we merged. Highlights: - SH mobile modesetting driver and associated helpers - some DRM core documentation - i915 modesetting rework, haswell hdmi, haswell and vlv fixes, write combined pte writing, ilk rc6 support, - nouveau: major driver rework into a hw core driver, makes features like SLI a lot saner to implement, - psb: add eDP/DP support for Cedarview - radeon: 2 layer page tables, async VM pte updates, better PLL selection for > 2 screens, better ACPI interactions The rest is general grab bag of fixes. So why part 1? well I have the exynos pull req which came in a bit late but was waiting for me to do something they shouldn't have and it looks fairly safe, and David Howells has some more header cleanups he'd like me to pull, that seem like a good idea, but I'd like to get this merge out of the way so -next dosen't get blocked." Tons of conflicts mostly due to silly include line changes, but mostly mindless. A few other small semantic conflicts too, noted from Dave's pre-merged branch. * 'drm-next' of git://people.freedesktop.org/~airlied/linux: (447 commits) drm/nv98/crypt: fix fuc build with latest envyas drm/nouveau/devinit: fixup various issues with subdev ctor/init ordering drm/nv41/vm: fix and enable use of "real" pciegart drm/nv44/vm: fix and enable use of "real" pciegart drm/nv04/dmaobj: fixup vm target handling in preparation for nv4x pcie drm/nouveau: store supported dma mask in vmmgr drm/nvc0/ibus: initial implementation of subdev drm/nouveau/therm: add support for fan-control modes drm/nouveau/hwmon: rename pwm0* to pmw1* to follow hwmon's rules drm/nouveau/therm: calculate the pwm divisor on nv50+ drm/nouveau/fan: rewrite the fan tachometer driver to get more precision, faster drm/nouveau/therm: move thermal-related functions to the therm subdev drm/nouveau/bios: parse the pwm divisor from the perf table drm/nouveau/therm: use the EXTDEV table to detect i2c monitoring devices drm/nouveau/therm: rework thermal table parsing drm/nouveau/gpio: expose the PWM/TOGGLE parameter found in the gpio vbios table drm/nouveau: fix pm initialization order drm/nouveau/bios: check that fixed tvdac gpio data is valid before using it drm/nouveau: log channel debug/error messages from client object rather than drm client drm/nouveau: have drm debugging macros build on top of core macros ...
author: Linus Torvalds <torvalds@linux-foundation.org> 2012-10-04 02:29:23 -0400
committer: Linus Torvalds <torvalds@linux-foundation.org> 2012-10-04 02:29:23 -0400
commit: 612a9aab56a93533e76e3ad91642db7033e03b69 (patch)
tree: 8402096973f67af941f9392f7da06cca03e0b58a /drivers/gpu/drm/radeon/r600_blit.c
parent: 3a494318b14b1bc0f59d2d6ce84c505c74d82d2a (diff)
parent: 268d28371cd326be4dfcd7eba5917bf4b9d30c8f (diff)
1 files changed, 60 insertions, 55 deletions
diff --git a/drivers/gpu/drm/radeon/r600_blit.c b/drivers/gpu/drm/radeon/r600_blit.c
index 26ace5623dc7..77da1f9c0b8e 100644
--- a/drivers/gpu/drm/radeon/r600_blit.c
+++ b/drivers/gpu/drm/radeon/r600_blit.c
@@ -488,31 +488,36 @@ set_default_state(drm_radeon_private_t *dev_priv)
        ADVANCE_RING();
 }
-static uint32_t i2f(uint32_t input)
+/* 23 bits of float fractional data */
+#define I2F_FRAC_BITS  23
+#define I2F_MASK ((1 << I2F_FRAC_BITS) - 1)
+/*
+ * Converts unsigned integer into 32-bit IEEE floating point representation.
+ * Will be exact from 0 to 2^24.  Above that, we round towards zero
+ * as the fractional bits will not fit in a float.  (It would be better to
+ * round towards even as the fpu does, but that is slower.)
+ */
+__pure uint32_t int2float(uint32_t x)
 {
-        u32 result, i, exponent, fraction;
+        uint32_t msb, exponent, fraction;
-        if ((input & 0x3fff) == 0)
+        /* Zero is special */
-                result = 0; /* 0 is a special case */
+        if (!x) return 0;
-        else {
-                exponent = 140; /* exponent biased by 127; */
+        /* Get location of the most significant bit */
-                fraction = (input & 0x3fff) << 10; /* cheat and only
+        msb = __fls(x);
-                                                      handle numbers below 2^^15 */
-                for (i = 0; i < 14; i++) {
-                        if (fraction & 0x800000)
-                                break;
-                        else {
-                                fraction = fraction << 1; /* keep
-                                                             shifting left until top bit = 1 */
-                                exponent = exponent - 1;
-                        }
-                }
-                result = exponent << 23 | (fraction & 0x7fffff); /* mask
-                                                                    off top bit; assumed 1 */
-        }
-        return result;
-}
+        /*
+         * Use a rotate instead of a shift because that works both leftwards
+         * and rightwards due to the mod(32) behaviour.  This means we don't
+         * need to check to see if we are above 2^24 or not.
+         */
+        fraction = ror32(x, (msb - I2F_FRAC_BITS) & 0x1f) & I2F_MASK;
+        exponent = (127 + msb) << I2F_FRAC_BITS;
+        return fraction + exponent;
+}
 static int r600_nomm_get_vb(struct drm_device *dev)
 {
@@ -631,20 +636,20 @@ r600_blit_copy(struct drm_device *dev,
                                vb = r600_nomm_get_vb_ptr(dev);
                        }
-                        vb[0] = i2f(dst_x);
+                        vb[0] = int2float(dst_x);
                        vb[1] = 0;
-                        vb[2] = i2f(src_x);
+                        vb[2] = int2float(src_x);
                        vb[3] = 0;
-                        vb[4] = i2f(dst_x);
+                        vb[4] = int2float(dst_x);
-                        vb[5] = i2f(h);
+                        vb[5] = int2float(h);
-                        vb[6] = i2f(src_x);
+                        vb[6] = int2float(src_x);
-                        vb[7] = i2f(h);
+                        vb[7] = int2float(h);
-                        vb[8] = i2f(dst_x + cur_size);
+                        vb[8] = int2float(dst_x + cur_size);
-                        vb[9] = i2f(h);
+                        vb[9] = int2float(h);
-                        vb[10] = i2f(src_x + cur_size);
+                        vb[10] = int2float(src_x + cur_size);
-                        vb[11] = i2f(h);
+                        vb[11] = int2float(h);
                        /* src */
                        set_tex_resource(dev_priv, FMT_8,
@@ -720,20 +725,20 @@ r600_blit_copy(struct drm_device *dev,
                                vb = r600_nomm_get_vb_ptr(dev);
                        }
-                        vb[0] = i2f(dst_x / 4);
+                        vb[0] = int2float(dst_x / 4);
                        vb[1] = 0;
-                        vb[2] = i2f(src_x / 4);
+                        vb[2] = int2float(src_x / 4);
                        vb[3] = 0;
-                        vb[4] = i2f(dst_x / 4);
+                        vb[4] = int2float(dst_x / 4);
-                        vb[5] = i2f(h);
+                        vb[5] = int2float(h);
-                        vb[6] = i2f(src_x / 4);
+                        vb[6] = int2float(src_x / 4);
-                        vb[7] = i2f(h);
+                        vb[7] = int2float(h);
-                        vb[8] = i2f((dst_x + cur_size) / 4);
+                        vb[8] = int2float((dst_x + cur_size) / 4);
-                        vb[9] = i2f(h);
+                        vb[9] = int2float(h);
-                        vb[10] = i2f((src_x + cur_size) / 4);
+                        vb[10] = int2float((src_x + cur_size) / 4);
-                        vb[11] = i2f(h);
+                        vb[11] = int2float(h);
                        /* src */
                        set_tex_resource(dev_priv, FMT_8_8_8_8,
@@ -803,20 +808,20 @@ r600_blit_swap(struct drm_device *dev,
        dx2 = dx + w;
        dy2 = dy + h;
-        vb[0] = i2f(dx);
+        vb[0] = int2float(dx);
-        vb[1] = i2f(dy);
+        vb[1] = int2float(dy);
-        vb[2] = i2f(sx);
+        vb[2] = int2float(sx);
-        vb[3] = i2f(sy);
+        vb[3] = int2float(sy);
-        vb[4] = i2f(dx);
+        vb[4] = int2float(dx);
-        vb[5] = i2f(dy2);
+        vb[5] = int2float(dy2);
-        vb[6] = i2f(sx);
+        vb[6] = int2float(sx);
-        vb[7] = i2f(sy2);
+        vb[7] = int2float(sy2);
-        vb[8] = i2f(dx2);
+        vb[8] = int2float(dx2);
-        vb[9] = i2f(dy2);
+        vb[9] = int2float(dy2);
-        vb[10] = i2f(sx2);
+        vb[10] = int2float(sx2);
-        vb[11] = i2f(sy2);
+        vb[11] = int2float(sy2);
        switch(cpp) {
        case 4:
author	Linus Torvalds <torvalds@linux-foundation.org>	2012-10-04 02:29:23 -0400
committer	Linus Torvalds <torvalds@linux-foundation.org>	2012-10-04 02:29:23 -0400
commit	612a9aab56a93533e76e3ad91642db7033e03b69 (patch)
tree	8402096973f67af941f9392f7da06cca03e0b58a /drivers/gpu/drm/radeon/r600_blit.c
parent	3a494318b14b1bc0f59d2d6ce84c505c74d82d2a (diff)
parent	268d28371cd326be4dfcd7eba5917bf4b9d30c8f (diff)

diff --git a/drivers/gpu/drm/radeon/r600_blit.c b/drivers/gpu/drm/radeon/r600_blit.c index 26ace5623dc7..77da1f9c0b8e 100644 --- a/drivers/gpu/drm/radeon/r600_blit.c +++ b/drivers/gpu/drm/radeon/r600_blit.c
@@ -488,31 +488,36 @@ set_default_state(drm_radeon_private_t *dev_priv)
488	ADVANCE_RING();	488	ADVANCE_RING();
489	}	489	}
490		490
491	static uint32_t i2f(uint32_t input)	491	/* 23 bits of float fractional data */
		492	#define I2F_FRAC_BITS 23
		493	#define I2F_MASK ((1 << I2F_FRAC_BITS) - 1)
		494
		495	/*
		496	* Converts unsigned integer into 32-bit IEEE floating point representation.
		497	* Will be exact from 0 to 2^24. Above that, we round towards zero
		498	* as the fractional bits will not fit in a float. (It would be better to
		499	* round towards even as the fpu does, but that is slower.)
		500	*/
		501	__pure uint32_t int2float(uint32_t x)
492	{	502	{
493	u32 result, i, exponent, fraction;	503	uint32_t msb, exponent, fraction;
494		504
495	if ((input & 0x3fff) == 0)	505	/* Zero is special */
496	result = 0; /* 0 is a special case */	506	if (!x) return 0;
497	else {	507
498	exponent = 140; /* exponent biased by 127; */	508	/* Get location of the most significant bit */
499	fraction = (input & 0x3fff) << 10; /* cheat and only	509	msb = __fls(x);
500	handle numbers below 2^^15 */
501	for (i = 0; i < 14; i++) {
502	if (fraction & 0x800000)
503	break;
504	else {
505	fraction = fraction << 1; /* keep
506	shifting left until top bit = 1 */
507	exponent = exponent - 1;
508	}
509	}
510	result = exponent << 23 \| (fraction & 0x7fffff); /* mask
511	off top bit; assumed 1 */
512	}
513	return result;
514	}
515		510
		511	/*
		512	* Use a rotate instead of a shift because that works both leftwards
		513	* and rightwards due to the mod(32) behaviour. This means we don't
		514	* need to check to see if we are above 2^24 or not.
		515	*/
		516	fraction = ror32(x, (msb - I2F_FRAC_BITS) & 0x1f) & I2F_MASK;
		517	exponent = (127 + msb) << I2F_FRAC_BITS;
		518
		519	return fraction + exponent;
		520	}
516		521
517	static int r600_nomm_get_vb(struct drm_device *dev)	522	static int r600_nomm_get_vb(struct drm_device *dev)
518	{	523	{
@@ -631,20 +636,20 @@ r600_blit_copy(struct drm_device *dev,
631	vb = r600_nomm_get_vb_ptr(dev);	636	vb = r600_nomm_get_vb_ptr(dev);
632	}	637	}
633		638
634	vb[0] = i2f(dst_x);	639	vb[0] = int2float(dst_x);
635	vb[1] = 0;	640	vb[1] = 0;
636	vb[2] = i2f(src_x);	641	vb[2] = int2float(src_x);
637	vb[3] = 0;	642	vb[3] = 0;
638		643
639	vb[4] = i2f(dst_x);	644	vb[4] = int2float(dst_x);
640	vb[5] = i2f(h);	645	vb[5] = int2float(h);
641	vb[6] = i2f(src_x);	646	vb[6] = int2float(src_x);
642	vb[7] = i2f(h);	647	vb[7] = int2float(h);
643		648
644	vb[8] = i2f(dst_x + cur_size);	649	vb[8] = int2float(dst_x + cur_size);
645	vb[9] = i2f(h);	650	vb[9] = int2float(h);
646	vb[10] = i2f(src_x + cur_size);	651	vb[10] = int2float(src_x + cur_size);
647	vb[11] = i2f(h);	652	vb[11] = int2float(h);
648		653
649	/* src */	654	/* src */
650	set_tex_resource(dev_priv, FMT_8,	655	set_tex_resource(dev_priv, FMT_8,
@@ -720,20 +725,20 @@ r600_blit_copy(struct drm_device *dev,
720	vb = r600_nomm_get_vb_ptr(dev);	725	vb = r600_nomm_get_vb_ptr(dev);
721	}	726	}
722		727
723	vb[0] = i2f(dst_x / 4);	728	vb[0] = int2float(dst_x / 4);
724	vb[1] = 0;	729	vb[1] = 0;
725	vb[2] = i2f(src_x / 4);	730	vb[2] = int2float(src_x / 4);
726	vb[3] = 0;	731	vb[3] = 0;
727		732
728	vb[4] = i2f(dst_x / 4);	733	vb[4] = int2float(dst_x / 4);
729	vb[5] = i2f(h);	734	vb[5] = int2float(h);
730	vb[6] = i2f(src_x / 4);	735	vb[6] = int2float(src_x / 4);
731	vb[7] = i2f(h);	736	vb[7] = int2float(h);
732		737
733	vb[8] = i2f((dst_x + cur_size) / 4);	738	vb[8] = int2float((dst_x + cur_size) / 4);
734	vb[9] = i2f(h);	739	vb[9] = int2float(h);
735	vb[10] = i2f((src_x + cur_size) / 4);	740	vb[10] = int2float((src_x + cur_size) / 4);
736	vb[11] = i2f(h);	741	vb[11] = int2float(h);
737		742
738	/* src */	743	/* src */
739	set_tex_resource(dev_priv, FMT_8_8_8_8,	744	set_tex_resource(dev_priv, FMT_8_8_8_8,
@@ -803,20 +808,20 @@ r600_blit_swap(struct drm_device *dev,
803	dx2 = dx + w;	808	dx2 = dx + w;
804	dy2 = dy + h;	809	dy2 = dy + h;
805		810
806	vb[0] = i2f(dx);	811	vb[0] = int2float(dx);
807	vb[1] = i2f(dy);	812	vb[1] = int2float(dy);
808	vb[2] = i2f(sx);	813	vb[2] = int2float(sx);
809	vb[3] = i2f(sy);	814	vb[3] = int2float(sy);
810		815
811	vb[4] = i2f(dx);	816	vb[4] = int2float(dx);
812	vb[5] = i2f(dy2);	817	vb[5] = int2float(dy2);
813	vb[6] = i2f(sx);	818	vb[6] = int2float(sx);
814	vb[7] = i2f(sy2);	819	vb[7] = int2float(sy2);
815		820
816	vb[8] = i2f(dx2);	821	vb[8] = int2float(dx2);
817	vb[9] = i2f(dy2);	822	vb[9] = int2float(dy2);
818	vb[10] = i2f(sx2);	823	vb[10] = int2float(sx2);
819	vb[11] = i2f(sy2);	824	vb[11] = int2float(sy2);
820		825
821	switch(cpp) {	826	switch(cpp) {
822	case 4:	827	case 4: