1 files changed, 60 insertions, 55 deletions
diff --git a/drivers/gpu/drm/radeon/r600_blit.c b/drivers/gpu/drm/radeon/r600_blit.c
index 3c031a48205d..661fec2a2cc1 100644
--- a/drivers/gpu/drm/radeon/r600_blit.c
+++ b/drivers/gpu/drm/radeon/r600_blit.c
@@ -489,31 +489,36 @@ set_default_state(drm_radeon_private_t *dev_priv)
        ADVANCE_RING();
 }
-static uint32_t i2f(uint32_t input)
+/* 23 bits of float fractional data */
+#define I2F_FRAC_BITS  23
+#define I2F_MASK ((1 << I2F_FRAC_BITS) - 1)
+/*
+ * Converts unsigned integer into 32-bit IEEE floating point representation.
+ * Will be exact from 0 to 2^24.  Above that, we round towards zero
+ * as the fractional bits will not fit in a float.  (It would be better to
+ * round towards even as the fpu does, but that is slower.)
+ */
+__pure uint32_t int2float(uint32_t x)
 {
-        u32 result, i, exponent, fraction;
+        uint32_t msb, exponent, fraction;
-        if ((input & 0x3fff) == 0)
+        /* Zero is special */
-                result = 0; /* 0 is a special case */
+        if (!x) return 0;
-        else {
-                exponent = 140; /* exponent biased by 127; */
+        /* Get location of the most significant bit */
-                fraction = (input & 0x3fff) << 10; /* cheat and only
+        msb = __fls(x);
-                                                      handle numbers below 2^^15 */
-                for (i = 0; i < 14; i++) {
-                        if (fraction & 0x800000)
-                                break;
-                        else {
-                                fraction = fraction << 1; /* keep
-                                                             shifting left until top bit = 1 */
-                                exponent = exponent - 1;
-                        }
-                }
-                result = exponent << 23 | (fraction & 0x7fffff); /* mask
-                                                                    off top bit; assumed 1 */
-        }
-        return result;
-}
+        /*
+         * Use a rotate instead of a shift because that works both leftwards
+         * and rightwards due to the mod(32) behaviour.  This means we don't
+         * need to check to see if we are above 2^24 or not.
+         */
+        fraction = ror32(x, (msb - I2F_FRAC_BITS) & 0x1f) & I2F_MASK;
+        exponent = (127 + msb) << I2F_FRAC_BITS;
+        return fraction + exponent;
+}
 static int r600_nomm_get_vb(struct drm_device *dev)
 {
@@ -632,20 +637,20 @@ r600_blit_copy(struct drm_device *dev,
                                vb = r600_nomm_get_vb_ptr(dev);
                        }
-                        vb[0] = i2f(dst_x);
+                        vb[0] = int2float(dst_x);
                        vb[1] = 0;
-                        vb[2] = i2f(src_x);
+                        vb[2] = int2float(src_x);
                        vb[3] = 0;
-                        vb[4] = i2f(dst_x);
+                        vb[4] = int2float(dst_x);
-                        vb[5] = i2f(h);
+                        vb[5] = int2float(h);
-                        vb[6] = i2f(src_x);
+                        vb[6] = int2float(src_x);
-                        vb[7] = i2f(h);
+                        vb[7] = int2float(h);
-                        vb[8] = i2f(dst_x + cur_size);
+                        vb[8] = int2float(dst_x + cur_size);
-                        vb[9] = i2f(h);
+                        vb[9] = int2float(h);
-                        vb[10] = i2f(src_x + cur_size);
+                        vb[10] = int2float(src_x + cur_size);
-                        vb[11] = i2f(h);
+                        vb[11] = int2float(h);
                        /* src */
                        set_tex_resource(dev_priv, FMT_8,
@@ -721,20 +726,20 @@ r600_blit_copy(struct drm_device *dev,
                                vb = r600_nomm_get_vb_ptr(dev);
                        }
-                        vb[0] = i2f(dst_x / 4);
+                        vb[0] = int2float(dst_x / 4);
                        vb[1] = 0;
-                        vb[2] = i2f(src_x / 4);
+                        vb[2] = int2float(src_x / 4);
                        vb[3] = 0;
-                        vb[4] = i2f(dst_x / 4);
+                        vb[4] = int2float(dst_x / 4);
-                        vb[5] = i2f(h);
+                        vb[5] = int2float(h);
-                        vb[6] = i2f(src_x / 4);
+                        vb[6] = int2float(src_x / 4);
-                        vb[7] = i2f(h);
+                        vb[7] = int2float(h);
-                        vb[8] = i2f((dst_x + cur_size) / 4);
+                        vb[8] = int2float((dst_x + cur_size) / 4);
-                        vb[9] = i2f(h);
+                        vb[9] = int2float(h);
-                        vb[10] = i2f((src_x + cur_size) / 4);
+                        vb[10] = int2float((src_x + cur_size) / 4);
-                        vb[11] = i2f(h);
+                        vb[11] = int2float(h);
                        /* src */
                        set_tex_resource(dev_priv, FMT_8_8_8_8,
@@ -804,20 +809,20 @@ r600_blit_swap(struct drm_device *dev,
        dx2 = dx + w;
        dy2 = dy + h;
-        vb[0] = i2f(dx);
+        vb[0] = int2float(dx);
-        vb[1] = i2f(dy);
+        vb[1] = int2float(dy);
-        vb[2] = i2f(sx);
+        vb[2] = int2float(sx);
-        vb[3] = i2f(sy);
+        vb[3] = int2float(sy);
-        vb[4] = i2f(dx);
+        vb[4] = int2float(dx);
-        vb[5] = i2f(dy2);
+        vb[5] = int2float(dy2);
-        vb[6] = i2f(sx);
+        vb[6] = int2float(sx);
-        vb[7] = i2f(sy2);
+        vb[7] = int2float(sy2);
-        vb[8] = i2f(dx2);
+        vb[8] = int2float(dx2);
-        vb[9] = i2f(dy2);
+        vb[9] = int2float(dy2);
-        vb[10] = i2f(sx2);
+        vb[10] = int2float(sx2);
-        vb[11] = i2f(sy2);
+        vb[11] = int2float(sy2);
        switch(cpp) {
        case 4:

diff --git a/drivers/gpu/drm/radeon/r600_blit.c b/drivers/gpu/drm/radeon/r600_blit.c index 3c031a48205d..661fec2a2cc1 100644 --- a/drivers/gpu/drm/radeon/r600_blit.c +++ b/drivers/gpu/drm/radeon/r600_blit.c
@@ -489,31 +489,36 @@ set_default_state(drm_radeon_private_t *dev_priv)
489	ADVANCE_RING();	489	ADVANCE_RING();
490	}	490	}
491		491
492	static uint32_t i2f(uint32_t input)	492	/* 23 bits of float fractional data */
		493	#define I2F_FRAC_BITS 23
		494	#define I2F_MASK ((1 << I2F_FRAC_BITS) - 1)
		495
		496	/*
		497	* Converts unsigned integer into 32-bit IEEE floating point representation.
		498	* Will be exact from 0 to 2^24. Above that, we round towards zero
		499	* as the fractional bits will not fit in a float. (It would be better to
		500	* round towards even as the fpu does, but that is slower.)
		501	*/
		502	__pure uint32_t int2float(uint32_t x)
493	{	503	{
494	u32 result, i, exponent, fraction;	504	uint32_t msb, exponent, fraction;
495		505
496	if ((input & 0x3fff) == 0)	506	/* Zero is special */
497	result = 0; /* 0 is a special case */	507	if (!x) return 0;
498	else {	508
499	exponent = 140; /* exponent biased by 127; */	509	/* Get location of the most significant bit */
500	fraction = (input & 0x3fff) << 10; /* cheat and only	510	msb = __fls(x);
501	handle numbers below 2^^15 */
502	for (i = 0; i < 14; i++) {
503	if (fraction & 0x800000)
504	break;
505	else {
506	fraction = fraction << 1; /* keep
507	shifting left until top bit = 1 */
508	exponent = exponent - 1;
509	}
510	}
511	result = exponent << 23 \| (fraction & 0x7fffff); /* mask
512	off top bit; assumed 1 */
513	}
514	return result;
515	}
516		511
		512	/*
		513	* Use a rotate instead of a shift because that works both leftwards
		514	* and rightwards due to the mod(32) behaviour. This means we don't
		515	* need to check to see if we are above 2^24 or not.
		516	*/
		517	fraction = ror32(x, (msb - I2F_FRAC_BITS) & 0x1f) & I2F_MASK;
		518	exponent = (127 + msb) << I2F_FRAC_BITS;
		519
		520	return fraction + exponent;
		521	}
517		522
518	static int r600_nomm_get_vb(struct drm_device *dev)	523	static int r600_nomm_get_vb(struct drm_device *dev)
519	{	524	{
@@ -632,20 +637,20 @@ r600_blit_copy(struct drm_device *dev,
632	vb = r600_nomm_get_vb_ptr(dev);	637	vb = r600_nomm_get_vb_ptr(dev);
633	}	638	}
634		639
635	vb[0] = i2f(dst_x);	640	vb[0] = int2float(dst_x);
636	vb[1] = 0;	641	vb[1] = 0;
637	vb[2] = i2f(src_x);	642	vb[2] = int2float(src_x);
638	vb[3] = 0;	643	vb[3] = 0;
639		644
640	vb[4] = i2f(dst_x);	645	vb[4] = int2float(dst_x);
641	vb[5] = i2f(h);	646	vb[5] = int2float(h);
642	vb[6] = i2f(src_x);	647	vb[6] = int2float(src_x);
643	vb[7] = i2f(h);	648	vb[7] = int2float(h);
644		649
645	vb[8] = i2f(dst_x + cur_size);	650	vb[8] = int2float(dst_x + cur_size);
646	vb[9] = i2f(h);	651	vb[9] = int2float(h);
647	vb[10] = i2f(src_x + cur_size);	652	vb[10] = int2float(src_x + cur_size);
648	vb[11] = i2f(h);	653	vb[11] = int2float(h);
649		654
650	/* src */	655	/* src */
651	set_tex_resource(dev_priv, FMT_8,	656	set_tex_resource(dev_priv, FMT_8,
@@ -721,20 +726,20 @@ r600_blit_copy(struct drm_device *dev,
721	vb = r600_nomm_get_vb_ptr(dev);	726	vb = r600_nomm_get_vb_ptr(dev);
722	}	727	}
723		728
724	vb[0] = i2f(dst_x / 4);	729	vb[0] = int2float(dst_x / 4);
725	vb[1] = 0;	730	vb[1] = 0;
726	vb[2] = i2f(src_x / 4);	731	vb[2] = int2float(src_x / 4);
727	vb[3] = 0;	732	vb[3] = 0;
728		733
729	vb[4] = i2f(dst_x / 4);	734	vb[4] = int2float(dst_x / 4);
730	vb[5] = i2f(h);	735	vb[5] = int2float(h);
731	vb[6] = i2f(src_x / 4);	736	vb[6] = int2float(src_x / 4);
732	vb[7] = i2f(h);	737	vb[7] = int2float(h);
733		738
734	vb[8] = i2f((dst_x + cur_size) / 4);	739	vb[8] = int2float((dst_x + cur_size) / 4);
735	vb[9] = i2f(h);	740	vb[9] = int2float(h);
736	vb[10] = i2f((src_x + cur_size) / 4);	741	vb[10] = int2float((src_x + cur_size) / 4);
737	vb[11] = i2f(h);	742	vb[11] = int2float(h);
738		743
739	/* src */	744	/* src */
740	set_tex_resource(dev_priv, FMT_8_8_8_8,	745	set_tex_resource(dev_priv, FMT_8_8_8_8,
@@ -804,20 +809,20 @@ r600_blit_swap(struct drm_device *dev,
804	dx2 = dx + w;	809	dx2 = dx + w;
805	dy2 = dy + h;	810	dy2 = dy + h;
806		811
807	vb[0] = i2f(dx);	812	vb[0] = int2float(dx);
808	vb[1] = i2f(dy);	813	vb[1] = int2float(dy);
809	vb[2] = i2f(sx);	814	vb[2] = int2float(sx);
810	vb[3] = i2f(sy);	815	vb[3] = int2float(sy);
811		816
812	vb[4] = i2f(dx);	817	vb[4] = int2float(dx);
813	vb[5] = i2f(dy2);	818	vb[5] = int2float(dy2);
814	vb[6] = i2f(sx);	819	vb[6] = int2float(sx);
815	vb[7] = i2f(sy2);	820	vb[7] = int2float(sy2);
816		821
817	vb[8] = i2f(dx2);	822	vb[8] = int2float(dx2);
818	vb[9] = i2f(dy2);	823	vb[9] = int2float(dy2);
819	vb[10] = i2f(sx2);	824	vb[10] = int2float(sx2);
820	vb[11] = i2f(sy2);	825	vb[11] = int2float(sy2);
821		826
822	switch(cpp) {	827	switch(cpp) {
823	case 4:	828	case 4: