Merge pull request #113 from delahee/patch-2

MultiplyAlpha optimisation
2014-03-20 23:34:05 -07:00
parent 5d241f3320 22336374bd
commit d9b3e37dee
1 changed files with 13 additions and 13 deletions
--- a/project/src/renderer/common/SimpleSurface.cpp
+++ b/project/src/renderer/common/SimpleSurface.cpp
@@ -662,26 +662,26 @@ namespace lime {
 		
 		if (mPixelFormat == pfAlpha)
 			return;
-		int a;
-		double multiply;
+			
+		//converted to uint 
+		//converted to float
+		//got rid of the premultiply so that we can allow compiler to pipeline computation
+		//cuz ARM instr have that mul load shift greatness
+		uint8 a;
+		float multiply = 0.0f;
+		int stride = mStride;
+		uint8 *dest = 0;
 		
 		for (int y = 0; y < r.h; y++) {
+			dest = mBase + ((r.y + y) * stride) + (r.x << 2);
 			
-			uint8 *dest = mBase + ((r.y + y) * mStride) + (r.x * 4);
 			for (int x = 0; x < r.w; x++) {
-				
 				a = *(dest + 3);
-				if (a < 255.0) {
-					
-					multiply = a / 255.0;
-					*dest = sgClamp0255[int((*dest) * multiply)];
-					*(dest + 1) = sgClamp0255[int(*(dest + 1) * multiply)];
-					*(dest + 2) = sgClamp0255[int(*(dest + 2) * multiply)];
-					
-				}
+				*dest = (uint8) (*dest * a * 0.0039215686274509803921568627451f);
+				*(dest + 1) = (uint8) (*(dest + 1) * a * 0.0039215686274509803921568627451f);
+				*(dest + 2) = (uint8) (*(dest + 2) * a * 0.0039215686274509803921568627451f);
 				
 				dest += 4;
-				
 			}
 			
 		}