Module Name:    src
Committed By:   tsutsui
Date:           Sun Sep 28 05:00:56 UTC 2014

Modified Files:
        src/sys/arch/luna68k/dev: omrasops.c

Log Message:
Put dumb optimizations to avoid conditionals in putchar drawing loops.

~10% improvements of time cat results on LUNA-II 8bpp framebuffer.


To generate a diff of this commit:
cvs rdiff -u -r1.17 -r1.18 src/sys/arch/luna68k/dev/omrasops.c

Please note that diffs are not public domain; they are subject to the
copyright notices on the relevant files.

Modified files:

Index: src/sys/arch/luna68k/dev/omrasops.c
diff -u src/sys/arch/luna68k/dev/omrasops.c:1.17 src/sys/arch/luna68k/dev/omrasops.c:1.18
--- src/sys/arch/luna68k/dev/omrasops.c:1.17	Sun Sep 28 04:43:01 2014
+++ src/sys/arch/luna68k/dev/omrasops.c	Sun Sep 28 05:00:56 2014
@@ -1,4 +1,4 @@
-/* $NetBSD: omrasops.c,v 1.17 2014/09/28 04:43:01 tsutsui Exp $ */
+/* $NetBSD: omrasops.c,v 1.18 2014/09/28 05:00:56 tsutsui Exp $ */
 
 /*-
  * Copyright (c) 2000 The NetBSD Foundation, Inc.
@@ -31,7 +31,7 @@
 
 #include <sys/cdefs.h>			/* RCS ID & Copyright macro defns */
 
-__KERNEL_RCSID(0, "$NetBSD: omrasops.c,v 1.17 2014/09/28 04:43:01 tsutsui Exp $");
+__KERNEL_RCSID(0, "$NetBSD: omrasops.c,v 1.18 2014/09/28 05:00:56 tsutsui Exp $");
 
 /*
  * Designed speficically for 'm68k bitorder';
@@ -175,6 +175,8 @@ om4_putchar(void *cookie, int row, int s
 	uint8_t *p;
 	int scanspan, startx, height, width, align, y;
 	uint32_t lmask, rmask, glyph, glyphbg, fgpat, bgpat;
+	uint32_t fgmask0, fgmask1, fgmask2, fgmask3;
+	uint32_t bgmask0, bgmask1, bgmask2, bgmask3;
 	int i, fg, bg;
 	uint8_t *fb;
 
@@ -185,6 +187,14 @@ om4_putchar(void *cookie, int row, int s
 	fb = (uint8_t *)ri->ri_font->data +
 	    (uc - ri->ri_font->firstchar) * ri->ri_fontscale;
 	om4_unpack_attr(attr, &fg, &bg, NULL);
+	fgmask0 = (fg & 0x01) ? ALL1BITS : ALL0BITS;
+	fgmask1 = (fg & 0x02) ? ALL1BITS : ALL0BITS;
+	fgmask2 = (fg & 0x04) ? ALL1BITS : ALL0BITS;
+	fgmask3 = (fg & 0x08) ? ALL1BITS : ALL0BITS;
+	bgmask0 = (bg & 0x01) ? ALL1BITS : ALL0BITS;
+	bgmask1 = (bg & 0x02) ? ALL1BITS : ALL0BITS;
+	bgmask2 = (bg & 0x04) ? ALL1BITS : ALL0BITS;
+	bgmask3 = (bg & 0x08) ? ALL1BITS : ALL0BITS;
 
 	p = (uint8_t *)ri->ri_bits + y * scanspan + ((startx / 32) * 4);
 	align = startx & ALIGNMASK;
@@ -200,17 +210,17 @@ om4_putchar(void *cookie, int row, int s
 			glyph <<= (4 - ri->ri_font->stride) * NBBY;
 			glyph = (glyph >> align);
 			glyphbg = glyph ^ ALL1BITS;
-			fgpat = (fg & 0x01) ? glyph : 0;
-			bgpat = (bg & 0x01) ? glyphbg : 0;
+			fgpat = glyph   & fgmask0;
+			bgpat = glyphbg & bgmask0;
 			P0(p) = (P0(p) & ~lmask) | ((fgpat | bgpat) & lmask);
-			fgpat = (fg & 0x02) ? glyph : 0;
-			bgpat = (bg & 0x02) ? glyphbg : 0;
+			fgpat = glyph   & fgmask1;
+			bgpat = glyphbg & bgmask1;
 			P1(p) = (P1(p) & ~lmask) | ((fgpat | bgpat) & lmask);
-			fgpat = (fg & 0x04) ? glyph : 0;
-			bgpat = (bg & 0x04) ? glyphbg : 0;
+			fgpat = glyph   & fgmask2;
+			bgpat = glyphbg & bgmask2;
 			P2(p) = (P2(p) & ~lmask) | ((fgpat | bgpat) & lmask);
-			fgpat = (fg & 0x08) ? glyph : 0;
-			bgpat = (bg & 0x08) ? glyphbg : 0;
+			fgpat = glyph   & fgmask3;
+			bgpat = glyphbg & bgmask3;
 			P3(p) = (P3(p) & ~lmask) | ((fgpat | bgpat) & lmask);
 			p += scanspan;
 			height--;
@@ -227,32 +237,32 @@ om4_putchar(void *cookie, int row, int s
 			glyph <<= (4 - ri->ri_font->stride) * NBBY;
 			lhalf = (glyph >> align);
 			lhalfbg = lhalf ^ ALL1BITS;
-			fgpat = (fg & 0x01) ? lhalf : 0;
-			bgpat = (bg & 0x01) ? lhalfbg : 0;
+			fgpat = lhalf   & fgmask0;
+			bgpat = lhalfbg & bgmask0;
 			P0(p) = (P0(p) & ~lmask) | ((fgpat | bgpat) & lmask);
-			fgpat = (fg & 0x02) ? lhalf : 0;
-			bgpat = (bg & 0x02) ? lhalfbg : 0;
+			fgpat = lhalf   & fgmask1;
+			bgpat = lhalfbg & bgmask1;
 			P1(p) = (P1(p) & ~lmask) | ((fgpat | bgpat) & lmask);
-			fgpat = (fg & 0x04) ? lhalf : 0;
-			bgpat = (bg & 0x04) ? lhalfbg : 0;
+			fgpat = lhalf   & fgmask2;
+			bgpat = lhalfbg & bgmask2;
 			P2(p) = (P2(p) & ~lmask) | ((fgpat | bgpat) & lmask);
-			fgpat = (fg & 0x08) ? lhalf : 0;
-			bgpat = (bg & 0x08) ? lhalfbg : 0;
+			fgpat = lhalf   & fgmask3;
+			bgpat = lhalfbg & bgmask3;
 			P3(p) = (P3(p) & ~lmask) | ((fgpat | bgpat) & lmask);
 			p += BYTESDONE;
 			rhalf = (glyph << (BLITWIDTH - align));
 			rhalfbg = rhalf ^ ALL1BITS;
-			fgpat = (fg & 0x01) ? rhalf : 0;
-			bgpat = (bg & 0x01) ? rhalfbg : 0;
+			fgpat = rhalf   & fgmask0;
+			bgpat = rhalfbg & bgmask0;
 			P0(p) = ((fgpat | bgpat) & rmask) | (P0(p) & ~rmask);
-			fgpat = (fg & 0x02) ? rhalf : 0;
-			bgpat = (bg & 0x02) ? rhalfbg : 0;
+			fgpat = rhalf   & fgmask1;
+			bgpat = rhalfbg & bgmask1;
 			P1(p) = ((fgpat | bgpat) & rmask) | (P1(p) & ~rmask);
-			fgpat = (fg & 0x04) ? rhalf : 0;
-			bgpat = (bg & 0x04) ? rhalfbg : 0;
+			fgpat = rhalf   & fgmask2;
+			bgpat = rhalfbg & bgmask2;
 			P2(p) = ((fgpat | bgpat) & rmask) | (P2(p) & ~rmask);
-			fgpat = (fg & 0x08) ? rhalf : 0;
-			bgpat = (bg & 0x08) ? rhalfbg : 0;
+			fgpat = rhalf   & fgmask3;
+			bgpat = rhalfbg & bgmask3;
 			P3(p) = ((fgpat | bgpat) & rmask) | (P3(p) & ~rmask);
 
 			p = (q += scanspan);

Reply via email to