Source-Changes-HG archive

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index][Old Index]

[src/trunk]: src/sys/arch/sparc/dev cg14_invert():



details:   https://anonhg.NetBSD.org/src/rev/ef6e24373b56
branches:  trunk
changeset: 1027736:ef6e24373b56
user:      macallan <macallan%NetBSD.org@localhost>
date:      Fri Dec 17 18:51:02 2021 +0000

description:
cg14_invert():
- use only 32bit accesses
- use byte mask / ROPs for partial writes

diffstat:

 sys/arch/sparc/dev/cgfourteen.c |  76 ++++++++++++++++++++++++----------------
 1 files changed, 45 insertions(+), 31 deletions(-)

diffs (104 lines):

diff -r 868f52ab3343 -r ef6e24373b56 sys/arch/sparc/dev/cgfourteen.c
--- a/sys/arch/sparc/dev/cgfourteen.c   Fri Dec 17 17:27:19 2021 +0000
+++ b/sys/arch/sparc/dev/cgfourteen.c   Fri Dec 17 18:51:02 2021 +0000
@@ -1,4 +1,4 @@
-/*     $NetBSD: cgfourteen.c,v 1.90 2021/08/07 16:19:05 thorpej Exp $ */
+/*     $NetBSD: cgfourteen.c,v 1.91 2021/12/17 18:51:02 macallan Exp $ */
 
 /*
  * Copyright (c) 1996
@@ -1226,50 +1226,64 @@
            sc->sc_vd.active->scr_ri.ri_devcmap[(attr >> 24 & 0xf)]);
 }
 
+/*
+ * invert a rectangle, used only to (un)draw the cursor.
+ * - does a scanline at a time
+ * - does not handle wi > 64 or wi < 4, not that we need it for our fonts
+ * - uses all 32bit accesses
+ */ 
 static void
 cg14_invert(struct cgfourteen_softc *sc, int x, int y, int wi, int he)
 {
-       uint32_t addr, pptr;
-       int line, cnt, pre, words;
+       uint32_t addr, pptr, lmask, rmask;
+       int line, cnt, pre, words, pwrds = 0, post, reg;
        int stride = sc->sc_fb.fb_type.fb_width;
 
-       addr = sc->sc_fb_paddr + x + stride * y;
-       sx_write(sc->sc_sx, SX_ROP_CONTROL, 0x33); /* ~src a */
+       addr = (sc->sc_fb_paddr + x + stride * y) & ~3;
+       sx_write(sc->sc_sx, SX_ROP_CONTROL, 0x3C); /* ~src a / src a */
        /*
-        * Calculate the number of pixels we need to do one by one
-        * until we're 32bit aligned, then do the rest in 32bit
-        * mode. Assumes that stride is always a multiple of 4. 
-        */ 
-       /* TODO: use 32bit writes with byte mask instead */
-       pre = addr & 3;
-       if (pre != 0) pre = 4 - pre;
+        * Calculate the number of pixels we need to mask on each end of the
+        * scanline and how many we can do without mask, if any
+        */
+       pre = x & 3;
+       if (pre != 0) {
+               lmask = 0xffffffff >> pre;
+               pre = 4 - pre;
+               pwrds++;
+       }
+       post = (x + wi) & 3;
+       if (post != 0) {
+               rmask = ~(0xffffffff >> post);
+               pwrds++;
+       }
+       words = (wi + pre + 3) >> 2;
+       cnt = words - pwrds;
+       sx_write(sc->sc_sx, SX_QUEUED(7), 0xe0e0e0e0); /* four red pixels */
        for (line = 0; line < he; line++) {
                pptr = addr;
-               cnt = wi;
+               /* load a whole scanline */
+               sta(pptr & ~7, ASI_SX, SX_LD(8, words - 1, pptr & 7));
+               reg = 8;
                if (pre) {
-                       sta(pptr & ~7, ASI_SX, SX_LDB(8, pre - 1, pptr & 7));
+                       sx_write(sc->sc_sx, SX_QUEUED(R_MASK), lmask);
                        sx_write(sc->sc_sx, SX_INSTRUCTIONS,
-                           SX_ROP(8, 8, 32, pre - 1));
-                       sta(pptr & ~7, ASI_SX, SX_STB(32, pre - 1, pptr & 7));
-                       pptr += pre;
-                       cnt -= pre;
+                           SX_ROPB(8, 8, 40, 0));
+                       reg++;
                }
-               /* now do the aligned pixels in 32bit chunks */
-               while(cnt > 15) {
-                       words = uimin(16, cnt >> 2);
-                       sta(pptr & ~7, ASI_SX, SX_LD(8, words - 1, pptr & 7));
+               if (cnt > 0) {
+                       sx_write(sc->sc_sx, SX_QUEUED(R_MASK), 0xffffffff);
+                       /* XXX handle cnt > 16 */
                        sx_write(sc->sc_sx, SX_INSTRUCTIONS,
-                           SX_ROP(8, 8, 32, words - 1));
-                       sta(pptr & ~7, ASI_SX, SX_ST(32, words - 1, pptr & 7));
-                       pptr += words << 2;
-                       cnt -= words << 2;
+                           SX_ROP(reg, reg, reg + 32, cnt - 1));
+                       reg += cnt;
                }
-               /* do any remaining pixels byte-wise again */
-               if (cnt > 0)
-                       sta(pptr & ~7, ASI_SX, SX_LDB(8, cnt - 1, pptr & 7));
+               if (post) {
+                       sx_write(sc->sc_sx, SX_QUEUED(R_MASK), rmask);
                        sx_write(sc->sc_sx, SX_INSTRUCTIONS,
-                           SX_ROP(8, 8, 32, cnt - 1));
-                       sta(pptr & ~7, ASI_SX, SX_STB(32, cnt - 1, pptr & 7));
+                           SX_ROPB(reg, 7, reg + 32, 0));
+                       reg++;
+               }
+               sta(pptr & ~7, ASI_SX, SX_ST(40, words - 1, pptr & 7));         
                addr += stride;
        }
 }



Home | Main Index | Thread Index | Old Index