Author: jkim
Date: Wed Aug 21 22:27:42 2013
New Revision: 254619
URL: http://svnweb.freebsd.org/changeset/base/254619

Log:
  Reimplement atomic_load_acq_64() and atomic_store_rel_64() for i386.  These
  functions are now real functions rather than function pointers.  Supposedly,
  it is faster for modern processors.
  
  Suggested by: bde

Modified:
  head/sys/i386/i386/machdep.c
  head/sys/i386/include/atomic.h

Modified: head/sys/i386/i386/machdep.c
==============================================================================
--- head/sys/i386/i386/machdep.c        Wed Aug 21 22:05:58 2013        
(r254618)
+++ head/sys/i386/i386/machdep.c        Wed Aug 21 22:27:42 2013        
(r254619)
@@ -1548,21 +1548,6 @@ idle_sysctl(SYSCTL_HANDLER_ARGS)
 SYSCTL_PROC(_machdep, OID_AUTO, idle, CTLTYPE_STRING | CTLFLAG_RW, 0, 0,
     idle_sysctl, "A", "currently selected idle function");
 
-uint64_t (*atomic_load_acq_64)(volatile uint64_t *) =
-    atomic_load_acq_64_i386;
-void (*atomic_store_rel_64)(volatile uint64_t *, uint64_t) =
-    atomic_store_rel_64_i386;
-
-static void
-cpu_probe_cmpxchg8b(void)
-{
-
-       if ((cpu_feature & CPUID_CX8) != 0) {
-               atomic_load_acq_64 = atomic_load_acq_64_i586;
-               atomic_store_rel_64 = atomic_store_rel_64_i586;
-       }
-}
-
 /*
  * Reset registers to default values on exec.
  */
@@ -2824,7 +2809,6 @@ init386(first)
        thread0.td_pcb->pcb_gsd = PCPU_GET(fsgs_gdt)[1];
 
        cpu_probe_amdc1e();
-       cpu_probe_cmpxchg8b();
 }
 
 #else
@@ -3115,7 +3099,6 @@ init386(first)
        thread0.td_frame = &proc0_tf;
 
        cpu_probe_amdc1e();
-       cpu_probe_cmpxchg8b();
 
 #ifdef FDT
        x86_init_fdt();

Modified: head/sys/i386/include/atomic.h
==============================================================================
--- head/sys/i386/include/atomic.h      Wed Aug 21 22:05:58 2013        
(r254618)
+++ head/sys/i386/include/atomic.h      Wed Aug 21 22:27:42 2013        
(r254619)
@@ -32,6 +32,11 @@
 #error this file needs sys/cdefs.h as a prerequisite
 #endif
 
+#ifdef _KERNEL
+#include <machine/md_var.h>
+#include <machine/specialreg.h>
+#endif
+
 #define        mb()    __asm __volatile("lock; addl $0,(%%esp)" : : : 
"memory", "cc")
 #define        wmb()   __asm __volatile("lock; addl $0,(%%esp)" : : : 
"memory", "cc")
 #define        rmb()   __asm __volatile("lock; addl $0,(%%esp)" : : : 
"memory", "cc")
@@ -87,6 +92,9 @@ u_##TYPE      atomic_load_acq_##TYPE(volatile
 #define        ATOMIC_STORE(TYPE)                                      \
 void           atomic_store_rel_##TYPE(volatile u_##TYPE *p, u_##TYPE v)
 
+uint64_t       atomic_load_acq_64(volatile uint64_t *);
+void           atomic_store_rel_64(volatile uint64_t *, uint64_t);
+
 #else /* !KLD_MODULE && __GNUCLIKE_ASM */
 
 /*
@@ -124,83 +132,6 @@ atomic_##NAME##_barr_##TYPE(volatile u_#
 }                                                      \
 struct __hack
 
-#if defined(_KERNEL) && !defined(WANT_FUNCTIONS)
-
-/* I486 does not support SMP or CMPXCHG8B. */
-static __inline uint64_t
-atomic_load_acq_64_i386(volatile uint64_t *p)
-{
-       volatile uint32_t *high, *low;
-       uint64_t res;
-
-       low = (volatile uint32_t *)p;
-       high = (volatile uint32_t *)p + 1;
-       __asm __volatile(
-       "       pushfl ;                "
-       "       cli ;                   "
-       "       movl %1,%%eax ;         "
-       "       movl %2,%%edx ;         "
-       "       popfl"
-       : "=&A" (res)                   /* 0 */
-       : "m" (*low),                   /* 1 */
-         "m" (*high)                   /* 2 */
-       : "memory");
-       return (res);
-}
-
-static __inline void
-atomic_store_rel_64_i386(volatile uint64_t *p, uint64_t v)
-{
-       volatile uint32_t *high, *low;
-
-       low = (volatile uint32_t *)p;
-       high = (volatile uint32_t *)p + 1;
-       __asm __volatile(
-       "       pushfl ;                "
-       "       cli ;                   "
-       "       movl %%eax,%0 ;         "
-       "       movl %%edx,%1 ;         "
-       "       popfl"
-       : "=m" (*low),                  /* 0 */
-         "=m" (*high)                  /* 1 */
-       : "A" (v)                       /* 2 */
-       : "memory");
-}
-
-static __inline uint64_t
-atomic_load_acq_64_i586(volatile uint64_t *p)
-{
-       uint64_t res;
-
-       __asm __volatile(
-       "       movl %%ebx,%%eax ;      "
-       "       movl %%ecx,%%edx ;      "
-       "       " MPLOCKED "            "
-       "       cmpxchg8b %1"
-       : "=&A" (res),                  /* 0 */
-         "+m" (*p)                     /* 1 */
-       : : "memory", "cc");
-       return (res);
-}
-
-static __inline void
-atomic_store_rel_64_i586(volatile uint64_t *p, uint64_t v)
-{
-
-       __asm __volatile(
-       "       movl %%eax,%%ebx ;      "
-       "       movl %%edx,%%ecx ;      "
-       "1:                             "
-       "       " MPLOCKED "            "
-       "       cmpxchg8b %0 ;          "
-       "       jne 1b"
-       : "+m" (*p),                    /* 0 */
-         "+A" (v)                      /* 1 */
-       : : "ebx", "ecx", "memory", "cc");
-}
-
-#endif /* _KERNEL && !WANT_FUNCTIONS */
-
 /*
  * Atomic compare and set, used by the mutex functions
  *
@@ -343,6 +274,108 @@ struct __hack
 
 #endif /* _KERNEL && !SMP */
 
+#ifdef _KERNEL
+
+#ifdef WANT_FUNCTIONS
+uint64_t       atomic_load_acq_64_i386(volatile uint64_t *);
+uint64_t       atomic_load_acq_64_i586(volatile uint64_t *);
+void           atomic_store_rel_64_i386(volatile uint64_t *, uint64_t);
+void           atomic_store_rel_64_i586(volatile uint64_t *, uint64_t);
+#endif
+
+/* I486 does not support SMP or CMPXCHG8B. */
+static __inline uint64_t
+atomic_load_acq_64_i386(volatile uint64_t *p)
+{
+       volatile uint32_t *q;
+       uint64_t res;
+
+       q = (volatile uint32_t *)p;
+       __asm __volatile(
+       "       pushfl ;                "
+       "       cli ;                   "
+       "       movl    %1,%%eax ;      "
+       "       movl    %2,%%edx ;      "
+       "       popfl"
+       : "=&A" (res)                   /* 0 */
+       : "m" (*q),                     /* 1 */
+         "m" (*(q + 1))                /* 2 */
+       : "memory");
+       return (res);
+}
+
+static __inline void
+atomic_store_rel_64_i386(volatile uint64_t *p, uint64_t v)
+{
+       volatile uint32_t *q;
+
+       q = (volatile uint32_t *)p;
+       __asm __volatile(
+       "       pushfl ;                "
+       "       cli ;                   "
+       "       movl    %%eax,%0 ;      "
+       "       movl    %%edx,%1 ;      "
+       "       popfl"
+       : "=m" (*q),                    /* 0 */
+         "=m" (*(q + 1))               /* 1 */
+       : "A" (v)                       /* 2 */
+       : "memory");
+}
+
+static __inline uint64_t
+atomic_load_acq_64_i586(volatile uint64_t *p)
+{
+       uint64_t res;
+
+       __asm __volatile(
+       "       movl    %%ebx,%%eax ;   "
+       "       movl    %%ecx,%%edx ;   "
+       "       " MPLOCKED "            "
+       "       cmpxchg8b %1"
+       : "=&A" (res),                  /* 0 */
+         "+m" (*p)                     /* 1 */
+       : : "memory", "cc");
+       return (res);
+}
+
+static __inline void
+atomic_store_rel_64_i586(volatile uint64_t *p, uint64_t v)
+{
+
+       __asm __volatile(
+       "       movl    %%eax,%%ebx ;   "
+       "       movl    %%edx,%%ecx ;   "
+       "1:                             "
+       "       " MPLOCKED "            "
+       "       cmpxchg8b %0 ;          "
+       "       jne     1b"
+       : "+m" (*p),                    /* 0 */
+         "+A" (v)                      /* 1 */
+       : : "ebx", "ecx", "memory", "cc");
+}
+
+static __inline uint64_t
+atomic_load_acq_64(volatile uint64_t *p)
+{
+
+       if ((cpu_feature & CPUID_CX8) == 0)
+               return (atomic_load_acq_64_i386(p));
+       else
+               return (atomic_load_acq_64_i586(p));
+}
+
+static __inline void
+atomic_store_rel_64(volatile uint64_t *p, uint64_t v)
+{
+
+       if ((cpu_feature & CPUID_CX8) == 0)
+               atomic_store_rel_64_i386(p, v);
+       else
+               atomic_store_rel_64_i586(p, v);
+}
+
+#endif /* _KERNEL */
+
 #endif /* KLD_MODULE || !__GNUCLIKE_ASM */
 
 ATOMIC_ASM(set,             char,  "orb %b1,%0",  "iq",  v);
@@ -381,11 +414,6 @@ ATOMIC_STORE(long);
 
 #ifndef WANT_FUNCTIONS
 
-#ifdef _KERNEL
-extern uint64_t (*atomic_load_acq_64)(volatile uint64_t *);
-extern void (*atomic_store_rel_64)(volatile uint64_t *, uint64_t);
-#endif
-
 static __inline int
 atomic_cmpset_long(volatile u_long *dst, u_long expect, u_long src)
 {
_______________________________________________
[email protected] mailing list
http://lists.freebsd.org/mailman/listinfo/svn-src-head
To unsubscribe, send any mail to "[email protected]"

Reply via email to