rust-lang · gnzlbg · Jun 25, 2018 · Jun 23, 2018 · Jun 23, 2018 · Jun 23, 2018
diff --git a/coresimd/x86/cpuid.rs b/coresimd/x86/cpuid.rs
@@ -78,34 +78,53 @@ pub unsafe fn __cpuid(leaf: u32) -> CpuidResult {
 }
 
 /// Does the host support the `cpuid` instruction?
-#[inline]
+#[inline(never)]
 pub fn has_cpuid() -> bool {
     #[cfg(target_arch = "x86_64")]
     {
         true
     }
     #[cfg(target_arch = "x86")]
     {
-        use coresimd::x86::{__readeflags, __writeeflags};
-
-        // On `x86` the `cpuid` instruction is not always available.
-        // This follows the approach indicated in:
-        // http://wiki.osdev.org/CPUID#Checking_CPUID_availability
         unsafe {
-            // Read EFLAGS:
-            let eflags: u32 = __readeflags();
-
-            // Invert the ID bit in EFLAGS:
-            let eflags_mod: u32 = eflags | 0x0020_0000;
-
-            // Store the modified EFLAGS (ID bit may or may not be inverted)
-            __writeeflags(eflags_mod);
-
-            // Read EFLAGS again:
-            let eflags_after: u32 = __readeflags();
-
-            // Check if the ID bit changed:
-            eflags_after != eflags
+            // On `x86` the `cpuid` instruction is not always available.
+            // This follows the approach indicated in:
+            // http://wiki.osdev.org/CPUID#Checking_CPUID_availability
+            // https://software.intel.com/en-us/articles/using-cpuid-to-detect-the-presence-of-sse-41-and-sse-42-instruction-sets/
+            // which detects whether `cpuid` is available by checking whether the 21st bit of the EFLAGS register is modifiable or not.
+            // If it is, then `cpuid` is available.
+            let result: u32;
+            let _temp: u32;
+            unsafe {
+                asm!(r#"
+                    # Read eflags into $0 and copy into $1:
+                    pushfd
+                    pop     $0
+                    mov     $1, $0
+                    # Flip 21st bit:
+                    xor     $0, 0x200000
+                    # Set eflags:
+                    push    $0
+                    popfd
+                    # Read eflags again, if cpuid is available
+                    # the 21st bit will be flipped, otherwise it
+                    # it will have the same value as the original in $1:
+                    pushfd
+                    pop     $0
+                    # Xor'ing with the original eflags should have the
+                    # 21st bit set to true if cpuid is available and zero
+                    # otherwise. All other bits have not been modified and
+                    # are zero:
+                    xor     $0, $1
+                    # Store in $0 the value of the 21st bit
+                    shr     $0, 21
+                    "#
+                     : "=r"(result), "=r"(_temp)
+                     :
+                     : "cc", "memory"
+                     : "intel");
+            }
+            result != 0
         }
     }
 }
@@ -138,17 +157,8 @@ mod tests {
         assert!(cpuid::has_cpuid());
     }
 
-    #[cfg(target_arch = "x86")]
     #[test]
-    fn test_has_cpuid() {
-        unsafe {
-            let before = __readeflags();
-
-            if cpuid::has_cpuid() {
-                assert!(before != __readeflags());
-            } else {
-                assert!(before == __readeflags());
-            }
-        }
+    fn test_has_cpuid_idempotent() {
+        assert_eq!(cpuid::has_cpuid(), cpuid::has_cpuid());
     }
 }