Use the 64b inner:monotonize() implementation not the 128b one for aarch64

AGSaidi · AGSaidi · commit ce450f893d55 · 2021-09-04T15:11:26.000-05:00
aarch64 prior to v8.4 (FEAT_LSE2) doesn't have an instruction that guarantees
untorn 128b reads except for completing a 128b load/store exclusive pair
(ldxp/stxp) or compare-and-swap (casp) successfully. The requirement to
complete a 128b read+write atomic is actually more expensive and more unfair
than the previous implementation of monotonize() which used a Mutex on aarch64,
especially at large core counts.  For aarch64 switch to the 64b atomic
implementation which is about 13x faster for a benchmark that involves many
calls to Instant::now().
diff --git a/library/std/src/time/monotonic.rs b/library/std/src/time/monotonic.rs
@@ -5,7 +5,7 @@ pub(super) fn monotonize(raw: time::Instant) -> time::Instant {
     inner::monotonize(raw)
 }
 
-#[cfg(all(target_has_atomic = "64", not(target_has_atomic = "128")))]
+#[cfg(any(all(target_has_atomic = "64", not(target_has_atomic = "128")), target_arch = "aarch64"))]
 pub mod inner {
     use crate::sync::atomic::AtomicU64;
     use crate::sync::atomic::Ordering::*;
@@ -70,7 +70,7 @@ pub mod inner {
     }
 }
 
-#[cfg(target_has_atomic = "128")]
+#[cfg(all(target_has_atomic = "128", not(target_arch = "aarch64")))]
 pub mod inner {
     use crate::sync::atomic::AtomicU128;
     use crate::sync::atomic::Ordering::*;

Original file line number	Diff line number	Diff line change
`@@ -5,7 +5,7 @@ pub(super) fn monotonize(raw: time::Instant) -> time::Instant {`
`5`	`5`	`inner::monotonize(raw)`
`6`	`6`	`}`
`7`	`7`
`8`		`-#[cfg(all(target_has_atomic = "64", not(target_has_atomic = "128")))]`
	`8`	`+#[cfg(any(all(target_has_atomic = "64", not(target_has_atomic = "128")), target_arch = "aarch64"))]`
`9`	`9`	`pub mod inner {`
`10`	`10`	`use crate::sync::atomic::AtomicU64;`
`11`	`11`	`use crate::sync::atomic::Ordering::*;`
`@@ -70,7 +70,7 @@ pub mod inner {`
`70`	`70`	`}`
`71`	`71`	`}`
`72`	`72`
`73`		`-#[cfg(target_has_atomic = "128")]`
	`73`	`+#[cfg(all(target_has_atomic = "128", not(target_arch = "aarch64")))]`
`74`	`74`	`pub mod inner {`
`75`	`75`	`use crate::sync::atomic::AtomicU128;`
`76`	`76`	`use crate::sync::atomic::Ordering::*;`