Auto merge of #121956 - ChrisDenton:srwlock, r=joboet

Windows: Implement condvar, mutex and rwlock using futex

Well, the Windows equivalent: [`WaitOnAddress`,](https://learn.microsoft.com/en-us/windows/win32/api/synchapi/nf-synchapi-waitonaddress) [`WakeByAddressSingle`](https://learn.microsoft.com/en-us/windows/win32/api/synchapi/nf-synchapi-wakebyaddresssingle) and [`WakeByAddressAll`](https://learn.microsoft.com/en-us/windows/win32/api/synchapi/nf-synchapi-wakebyaddressall).

Note that Windows flavoured futexes can be different sizes (1, 2, 4 or 8 bytes). I took advantage of that in the `Mutex` implementation.

I also edited the Mutex implementation a bit more than necessary. I was having trouble keeping in my head what 0, 1 and 2 meant so I replaced them with consts.

I *think* we're maybe spinning a bit much. `WaitOnAddress` seems to be looping quite a bit too. But for now I've keep the implementations the same. I do wonder if it'd be worth reducing or removing our spinning on Windows.

This also adds a new shim to miri, because of course it does.

Fixes #121949
This commit is contained in:
bors 2024-03-06 12:19:40 +00:00
commit 3314d5ce4c
14 changed files with 160 additions and 33 deletions

View File

@ -1,5 +1,6 @@
cfg_if::cfg_if! { cfg_if::cfg_if! {
if #[cfg(any( if #[cfg(any(
all(target_os = "windows", not(target_vendor="win7")),
target_os = "linux", target_os = "linux",
target_os = "android", target_os = "android",
target_os = "freebsd", target_os = "freebsd",
@ -14,9 +15,9 @@ cfg_if::cfg_if! {
} else if #[cfg(target_family = "unix")] { } else if #[cfg(target_family = "unix")] {
mod pthread; mod pthread;
pub use pthread::Condvar; pub use pthread::Condvar;
} else if #[cfg(target_os = "windows")] { } else if #[cfg(all(target_os = "windows", target_vendor = "win7"))] {
mod windows; mod windows7;
pub use windows::Condvar; pub use windows7::Condvar;
} else if #[cfg(all(target_vendor = "fortanix", target_env = "sgx"))] { } else if #[cfg(all(target_vendor = "fortanix", target_env = "sgx"))] {
mod sgx; mod sgx;
pub use sgx::Condvar; pub use sgx::Condvar;

View File

@ -1,30 +1,42 @@
use crate::sync::atomic::{ use crate::sync::atomic::{
AtomicU32, self,
Ordering::{Acquire, Relaxed, Release}, Ordering::{Acquire, Relaxed, Release},
}; };
use crate::sys::futex::{futex_wait, futex_wake}; use crate::sys::futex::{futex_wait, futex_wake};
pub struct Mutex { cfg_if::cfg_if! {
/// 0: unlocked if #[cfg(windows)] {
/// 1: locked, no other threads waiting // On Windows we can have a smol futex
/// 2: locked, and other threads waiting (contended) type Atomic = atomic::AtomicU8;
futex: AtomicU32, type State = u8;
} else {
type Atomic = atomic::AtomicU32;
type State = u32;
} }
}
pub struct Mutex {
futex: Atomic,
}
const UNLOCKED: State = 0;
const LOCKED: State = 1; // locked, no other threads waiting
const CONTENDED: State = 2; // locked, and other threads waiting (contended)
impl Mutex { impl Mutex {
#[inline] #[inline]
pub const fn new() -> Self { pub const fn new() -> Self {
Self { futex: AtomicU32::new(0) } Self { futex: Atomic::new(UNLOCKED) }
} }
#[inline] #[inline]
pub fn try_lock(&self) -> bool { pub fn try_lock(&self) -> bool {
self.futex.compare_exchange(0, 1, Acquire, Relaxed).is_ok() self.futex.compare_exchange(UNLOCKED, LOCKED, Acquire, Relaxed).is_ok()
} }
#[inline] #[inline]
pub fn lock(&self) { pub fn lock(&self) {
if self.futex.compare_exchange(0, 1, Acquire, Relaxed).is_err() { if self.futex.compare_exchange(UNLOCKED, LOCKED, Acquire, Relaxed).is_err() {
self.lock_contended(); self.lock_contended();
} }
} }
@ -36,8 +48,8 @@ impl Mutex {
// If it's unlocked now, attempt to take the lock // If it's unlocked now, attempt to take the lock
// without marking it as contended. // without marking it as contended.
if state == 0 { if state == UNLOCKED {
match self.futex.compare_exchange(0, 1, Acquire, Relaxed) { match self.futex.compare_exchange(UNLOCKED, LOCKED, Acquire, Relaxed) {
Ok(_) => return, // Locked! Ok(_) => return, // Locked!
Err(s) => state = s, Err(s) => state = s,
} }
@ -45,31 +57,31 @@ impl Mutex {
loop { loop {
// Put the lock in contended state. // Put the lock in contended state.
// We avoid an unnecessary write if it as already set to 2, // We avoid an unnecessary write if it as already set to CONTENDED,
// to be friendlier for the caches. // to be friendlier for the caches.
if state != 2 && self.futex.swap(2, Acquire) == 0 { if state != CONTENDED && self.futex.swap(CONTENDED, Acquire) == UNLOCKED {
// We changed it from 0 to 2, so we just successfully locked it. // We changed it from UNLOCKED to CONTENDED, so we just successfully locked it.
return; return;
} }
// Wait for the futex to change state, assuming it is still 2. // Wait for the futex to change state, assuming it is still CONTENDED.
futex_wait(&self.futex, 2, None); futex_wait(&self.futex, CONTENDED, None);
// Spin again after waking up. // Spin again after waking up.
state = self.spin(); state = self.spin();
} }
} }
fn spin(&self) -> u32 { fn spin(&self) -> State {
let mut spin = 100; let mut spin = 100;
loop { loop {
// We only use `load` (and not `swap` or `compare_exchange`) // We only use `load` (and not `swap` or `compare_exchange`)
// while spinning, to be easier on the caches. // while spinning, to be easier on the caches.
let state = self.futex.load(Relaxed); let state = self.futex.load(Relaxed);
// We stop spinning when the mutex is unlocked (0), // We stop spinning when the mutex is UNLOCKED,
// but also when it's contended (2). // but also when it's CONTENDED.
if state != 1 || spin == 0 { if state != LOCKED || spin == 0 {
return state; return state;
} }
@ -80,9 +92,9 @@ impl Mutex {
#[inline] #[inline]
pub unsafe fn unlock(&self) { pub unsafe fn unlock(&self) {
if self.futex.swap(0, Release) == 2 { if self.futex.swap(UNLOCKED, Release) == CONTENDED {
// We only wake up one thread. When that thread locks the mutex, it // We only wake up one thread. When that thread locks the mutex, it
// will mark the mutex as contended (2) (see lock_contended above), // will mark the mutex as CONTENDED (see lock_contended above),
// which makes sure that any other waiting threads will also be // which makes sure that any other waiting threads will also be
// woken up eventually. // woken up eventually.
self.wake(); self.wake();

View File

@ -1,5 +1,6 @@
cfg_if::cfg_if! { cfg_if::cfg_if! {
if #[cfg(any( if #[cfg(any(
all(target_os = "windows", not(target_vendor = "win7")),
target_os = "linux", target_os = "linux",
target_os = "android", target_os = "android",
target_os = "freebsd", target_os = "freebsd",
@ -19,9 +20,9 @@ cfg_if::cfg_if! {
))] { ))] {
mod pthread; mod pthread;
pub use pthread::{Mutex, raw}; pub use pthread::{Mutex, raw};
} else if #[cfg(target_os = "windows")] { } else if #[cfg(all(target_os = "windows", target_vendor = "win7"))] {
mod windows; mod windows7;
pub use windows::{Mutex, raw}; pub use windows7::{Mutex, raw};
} else if #[cfg(all(target_vendor = "fortanix", target_env = "sgx"))] { } else if #[cfg(all(target_vendor = "fortanix", target_env = "sgx"))] {
mod sgx; mod sgx;
pub use sgx::Mutex; pub use sgx::Mutex;

View File

@ -1,5 +1,6 @@
cfg_if::cfg_if! { cfg_if::cfg_if! {
if #[cfg(any( if #[cfg(any(
all(target_os = "windows", not(target_vendor = "win7")),
target_os = "linux", target_os = "linux",
target_os = "android", target_os = "android",
target_os = "freebsd", target_os = "freebsd",
@ -14,9 +15,9 @@ cfg_if::cfg_if! {
} else if #[cfg(target_family = "unix")] { } else if #[cfg(target_family = "unix")] {
mod queue; mod queue;
pub use queue::RwLock; pub use queue::RwLock;
} else if #[cfg(target_os = "windows")] { } else if #[cfg(all(target_os = "windows", target_vendor = "win7"))] {
mod windows; mod windows7;
pub use windows::RwLock; pub use windows7::RwLock;
} else if #[cfg(all(target_vendor = "fortanix", target_env = "sgx"))] { } else if #[cfg(all(target_vendor = "fortanix", target_env = "sgx"))] {
mod sgx; mod sgx;
pub use sgx::RwLock; pub use sgx::RwLock;

View File

@ -36,6 +36,7 @@ pub type LPVOID = *mut c_void;
pub type LPWCH = *mut WCHAR; pub type LPWCH = *mut WCHAR;
pub type LPWSTR = *mut WCHAR; pub type LPWSTR = *mut WCHAR;
#[cfg(target_vendor = "win7")]
pub type PSRWLOCK = *mut SRWLOCK; pub type PSRWLOCK = *mut SRWLOCK;
pub type socklen_t = c_int; pub type socklen_t = c_int;
@ -50,7 +51,9 @@ pub const INVALID_HANDLE_VALUE: HANDLE = ::core::ptr::without_provenance_mut(-1i
pub const EXIT_SUCCESS: u32 = 0; pub const EXIT_SUCCESS: u32 = 0;
pub const EXIT_FAILURE: u32 = 1; pub const EXIT_FAILURE: u32 = 1;
#[cfg(target_vendor = "win7")]
pub const CONDITION_VARIABLE_INIT: CONDITION_VARIABLE = CONDITION_VARIABLE { Ptr: ptr::null_mut() }; pub const CONDITION_VARIABLE_INIT: CONDITION_VARIABLE = CONDITION_VARIABLE { Ptr: ptr::null_mut() };
#[cfg(target_vendor = "win7")]
pub const SRWLOCK_INIT: SRWLOCK = SRWLOCK { Ptr: ptr::null_mut() }; pub const SRWLOCK_INIT: SRWLOCK = SRWLOCK { Ptr: ptr::null_mut() };
pub const INIT_ONCE_STATIC_INIT: INIT_ONCE = INIT_ONCE { Ptr: ptr::null_mut() }; pub const INIT_ONCE_STATIC_INIT: INIT_ONCE = INIT_ONCE { Ptr: ptr::null_mut() };
@ -373,6 +376,7 @@ extern "system" {
dwmilliseconds: u32, dwmilliseconds: u32,
) -> BOOL; ) -> BOOL;
pub fn WakeByAddressSingle(address: *const c_void); pub fn WakeByAddressSingle(address: *const c_void);
pub fn WakeByAddressAll(address: *const c_void);
} }
#[cfg(target_vendor = "win7")] #[cfg(target_vendor = "win7")]

View File

@ -0,0 +1,85 @@
use super::api;
use crate::sys::c;
use crate::sys::dur2timeout;
use core::ffi::c_void;
use core::mem;
use core::ptr;
use core::sync::atomic::{
AtomicBool, AtomicI16, AtomicI32, AtomicI64, AtomicI8, AtomicIsize, AtomicPtr, AtomicU16,
AtomicU32, AtomicU64, AtomicU8, AtomicUsize,
};
use core::time::Duration;
pub unsafe trait Waitable {
type Atomic;
}
macro_rules! unsafe_waitable_int {
($(($int:ty, $atomic:ty)),*$(,)?) => {
$(
unsafe impl Waitable for $int {
type Atomic = $atomic;
}
)*
};
}
unsafe_waitable_int! {
(bool, AtomicBool),
(i8, AtomicI8),
(i16, AtomicI16),
(i32, AtomicI32),
(i64, AtomicI64),
(isize, AtomicIsize),
(u8, AtomicU8),
(u16, AtomicU16),
(u32, AtomicU32),
(u64, AtomicU64),
(usize, AtomicUsize),
}
unsafe impl<T> Waitable for *const T {
type Atomic = AtomicPtr<T>;
}
unsafe impl<T> Waitable for *mut T {
type Atomic = AtomicPtr<T>;
}
pub fn wait_on_address<W: Waitable>(
address: &W::Atomic,
compare: W,
timeout: Option<Duration>,
) -> bool {
unsafe {
let addr = ptr::from_ref(address).cast::<c_void>();
let size = mem::size_of::<W>();
let compare_addr = ptr::addr_of!(compare).cast::<c_void>();
let timeout = timeout.map(dur2timeout).unwrap_or(c::INFINITE);
c::WaitOnAddress(addr, compare_addr, size, timeout) == c::TRUE
}
}
pub fn wake_by_address_single<T>(address: &T) {
unsafe {
let addr = ptr::from_ref(address).cast::<c_void>();
c::WakeByAddressSingle(addr);
}
}
pub fn wake_by_address_all<T>(address: &T) {
unsafe {
let addr = ptr::from_ref(address).cast::<c_void>();
c::WakeByAddressAll(addr);
}
}
pub fn futex_wait<W: Waitable>(futex: &W::Atomic, expected: W, timeout: Option<Duration>) -> bool {
// return false only on timeout
wait_on_address(futex, expected, timeout) || api::get_last_error().code != c::ERROR_TIMEOUT
}
pub fn futex_wake<T>(futex: &T) -> bool {
wake_by_address_single(futex);
false
}
pub fn futex_wake_all<T>(futex: &T) {
wake_by_address_all(futex)
}

View File

@ -17,6 +17,8 @@ pub mod args;
pub mod c; pub mod c;
pub mod env; pub mod env;
pub mod fs; pub mod fs;
#[cfg(not(target_vendor = "win7"))]
pub mod futex;
pub mod handle; pub mod handle;
pub mod io; pub mod io;
pub mod net; pub mod net;

View File

@ -366,6 +366,12 @@ pub trait EvalContextExt<'mir, 'tcx: 'mir>: crate::MiriInterpCxExt<'mir, 'tcx> {
this.WakeByAddressSingle(ptr_op)?; this.WakeByAddressSingle(ptr_op)?;
} }
"WakeByAddressAll" => {
let [ptr_op] =
this.check_shim(abi, Abi::System { unwind: false }, link_name, args)?;
this.WakeByAddressAll(ptr_op)?;
}
// Dynamic symbol loading // Dynamic symbol loading
"GetProcAddress" => { "GetProcAddress" => {

View File

@ -384,6 +384,21 @@ pub trait EvalContextExt<'mir, 'tcx: 'mir>: crate::MiriInterpCxExt<'mir, 'tcx> {
Ok(()) Ok(())
} }
fn WakeByAddressAll(&mut self, ptr_op: &OpTy<'tcx, Provenance>) -> InterpResult<'tcx> {
let this = self.eval_context_mut();
let ptr = this.read_pointer(ptr_op)?;
// See the Linux futex implementation for why this fence exists.
this.atomic_fence(AtomicFenceOrd::SeqCst)?;
while let Some(thread) = this.futex_wake(ptr.addr().bytes(), u32::MAX) {
this.unblock_thread(thread);
this.unregister_timeout_callback_if_exists(thread);
}
Ok(())
}
fn SleepConditionVariableSRW( fn SleepConditionVariableSRW(
&mut self, &mut self,

View File

@ -10,7 +10,7 @@
// //
// cdb-command:dx m,d // cdb-command:dx m,d
// cdb-check:m,d [Type: std::sync::mutex::Mutex<i32>] // cdb-check:m,d [Type: std::sync::mutex::Mutex<i32>]
// cdb-check: [...] inner [Type: std::sys::locks::mutex::windows::Mutex] // cdb-check: [...] inner [Type: std::sys::locks::mutex::futex::Mutex]
// cdb-check: [...] poison [Type: std::sync::poison::Flag] // cdb-check: [...] poison [Type: std::sync::poison::Flag]
// cdb-check: [...] data : 0 [Type: core::cell::UnsafeCell<i32>] // cdb-check: [...] data : 0 [Type: core::cell::UnsafeCell<i32>]

View File

@ -16,7 +16,7 @@
// cdb-command:dx r // cdb-command:dx r
// cdb-check:r [Type: std::sync::rwlock::RwLockReadGuard<i32>] // cdb-check:r [Type: std::sync::rwlock::RwLockReadGuard<i32>]
// cdb-check: [...] data : NonNull([...]: 0) [Type: core::ptr::non_null::NonNull<i32>] // cdb-check: [...] data : NonNull([...]: 0) [Type: core::ptr::non_null::NonNull<i32>]
// cdb-check: [...] inner_lock : [...] [Type: std::sys::locks::rwlock::windows::RwLock *] // cdb-check: [...] inner_lock : [...] [Type: std::sys::locks::rwlock::futex::RwLock *]
#[allow(unused_variables)] #[allow(unused_variables)]