Line data Source code
1 : use std::panic::AssertUnwindSafe;
2 : use std::sync::atomic::{AtomicBool, AtomicU8, AtomicU32, Ordering};
3 : use std::sync::{Arc, OnceLock, mpsc};
4 : use std::thread::JoinHandle;
5 :
6 : use tracing::{debug, error, trace};
7 :
8 : use crate::time::Timing;
9 :
10 : /// Stores status of the running threads. Threads are registered in the runtime upon creation
11 : /// and deregistered upon termination.
12 : pub struct Runtime {
13 : // stores handles to all threads that are currently running
14 : threads: Vec<ThreadHandle>,
15 : // stores current time and pending wakeups
16 : clock: Arc<Timing>,
17 : // thread counter
18 : thread_counter: AtomicU32,
19 : // Thread step counter -- how many times all threads has been actually
20 : // stepped (note that all world/time/executor/thread have slightly different
21 : // meaning of steps). For observability.
22 : pub step_counter: u64,
23 : }
24 :
25 : impl Runtime {
26 : /// Init new runtime, no running threads.
27 528 : pub fn new(clock: Arc<Timing>) -> Self {
28 528 : Self {
29 528 : threads: Vec::new(),
30 528 : clock,
31 528 : thread_counter: AtomicU32::new(0),
32 528 : step_counter: 0,
33 528 : }
34 528 : }
35 :
36 : /// Spawn a new thread and register it in the runtime.
37 19364 : pub fn spawn<F>(&mut self, f: F) -> ExternalHandle
38 19364 : where
39 19364 : F: FnOnce() + Send + 'static,
40 19364 : {
41 19364 : let (tx, rx) = mpsc::channel();
42 19364 :
43 19364 : let clock = self.clock.clone();
44 19364 : let tid = self.thread_counter.fetch_add(1, Ordering::SeqCst);
45 19364 : debug!("spawning thread-{}", tid);
46 :
47 19364 : let join = std::thread::spawn(move || {
48 19364 : let _guard = tracing::info_span!("", tid).entered();
49 19364 :
50 19364 : let res = std::panic::catch_unwind(AssertUnwindSafe(|| {
51 19364 : with_thread_context(|ctx| {
52 19364 : assert!(ctx.clock.set(clock).is_ok());
53 19364 : ctx.id.store(tid, Ordering::SeqCst);
54 19364 : tx.send(ctx.clone()).expect("failed to send thread context");
55 19364 : // suspend thread to put it to `threads` in sleeping state
56 19364 : ctx.yield_me(0);
57 19364 : });
58 19364 :
59 19364 : // start user-provided function
60 19364 : f();
61 19364 : }));
62 19364 : debug!("thread finished");
63 :
64 19306 : if let Err(e) = res {
65 19286 : with_thread_context(|ctx| {
66 19286 : if !ctx.allow_panic.load(std::sync::atomic::Ordering::SeqCst) {
67 0 : error!("thread panicked, terminating the process: {:?}", e);
68 0 : std::process::exit(1);
69 19286 : }
70 19286 :
71 19286 : debug!("thread panicked: {:?}", e);
72 19286 : let mut result = ctx.result.lock();
73 19286 : if result.0 == -1 {
74 18844 : *result = (256, format!("thread panicked: {:?}", e));
75 18844 : }
76 19286 : });
77 19286 : }
78 :
79 19306 : with_thread_context(|ctx| {
80 19306 : ctx.finish_me();
81 19306 : });
82 19364 : });
83 19364 :
84 19364 : let ctx = rx.recv().expect("failed to receive thread context");
85 19364 : let handle = ThreadHandle::new(ctx.clone(), join);
86 19364 :
87 19364 : self.threads.push(handle);
88 19364 :
89 19364 : ExternalHandle { ctx }
90 19364 : }
91 :
92 : /// Returns true if there are any unfinished activity, such as running thread or pending events.
93 : /// Otherwise returns false, which means all threads are blocked forever.
94 422925 : pub fn step(&mut self) -> bool {
95 422925 : trace!("runtime step");
96 :
97 : // have we run any thread?
98 422925 : let mut ran = false;
99 422925 :
100 2110247 : self.threads.retain(|thread: &ThreadHandle| {
101 2110247 : let res = thread.ctx.wakeup.compare_exchange(
102 2110247 : PENDING_WAKEUP,
103 2110247 : NO_WAKEUP,
104 2110247 : Ordering::SeqCst,
105 2110247 : Ordering::SeqCst,
106 2110247 : );
107 2110247 : if res.is_err() {
108 : // thread has no pending wakeups, leaving as is
109 1819326 : return true;
110 290921 : }
111 290921 : ran = true;
112 290921 :
113 290921 : trace!("entering thread-{}", thread.ctx.tid());
114 290921 : let status = thread.step();
115 290921 : self.step_counter += 1;
116 290921 : trace!(
117 0 : "out of thread-{} with status {:?}",
118 0 : thread.ctx.tid(),
119 : status
120 : );
121 :
122 290921 : if status == Status::Sleep {
123 271615 : true
124 : } else {
125 19306 : trace!("thread has finished");
126 : // removing the thread from the list
127 19306 : false
128 : }
129 2110247 : });
130 422925 :
131 422925 : if !ran {
132 223203 : trace!("no threads were run, stepping clock");
133 223203 : if let Some(ctx_to_wake) = self.clock.step() {
134 222655 : trace!("waking up thread-{}", ctx_to_wake.tid());
135 222655 : ctx_to_wake.inc_wake();
136 : } else {
137 548 : return false;
138 : }
139 199722 : }
140 :
141 422377 : true
142 422925 : }
143 :
144 : /// Kill all threads. This is done by setting a flag in each thread context and waking it up.
145 1008 : pub fn crash_all_threads(&mut self) {
146 2850 : for thread in self.threads.iter() {
147 2850 : thread.ctx.crash_stop();
148 2850 : }
149 :
150 : // all threads should be finished after a few steps
151 1512 : while !self.threads.is_empty() {
152 504 : self.step();
153 504 : }
154 1008 : }
155 : }
156 :
157 : impl Drop for Runtime {
158 503 : fn drop(&mut self) {
159 503 : debug!("dropping the runtime");
160 503 : self.crash_all_threads();
161 503 : }
162 : }
163 :
164 : #[derive(Clone)]
165 : pub struct ExternalHandle {
166 : ctx: Arc<ThreadContext>,
167 : }
168 :
169 : impl ExternalHandle {
170 : /// Returns true if thread has finished execution.
171 436694 : pub fn is_finished(&self) -> bool {
172 436694 : let status = self.ctx.mutex.lock();
173 436694 : *status == Status::Finished
174 436694 : }
175 :
176 : /// Returns exitcode and message, which is available after thread has finished execution.
177 434 : pub fn result(&self) -> (i32, String) {
178 434 : let result = self.ctx.result.lock();
179 434 : result.clone()
180 434 : }
181 :
182 : /// Returns thread id.
183 16 : pub fn id(&self) -> u32 {
184 16 : self.ctx.id.load(Ordering::SeqCst)
185 16 : }
186 :
187 : /// Sets a flag to crash thread on the next wakeup.
188 16332 : pub fn crash_stop(&self) {
189 16332 : self.ctx.crash_stop();
190 16332 : }
191 : }
192 :
193 : struct ThreadHandle {
194 : ctx: Arc<ThreadContext>,
195 : _join: JoinHandle<()>,
196 : }
197 :
198 : impl ThreadHandle {
199 : /// Create a new [`ThreadHandle`] and wait until thread will enter [`Status::Sleep`] state.
200 19364 : fn new(ctx: Arc<ThreadContext>, join: JoinHandle<()>) -> Self {
201 19364 : let mut status = ctx.mutex.lock();
202 : // wait until thread will go into the first yield
203 19389 : while *status != Status::Sleep {
204 25 : ctx.condvar.wait(&mut status);
205 25 : }
206 19364 : drop(status);
207 19364 :
208 19364 : Self { ctx, _join: join }
209 19364 : }
210 :
211 : /// Allows thread to execute one step of its execution.
212 : /// Returns [`Status`] of the thread after the step.
213 290921 : fn step(&self) -> Status {
214 290921 : let mut status = self.ctx.mutex.lock();
215 290921 : assert!(matches!(*status, Status::Sleep));
216 :
217 290921 : *status = Status::Running;
218 290921 : self.ctx.condvar.notify_all();
219 :
220 581842 : while *status == Status::Running {
221 290921 : self.ctx.condvar.wait(&mut status);
222 290921 : }
223 :
224 290921 : *status
225 290921 : }
226 : }
227 :
228 : #[derive(Clone, Copy, Debug, PartialEq, Eq)]
229 : enum Status {
230 : /// Thread is running.
231 : Running,
232 : /// Waiting for event to complete, will be resumed by the executor step, once wakeup flag is set.
233 : Sleep,
234 : /// Thread finished execution.
235 : Finished,
236 : }
237 :
238 : const NO_WAKEUP: u8 = 0;
239 : const PENDING_WAKEUP: u8 = 1;
240 :
241 : pub struct ThreadContext {
242 : id: AtomicU32,
243 : // used to block thread until it is woken up
244 : mutex: parking_lot::Mutex<Status>,
245 : condvar: parking_lot::Condvar,
246 : // used as a flag to indicate runtime that thread is ready to be woken up
247 : wakeup: AtomicU8,
248 : clock: OnceLock<Arc<Timing>>,
249 : // execution result, set by exit() call
250 : result: parking_lot::Mutex<(i32, String)>,
251 : // determines if process should be killed on receiving panic
252 : allow_panic: AtomicBool,
253 : // acts as a signal that thread should crash itself on the next wakeup
254 : crash_request: AtomicBool,
255 : }
256 :
257 : impl ThreadContext {
258 19892 : pub(crate) fn new() -> Self {
259 19892 : Self {
260 19892 : id: AtomicU32::new(0),
261 19892 : mutex: parking_lot::Mutex::new(Status::Running),
262 19892 : condvar: parking_lot::Condvar::new(),
263 19892 : wakeup: AtomicU8::new(NO_WAKEUP),
264 19892 : clock: OnceLock::new(),
265 19892 : result: parking_lot::Mutex::new((-1, String::new())),
266 19892 : allow_panic: AtomicBool::new(false),
267 19892 : crash_request: AtomicBool::new(false),
268 19892 : }
269 19892 : }
270 : }
271 :
272 : // Functions for executor to control thread execution.
273 : impl ThreadContext {
274 : /// Set atomic flag to indicate that thread is ready to be woken up.
275 702586 : fn inc_wake(&self) {
276 702586 : self.wakeup.store(PENDING_WAKEUP, Ordering::SeqCst);
277 702586 : }
278 :
279 : /// Internal function used for event queues.
280 184014 : pub(crate) fn schedule_wakeup(self: &Arc<Self>, after_ms: u64) {
281 184014 : self.clock
282 184014 : .get()
283 184014 : .unwrap()
284 184014 : .schedule_wakeup(after_ms, self.clone());
285 184014 : }
286 :
287 1 : fn tid(&self) -> u32 {
288 1 : self.id.load(Ordering::SeqCst)
289 1 : }
290 :
291 19182 : fn crash_stop(&self) {
292 19182 : let status = self.mutex.lock();
293 19182 : if *status == Status::Finished {
294 7 : debug!(
295 0 : "trying to crash thread-{}, which is already finished",
296 0 : self.tid()
297 : );
298 7 : return;
299 19175 : }
300 19175 : assert!(matches!(*status, Status::Sleep));
301 19175 : drop(status);
302 19175 :
303 19175 : self.allow_panic.store(true, Ordering::SeqCst);
304 19175 : self.crash_request.store(true, Ordering::SeqCst);
305 19175 : // set a wakeup
306 19175 : self.inc_wake();
307 : // it will panic on the next wakeup
308 19182 : }
309 : }
310 :
311 : // Internal functions.
312 : impl ThreadContext {
313 : /// Blocks thread until it's woken up by the executor. If `after_ms` is 0, is will be
314 : /// woken on the next step. If `after_ms` > 0, wakeup is scheduled after that time.
315 : /// Otherwise wakeup is not scheduled inside `yield_me`, and should be arranged before
316 : /// calling this function.
317 290979 : fn yield_me(self: &Arc<Self>, after_ms: i64) {
318 290979 : let mut status = self.mutex.lock();
319 290979 : assert!(matches!(*status, Status::Running));
320 :
321 290979 : match after_ms.cmp(&0) {
322 241055 : std::cmp::Ordering::Less => {
323 241055 : // block until something wakes us up
324 241055 : }
325 20973 : std::cmp::Ordering::Equal => {
326 20973 : // tell executor that we are ready to be woken up
327 20973 : self.inc_wake();
328 20973 : }
329 28951 : std::cmp::Ordering::Greater => {
330 28951 : // schedule wakeup
331 28951 : self.clock
332 28951 : .get()
333 28951 : .unwrap()
334 28951 : .schedule_wakeup(after_ms as u64, self.clone());
335 28951 : }
336 : }
337 :
338 290979 : *status = Status::Sleep;
339 290979 : self.condvar.notify_all();
340 :
341 : // wait until executor wakes us up
342 581958 : while *status != Status::Running {
343 290979 : self.condvar.wait(&mut status);
344 290979 : }
345 :
346 290979 : if self.crash_request.load(Ordering::SeqCst) {
347 18844 : panic!("crashed by request");
348 272135 : }
349 272135 : }
350 :
351 : /// Called only once, exactly before thread finishes execution.
352 19306 : fn finish_me(&self) {
353 19306 : let mut status = self.mutex.lock();
354 19306 : assert!(matches!(*status, Status::Running));
355 :
356 19306 : *status = Status::Finished;
357 19306 : {
358 19306 : let mut result = self.result.lock();
359 19306 : if result.0 == -1 {
360 20 : *result = (0, "finished normally".to_owned());
361 19286 : }
362 : }
363 19306 : self.condvar.notify_all();
364 19306 : }
365 : }
366 :
367 : /// Invokes the given closure with a reference to the current thread [`ThreadContext`].
368 : #[inline(always)]
369 1908079 : fn with_thread_context<T>(f: impl FnOnce(&Arc<ThreadContext>) -> T) -> T {
370 1908079 : thread_local!(static THREAD_DATA: Arc<ThreadContext> = Arc::new(ThreadContext::new()));
371 1908079 : THREAD_DATA.with(f)
372 1908079 : }
373 :
374 : /// Waker is used to wake up threads that are blocked on condition.
375 : /// It keeps track of contexts [`Arc<ThreadContext>`] and can increment the counter
376 : /// of several contexts to send a notification.
377 : pub struct Waker {
378 : // contexts that are waiting for a notification
379 : contexts: parking_lot::Mutex<smallvec::SmallVec<[Arc<ThreadContext>; 8]>>,
380 : }
381 :
382 : impl Default for Waker {
383 0 : fn default() -> Self {
384 0 : Self::new()
385 0 : }
386 : }
387 :
388 : impl Waker {
389 80157 : pub fn new() -> Self {
390 80157 : Self {
391 80157 : contexts: parking_lot::Mutex::new(smallvec::SmallVec::new()),
392 80157 : }
393 80157 : }
394 :
395 : /// Subscribe current thread to receive a wake notification later.
396 850281 : pub fn wake_me_later(&self) {
397 850281 : with_thread_context(|ctx| {
398 850281 : self.contexts.lock().push(ctx.clone());
399 850281 : });
400 850281 : }
401 :
402 : /// Wake up all threads that are waiting for a notification and clear the list.
403 126919 : pub fn wake_all(&self) {
404 126919 : let mut v = self.contexts.lock();
405 439783 : for ctx in v.iter() {
406 439783 : ctx.inc_wake();
407 439783 : }
408 126919 : v.clear();
409 126919 : }
410 : }
411 :
412 : /// See [`ThreadContext::yield_me`].
413 271615 : pub fn yield_me(after_ms: i64) {
414 271615 : with_thread_context(|ctx| ctx.yield_me(after_ms))
415 271615 : }
416 :
417 : /// Get current time.
418 727257 : pub fn now() -> u64 {
419 727257 : with_thread_context(|ctx| ctx.clock.get().unwrap().now())
420 727257 : }
421 :
422 442 : pub fn exit(code: i32, msg: String) {
423 442 : with_thread_context(|ctx| {
424 442 : ctx.allow_panic.store(true, Ordering::SeqCst);
425 442 : let mut result = ctx.result.lock();
426 442 : *result = (code, msg);
427 442 : panic!("exit");
428 442 : });
429 : }
430 :
431 528 : pub(crate) fn get_thread_ctx() -> Arc<ThreadContext> {
432 528 : with_thread_context(|ctx| ctx.clone())
433 528 : }
434 :
435 : /// Trait for polling channels until they have something.
436 : pub trait PollSome {
437 : /// Schedule wakeup for message arrival.
438 : fn wake_me(&self);
439 :
440 : /// Check if channel has a ready message.
441 : fn has_some(&self) -> bool;
442 : }
443 :
444 : /// Blocks current thread until one of the channels has a ready message. Returns
445 : /// index of the channel that has a message. If timeout is reached, returns None.
446 : ///
447 : /// Negative timeout means block forever. Zero timeout means check channels and return
448 : /// immediately. Positive timeout means block until timeout is reached.
449 106997 : pub fn epoll_chans(chans: &[Box<dyn PollSome>], timeout: i64) -> Option<usize> {
450 106997 : let deadline = if timeout < 0 {
451 78085 : 0
452 : } else {
453 28912 : now() + timeout as u64
454 : };
455 :
456 : loop {
457 1050245 : for chan in chans {
458 847186 : chan.wake_me()
459 : }
460 :
461 683517 : for (i, chan) in chans.iter().enumerate() {
462 683517 : if chan.has_some() {
463 86359 : return Some(i);
464 597158 : }
465 : }
466 :
467 98756 : if timeout < 0 {
468 67111 : // block until wakeup
469 67111 : yield_me(-1);
470 67111 : } else {
471 31645 : let current_time = now();
472 31645 : if current_time >= deadline {
473 2694 : return None;
474 28951 : }
475 28951 :
476 28951 : yield_me((deadline - current_time) as i64);
477 : }
478 : }
479 89053 : }
|