Line data Source code
1 : use std::panic::AssertUnwindSafe;
2 : use std::sync::atomic::{AtomicBool, AtomicU8, AtomicU32, Ordering};
3 : use std::sync::{Arc, OnceLock, mpsc};
4 : use std::thread::JoinHandle;
5 :
6 : use tracing::{debug, error, trace};
7 :
8 : use crate::time::Timing;
9 :
10 : /// Stores status of the running threads. Threads are registered in the runtime upon creation
11 : /// and deregistered upon termination.
12 : pub struct Runtime {
13 : // stores handles to all threads that are currently running
14 : threads: Vec<ThreadHandle>,
15 : // stores current time and pending wakeups
16 : clock: Arc<Timing>,
17 : // thread counter
18 : thread_counter: AtomicU32,
19 : // Thread step counter -- how many times all threads has been actually
20 : // stepped (note that all world/time/executor/thread have slightly different
21 : // meaning of steps). For observability.
22 : pub step_counter: u64,
23 : }
24 :
25 : impl Runtime {
26 : /// Init new runtime, no running threads.
27 528 : pub fn new(clock: Arc<Timing>) -> Self {
28 528 : Self {
29 528 : threads: Vec::new(),
30 528 : clock,
31 528 : thread_counter: AtomicU32::new(0),
32 528 : step_counter: 0,
33 528 : }
34 528 : }
35 :
36 : /// Spawn a new thread and register it in the runtime.
37 20298 : pub fn spawn<F>(&mut self, f: F) -> ExternalHandle
38 20298 : where
39 20298 : F: FnOnce() + Send + 'static,
40 : {
41 20298 : let (tx, rx) = mpsc::channel();
42 :
43 20298 : let clock = self.clock.clone();
44 20298 : let tid = self.thread_counter.fetch_add(1, Ordering::SeqCst);
45 20298 : debug!("spawning thread-{}", tid);
46 :
47 20298 : let join = std::thread::spawn(move || {
48 20298 : let _guard = tracing::info_span!("", tid).entered();
49 :
50 20298 : let res = std::panic::catch_unwind(AssertUnwindSafe(|| {
51 20298 : with_thread_context(|ctx| {
52 20298 : assert!(ctx.clock.set(clock).is_ok());
53 20298 : ctx.id.store(tid, Ordering::SeqCst);
54 20298 : tx.send(ctx.clone()).expect("failed to send thread context");
55 : // suspend thread to put it to `threads` in sleeping state
56 20298 : ctx.yield_me(0);
57 528 : });
58 :
59 : // start user-provided function
60 20298 : f();
61 528 : }));
62 20298 : debug!("thread finished");
63 :
64 20298 : if let Err(e) = res {
65 20278 : with_thread_context(|ctx| {
66 20220 : if !ctx.allow_panic.load(std::sync::atomic::Ordering::SeqCst) {
67 0 : error!("thread panicked, terminating the process: {:?}", e);
68 0 : std::process::exit(1);
69 504 : }
70 :
71 20220 : debug!("thread panicked: {:?}", e);
72 20220 : let mut result = ctx.result.lock();
73 20220 : if result.0 == -1 {
74 19804 : *result = (256, format!("thread panicked: {e:?}"));
75 19804 : }
76 504 : });
77 0 : }
78 :
79 20298 : with_thread_context(|ctx| {
80 20240 : ctx.finish_me();
81 504 : });
82 528 : });
83 :
84 20298 : let ctx = rx.recv().expect("failed to receive thread context");
85 20298 : let handle = ThreadHandle::new(ctx.clone(), join);
86 :
87 20298 : self.threads.push(handle);
88 :
89 20298 : ExternalHandle { ctx }
90 528 : }
91 :
92 : /// Returns true if there are any unfinished activity, such as running thread or pending events.
93 : /// Otherwise returns false, which means all threads are blocked forever.
94 418835 : pub fn step(&mut self) -> bool {
95 418835 : trace!("runtime step");
96 :
97 : // have we run any thread?
98 418835 : let mut ran = false;
99 :
100 2089669 : self.threads.retain(|thread: &ThreadHandle| {
101 2089669 : let res = thread.ctx.wakeup.compare_exchange(
102 : PENDING_WAKEUP,
103 : NO_WAKEUP,
104 2089669 : Ordering::SeqCst,
105 2089669 : Ordering::SeqCst,
106 : );
107 2089669 : if res.is_err() {
108 : // thread has no pending wakeups, leaving as is
109 1799975 : return true;
110 289694 : }
111 289694 : ran = true;
112 :
113 289694 : trace!("entering thread-{}", thread.ctx.tid());
114 289694 : let status = thread.step();
115 289694 : self.step_counter += 1;
116 289694 : trace!(
117 0 : "out of thread-{} with status {:?}",
118 0 : thread.ctx.tid(),
119 : status
120 : );
121 :
122 289694 : if status == Status::Sleep {
123 269454 : true
124 : } else {
125 20240 : trace!("thread has finished");
126 : // removing the thread from the list
127 20240 : false
128 : }
129 2089669 : });
130 :
131 418835 : if !ran {
132 221348 : trace!("no threads were run, stepping clock");
133 221348 : if let Some(ctx_to_wake) = self.clock.step() {
134 220800 : trace!("waking up thread-{}", ctx_to_wake.tid());
135 220800 : ctx_to_wake.inc_wake();
136 : } else {
137 548 : return false;
138 : }
139 197487 : }
140 :
141 418287 : true
142 418835 : }
143 :
144 : /// Kill all threads. This is done by setting a flag in each thread context and waking it up.
145 1008 : pub fn crash_all_threads(&mut self) {
146 2852 : for thread in self.threads.iter() {
147 2852 : thread.ctx.crash_stop();
148 2852 : }
149 :
150 : // all threads should be finished after a few steps
151 1512 : while !self.threads.is_empty() {
152 504 : self.step();
153 504 : }
154 1008 : }
155 : }
156 :
157 : impl Drop for Runtime {
158 503 : fn drop(&mut self) {
159 503 : debug!("dropping the runtime");
160 503 : self.crash_all_threads();
161 503 : }
162 : }
163 :
164 : #[derive(Clone)]
165 : pub struct ExternalHandle {
166 : ctx: Arc<ThreadContext>,
167 : }
168 :
169 : impl ExternalHandle {
170 : /// Returns true if thread has finished execution.
171 432726 : pub fn is_finished(&self) -> bool {
172 432726 : let status = self.ctx.mutex.lock();
173 432726 : *status == Status::Finished
174 432726 : }
175 :
176 : /// Returns exitcode and message, which is available after thread has finished execution.
177 407 : pub fn result(&self) -> (i32, String) {
178 407 : let result = self.ctx.result.lock();
179 407 : result.clone()
180 407 : }
181 :
182 : /// Returns thread id.
183 4 : pub fn id(&self) -> u32 {
184 4 : self.ctx.id.load(Ordering::SeqCst)
185 4 : }
186 :
187 : /// Sets a flag to crash thread on the next wakeup.
188 17293 : pub fn crash_stop(&self) {
189 17293 : self.ctx.crash_stop();
190 17293 : }
191 : }
192 :
193 : struct ThreadHandle {
194 : ctx: Arc<ThreadContext>,
195 : _join: JoinHandle<()>,
196 : }
197 :
198 : impl ThreadHandle {
199 : /// Create a new [`ThreadHandle`] and wait until thread will enter [`Status::Sleep`] state.
200 20298 : fn new(ctx: Arc<ThreadContext>, join: JoinHandle<()>) -> Self {
201 20298 : let mut status = ctx.mutex.lock();
202 : // wait until thread will go into the first yield
203 20333 : while *status != Status::Sleep {
204 35 : ctx.condvar.wait(&mut status);
205 35 : }
206 20298 : drop(status);
207 :
208 20298 : Self { ctx, _join: join }
209 20298 : }
210 :
211 : /// Allows thread to execute one step of its execution.
212 : /// Returns [`Status`] of the thread after the step.
213 289694 : fn step(&self) -> Status {
214 289694 : let mut status = self.ctx.mutex.lock();
215 289694 : assert!(matches!(*status, Status::Sleep));
216 :
217 289694 : *status = Status::Running;
218 289694 : self.ctx.condvar.notify_all();
219 :
220 579388 : while *status == Status::Running {
221 289694 : self.ctx.condvar.wait(&mut status);
222 289694 : }
223 :
224 289694 : *status
225 289694 : }
226 : }
227 :
228 : #[derive(Clone, Copy, Debug, PartialEq, Eq)]
229 : enum Status {
230 : /// Thread is running.
231 : Running,
232 : /// Waiting for event to complete, will be resumed by the executor step, once wakeup flag is set.
233 : Sleep,
234 : /// Thread finished execution.
235 : Finished,
236 : }
237 :
238 : const NO_WAKEUP: u8 = 0;
239 : const PENDING_WAKEUP: u8 = 1;
240 :
241 : pub struct ThreadContext {
242 : id: AtomicU32,
243 : // used to block thread until it is woken up
244 : mutex: parking_lot::Mutex<Status>,
245 : condvar: parking_lot::Condvar,
246 : // used as a flag to indicate runtime that thread is ready to be woken up
247 : wakeup: AtomicU8,
248 : clock: OnceLock<Arc<Timing>>,
249 : // execution result, set by exit() call
250 : result: parking_lot::Mutex<(i32, String)>,
251 : // determines if process should be killed on receiving panic
252 : allow_panic: AtomicBool,
253 : // acts as a signal that thread should crash itself on the next wakeup
254 : crash_request: AtomicBool,
255 : }
256 :
257 : impl ThreadContext {
258 20826 : pub(crate) fn new() -> Self {
259 20826 : Self {
260 20826 : id: AtomicU32::new(0),
261 20826 : mutex: parking_lot::Mutex::new(Status::Running),
262 20826 : condvar: parking_lot::Condvar::new(),
263 20826 : wakeup: AtomicU8::new(NO_WAKEUP),
264 20826 : clock: OnceLock::new(),
265 20826 : result: parking_lot::Mutex::new((-1, String::new())),
266 20826 : allow_panic: AtomicBool::new(false),
267 20826 : crash_request: AtomicBool::new(false),
268 20826 : }
269 20826 : }
270 : }
271 :
272 : // Functions for executor to control thread execution.
273 : impl ThreadContext {
274 : /// Set atomic flag to indicate that thread is ready to be woken up.
275 691284 : fn inc_wake(&self) {
276 691284 : self.wakeup.store(PENDING_WAKEUP, Ordering::SeqCst);
277 691284 : }
278 :
279 : /// Internal function used for event queues.
280 182273 : pub(crate) fn schedule_wakeup(self: &Arc<Self>, after_ms: u64) {
281 182273 : self.clock
282 182273 : .get()
283 182273 : .unwrap()
284 182273 : .schedule_wakeup(after_ms, self.clone());
285 182273 : }
286 :
287 1 : fn tid(&self) -> u32 {
288 1 : self.id.load(Ordering::SeqCst)
289 1 : }
290 :
291 20145 : fn crash_stop(&self) {
292 20145 : let status = self.mutex.lock();
293 20145 : if *status == Status::Finished {
294 9 : debug!(
295 0 : "trying to crash thread-{}, which is already finished",
296 0 : self.tid()
297 : );
298 9 : return;
299 20136 : }
300 20136 : assert!(matches!(*status, Status::Sleep));
301 20136 : drop(status);
302 :
303 20136 : self.allow_panic.store(true, Ordering::SeqCst);
304 20136 : self.crash_request.store(true, Ordering::SeqCst);
305 : // set a wakeup
306 20136 : self.inc_wake();
307 : // it will panic on the next wakeup
308 20145 : }
309 : }
310 :
311 : // Internal functions.
312 : impl ThreadContext {
313 : /// Blocks thread until it's woken up by the executor. If `after_ms` is 0, is will be
314 : /// woken on the next step. If `after_ms` > 0, wakeup is scheduled after that time.
315 : /// Otherwise wakeup is not scheduled inside `yield_me`, and should be arranged before
316 : /// calling this function.
317 289752 : fn yield_me(self: &Arc<Self>, after_ms: i64) {
318 289752 : let mut status = self.mutex.lock();
319 289752 : assert!(matches!(*status, Status::Running));
320 :
321 289752 : match after_ms.cmp(&0) {
322 239521 : std::cmp::Ordering::Less => {
323 239521 : // block until something wakes us up
324 239521 : }
325 21914 : std::cmp::Ordering::Equal => {
326 21914 : // tell executor that we are ready to be woken up
327 21914 : self.inc_wake();
328 21914 : }
329 28317 : std::cmp::Ordering::Greater => {
330 28317 : // schedule wakeup
331 28317 : self.clock
332 28317 : .get()
333 28317 : .unwrap()
334 28317 : .schedule_wakeup(after_ms as u64, self.clone());
335 28317 : }
336 : }
337 :
338 289752 : *status = Status::Sleep;
339 289752 : self.condvar.notify_all();
340 :
341 : // wait until executor wakes us up
342 579446 : while *status != Status::Running {
343 289694 : self.condvar.wait(&mut status);
344 289694 : }
345 :
346 289752 : if self.crash_request.load(Ordering::SeqCst) {
347 19804 : panic!("crashed by request");
348 269948 : }
349 269948 : }
350 :
351 : /// Called only once, exactly before thread finishes execution.
352 20240 : fn finish_me(&self) {
353 20240 : let mut status = self.mutex.lock();
354 20240 : assert!(matches!(*status, Status::Running));
355 :
356 20240 : *status = Status::Finished;
357 : {
358 20240 : let mut result = self.result.lock();
359 20240 : if result.0 == -1 {
360 20 : *result = (0, "finished normally".to_owned());
361 20220 : }
362 : }
363 20240 : self.condvar.notify_all();
364 20240 : }
365 : }
366 :
367 : /// Invokes the given closure with a reference to the current thread [`ThreadContext`].
368 : #[inline(always)]
369 1924489 : fn with_thread_context<T>(f: impl FnOnce(&Arc<ThreadContext>) -> T) -> T {
370 : thread_local!(static THREAD_DATA: Arc<ThreadContext> = Arc::new(ThreadContext::new()));
371 1924489 : THREAD_DATA.with(f)
372 1865267 : }
373 :
374 : /// Waker is used to wake up threads that are blocked on condition.
375 : /// It keeps track of contexts [`Arc<ThreadContext>`] and can increment the counter
376 : /// of several contexts to send a notification.
377 : pub struct Waker {
378 : // contexts that are waiting for a notification
379 : contexts: parking_lot::Mutex<smallvec::SmallVec<[Arc<ThreadContext>; 8]>>,
380 : }
381 :
382 : impl Default for Waker {
383 0 : fn default() -> Self {
384 0 : Self::new()
385 0 : }
386 : }
387 :
388 : impl Waker {
389 84055 : pub fn new() -> Self {
390 84055 : Self {
391 84055 : contexts: parking_lot::Mutex::new(smallvec::SmallVec::new()),
392 84055 : }
393 84055 : }
394 :
395 : /// Subscribe current thread to receive a wake notification later.
396 870879 : pub fn wake_me_later(&self) {
397 870879 : with_thread_context(|ctx| {
398 870879 : self.contexts.lock().push(ctx.clone());
399 870879 : });
400 870879 : }
401 :
402 : /// Wake up all threads that are waiting for a notification and clear the list.
403 127404 : pub fn wake_all(&self) {
404 127404 : let mut v = self.contexts.lock();
405 428434 : for ctx in v.iter() {
406 428434 : ctx.inc_wake();
407 428434 : }
408 127404 : v.clear();
409 127404 : }
410 : }
411 :
412 : /// See [`ThreadContext::yield_me`].
413 269454 : pub fn yield_me(after_ms: i64) {
414 269454 : with_thread_context(|ctx| ctx.yield_me(after_ms))
415 269454 : }
416 :
417 : /// Get current time.
418 722454 : pub fn now() -> u64 {
419 722454 : with_thread_context(|ctx| ctx.clock.get().unwrap().now())
420 722454 : }
421 :
422 416 : pub fn exit(code: i32, msg: String) -> ! {
423 416 : with_thread_context(|ctx| {
424 416 : ctx.allow_panic.store(true, Ordering::SeqCst);
425 416 : let mut result = ctx.result.lock();
426 416 : *result = (code, msg);
427 416 : panic!("exit");
428 : })
429 : }
430 :
431 528 : pub(crate) fn get_thread_ctx() -> Arc<ThreadContext> {
432 528 : with_thread_context(|ctx| ctx.clone())
433 528 : }
434 :
435 : /// Trait for polling channels until they have something.
436 : pub trait PollSome {
437 : /// Schedule wakeup for message arrival.
438 : fn wake_me(&self);
439 :
440 : /// Check if channel has a ready message.
441 : fn has_some(&self) -> bool;
442 : }
443 :
444 : /// Blocks current thread until one of the channels has a ready message. Returns
445 : /// index of the channel that has a message. If timeout is reached, returns None.
446 : ///
447 : /// Negative timeout means block forever. Zero timeout means check channels and return
448 : /// immediately. Positive timeout means block until timeout is reached.
449 108326 : pub fn epoll_chans(chans: &[Box<dyn PollSome>], timeout: i64) -> Option<usize> {
450 108326 : let deadline = if timeout < 0 {
451 79197 : 0
452 : } else {
453 29129 : now() + timeout as u64
454 : };
455 :
456 : loop {
457 1053764 : for chan in chans {
458 867899 : chan.wake_me()
459 : }
460 :
461 696876 : for (i, chan) in chans.iter().enumerate() {
462 696876 : if chan.has_some() {
463 86614 : return Some(i);
464 610262 : }
465 : }
466 :
467 99251 : if timeout < 0 {
468 68139 : // block until wakeup
469 68139 : yield_me(-1);
470 68139 : } else {
471 31112 : let current_time = now();
472 31112 : if current_time >= deadline {
473 21712 : return None;
474 9400 : }
475 :
476 9400 : yield_me((deadline - current_time) as i64);
477 : }
478 : }
479 108326 : }
|