Line data Source code
1 : //! A C-Rust shim: defines implementation of C walproposer API, assuming wp
2 : //! callback_data stores Box to some Rust implementation.
3 :
4 : #![allow(dead_code)]
5 :
6 : use std::ffi::{CStr, CString};
7 :
8 : use crate::bindings::{
9 : NeonWALReadResult, PGAsyncReadResult, PGAsyncWriteResult, Safekeeper, Size, StringInfoData,
10 : TimestampTz, WalProposer, WalProposerConnStatusType, WalProposerConnectPollStatusType,
11 : WalProposerExecStatusType, WalproposerShmemState, XLogRecPtr, uint32, walproposer_api,
12 : };
13 : use crate::walproposer::{ApiImpl, StreamingCallback, WaitResult};
14 :
15 1606 : extern "C" fn get_shmem_state(wp: *mut WalProposer) -> *mut WalproposerShmemState {
16 : unsafe {
17 1606 : let callback_data = (*(*wp).config).callback_data;
18 1606 : let api = callback_data as *mut Box<dyn ApiImpl>;
19 1606 : (*api).get_shmem_state()
20 : }
21 1606 : }
22 :
23 244 : extern "C-unwind" fn start_streaming(wp: *mut WalProposer, startpos: XLogRecPtr) {
24 244 : unsafe {
25 244 : let callback_data = (*(*wp).config).callback_data;
26 244 : let api = callback_data as *mut Box<dyn ApiImpl>;
27 244 : let callback = StreamingCallback::new(wp);
28 244 : (*api).start_streaming(startpos, &callback);
29 244 : }
30 244 : }
31 :
32 136 : extern "C" fn get_flush_rec_ptr(wp: *mut WalProposer) -> XLogRecPtr {
33 : unsafe {
34 136 : let callback_data = (*(*wp).config).callback_data;
35 136 : let api = callback_data as *mut Box<dyn ApiImpl>;
36 136 : (*api).get_flush_rec_ptr()
37 : }
38 136 : }
39 :
40 1393 : extern "C" fn update_donor(wp: *mut WalProposer, donor: *mut Safekeeper, donor_lsn: XLogRecPtr) {
41 : unsafe {
42 1393 : let callback_data = (*(*wp).config).callback_data;
43 1393 : let api = callback_data as *mut Box<dyn ApiImpl>;
44 1393 : (*api).update_donor(&mut (*donor), donor_lsn)
45 : }
46 1393 : }
47 :
48 341674 : extern "C" fn get_current_timestamp(wp: *mut WalProposer) -> TimestampTz {
49 : unsafe {
50 341674 : let callback_data = (*(*wp).config).callback_data;
51 341674 : let api = callback_data as *mut Box<dyn ApiImpl>;
52 341674 : (*api).get_current_timestamp()
53 : }
54 341674 : }
55 :
56 11554 : extern "C" fn conn_error_message(sk: *mut Safekeeper) -> *mut ::std::os::raw::c_char {
57 : unsafe {
58 11554 : let callback_data = (*(*(*sk).wp).config).callback_data;
59 11554 : let api = callback_data as *mut Box<dyn ApiImpl>;
60 11554 : let msg = (*api).conn_error_message(&mut (*sk));
61 11554 : let msg = CString::new(msg).unwrap();
62 : // TODO: fix leaking error message
63 11554 : msg.into_raw()
64 : }
65 11554 : }
66 :
67 35169 : extern "C" fn conn_status(sk: *mut Safekeeper) -> WalProposerConnStatusType {
68 : unsafe {
69 35169 : let callback_data = (*(*(*sk).wp).config).callback_data;
70 35169 : let api = callback_data as *mut Box<dyn ApiImpl>;
71 35169 : (*api).conn_status(&mut (*sk))
72 : }
73 35169 : }
74 :
75 35169 : extern "C" fn conn_connect_start(sk: *mut Safekeeper) {
76 : unsafe {
77 35169 : let callback_data = (*(*(*sk).wp).config).callback_data;
78 35169 : let api = callback_data as *mut Box<dyn ApiImpl>;
79 35169 : (*api).conn_connect_start(&mut (*sk))
80 : }
81 35169 : }
82 :
83 31614 : extern "C" fn conn_connect_poll(sk: *mut Safekeeper) -> WalProposerConnectPollStatusType {
84 : unsafe {
85 31614 : let callback_data = (*(*(*sk).wp).config).callback_data;
86 31614 : let api = callback_data as *mut Box<dyn ApiImpl>;
87 31614 : (*api).conn_connect_poll(&mut (*sk))
88 : }
89 31614 : }
90 :
91 31614 : extern "C" fn conn_send_query(sk: *mut Safekeeper, query: *mut ::std::os::raw::c_char) -> bool {
92 31614 : let query = unsafe { CStr::from_ptr(query) };
93 31614 : let query = query.to_str().unwrap();
94 :
95 : unsafe {
96 31614 : let callback_data = (*(*(*sk).wp).config).callback_data;
97 31614 : let api = callback_data as *mut Box<dyn ApiImpl>;
98 31614 : (*api).conn_send_query(&mut (*sk), query)
99 : }
100 31614 : }
101 :
102 31614 : extern "C" fn conn_get_query_result(sk: *mut Safekeeper) -> WalProposerExecStatusType {
103 : unsafe {
104 31614 : let callback_data = (*(*(*sk).wp).config).callback_data;
105 31614 : let api = callback_data as *mut Box<dyn ApiImpl>;
106 31614 : (*api).conn_get_query_result(&mut (*sk))
107 : }
108 31614 : }
109 :
110 0 : extern "C" fn conn_flush(sk: *mut Safekeeper) -> ::std::os::raw::c_int {
111 : unsafe {
112 0 : let callback_data = (*(*(*sk).wp).config).callback_data;
113 0 : let api = callback_data as *mut Box<dyn ApiImpl>;
114 0 : (*api).conn_flush(&mut (*sk))
115 : }
116 0 : }
117 :
118 11788 : extern "C" fn conn_finish(sk: *mut Safekeeper) {
119 : unsafe {
120 11788 : let callback_data = (*(*(*sk).wp).config).callback_data;
121 11788 : let api = callback_data as *mut Box<dyn ApiImpl>;
122 11788 : (*api).conn_finish(&mut (*sk))
123 : }
124 11788 : }
125 :
126 22505 : extern "C" fn conn_async_read(
127 22505 : sk: *mut Safekeeper,
128 22505 : buf: *mut *mut ::std::os::raw::c_char,
129 22505 : amount: *mut ::std::os::raw::c_int,
130 22505 : ) -> PGAsyncReadResult {
131 : unsafe {
132 22505 : let callback_data = (*(*(*sk).wp).config).callback_data;
133 22505 : let api = callback_data as *mut Box<dyn ApiImpl>;
134 :
135 : // This function has guarantee that returned buf will be valid until
136 : // the next call. So we can store a Vec in each Safekeeper and reuse
137 : // it on the next call.
138 22505 : let mut inbuf = take_vec_u8(&mut (*sk).inbuf).unwrap_or_default();
139 22505 : inbuf.clear();
140 :
141 22505 : let result = (*api).conn_async_read(&mut (*sk), &mut inbuf);
142 :
143 : // Put a Vec back to sk->inbuf and return data ptr.
144 22505 : *amount = inbuf.len() as i32;
145 22505 : *buf = store_vec_u8(&mut (*sk).inbuf, inbuf);
146 :
147 22505 : result
148 : }
149 22505 : }
150 :
151 7263 : extern "C" fn conn_async_write(
152 7263 : sk: *mut Safekeeper,
153 7263 : buf: *const ::std::os::raw::c_void,
154 7263 : size: usize,
155 7263 : ) -> PGAsyncWriteResult {
156 : unsafe {
157 7263 : let buf = std::slice::from_raw_parts(buf as *const u8, size);
158 7263 : let callback_data = (*(*(*sk).wp).config).callback_data;
159 7263 : let api = callback_data as *mut Box<dyn ApiImpl>;
160 7263 : (*api).conn_async_write(&mut (*sk), buf)
161 : }
162 7263 : }
163 :
164 36290 : extern "C" fn conn_blocking_write(
165 36290 : sk: *mut Safekeeper,
166 36290 : buf: *const ::std::os::raw::c_void,
167 36290 : size: usize,
168 36290 : ) -> bool {
169 : unsafe {
170 36290 : let buf = std::slice::from_raw_parts(buf as *const u8, size);
171 36290 : let callback_data = (*(*(*sk).wp).config).callback_data;
172 36290 : let api = callback_data as *mut Box<dyn ApiImpl>;
173 36290 : (*api).conn_blocking_write(&mut (*sk), buf)
174 : }
175 36290 : }
176 :
177 799 : extern "C-unwind" fn recovery_download(wp: *mut WalProposer, sk: *mut Safekeeper) -> bool {
178 : unsafe {
179 799 : let callback_data = (*(*(*sk).wp).config).callback_data;
180 799 : let api = callback_data as *mut Box<dyn ApiImpl>;
181 :
182 : // currently `recovery_download` is always called right after election
183 799 : (*api).after_election(&mut (*wp));
184 :
185 799 : (*api).recovery_download(&mut (*wp), &mut (*sk))
186 : }
187 799 : }
188 :
189 1416 : extern "C" fn wal_reader_allocate(sk: *mut Safekeeper) {
190 1416 : unsafe {
191 1416 : let callback_data = (*(*(*sk).wp).config).callback_data;
192 1416 : let api = callback_data as *mut Box<dyn ApiImpl>;
193 1416 : (*api).wal_reader_allocate(&mut (*sk));
194 1416 : }
195 1416 : }
196 :
197 : #[allow(clippy::unnecessary_cast)]
198 1333 : extern "C" fn wal_read(
199 1333 : sk: *mut Safekeeper,
200 1333 : buf: *mut ::std::os::raw::c_char,
201 1333 : startptr: XLogRecPtr,
202 1333 : count: Size,
203 1333 : _errmsg: *mut *mut ::std::os::raw::c_char,
204 1333 : ) -> NeonWALReadResult {
205 : unsafe {
206 1333 : let buf = std::slice::from_raw_parts_mut(buf as *mut u8, count);
207 1333 : let callback_data = (*(*(*sk).wp).config).callback_data;
208 1333 : let api = callback_data as *mut Box<dyn ApiImpl>;
209 : // TODO: errmsg is not forwarded
210 1333 : (*api).wal_read(&mut (*sk), buf, startptr)
211 : }
212 1333 : }
213 :
214 26979 : extern "C" fn wal_reader_events(sk: *mut Safekeeper) -> uint32 {
215 : unsafe {
216 26979 : let callback_data = (*(*(*sk).wp).config).callback_data;
217 26979 : let api = callback_data as *mut Box<dyn ApiImpl>;
218 26979 : (*api).wal_reader_events(&mut (*sk))
219 : }
220 26979 : }
221 :
222 9554 : extern "C" fn init_event_set(wp: *mut WalProposer) {
223 9554 : unsafe {
224 9554 : let callback_data = (*(*wp).config).callback_data;
225 9554 : let api = callback_data as *mut Box<dyn ApiImpl>;
226 9554 : (*api).init_event_set(&mut (*wp));
227 9554 : }
228 9554 : }
229 :
230 70211 : extern "C" fn update_event_set(sk: *mut Safekeeper, events: uint32) {
231 70211 : unsafe {
232 70211 : let callback_data = (*(*(*sk).wp).config).callback_data;
233 70211 : let api = callback_data as *mut Box<dyn ApiImpl>;
234 70211 : (*api).update_event_set(&mut (*sk), events);
235 70211 : }
236 70211 : }
237 :
238 8935 : extern "C" fn active_state_update_event_set(sk: *mut Safekeeper) {
239 8935 : unsafe {
240 8935 : let callback_data = (*(*(*sk).wp).config).callback_data;
241 8935 : let api = callback_data as *mut Box<dyn ApiImpl>;
242 8935 : (*api).active_state_update_event_set(&mut (*sk));
243 8935 : }
244 8935 : }
245 :
246 63228 : extern "C" fn add_safekeeper_event_set(sk: *mut Safekeeper, events: uint32) {
247 63228 : unsafe {
248 63228 : let callback_data = (*(*(*sk).wp).config).callback_data;
249 63228 : let api = callback_data as *mut Box<dyn ApiImpl>;
250 63228 : (*api).add_safekeeper_event_set(&mut (*sk), events);
251 63228 : }
252 63228 : }
253 :
254 39847 : extern "C" fn rm_safekeeper_event_set(sk: *mut Safekeeper) {
255 39847 : unsafe {
256 39847 : let callback_data = (*(*(*sk).wp).config).callback_data;
257 39847 : let api = callback_data as *mut Box<dyn ApiImpl>;
258 39847 : (*api).rm_safekeeper_event_set(&mut (*sk));
259 39847 : }
260 39847 : }
261 :
262 95053 : extern "C-unwind" fn wait_event_set(
263 95053 : wp: *mut WalProposer,
264 95053 : timeout: ::std::os::raw::c_long,
265 95053 : event_sk: *mut *mut Safekeeper,
266 95053 : events: *mut uint32,
267 95053 : ) -> ::std::os::raw::c_int {
268 : unsafe {
269 95053 : let callback_data = (*(*wp).config).callback_data;
270 95053 : let api = callback_data as *mut Box<dyn ApiImpl>;
271 95053 : let result = (*api).wait_event_set(&mut (*wp), timeout);
272 95053 : match result {
273 : WaitResult::Latch => {
274 9550 : *event_sk = std::ptr::null_mut();
275 9550 : *events = crate::bindings::WL_LATCH_SET;
276 9550 : 1
277 : }
278 : WaitResult::Timeout => {
279 2815 : *event_sk = std::ptr::null_mut();
280 : // WaitEventSetWait returns 0 for timeout.
281 2815 : *events = 0;
282 2815 : 0
283 : }
284 82688 : WaitResult::Network(sk, event_mask) => {
285 82688 : *event_sk = sk;
286 82688 : *events = event_mask;
287 82688 : 1
288 : }
289 : }
290 : }
291 95053 : }
292 :
293 0 : extern "C" fn strong_random(
294 0 : wp: *mut WalProposer,
295 0 : buf: *mut ::std::os::raw::c_void,
296 0 : len: usize,
297 0 : ) -> bool {
298 : unsafe {
299 0 : let buf = std::slice::from_raw_parts_mut(buf as *mut u8, len);
300 0 : let callback_data = (*(*wp).config).callback_data;
301 0 : let api = callback_data as *mut Box<dyn ApiImpl>;
302 0 : (*api).strong_random(buf)
303 : }
304 0 : }
305 :
306 335 : extern "C" fn get_redo_start_lsn(wp: *mut WalProposer) -> XLogRecPtr {
307 : unsafe {
308 335 : let callback_data = (*(*wp).config).callback_data;
309 335 : let api = callback_data as *mut Box<dyn ApiImpl>;
310 335 : (*api).get_redo_start_lsn()
311 : }
312 335 : }
313 :
314 469 : unsafe extern "C-unwind" fn finish_sync_safekeepers(wp: *mut WalProposer, lsn: XLogRecPtr) -> ! {
315 : unsafe {
316 469 : let callback_data = (*(*wp).config).callback_data;
317 469 : let api = callback_data as *mut Box<dyn ApiImpl>;
318 469 : (*api).finish_sync_safekeepers(lsn)
319 : }
320 : }
321 :
322 3362 : extern "C" fn process_safekeeper_feedback(wp: *mut WalProposer, sk: *mut Safekeeper) {
323 3362 : unsafe {
324 3362 : let callback_data = (*(*wp).config).callback_data;
325 3362 : let api = callback_data as *mut Box<dyn ApiImpl>;
326 3362 : (*api).process_safekeeper_feedback(&mut (*wp), &mut (*sk));
327 3362 : }
328 3362 : }
329 :
330 164576 : extern "C-unwind" fn log_internal(
331 164576 : wp: *mut WalProposer,
332 164576 : level: ::std::os::raw::c_int,
333 164576 : line: *const ::std::os::raw::c_char,
334 164576 : ) {
335 : unsafe {
336 164576 : let callback_data = (*(*wp).config).callback_data;
337 164576 : let api = callback_data as *mut Box<dyn ApiImpl>;
338 164576 : let line = CStr::from_ptr(line);
339 164576 : let line = line.to_str().unwrap();
340 164576 : (*api).log_internal(&mut (*wp), Level::from(level as u32), line)
341 : }
342 164576 : }
343 :
344 : #[derive(Debug, PartialEq)]
345 : pub enum Level {
346 : Debug5,
347 : Debug4,
348 : Debug3,
349 : Debug2,
350 : Debug1,
351 : Log,
352 : Info,
353 : Notice,
354 : Warning,
355 : Error,
356 : Fatal,
357 : Panic,
358 : WPEvent,
359 : }
360 :
361 : impl Level {
362 164576 : pub fn from(elevel: u32) -> Level {
363 : use crate::bindings::*;
364 :
365 164576 : match elevel {
366 5847 : DEBUG5 => Level::Debug5,
367 0 : DEBUG4 => Level::Debug4,
368 0 : DEBUG3 => Level::Debug3,
369 3362 : DEBUG2 => Level::Debug2,
370 0 : DEBUG1 => Level::Debug1,
371 141738 : LOG => Level::Log,
372 0 : INFO => Level::Info,
373 0 : NOTICE => Level::Notice,
374 13565 : WARNING => Level::Warning,
375 0 : ERROR => Level::Error,
376 60 : FATAL => Level::Fatal,
377 4 : PANIC => Level::Panic,
378 0 : WPEVENT => Level::WPEvent,
379 0 : _ => panic!("unknown log level {elevel}"),
380 : }
381 164576 : }
382 : }
383 :
384 9554 : pub(crate) fn create_api() -> walproposer_api {
385 9554 : walproposer_api {
386 9554 : get_shmem_state: Some(get_shmem_state),
387 9554 : start_streaming: Some(start_streaming),
388 9554 : get_flush_rec_ptr: Some(get_flush_rec_ptr),
389 9554 : update_donor: Some(update_donor),
390 9554 : get_current_timestamp: Some(get_current_timestamp),
391 9554 : conn_error_message: Some(conn_error_message),
392 9554 : conn_status: Some(conn_status),
393 9554 : conn_connect_start: Some(conn_connect_start),
394 9554 : conn_connect_poll: Some(conn_connect_poll),
395 9554 : conn_send_query: Some(conn_send_query),
396 9554 : conn_get_query_result: Some(conn_get_query_result),
397 9554 : conn_flush: Some(conn_flush),
398 9554 : conn_finish: Some(conn_finish),
399 9554 : conn_async_read: Some(conn_async_read),
400 9554 : conn_async_write: Some(conn_async_write),
401 9554 : conn_blocking_write: Some(conn_blocking_write),
402 9554 : recovery_download: Some(recovery_download),
403 9554 : wal_reader_allocate: Some(wal_reader_allocate),
404 9554 : wal_read: Some(wal_read),
405 9554 : wal_reader_events: Some(wal_reader_events),
406 9554 : init_event_set: Some(init_event_set),
407 9554 : update_event_set: Some(update_event_set),
408 9554 : active_state_update_event_set: Some(active_state_update_event_set),
409 9554 : add_safekeeper_event_set: Some(add_safekeeper_event_set),
410 9554 : rm_safekeeper_event_set: Some(rm_safekeeper_event_set),
411 9554 : wait_event_set: Some(wait_event_set),
412 9554 : strong_random: Some(strong_random),
413 9554 : get_redo_start_lsn: Some(get_redo_start_lsn),
414 9554 : finish_sync_safekeepers: Some(finish_sync_safekeepers),
415 9554 : process_safekeeper_feedback: Some(process_safekeeper_feedback),
416 9554 : log_internal: Some(log_internal),
417 9554 : }
418 9554 : }
419 :
420 9554 : pub fn empty_shmem() -> crate::bindings::WalproposerShmemState {
421 9554 : let empty_feedback = crate::bindings::PageserverFeedback {
422 9554 : present: false,
423 9554 : currentClusterSize: 0,
424 9554 : last_received_lsn: 0,
425 9554 : disk_consistent_lsn: 0,
426 9554 : remote_consistent_lsn: 0,
427 9554 : replytime: 0,
428 9554 : shard_number: 0,
429 9554 : corruption_detected: false,
430 9554 : };
431 :
432 9554 : let empty_wal_rate_limiter = crate::bindings::WalRateLimiter {
433 9554 : effective_max_wal_bytes_per_second: crate::bindings::pg_atomic_uint32 { value: 0 },
434 9554 : should_limit: crate::bindings::pg_atomic_uint32 { value: 0 },
435 9554 : sent_bytes: 0,
436 9554 : batch_start_time_us: crate::bindings::pg_atomic_uint64 { value: 0 },
437 9554 : batch_end_time_us: crate::bindings::pg_atomic_uint64 { value: 0 },
438 9554 : };
439 :
440 9554 : crate::bindings::WalproposerShmemState {
441 9554 : propEpochStartLsn: crate::bindings::pg_atomic_uint64 { value: 0 },
442 9554 : donor_name: [0; 64],
443 9554 : donor_conninfo: [0; 1024],
444 9554 : donor_lsn: 0,
445 9554 : mutex: 0,
446 9554 : mineLastElectedTerm: crate::bindings::pg_atomic_uint64 { value: 0 },
447 9554 : backpressureThrottlingTime: crate::bindings::pg_atomic_uint64 { value: 0 },
448 9554 : currentClusterSize: crate::bindings::pg_atomic_uint64 { value: 0 },
449 9554 : shard_ps_feedback: [empty_feedback; 128],
450 9554 : num_shards: 0,
451 9554 : replica_promote: false,
452 9554 : min_ps_feedback: empty_feedback,
453 9554 : wal_rate_limiter: empty_wal_rate_limiter,
454 9554 : }
455 9554 : }
456 :
457 : impl std::fmt::Display for Level {
458 693 : fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
459 693 : write!(f, "{self:?}")
460 693 : }
461 : }
462 :
463 : /// Take ownership of `Vec<u8>` from StringInfoData.
464 : #[allow(clippy::unnecessary_cast)]
465 51159 : pub(crate) fn take_vec_u8(pg: &mut StringInfoData) -> Option<Vec<u8>> {
466 51159 : if pg.data.is_null() {
467 28660 : return None;
468 22499 : }
469 :
470 22499 : let ptr = pg.data as *mut u8;
471 22499 : let length = pg.len as usize;
472 22499 : let capacity = pg.maxlen as usize;
473 :
474 22499 : pg.data = std::ptr::null_mut();
475 22499 : pg.len = 0;
476 22499 : pg.maxlen = 0;
477 :
478 22499 : unsafe { Some(Vec::from_raw_parts(ptr, length, capacity)) }
479 51159 : }
480 :
481 : /// Store `Vec<u8>` in StringInfoData.
482 22505 : fn store_vec_u8(pg: &mut StringInfoData, vec: Vec<u8>) -> *mut ::std::os::raw::c_char {
483 22505 : let ptr = vec.as_ptr() as *mut ::std::os::raw::c_char;
484 22505 : let length = vec.len();
485 22505 : let capacity = vec.capacity();
486 :
487 22505 : assert!(pg.data.is_null());
488 :
489 22505 : pg.data = ptr;
490 22505 : pg.len = length as i32;
491 22505 : pg.maxlen = capacity as i32;
492 :
493 22505 : std::mem::forget(vec);
494 :
495 22505 : ptr
496 22505 : }
|