artichoke_backend/extn/core/string/
ffi.rs

1use core::char;
2use core::convert::TryFrom;
3use core::hash::BuildHasher;
4use core::num::Wrapping;
5use core::ptr;
6use core::slice;
7use core::str;
8use std::collections::TryReserveError;
9use std::ffi::{CStr, c_char, c_double, c_int, c_void};
10use std::io::Write as _;
11use std::ptr::NonNull;
12
13use artichoke_core::convert::Convert;
14use artichoke_core::hash::Hash as _;
15use bstr::ByteSlice;
16use spinoso_exception::ArgumentError;
17use spinoso_exception::NoMemoryError;
18use spinoso_string::{RawParts, String};
19
20use super::trampoline;
21use crate::convert::BoxUnboxVmValue;
22use crate::error;
23use crate::sys;
24use crate::value::Value;
25
26// ```c
27// MRB_API mrb_value mrb_str_new_capa(mrb_state *mrb, size_t capa)
28// ```
29#[unsafe(no_mangle)]
30unsafe extern "C-unwind" fn mrb_str_new_capa(mrb: *mut sys::mrb_state, capa: sys::mrb_int) -> sys::mrb_value {
31    let capa = if let Ok(capa) = usize::try_from(capa) {
32        capa
33    } else {
34        return sys::mrb_sys_nil_value();
35    };
36    unwrap_interpreter!(mrb, to => guard);
37    let result = String::with_capacity(capa);
38    let result = String::alloc_value(result, &mut guard);
39    match result {
40        Ok(value) => value.inner(),
41        Err(exception) => {
42            // SAFETY: only Copy objects remain on the stack
43            unsafe { error::raise(guard, exception) }
44        }
45    }
46}
47
48// ```c
49// MRB_API mrb_value mrb_str_new(mrb_state *mrb, const char *p, size_t len)
50// ```
51#[unsafe(no_mangle)]
52unsafe extern "C-unwind" fn mrb_str_new(
53    mrb: *mut sys::mrb_state,
54    p: *const c_char,
55    len: sys::mrb_int,
56) -> sys::mrb_value {
57    let len = if let Ok(len) = usize::try_from(len) {
58        len
59    } else {
60        return sys::mrb_sys_nil_value();
61    };
62    unwrap_interpreter!(mrb, to => guard);
63    let s = if p.is_null() {
64        String::utf8(vec![0; len])
65    } else {
66        let bytes = slice::from_raw_parts(p.cast::<u8>(), len);
67        let bytes = bytes.to_vec();
68        String::utf8(bytes)
69    };
70    let result = String::alloc_value(s, &mut guard);
71    match result {
72        Ok(value) => value.inner(),
73        Err(exception) => {
74            // SAFETY: only Copy objects remain on the stack
75            unsafe { error::raise(guard, exception) }
76        }
77    }
78}
79
80// ```c
81// MRB_API mrb_value mrb_str_new_cstr(mrb_state *mrb, const char *p)
82// ```
83#[unsafe(no_mangle)]
84unsafe extern "C-unwind" fn mrb_str_new_cstr(mrb: *mut sys::mrb_state, p: *const c_char) -> sys::mrb_value {
85    unwrap_interpreter!(mrb, to => guard);
86    let cstr = CStr::from_ptr(p);
87    let bytes = cstr.to_bytes().to_vec();
88    let result = String::utf8(bytes);
89    let result = String::alloc_value(result, &mut guard);
90    match result {
91        Ok(value) => value.inner(),
92        Err(exception) => {
93            // SAFETY: only Copy objects remain on the stack
94            unsafe { error::raise(guard, exception) }
95        }
96    }
97}
98
99// ```c
100// MRB_API mrb_value mrb_str_new_static(mrb_state *mrb, const char *p, size_t len)
101// ```
102#[unsafe(no_mangle)]
103unsafe extern "C-unwind" fn mrb_str_new_static(
104    mrb: *mut sys::mrb_state,
105    p: *const c_char,
106    len: sys::mrb_int,
107) -> sys::mrb_value {
108    // Artichoke doesn't have a static string optimization.
109    mrb_str_new(mrb, p, len)
110}
111
112// ```c
113// MRB_API mrb_int mrb_str_index(mrb_state *mrb, mrb_value str, const char *sptr, mrb_int slen, mrb_int offset)
114// ```
115#[unsafe(no_mangle)]
116#[expect(
117    clippy::cast_possible_wrap,
118    reason = "mruby stores sizes as int64_t instead of size_t"
119)]
120unsafe extern "C-unwind" fn mrb_str_index(
121    mrb: *mut sys::mrb_state,
122    s: sys::mrb_value,
123    sptr: *const c_char,
124    slen: sys::mrb_int,
125    offset: sys::mrb_int,
126) -> sys::mrb_int {
127    unwrap_interpreter!(mrb, to => guard, or_else = -1);
128    let mut value = s.into();
129    let Ok(string) = String::unbox_from_value(&mut value, &mut guard) else {
130        return -1;
131    };
132
133    /*
134    len = RSTRING_LEN(str);
135    if (offset < 0) {
136      offset += len;
137      if (offset < 0) return -1;
138    }
139    if (len - offset < slen) return -1;
140    s = RSTRING_PTR(str);
141    if (offset) {
142      s += offset;
143    }
144    if (slen == 0) return offset;
145    /* need proceed one character at a time */
146    len = RSTRING_LEN(str) - offset;
147    */
148    let mut offset = isize::try_from(offset).unwrap_or(0);
149    let length = isize::try_from(string.len()).unwrap_or(0);
150    if offset < 0 {
151        offset += length;
152    }
153    let Ok(offset) = usize::try_from(offset) else {
154        return -1;
155    };
156    let Some(haystack) = string.get(offset..) else {
157        return -1;
158    };
159    let needle = slice::from_raw_parts(sptr.cast::<u8>(), usize::try_from(slen).unwrap_or(0));
160    if needle.is_empty() {
161        return offset as sys::mrb_int;
162    }
163    haystack.find(needle).map_or(-1, |pos| pos as sys::mrb_int)
164}
165
166// ```c
167// mrb_value mrb_str_aref(mrb_state *mrb, mrb_value str, mrb_value indx, mrb_value alen)
168// ```
169#[unsafe(no_mangle)]
170unsafe extern "C-unwind" fn mrb_str_aref(
171    mrb: *mut sys::mrb_state,
172    s: sys::mrb_value,
173    indx: sys::mrb_value,
174    alen: sys::mrb_value,
175) -> sys::mrb_value {
176    unwrap_interpreter!(mrb, to => guard);
177    let value = Value::from(s);
178    let indx = Value::from(indx);
179    let alen = Value::from(alen);
180
181    let alen = if alen.is_unreachable() { None } else { Some(alen) };
182
183    let result = trampoline::aref(&mut guard, value, indx, alen);
184    match result {
185        Ok(value) => value.into(),
186        Err(_) => Value::nil().into(),
187    }
188}
189
190// ```c
191// MRB_API mrb_int mrb_str_strlen(mrb_state *mrb, struct RString *s)
192// ```
193//
194// NOTE: Implemented in C in `mruby-sys/src/mruby-sys/ext.c`.
195
196// ```c
197// MRB_API void mrb_str_modify_keep_ascii(mrb_state *mrb, struct RString *s)
198// MRB_API void mrb_str_modify(mrb_state *mrb, struct RString *s)
199// ```
200//
201// NOTE: Implemented in C in `mruby-sys/src/mruby-sys/ext.c`.
202
203// ```c
204// MRB_API mrb_value mrb_str_resize(mrb_state *mrb, mrb_value str, mrb_int len)
205// ```
206#[unsafe(no_mangle)]
207unsafe extern "C-unwind" fn mrb_str_resize(
208    mrb: *mut sys::mrb_state,
209    s: sys::mrb_value,
210    len: sys::mrb_int,
211) -> sys::mrb_value {
212    fn try_resize(s: &mut String, len: usize) -> Result<(), TryReserveError> {
213        match len.checked_sub(s.len()) {
214            Some(0) => {}
215            Some(additional) => s.try_reserve(additional)?,
216            // If the given length is less than the length of the `String`, truncate.
217            None => s.truncate(len),
218        }
219        Ok(())
220    }
221
222    unwrap_interpreter!(mrb, to => guard, or_else = s);
223    let mut value = s.into();
224    let Ok(mut string) = String::unbox_from_value(&mut value, &mut guard) else {
225        return s;
226    };
227    let Ok(len) = usize::try_from(len) else {
228        return s;
229    };
230    // SAFETY: The string is repacked before any intervening uses of `interp`
231    // which means no mruby heap allocations can occur.
232    let string_mut = string.as_inner_mut();
233
234    let result = try_resize(string_mut, len);
235
236    let inner = string.take();
237    let value = String::box_into_value(inner, value, &mut guard).expect("String reboxing should not fail");
238
239    match result {
240        Ok(()) => value.inner(),
241        // NOTE: Ideally this code would distinguish between a capacity overflow
242        // (string too large) vs an out of memory condition (allocation failure).
243        // This is not possible on stable Rust since `TryReserveErrorKind` is
244        // unstable.
245        Err(_) => {
246            // NOTE: This code can't use an `Error` unified exception trait object.
247            // Since we're in memory error territory, we're not sure if we can
248            // allocate the `Box` it requires.
249            let err = NoMemoryError::with_message("out of memory");
250            error::raise(guard, err);
251        }
252    }
253}
254
255// ```c
256// MRB_API char* mrb_str_to_cstr(mrb_state *mrb, mrb_value str0)
257// ```
258//
259// NOTE: Not implemented.
260
261// ```c
262// MRB_API void mrb_str_concat(mrb_state *mrb, mrb_value self, mrb_value other)
263// ```
264//
265// NOTE: Implemented in C in `mruby-sys/src/mruby-sys/ext.c`.
266//
267// ```
268// #[unsafe(no_mangle)]
269// unsafe extern "C-unwind" mrb_str_concat(mrb: *mut sys::mrb_state, this: sys::mrb_value, other: sys::mrb_value) {
270//     unwrap_interpreter!(mrb, to => guard, or_else = ());
271// }
272// ```
273
274// ```c
275// MRB_API mrb_value mrb_str_plus(mrb_state *mrb, mrb_value a, mrb_value b)
276// ```
277#[unsafe(no_mangle)]
278unsafe extern "C-unwind" fn mrb_str_plus(
279    mrb: *mut sys::mrb_state,
280    a: sys::mrb_value,
281    b: sys::mrb_value,
282) -> sys::mrb_value {
283    unwrap_interpreter!(mrb, to => guard);
284    let mut a = Value::from(a);
285    let mut b = Value::from(b);
286
287    let Ok(a) = String::unbox_from_value(&mut a, &mut guard) else {
288        return Value::nil().into();
289    };
290    let Ok(b) = String::unbox_from_value(&mut b, &mut guard) else {
291        return Value::nil().into();
292    };
293
294    let mut s = String::with_capacity_and_encoding(a.len() + b.len(), a.encoding());
295
296    s.extend_from_slice(a.as_slice());
297    s.extend_from_slice(b.as_slice());
298
299    let s = String::alloc_value(s, &mut guard).unwrap_or_default();
300    s.into()
301}
302
303// ```c
304// MRB_API int mrb_str_cmp(mrb_state *mrb, mrb_value str1, mrb_value str2)
305// ```
306#[unsafe(no_mangle)]
307unsafe extern "C-unwind" fn mrb_str_cmp(
308    mrb: *mut sys::mrb_state,
309    str1: sys::mrb_value,
310    str2: sys::mrb_value,
311) -> c_int {
312    unwrap_interpreter!(mrb, to => guard, or_else = -1);
313    let mut a = Value::from(str1);
314    let mut b = Value::from(str2);
315
316    let Ok(a) = String::unbox_from_value(&mut a, &mut guard) else {
317        return -1;
318    };
319    let Ok(b) = String::unbox_from_value(&mut b, &mut guard) else {
320        return -1;
321    };
322
323    a.cmp(&*b) as c_int
324}
325
326// ```c
327// MRB_API mrb_bool mrb_str_equal(mrb_state *mrb, mrb_value str1, mrb_value str2)
328// ```
329#[unsafe(no_mangle)]
330unsafe extern "C-unwind" fn mrb_str_equal(
331    mrb: *mut sys::mrb_state,
332    str1: sys::mrb_value,
333    str2: sys::mrb_value,
334) -> sys::mrb_bool {
335    unwrap_interpreter!(mrb, to => guard, or_else = false);
336    let mut a = Value::from(str1);
337    let mut b = Value::from(str2);
338
339    let Ok(a) = String::unbox_from_value(&mut a, &mut guard) else {
340        return false;
341    };
342    let Ok(b) = String::unbox_from_value(&mut b, &mut guard) else {
343        return false;
344    };
345
346    *a == *b
347}
348
349// ```c
350// MRB_API const char* mrb_string_value_ptr(mrb_state *mrb, mrb_value str)
351// ```
352//
353// obsolete: use `RSTRING_PTR()`
354//
355// NOTE: not implemented
356
357// ```c
358// MRB_API mrb_int mrb_string_value_len(mrb_state *mrb, mrb_value ptr)
359// ```
360//
361// obsolete: use `RSTRING_LEN()`
362//
363// NOTE: not implemented
364
365// ```c
366// MRB_API mrb_value mrb_str_dup(mrb_state *mrb, mrb_value str)
367// ```
368#[unsafe(no_mangle)]
369unsafe extern "C-unwind" fn mrb_str_dup(mrb: *mut sys::mrb_state, s: sys::mrb_value) -> sys::mrb_value {
370    unwrap_interpreter!(mrb, to => guard);
371    let mut string = Value::from(s);
372    let basic = sys::mrb_sys_basic_ptr(s).cast::<sys::RString>();
373    let class = (*basic).c;
374
375    let Ok(string) = String::unbox_from_value(&mut string, &mut guard) else {
376        return Value::nil().into();
377    };
378    let dup = string.clone();
379    let Ok(value) = String::alloc_value(dup, &mut guard) else {
380        return Value::nil().into();
381    };
382    let value = value.inner();
383
384    // dup'd strings keep the class of the source `String`.
385    let dup_basic = sys::mrb_sys_basic_ptr(value).cast::<sys::RString>();
386    (*dup_basic).c = class;
387
388    value
389}
390
391// ```c
392// MRB_API mrb_value mrb_str_substr(mrb_state *mrb, mrb_value str, mrb_int beg, mrb_int len)
393// ```
394#[unsafe(no_mangle)]
395unsafe extern "C-unwind" fn mrb_str_substr(
396    mrb: *mut sys::mrb_state,
397    s: sys::mrb_value,
398    beg: sys::mrb_int,
399    len: sys::mrb_int,
400) -> sys::mrb_value {
401    if len < 0 {
402        return Value::nil().into();
403    }
404    unwrap_interpreter!(mrb, to => guard);
405
406    let mut string = Value::from(s);
407    let Ok(string) = String::unbox_from_value(&mut string, &mut guard) else {
408        return Value::nil().into();
409    };
410
411    let offset = if let Ok(offset) = usize::try_from(beg) {
412        offset
413    } else {
414        let offset = beg
415            .checked_neg()
416            .and_then(|offset| usize::try_from(offset).ok())
417            .and_then(|offset| offset.checked_sub(string.len()));
418        let Some(offset) = offset else {
419            return Value::nil().into();
420        };
421        offset
422    };
423
424    // FIXME: mruby treats this as a character offset, not a byte offset.
425    let Some(slice) = string.get(offset..) else {
426        return Value::nil().into();
427    };
428    let substr = String::with_bytes_and_encoding(slice.to_vec(), string.encoding());
429    String::alloc_value(substr, &mut guard).unwrap_or_default().into()
430}
431
432// ```c
433// MRB_API mrb_value mrb_ptr_to_str(mrb_state *mrb, void *p)
434// ```
435#[unsafe(no_mangle)]
436unsafe extern "C-unwind" fn mrb_ptr_to_str(mrb: *mut sys::mrb_state, p: *mut c_void) -> sys::mrb_value {
437    unwrap_interpreter!(mrb, to => guard);
438    let mut s = String::with_capacity(16 + 2);
439    let _ignore = write!(s, "{p:p}");
440    String::alloc_value(s, &mut guard).unwrap_or_default().into()
441}
442
443// ```c
444// MRB_API mrb_value mrb_cstr_to_inum(mrb_state *mrb, const char *str, mrb_int base, mrb_bool badcheck)
445// ```
446//
447// NOTE: not implemented.
448
449// ```c
450// MRB_API const char* mrb_string_value_cstr(mrb_state *mrb, mrb_value *ptr)
451// ```
452//
453// obsolete: use `RSTRING_CSTR()` or `mrb_string_cstr()`
454#[unsafe(no_mangle)]
455unsafe extern "C-unwind" fn mrb_string_value_cstr(
456    mrb: *mut sys::mrb_state,
457    ptr: *mut sys::mrb_value,
458) -> *const c_char {
459    unwrap_interpreter!(mrb, to => guard, or_else = ptr::null());
460    let mut s = Value::from(*ptr);
461    let Ok(mut string) = String::unbox_from_value(&mut s, &mut guard) else {
462        return ptr::null();
463    };
464    if let Some(b'\0') = string.last() {
465        return string.as_ptr().cast();
466    }
467    // SAFETY: The string is repacked before any intervening uses of `interp`
468    // which means no mruby heap allocations can occur.
469    let string_mut = string.as_inner_mut();
470    string_mut.push_byte(b'\0');
471    // SAFETY: This raw pointer will not be invalidated since we rebox this
472    // `String` into the mruby heap where the GC will keep it alive.
473    let cstr = string.as_ptr().cast::<c_char>();
474
475    let inner = string.take();
476    String::box_into_value(inner, s, &mut guard).expect("String reboxing should not fail");
477
478    cstr
479}
480
481// ```c
482// MRB_API const char* mrb_string_cstr(mrb_state *mrb, mrb_value str)
483// ```
484#[unsafe(no_mangle)]
485unsafe extern "C-unwind" fn mrb_string_cstr(mrb: *mut sys::mrb_state, s: sys::mrb_value) -> *const c_char {
486    unwrap_interpreter!(mrb, to => guard, or_else = ptr::null());
487    let mut s = Value::from(s);
488    let Ok(mut string) = String::unbox_from_value(&mut s, &mut guard) else {
489        return ptr::null();
490    };
491    if let Some(b'\0') = string.last() {
492        return string.as_ptr().cast();
493    }
494    // SAFETY: The string is repacked before any intervening uses of `interp`
495    // which means no mruby heap allocations can occur.
496    let string_mut = string.as_inner_mut();
497    string_mut.push_byte(b'\0');
498    // SAFETY: This raw pointer will not be invalidated since we rebox this
499    // `String` into the mruby heap where the GC will keep it alive.
500    let cstr = string.as_ptr().cast::<c_char>();
501
502    let inner = string.take();
503    String::box_into_value(inner, s, &mut guard).expect("String reboxing should not fail");
504
505    cstr
506}
507
508// ```c
509// MRB_API mrb_value mrb_str_to_integer(mrb_state *mrb, mrb_value str, mrb_int base, mrb_bool badcheck);
510// /* obsolete: use mrb_str_to_integer() */
511// #define mrb_str_to_inum(mrb, str, base, badcheck) mrb_str_to_integer(mrb, str, base, badcheck)
512// ```
513//
514// This function converts a numeric string to numeric `mrb_value` with the given base.
515#[unsafe(no_mangle)]
516unsafe extern "C-unwind" fn mrb_str_to_integer(
517    mrb: *mut sys::mrb_state,
518    s: sys::mrb_value,
519    base: sys::mrb_int,
520    badcheck: sys::mrb_bool,
521) -> sys::mrb_value {
522    unwrap_interpreter!(mrb, to => guard);
523    let mut s = Value::from(s);
524    let Ok(s) = String::unbox_from_value(&mut s, &mut guard) else {
525        if badcheck {
526            let err = ArgumentError::with_message("not a string");
527            error::raise(guard, err);
528        }
529        return guard.convert(0_i64).into();
530    };
531    let Ok(s) = str::from_utf8(s.as_slice()) else {
532        if badcheck {
533            let err = ArgumentError::with_message("invalid number");
534            error::raise(guard, err);
535        }
536        return guard.convert(-1_i64).into();
537    };
538    let Ok(num) = s.parse::<i64>() else {
539        if badcheck {
540            let err = ArgumentError::with_message("invalid number");
541            error::raise(guard, err);
542        }
543        return guard.convert(0_i64).into();
544    };
545
546    let radix = match u32::try_from(base) {
547        Ok(base) if (2..=36).contains(&base) => base,
548        Ok(_) | Err(_) => {
549            let err = ArgumentError::with_message("illegal radix");
550            error::raise(guard, err);
551        }
552    };
553
554    let mut result = vec![];
555    let mut x = num;
556
557    loop {
558        let m = u32::try_from(x % base).expect("base must be <= 36, which guarantees the result is in range for u32");
559        x /= base;
560
561        // will panic if you use a bad radix (< 2 or > 36).
562        result.push(char::from_digit(m, radix).unwrap());
563        if x == 0 {
564            break;
565        }
566    }
567    let int = result.into_iter().rev().collect::<String>();
568    String::alloc_value(int, &mut guard).unwrap_or_default().into()
569}
570
571// ```c
572// MRB_API double mrb_cstr_to_dbl(mrb_state *mrb, const char *s, mrb_bool badcheck)
573// ```
574//
575// NOTE: not implemented
576
577// ```c
578// MRB_API double mrb_str_to_dbl(mrb_state *mrb, mrb_value str, mrb_bool badcheck)
579// ```
580#[unsafe(no_mangle)]
581unsafe extern "C-unwind" fn mrb_str_to_dbl(
582    mrb: *mut sys::mrb_state,
583    s: sys::mrb_value,
584    badcheck: sys::mrb_bool,
585) -> c_double {
586    unwrap_interpreter!(mrb, to => guard, or_else = 0.0);
587    let mut s = Value::from(s);
588    let Ok(s) = String::unbox_from_value(&mut s, &mut guard) else {
589        if badcheck {
590            let err = ArgumentError::with_message("not a string");
591            error::raise(guard, err);
592        }
593        return 0.0;
594    };
595    let Ok(s) = str::from_utf8(s.as_slice()) else {
596        if badcheck {
597            let err = ArgumentError::with_message("invalid number");
598            error::raise(guard, err);
599        }
600        return 0.0;
601    };
602    let Ok(num) = s.parse::<c_double>() else {
603        if badcheck {
604            let err = ArgumentError::with_message("invalid number");
605            error::raise(guard, err);
606        }
607        return 0.0;
608    };
609    num
610}
611
612// ```c
613// MRB_API mrb_value mrb_str_cat(mrb_state *mrb, mrb_value str, const char *ptr, size_t len)
614// ```
615#[unsafe(no_mangle)]
616unsafe extern "C-unwind" fn mrb_str_cat(
617    mrb: *mut sys::mrb_state,
618    s: sys::mrb_value,
619    ptr: *const c_char,
620    len: usize,
621) -> sys::mrb_value {
622    unwrap_interpreter!(mrb, to => guard, or_else = s);
623    let mut s = Value::from(s);
624    let Ok(mut string) = String::unbox_from_value(&mut s, &mut guard) else {
625        return s.inner();
626    };
627    let slice = slice::from_raw_parts(ptr.cast::<u8>(), len);
628
629    // SAFETY: The string is repacked before any intervening uses of
630    // `interp` which means no mruby heap allocations can occur.
631    let string_mut = string.as_inner_mut();
632    string_mut.extend_from_slice(slice);
633    let inner = string.take();
634    let value = String::box_into_value(inner, s, &mut guard).expect("String reboxing should not fail");
635
636    value.inner()
637}
638
639// ```c
640// MRB_API mrb_value mrb_str_cat_cstr(mrb_state *mrb, mrb_value str, const char *ptr)
641// MRB_API mrb_value mrb_str_cat_str(mrb_state *mrb, mrb_value str, mrb_value str2)
642// MRB_API mrb_value mrb_str_append(mrb_state *mrb, mrb_value str1, mrb_value str2)
643// ```
644//
645// NOTE: Implemented in C in `mruby-sys/src/mruby-sys/ext.c`.
646
647// ```c
648// MRB_API double mrb_float_read(const char *string, char **endPtr)
649// ```
650//
651// NOTE: impl kept in C.
652
653// ```c
654// uint32_t mrb_str_hash(mrb_state *mrb, mrb_value str);
655// ```
656#[unsafe(no_mangle)]
657unsafe extern "C-unwind" fn mrb_str_hash(mrb: *mut sys::mrb_state, s: sys::mrb_value) -> u32 {
658    unwrap_interpreter!(mrb, to => guard, or_else = 0);
659    let mut s = Value::from(s);
660
661    let Ok(s) = String::unbox_from_value(&mut s, &mut guard) else {
662        return 0;
663    };
664
665    // NOTE: it is necessary to retrieve the interpreter `BuildHasher` second to
666    // avoid a duplicate borrow error. `Artichoke::global_build_hasher` requires
667    // a shared reference which the previous mutable borrow will coerce to, but
668    // the other ordering will not compile.
669    let Ok(global_build_hasher) = guard.global_build_hasher() else {
670        return 0;
671    };
672
673    let hash = global_build_hasher.hash_one(s.as_slice());
674    // Grab some bytes from the `u64` to construct a `u32` hash.
675    let [one, two, three, four, ..] = hash.to_ne_bytes();
676    u32::from_ne_bytes([one, two, three, four])
677}
678
679// ```c
680// #define FNV_32_PRIME ((uint32_t)0x01000193)
681// #define FNV1_32_INIT ((uint32_t)0x811c9dc5)
682//
683// uint32_t mrb_byte_hash(const uint8_t*, mrb_int);
684// uint32_t mrb_byte_hash_step(const uint8_t*, mrb_int, uint32_t);
685// ```
686
687const FNV_32_PRIME: Wrapping<u32> = Wrapping(0x0100_0193);
688const FNV1_32_INIT: Wrapping<u32> = Wrapping(0x811c_9dc5);
689
690#[unsafe(no_mangle)]
691unsafe extern "C-unwind" fn mrb_byte_hash(s: *const u8, len: sys::mrb_int) -> u32 {
692    mrb_byte_hash_step(s, len, FNV1_32_INIT)
693}
694
695#[unsafe(no_mangle)]
696#[expect(
697    clippy::cast_possible_truncation,
698    clippy::cast_sign_loss,
699    reason = "mruby stores sizes as int64_t instead of size_t"
700)]
701unsafe extern "C-unwind" fn mrb_byte_hash_step(s: *const u8, len: sys::mrb_int, mut hval: Wrapping<u32>) -> u32 {
702    let slice = slice::from_raw_parts(s, len as usize);
703    // FNV-1 hash each octet in the buffer
704    for &byte in slice {
705        // multiply by the 32 bit FNV magic prime mod `2^32`
706        hval *= FNV_32_PRIME;
707        // xor the bottom with the current octet
708        hval ^= u32::from(byte);
709    }
710    // return our new hash value
711    hval.0
712}
713
714#[unsafe(no_mangle)]
715#[expect(
716    clippy::cast_possible_truncation,
717    clippy::cast_sign_loss,
718    reason = "mruby stores sizes as int64_t instead of size_t"
719)]
720unsafe extern "C-unwind" fn mrb_gc_free_str(mrb: *mut sys::mrb_state, string: *mut sys::RString) {
721    let _ = mrb;
722
723    let Some(ptr) = NonNull::<c_char>::new((*string).as_.heap.ptr) else {
724        // An allocated but uninitialized string has no backing byte buffer, so
725        // there is nothing to free.
726        return;
727    };
728    let length = (*string).as_.heap.len as usize;
729    let capacity = (*string).as_.heap.aux.capa as usize;
730
731    // we don't need to free the encoding since `Encoding` is `Copy` and we pack
732    // it into the `RString` flags as a `u32`.
733
734    let raw_parts = RawParts {
735        ptr: ptr.cast::<u8>().as_mut(),
736        length,
737        capacity,
738    };
739    drop(String::from_raw_parts(raw_parts));
740}