2020-04-14 14:47:12 +08:00
|
|
|
use smallvec::{smallvec, SmallVec};
|
|
|
|
use std::ffi::{CStr, CString, NulError};
|
|
|
|
|
2022-01-06 02:19:13 +08:00
|
|
|
/// Similar to `std::ffi::CString`, but avoids heap allocating if the string is
|
2020-04-14 17:35:37 +08:00
|
|
|
/// small enough. Also guarantees it's input is UTF-8 -- used for cases where we
|
|
|
|
/// need to pass a NUL-terminated string to SQLite, and we have a `&str`.
|
2020-04-14 14:47:12 +08:00
|
|
|
#[derive(Clone, PartialEq, Eq, PartialOrd, Ord)]
|
2022-05-29 19:33:51 +08:00
|
|
|
pub(crate) struct SmallCString(SmallVec<[u8; 16]>);
|
2020-04-14 14:47:12 +08:00
|
|
|
|
|
|
|
impl SmallCString {
|
|
|
|
#[inline]
|
|
|
|
pub fn new(s: &str) -> Result<Self, NulError> {
|
2022-01-06 03:03:30 +08:00
|
|
|
if s.as_bytes().contains(&0_u8) {
|
2020-04-14 14:47:12 +08:00
|
|
|
return Err(Self::fabricate_nul_error(s));
|
|
|
|
}
|
|
|
|
let mut buf = SmallVec::with_capacity(s.len() + 1);
|
|
|
|
buf.extend_from_slice(s.as_bytes());
|
|
|
|
buf.push(0);
|
2020-04-14 17:35:37 +08:00
|
|
|
let res = Self(buf);
|
|
|
|
res.debug_checks();
|
|
|
|
Ok(res)
|
2020-04-14 14:47:12 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
pub fn as_str(&self) -> &str {
|
2020-04-14 17:35:37 +08:00
|
|
|
self.debug_checks();
|
2020-04-14 14:47:12 +08:00
|
|
|
// Constructor takes a &str so this is safe.
|
2020-04-14 17:35:37 +08:00
|
|
|
unsafe { std::str::from_utf8_unchecked(self.as_bytes_without_nul()) }
|
2020-04-14 14:47:12 +08:00
|
|
|
}
|
|
|
|
|
2020-04-14 17:35:37 +08:00
|
|
|
/// Get the bytes not including the NUL terminator. E.g. the bytes which
|
|
|
|
/// make up our `str`:
|
|
|
|
/// - `SmallCString::new("foo").as_bytes_without_nul() == b"foo"`
|
2022-01-06 02:19:13 +08:00
|
|
|
/// - `SmallCString::new("foo").as_bytes_with_nul() == b"foo\0"`
|
2020-04-14 14:47:12 +08:00
|
|
|
#[inline]
|
|
|
|
pub fn as_bytes_without_nul(&self) -> &[u8] {
|
2020-04-14 17:35:37 +08:00
|
|
|
self.debug_checks();
|
|
|
|
&self.0[..self.len()]
|
2020-04-14 14:47:12 +08:00
|
|
|
}
|
|
|
|
|
2020-04-14 17:35:37 +08:00
|
|
|
/// Get the bytes behind this str *including* the NUL terminator. This
|
|
|
|
/// should never return an empty slice.
|
|
|
|
#[inline]
|
|
|
|
pub fn as_bytes_with_nul(&self) -> &[u8] {
|
|
|
|
self.debug_checks();
|
|
|
|
&self.0
|
|
|
|
}
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
#[cfg(debug_assertions)]
|
|
|
|
fn debug_checks(&self) {
|
|
|
|
debug_assert_ne!(self.0.len(), 0);
|
|
|
|
debug_assert_eq!(self.0[self.0.len() - 1], 0);
|
|
|
|
let strbytes = &self.0[..(self.0.len() - 1)];
|
|
|
|
debug_assert!(!strbytes.contains(&0));
|
|
|
|
debug_assert!(std::str::from_utf8(strbytes).is_ok());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
#[cfg(not(debug_assertions))]
|
|
|
|
fn debug_checks(&self) {}
|
|
|
|
|
2020-04-14 14:47:12 +08:00
|
|
|
#[inline]
|
|
|
|
pub fn len(&self) -> usize {
|
|
|
|
debug_assert_ne!(self.0.len(), 0);
|
|
|
|
self.0.len() - 1
|
|
|
|
}
|
|
|
|
|
|
|
|
#[inline]
|
2020-04-14 17:35:37 +08:00
|
|
|
#[allow(unused)] // clippy wants this function.
|
2020-04-14 14:47:12 +08:00
|
|
|
pub fn is_empty(&self) -> bool {
|
|
|
|
self.len() == 0
|
|
|
|
}
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
pub fn as_cstr(&self) -> &CStr {
|
2020-04-14 17:35:37 +08:00
|
|
|
let bytes = self.as_bytes_with_nul();
|
|
|
|
debug_assert!(CStr::from_bytes_with_nul(bytes).is_ok());
|
|
|
|
unsafe { CStr::from_bytes_with_nul_unchecked(bytes) }
|
2020-04-14 14:47:12 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
#[cold]
|
|
|
|
fn fabricate_nul_error(b: &str) -> NulError {
|
|
|
|
CString::new(b).unwrap_err()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Default for SmallCString {
|
|
|
|
#[inline]
|
|
|
|
fn default() -> Self {
|
|
|
|
Self(smallvec![0])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl std::fmt::Debug for SmallCString {
|
|
|
|
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
|
|
f.debug_tuple("SmallCString").field(&self.as_str()).finish()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl std::ops::Deref for SmallCString {
|
|
|
|
type Target = CStr;
|
2020-10-29 04:12:29 +08:00
|
|
|
|
2020-04-14 14:47:12 +08:00
|
|
|
#[inline]
|
|
|
|
fn deref(&self) -> &CStr {
|
|
|
|
self.as_cstr()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl PartialEq<SmallCString> for str {
|
|
|
|
#[inline]
|
|
|
|
fn eq(&self, s: &SmallCString) -> bool {
|
|
|
|
s.as_bytes_without_nul() == self.as_bytes()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl PartialEq<str> for SmallCString {
|
|
|
|
#[inline]
|
|
|
|
fn eq(&self, s: &str) -> bool {
|
|
|
|
self.as_bytes_without_nul() == s.as_bytes()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl std::borrow::Borrow<str> for SmallCString {
|
|
|
|
#[inline]
|
|
|
|
fn borrow(&self) -> &str {
|
|
|
|
self.as_str()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod test {
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_small_cstring() {
|
|
|
|
// We don't go through the normal machinery for default, so make sure
|
|
|
|
// things work.
|
|
|
|
assert_eq!(SmallCString::default().0, SmallCString::new("").unwrap().0);
|
|
|
|
assert_eq!(SmallCString::new("foo").unwrap().len(), 3);
|
2020-04-14 17:35:37 +08:00
|
|
|
assert_eq!(
|
|
|
|
SmallCString::new("foo").unwrap().as_bytes_with_nul(),
|
|
|
|
b"foo\0"
|
|
|
|
);
|
2020-04-14 14:47:12 +08:00
|
|
|
assert_eq!(
|
|
|
|
SmallCString::new("foo").unwrap().as_bytes_without_nul(),
|
|
|
|
b"foo",
|
|
|
|
);
|
|
|
|
|
|
|
|
assert_eq!(SmallCString::new("😀").unwrap().len(), 4);
|
|
|
|
assert_eq!(
|
|
|
|
SmallCString::new("😀").unwrap().0.as_slice(),
|
|
|
|
b"\xf0\x9f\x98\x80\0",
|
|
|
|
);
|
|
|
|
assert_eq!(
|
|
|
|
SmallCString::new("😀").unwrap().as_bytes_without_nul(),
|
|
|
|
b"\xf0\x9f\x98\x80",
|
|
|
|
);
|
|
|
|
|
|
|
|
assert_eq!(SmallCString::new("").unwrap().len(), 0);
|
|
|
|
assert!(SmallCString::new("").unwrap().is_empty());
|
|
|
|
|
|
|
|
assert_eq!(SmallCString::new("").unwrap().0.as_slice(), b"\0");
|
|
|
|
assert_eq!(SmallCString::new("").unwrap().as_bytes_without_nul(), b"");
|
|
|
|
|
2022-07-31 13:00:37 +08:00
|
|
|
SmallCString::new("\0").unwrap_err();
|
|
|
|
SmallCString::new("\0abc").unwrap_err();
|
|
|
|
SmallCString::new("abc\0").unwrap_err();
|
2020-04-14 14:47:12 +08:00
|
|
|
}
|
|
|
|
}
|