From abbab7216a8b47108a0e1b7a26e429d6a990d7a6 Mon Sep 17 00:00:00 2001 From: Thom Chiovoloni Date: Tue, 14 Apr 2020 02:35:37 -0700 Subject: [PATCH] Better docs and cleaner SmallCString --- src/util/small_cstr.rs | 55 +++++++++++++++++++++++++++++++++++------- 1 file changed, 46 insertions(+), 9 deletions(-) diff --git a/src/util/small_cstr.rs b/src/util/small_cstr.rs index fae52f0..bc4d9cb 100644 --- a/src/util/small_cstr.rs +++ b/src/util/small_cstr.rs @@ -1,8 +1,11 @@ use smallvec::{smallvec, SmallVec}; use std::ffi::{CStr, CString, NulError}; +/// Similar to std::ffi::CString, but avoids heap allocating if the string is +/// small enough. Also guarantees it's input is UTF-8 -- used for cases where we +/// need to pass a NUL-terminated string to SQLite, and we have a `&str`. #[derive(Clone, PartialEq, Eq, PartialOrd, Ord)] -pub struct SmallCString(smallvec::SmallVec<[u8; 16]>); +pub(crate) struct SmallCString(smallvec::SmallVec<[u8; 16]>); impl SmallCString { #[inline] @@ -13,21 +16,50 @@ impl SmallCString { let mut buf = SmallVec::with_capacity(s.len() + 1); buf.extend_from_slice(s.as_bytes()); buf.push(0); - Ok(Self(buf)) + let res = Self(buf); + res.debug_checks(); + Ok(res) } #[inline] pub fn as_str(&self) -> &str { - debug_assert!(std::str::from_utf8(&self.as_bytes_without_nul()).is_ok()); + self.debug_checks(); // Constructor takes a &str so this is safe. - unsafe { std::str::from_utf8_unchecked(&self.as_bytes_without_nul()) } + unsafe { std::str::from_utf8_unchecked(self.as_bytes_without_nul()) } + } + + /// Get the bytes not including the NUL terminator. E.g. the bytes which + /// make up our `str`: + /// - `SmallCString::new("foo").as_bytes_without_nul() == b"foo"` + /// - `SmallCString::new("foo").as_bytes_with_nul() == b"foo\0" + #[inline] + pub fn as_bytes_without_nul(&self) -> &[u8] { + self.debug_checks(); + &self.0[..self.len()] + } + + /// Get the bytes behind this str *including* the NUL terminator. This + /// should never return an empty slice. + #[inline] + pub fn as_bytes_with_nul(&self) -> &[u8] { + self.debug_checks(); + &self.0 } #[inline] - pub fn as_bytes_without_nul(&self) -> &[u8] { - &self.0[..self.0.len() - 1] + #[cfg(debug_assertions)] + fn debug_checks(&self) { + debug_assert_ne!(self.0.len(), 0); + debug_assert_eq!(self.0[self.0.len() - 1], 0); + let strbytes = &self.0[..(self.0.len() - 1)]; + debug_assert!(!strbytes.contains(&0)); + debug_assert!(std::str::from_utf8(strbytes).is_ok()); } + #[inline] + #[cfg(not(debug_assertions))] + fn debug_checks(&self) {} + #[inline] pub fn len(&self) -> usize { debug_assert_ne!(self.0.len(), 0); @@ -35,14 +67,16 @@ impl SmallCString { } #[inline] + #[allow(unused)] // clippy wants this function. pub fn is_empty(&self) -> bool { self.len() == 0 } #[inline] pub fn as_cstr(&self) -> &CStr { - debug_assert!(CStr::from_bytes_with_nul(&self.0).is_ok()); - unsafe { CStr::from_bytes_with_nul_unchecked(&self.0) } + let bytes = self.as_bytes_with_nul(); + debug_assert!(CStr::from_bytes_with_nul(bytes).is_ok()); + unsafe { CStr::from_bytes_with_nul_unchecked(bytes) } } #[cold] @@ -103,7 +137,10 @@ mod test { // things work. assert_eq!(SmallCString::default().0, SmallCString::new("").unwrap().0); assert_eq!(SmallCString::new("foo").unwrap().len(), 3); - assert_eq!(SmallCString::new("foo").unwrap().0.as_slice(), b"foo\0"); + assert_eq!( + SmallCString::new("foo").unwrap().as_bytes_with_nul(), + b"foo\0" + ); assert_eq!( SmallCString::new("foo").unwrap().as_bytes_without_nul(), b"foo",