cxx/
cxx_string.rs

1use crate::actually_private::Private;
2use crate::lossy;
3#[cfg(feature = "alloc")]
4use alloc::borrow::Cow;
5#[cfg(feature = "alloc")]
6use alloc::string::String;
7use core::cmp::Ordering;
8use core::fmt::{self, Debug, Display};
9use core::hash::{Hash, Hasher};
10use core::marker::{PhantomData, PhantomPinned};
11use core::mem::MaybeUninit;
12use core::pin::Pin;
13use core::slice;
14use core::str::{self, Utf8Error};
15
16extern "C" {
17    #[link_name = "cxxbridge1$cxx_string$init"]
18    fn string_init(this: &mut MaybeUninit<CxxString>, ptr: *const u8, len: usize);
19    #[link_name = "cxxbridge1$cxx_string$destroy"]
20    fn string_destroy(this: &mut MaybeUninit<CxxString>);
21    #[link_name = "cxxbridge1$cxx_string$data"]
22    fn string_data(this: &CxxString) -> *const u8;
23    #[link_name = "cxxbridge1$cxx_string$length"]
24    fn string_length(this: &CxxString) -> usize;
25    #[link_name = "cxxbridge1$cxx_string$clear"]
26    fn string_clear(this: Pin<&mut CxxString>);
27    #[link_name = "cxxbridge1$cxx_string$reserve_total"]
28    fn string_reserve_total(this: Pin<&mut CxxString>, new_cap: usize);
29    #[link_name = "cxxbridge1$cxx_string$push"]
30    fn string_push(this: Pin<&mut CxxString>, ptr: *const u8, len: usize);
31}
32
33/// Binding to C++ `std::string`.
34///
35/// # Invariants
36///
37/// As an invariant of this API and the static analysis of the cxx::bridge
38/// macro, in Rust code we can never obtain a `CxxString` by value. C++'s string
39/// requires a move constructor and may hold internal pointers, which is not
40/// compatible with Rust's move behavior. Instead in Rust code we will only ever
41/// look at a CxxString through a reference or smart pointer, as in `&CxxString`
42/// or `UniquePtr<CxxString>`.
43#[repr(C)]
44pub struct CxxString {
45    _private: [u8; 0],
46    _pinned: PhantomData<PhantomPinned>,
47}
48
49/// Construct a C++ std::string on the Rust stack.
50///
51/// # Syntax
52///
53/// In statement position:
54///
55/// ```
56/// # use cxx::let_cxx_string;
57/// # let expression = "";
58/// let_cxx_string!(var = expression);
59/// ```
60///
61/// The `expression` may have any type that implements `AsRef<[u8]>`. Commonly
62/// it will be a string literal, but for example `&[u8]` and `String` would work
63/// as well.
64///
65/// The macro expands to something resembling `let $var: Pin<&mut CxxString> =
66/// /*???*/;`. The resulting [`Pin`] can be deref'd to `&CxxString` as needed.
67///
68/// # Example
69///
70/// ```
71/// use cxx::{let_cxx_string, CxxString};
72///
73/// fn f(s: &CxxString) {/* ... */}
74///
75/// fn main() {
76///     let_cxx_string!(s = "example");
77///     f(&s);
78/// }
79/// ```
80#[macro_export]
81macro_rules! let_cxx_string {
82    ($var:ident = $value:expr $(,)?) => {
83        let mut cxx_stack_string = $crate::private::StackString::new();
84        #[allow(unused_mut, unused_unsafe)]
85        let mut $var = match $value {
86            let_cxx_string => unsafe { cxx_stack_string.init(let_cxx_string) },
87        };
88    };
89}
90
91impl CxxString {
92    /// `CxxString` is not constructible via `new`. Instead, use the
93    /// [`let_cxx_string!`] macro.
94    pub fn new<T: Private>() -> Self {
95        unreachable!()
96    }
97
98    /// Returns the length of the string in bytes.
99    ///
100    /// Matches the behavior of C++ [std::string::size][size].
101    ///
102    /// [size]: https://en.cppreference.com/w/cpp/string/basic_string/size
103    pub fn len(&self) -> usize {
104        unsafe { string_length(self) }
105    }
106
107    /// Returns true if `self` has a length of zero bytes.
108    ///
109    /// Matches the behavior of C++ [std::string::empty][empty].
110    ///
111    /// [empty]: https://en.cppreference.com/w/cpp/string/basic_string/empty
112    pub fn is_empty(&self) -> bool {
113        self.len() == 0
114    }
115
116    /// Returns a byte slice of this string's contents.
117    pub fn as_bytes(&self) -> &[u8] {
118        let data = self.as_ptr();
119        let len = self.len();
120        unsafe { slice::from_raw_parts(data, len) }
121    }
122
123    /// Produces a pointer to the first character of the string.
124    ///
125    /// Matches the behavior of C++ [std::string::data][data].
126    ///
127    /// Note that the return type may look like `const char *` but is not a
128    /// `const char *` in the typical C sense, as C++ strings may contain
129    /// internal null bytes. As such, the returned pointer only makes sense as a
130    /// string in combination with the length returned by [`len()`][len].
131    ///
132    /// [data]: https://en.cppreference.com/w/cpp/string/basic_string/data
133    /// [len]: #method.len
134    pub fn as_ptr(&self) -> *const u8 {
135        unsafe { string_data(self) }
136    }
137
138    /// Validates that the C++ string contains UTF-8 data and produces a view of
139    /// it as a Rust &amp;str, otherwise an error.
140    pub fn to_str(&self) -> Result<&str, Utf8Error> {
141        str::from_utf8(self.as_bytes())
142    }
143
144    /// If the contents of the C++ string are valid UTF-8, this function returns
145    /// a view as a Cow::Borrowed &amp;str. Otherwise replaces any invalid UTF-8
146    /// sequences with the U+FFFD [replacement character] and returns a
147    /// Cow::Owned String.
148    ///
149    /// [replacement character]: https://doc.rust-lang.org/std/char/constant.REPLACEMENT_CHARACTER.html
150    #[cfg(feature = "alloc")]
151    #[cfg_attr(doc_cfg, doc(cfg(feature = "alloc")))]
152    pub fn to_string_lossy(&self) -> Cow<str> {
153        String::from_utf8_lossy(self.as_bytes())
154    }
155
156    /// Removes all characters from the string.
157    ///
158    /// Matches the behavior of C++ [std::string::clear][clear].
159    ///
160    /// Note: **unlike** the guarantee of Rust's `std::string::String::clear`,
161    /// the C++ standard does not require that capacity is unchanged by this
162    /// operation. In practice existing implementations do not change the
163    /// capacity but all pointers, references, and iterators into the string
164    /// contents are nevertheless invalidated.
165    ///
166    /// [clear]: https://en.cppreference.com/w/cpp/string/basic_string/clear
167    pub fn clear(self: Pin<&mut Self>) {
168        unsafe { string_clear(self) }
169    }
170
171    /// Ensures that this string's capacity is at least `additional` bytes
172    /// larger than its length.
173    ///
174    /// The capacity may be increased by more than `additional` bytes if it
175    /// chooses, to amortize the cost of frequent reallocations.
176    ///
177    /// **The meaning of the argument is not the same as
178    /// [std::string::reserve][reserve] in C++.** The C++ standard library and
179    /// Rust standard library both have a `reserve` method on strings, but in
180    /// C++ code the argument always refers to total capacity, whereas in Rust
181    /// code it always refers to additional capacity. This API on `CxxString`
182    /// follows the Rust convention, the same way that for the length accessor
183    /// we use the Rust conventional `len()` naming and not C++ `size()` or
184    /// `length()`.
185    ///
186    /// # Panics
187    ///
188    /// Panics if the new capacity overflows usize.
189    ///
190    /// [reserve]: https://en.cppreference.com/w/cpp/string/basic_string/reserve
191    pub fn reserve(self: Pin<&mut Self>, additional: usize) {
192        let new_cap = self
193            .len()
194            .checked_add(additional)
195            .expect("CxxString capacity overflow");
196        unsafe { string_reserve_total(self, new_cap) }
197    }
198
199    /// Appends a given string slice onto the end of this C++ string.
200    pub fn push_str(self: Pin<&mut Self>, s: &str) {
201        self.push_bytes(s.as_bytes());
202    }
203
204    /// Appends arbitrary bytes onto the end of this C++ string.
205    pub fn push_bytes(self: Pin<&mut Self>, bytes: &[u8]) {
206        unsafe { string_push(self, bytes.as_ptr(), bytes.len()) }
207    }
208}
209
210impl Display for CxxString {
211    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
212        lossy::display(self.as_bytes(), f)
213    }
214}
215
216impl Debug for CxxString {
217    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
218        lossy::debug(self.as_bytes(), f)
219    }
220}
221
222impl PartialEq for CxxString {
223    fn eq(&self, other: &Self) -> bool {
224        self.as_bytes() == other.as_bytes()
225    }
226}
227
228impl PartialEq<CxxString> for str {
229    fn eq(&self, other: &CxxString) -> bool {
230        self.as_bytes() == other.as_bytes()
231    }
232}
233
234impl PartialEq<str> for CxxString {
235    fn eq(&self, other: &str) -> bool {
236        self.as_bytes() == other.as_bytes()
237    }
238}
239
240impl Eq for CxxString {}
241
242impl PartialOrd for CxxString {
243    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
244        Some(self.cmp(other))
245    }
246}
247
248impl Ord for CxxString {
249    fn cmp(&self, other: &Self) -> Ordering {
250        self.as_bytes().cmp(other.as_bytes())
251    }
252}
253
254impl Hash for CxxString {
255    fn hash<H: Hasher>(&self, state: &mut H) {
256        self.as_bytes().hash(state);
257    }
258}
259
260impl fmt::Write for Pin<&mut CxxString> {
261    fn write_str(&mut self, s: &str) -> fmt::Result {
262        self.as_mut().push_str(s);
263        Ok(())
264    }
265}
266
267#[cfg(feature = "std")]
268impl std::io::Write for Pin<&mut CxxString> {
269    fn write(&mut self, buf: &[u8]) -> std::io::Result<usize> {
270        self.as_mut().push_bytes(buf);
271        Ok(buf.len())
272    }
273
274    fn flush(&mut self) -> std::io::Result<()> {
275        Ok(())
276    }
277}
278
279#[doc(hidden)]
280#[repr(C)]
281pub struct StackString {
282    // Static assertions in cxx.cc validate that this is large enough and
283    // aligned enough.
284    space: MaybeUninit<[usize; 8]>,
285}
286
287#[allow(missing_docs)]
288impl StackString {
289    pub fn new() -> Self {
290        StackString {
291            space: MaybeUninit::uninit(),
292        }
293    }
294
295    pub unsafe fn init(&mut self, value: impl AsRef<[u8]>) -> Pin<&mut CxxString> {
296        let value = value.as_ref();
297        unsafe {
298            let this = &mut *self.space.as_mut_ptr().cast::<MaybeUninit<CxxString>>();
299            string_init(this, value.as_ptr(), value.len());
300            Pin::new_unchecked(&mut *this.as_mut_ptr())
301        }
302    }
303}
304
305impl Drop for StackString {
306    fn drop(&mut self) {
307        unsafe {
308            let this = &mut *self.space.as_mut_ptr().cast::<MaybeUninit<CxxString>>();
309            string_destroy(this);
310        }
311    }
312}