alloc/ffi/c_str.rs
1//! [`CString`] and its related types.
2
3use core::borrow::Borrow;
4use core::ffi::{CStr, c_char};
5use core::num::NonZero;
6use core::slice::memchr;
7use core::str::{self, FromStr, Utf8Error};
8use core::{fmt, mem, ops, ptr, slice};
9
10use crate::borrow::{Cow, ToOwned};
11use crate::boxed::Box;
12use crate::rc::Rc;
13use crate::string::String;
14#[cfg(target_has_atomic = "ptr")]
15use crate::sync::Arc;
16use crate::vec::Vec;
17
18/// A type representing an owned, C-compatible, nul-terminated string with no nul bytes in the
19/// middle.
20///
21/// This type serves the purpose of being able to safely generate a
22/// C-compatible string from a Rust byte slice or vector. An instance of this
23/// type is a static guarantee that the underlying bytes contain no interior 0
24/// bytes ("nul characters") and that the final byte is 0 ("nul terminator").
25///
26/// `CString` is to <code>&[CStr]</code> as [`String`] is to <code>&[str]</code>: the former
27/// in each pair are owned strings; the latter are borrowed
28/// references.
29///
30/// # Creating a `CString`
31///
32/// A `CString` is created from either a byte slice or a byte vector,
33/// or anything that implements <code>[Into]<[Vec]<[u8]>></code> (for
34/// example, you can build a `CString` straight out of a [`String`] or
35/// a <code>&[str]</code>, since both implement that trait).
36/// You can create a `CString` from a literal with `CString::from(c"Text")`.
37///
38/// The [`CString::new`] method will actually check that the provided <code>&[[u8]]</code>
39/// does not have 0 bytes in the middle, and return an error if it
40/// finds one.
41///
42/// # Extracting a raw pointer to the whole C string
43///
44/// `CString` implements an [`as_ptr`][`CStr::as_ptr`] method through the [`Deref`]
45/// trait. This method will give you a `*const c_char` which you can
46/// feed directly to extern functions that expect a nul-terminated
47/// string, like C's `strdup()`. Notice that [`as_ptr`][`CStr::as_ptr`] returns a
48/// read-only pointer; if the C code writes to it, that causes
49/// undefined behavior.
50///
51/// # Extracting a slice of the whole C string
52///
53/// Alternatively, you can obtain a <code>&[[u8]]</code> slice from a
54/// `CString` with the [`CString::as_bytes`] method. Slices produced in this
55/// way do *not* contain the trailing nul terminator. This is useful
56/// when you will be calling an extern function that takes a `*const
57/// u8` argument which is not necessarily nul-terminated, plus another
58/// argument with the length of the string — like C's `strndup()`.
59/// You can of course get the slice's length with its
60/// [`len`][slice::len] method.
61///
62/// If you need a <code>&[[u8]]</code> slice *with* the nul terminator, you
63/// can use [`CString::as_bytes_with_nul`] instead.
64///
65/// Once you have the kind of slice you need (with or without a nul
66/// terminator), you can call the slice's own
67/// [`as_ptr`][slice::as_ptr] method to get a read-only raw pointer to pass to
68/// extern functions. See the documentation for that function for a
69/// discussion on ensuring the lifetime of the raw pointer.
70///
71/// [str]: prim@str "str"
72/// [`Deref`]: ops::Deref
73///
74/// # Examples
75///
76/// ```ignore (extern-declaration)
77/// # fn main() {
78/// use std::ffi::CString;
79/// use std::os::raw::c_char;
80///
81/// extern "C" {
82/// fn my_printer(s: *const c_char);
83/// }
84///
85/// // We are certain that our string doesn't have 0 bytes in the middle,
86/// // so we can .expect()
87/// let c_to_print = CString::new("Hello, world!").expect("CString::new failed");
88/// unsafe {
89/// my_printer(c_to_print.as_ptr());
90/// }
91/// # }
92/// ```
93///
94/// # Safety
95///
96/// `CString` is intended for working with traditional C-style strings
97/// (a sequence of non-nul bytes terminated by a single nul byte); the
98/// primary use case for these kinds of strings is interoperating with C-like
99/// code. Often you will need to transfer ownership to/from that external
100/// code. It is strongly recommended that you thoroughly read through the
101/// documentation of `CString` before use, as improper ownership management
102/// of `CString` instances can lead to invalid memory accesses, memory leaks,
103/// and other memory errors.
104#[derive(PartialEq, PartialOrd, Eq, Ord, Hash, Clone)]
105#[rustc_diagnostic_item = "cstring_type"]
106#[stable(feature = "alloc_c_string", since = "1.64.0")]
107pub struct CString {
108 // Invariant 1: the slice ends with a zero byte and has a length of at least one.
109 // Invariant 2: the slice contains only one zero byte.
110 // Improper usage of unsafe function can break Invariant 2, but not Invariant 1.
111 inner: Box<[u8]>,
112}
113
114/// An error indicating that an interior nul byte was found.
115///
116/// While Rust strings may contain nul bytes in the middle, C strings
117/// can't, as that byte would effectively truncate the string.
118///
119/// This error is created by the [`new`][`CString::new`] method on
120/// [`CString`]. See its documentation for more.
121///
122/// # Examples
123///
124/// ```
125/// use std::ffi::{CString, NulError};
126///
127/// let _: NulError = CString::new(b"f\0oo".to_vec()).unwrap_err();
128/// ```
129#[derive(Clone, PartialEq, Eq, Debug)]
130#[stable(feature = "alloc_c_string", since = "1.64.0")]
131pub struct NulError(usize, Vec<u8>);
132
133#[derive(Clone, PartialEq, Eq, Debug)]
134enum FromBytesWithNulErrorKind {
135 InteriorNul(usize),
136 NotNulTerminated,
137}
138
139/// An error indicating that a nul byte was not in the expected position.
140///
141/// The vector used to create a [`CString`] must have one and only one nul byte,
142/// positioned at the end.
143///
144/// This error is created by the [`CString::from_vec_with_nul`] method.
145/// See its documentation for more.
146///
147/// # Examples
148///
149/// ```
150/// use std::ffi::{CString, FromVecWithNulError};
151///
152/// let _: FromVecWithNulError = CString::from_vec_with_nul(b"f\0oo".to_vec()).unwrap_err();
153/// ```
154#[derive(Clone, PartialEq, Eq, Debug)]
155#[stable(feature = "alloc_c_string", since = "1.64.0")]
156pub struct FromVecWithNulError {
157 error_kind: FromBytesWithNulErrorKind,
158 bytes: Vec<u8>,
159}
160
161#[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
162impl FromVecWithNulError {
163 /// Returns a slice of [`u8`]s bytes that were attempted to convert to a [`CString`].
164 ///
165 /// # Examples
166 ///
167 /// Basic usage:
168 ///
169 /// ```
170 /// use std::ffi::CString;
171 ///
172 /// // Some invalid bytes in a vector
173 /// let bytes = b"f\0oo".to_vec();
174 ///
175 /// let value = CString::from_vec_with_nul(bytes.clone());
176 ///
177 /// assert_eq!(&bytes[..], value.unwrap_err().as_bytes());
178 /// ```
179 #[must_use]
180 #[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
181 pub fn as_bytes(&self) -> &[u8] {
182 &self.bytes[..]
183 }
184
185 /// Returns the bytes that were attempted to convert to a [`CString`].
186 ///
187 /// This method is carefully constructed to avoid allocation. It will
188 /// consume the error, moving out the bytes, so that a copy of the bytes
189 /// does not need to be made.
190 ///
191 /// # Examples
192 ///
193 /// Basic usage:
194 ///
195 /// ```
196 /// use std::ffi::CString;
197 ///
198 /// // Some invalid bytes in a vector
199 /// let bytes = b"f\0oo".to_vec();
200 ///
201 /// let value = CString::from_vec_with_nul(bytes.clone());
202 ///
203 /// assert_eq!(bytes, value.unwrap_err().into_bytes());
204 /// ```
205 #[must_use = "`self` will be dropped if the result is not used"]
206 #[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
207 pub fn into_bytes(self) -> Vec<u8> {
208 self.bytes
209 }
210}
211
212/// An error indicating invalid UTF-8 when converting a [`CString`] into a [`String`].
213///
214/// `CString` is just a wrapper over a buffer of bytes with a nul terminator;
215/// [`CString::into_string`] performs UTF-8 validation on those bytes and may
216/// return this error.
217///
218/// This `struct` is created by [`CString::into_string()`]. See
219/// its documentation for more.
220#[derive(Clone, PartialEq, Eq, Debug)]
221#[stable(feature = "alloc_c_string", since = "1.64.0")]
222pub struct IntoStringError {
223 inner: CString,
224 error: Utf8Error,
225}
226
227impl CString {
228 /// Creates a new C-compatible string from a container of bytes.
229 ///
230 /// This function will consume the provided data and use the
231 /// underlying bytes to construct a new string, ensuring that
232 /// there is a trailing 0 byte. This trailing 0 byte will be
233 /// appended by this function; the provided data should *not*
234 /// contain any 0 bytes in it.
235 ///
236 /// # Examples
237 ///
238 /// ```ignore (extern-declaration)
239 /// use std::ffi::CString;
240 /// use std::os::raw::c_char;
241 ///
242 /// extern "C" { fn puts(s: *const c_char); }
243 ///
244 /// let to_print = CString::new("Hello!").expect("CString::new failed");
245 /// unsafe {
246 /// puts(to_print.as_ptr());
247 /// }
248 /// ```
249 ///
250 /// # Errors
251 ///
252 /// This function will return an error if the supplied bytes contain an
253 /// internal 0 byte. The [`NulError`] returned will contain the bytes as well as
254 /// the position of the nul byte.
255 #[stable(feature = "rust1", since = "1.0.0")]
256 pub fn new<T: Into<Vec<u8>>>(t: T) -> Result<CString, NulError> {
257 trait SpecNewImpl {
258 fn spec_new_impl(self) -> Result<CString, NulError>;
259 }
260
261 impl<T: Into<Vec<u8>>> SpecNewImpl for T {
262 default fn spec_new_impl(self) -> Result<CString, NulError> {
263 let bytes: Vec<u8> = self.into();
264 match memchr::memchr(0, &bytes) {
265 Some(i) => Err(NulError(i, bytes)),
266 None => Ok(unsafe { CString::_from_vec_unchecked(bytes) }),
267 }
268 }
269 }
270
271 // Specialization for avoiding reallocation
272 #[inline(always)] // Without that it is not inlined into specializations
273 fn spec_new_impl_bytes(bytes: &[u8]) -> Result<CString, NulError> {
274 // We cannot have such large slice that we would overflow here
275 // but using `checked_add` allows LLVM to assume that capacity never overflows
276 // and generate twice shorter code.
277 // `saturating_add` doesn't help for some reason.
278 let capacity = bytes.len().checked_add(1).unwrap();
279
280 // Allocate before validation to avoid duplication of allocation code.
281 // We still need to allocate and copy memory even if we get an error.
282 let mut buffer = Vec::with_capacity(capacity);
283 buffer.extend(bytes);
284
285 // Check memory of self instead of new buffer.
286 // This allows better optimizations if lto enabled.
287 match memchr::memchr(0, bytes) {
288 Some(i) => Err(NulError(i, buffer)),
289 None => Ok(unsafe { CString::_from_vec_unchecked(buffer) }),
290 }
291 }
292
293 impl SpecNewImpl for &'_ [u8] {
294 fn spec_new_impl(self) -> Result<CString, NulError> {
295 spec_new_impl_bytes(self)
296 }
297 }
298
299 impl SpecNewImpl for &'_ str {
300 fn spec_new_impl(self) -> Result<CString, NulError> {
301 spec_new_impl_bytes(self.as_bytes())
302 }
303 }
304
305 impl SpecNewImpl for &'_ mut [u8] {
306 fn spec_new_impl(self) -> Result<CString, NulError> {
307 spec_new_impl_bytes(self)
308 }
309 }
310
311 t.spec_new_impl()
312 }
313
314 /// Creates a C-compatible string by consuming a byte vector,
315 /// without checking for interior 0 bytes.
316 ///
317 /// Trailing 0 byte will be appended by this function.
318 ///
319 /// This method is equivalent to [`CString::new`] except that no runtime
320 /// assertion is made that `v` contains no 0 bytes, and it requires an
321 /// actual byte vector, not anything that can be converted to one with Into.
322 ///
323 /// # Examples
324 ///
325 /// ```
326 /// use std::ffi::CString;
327 ///
328 /// let raw = b"foo".to_vec();
329 /// unsafe {
330 /// let c_string = CString::from_vec_unchecked(raw);
331 /// }
332 /// ```
333 #[must_use]
334 #[stable(feature = "rust1", since = "1.0.0")]
335 pub unsafe fn from_vec_unchecked(v: Vec<u8>) -> Self {
336 debug_assert!(memchr::memchr(0, &v).is_none());
337 unsafe { Self::_from_vec_unchecked(v) }
338 }
339
340 unsafe fn _from_vec_unchecked(mut v: Vec<u8>) -> Self {
341 v.reserve_exact(1);
342 v.push(0);
343 Self { inner: v.into_boxed_slice() }
344 }
345
346 /// Retakes ownership of a `CString` that was transferred to C via
347 /// [`CString::into_raw`].
348 ///
349 /// Additionally, the length of the string will be recalculated from the pointer.
350 ///
351 /// # Safety
352 ///
353 /// This should only ever be called with a pointer that was earlier
354 /// obtained by calling [`CString::into_raw`]. Other usage (e.g., trying to take
355 /// ownership of a string that was allocated by foreign code) is likely to lead
356 /// to undefined behavior or allocator corruption.
357 ///
358 /// It should be noted that the length isn't just "recomputed," but that
359 /// the recomputed length must match the original length from the
360 /// [`CString::into_raw`] call. This means the [`CString::into_raw`]/`from_raw`
361 /// methods should not be used when passing the string to C functions that can
362 /// modify the string's length.
363 ///
364 /// > **Note:** If you need to borrow a string that was allocated by
365 /// > foreign code, use [`CStr`]. If you need to take ownership of
366 /// > a string that was allocated by foreign code, you will need to
367 /// > make your own provisions for freeing it appropriately, likely
368 /// > with the foreign code's API to do that.
369 ///
370 /// # Examples
371 ///
372 /// Creates a `CString`, pass ownership to an `extern` function (via raw pointer), then retake
373 /// ownership with `from_raw`:
374 ///
375 /// ```ignore (extern-declaration)
376 /// use std::ffi::CString;
377 /// use std::os::raw::c_char;
378 ///
379 /// extern "C" {
380 /// fn some_extern_function(s: *mut c_char);
381 /// }
382 ///
383 /// let c_string = CString::from(c"Hello!");
384 /// let raw = c_string.into_raw();
385 /// unsafe {
386 /// some_extern_function(raw);
387 /// let c_string = CString::from_raw(raw);
388 /// }
389 /// ```
390 #[must_use = "call `drop(from_raw(ptr))` if you intend to drop the `CString`"]
391 #[stable(feature = "cstr_memory", since = "1.4.0")]
392 pub unsafe fn from_raw(ptr: *mut c_char) -> CString {
393 // SAFETY: This is called with a pointer that was obtained from a call
394 // to `CString::into_raw` and the length has not been modified. As such,
395 // we know there is a NUL byte (and only one) at the end and that the
396 // information about the size of the allocation is correct on Rust's
397 // side.
398 unsafe {
399 unsafe extern "C" {
400 /// Provided by libc or compiler_builtins.
401 fn strlen(s: *const c_char) -> usize;
402 }
403 let len = strlen(ptr) + 1; // Including the NUL byte
404 let slice = slice::from_raw_parts_mut(ptr, len);
405 CString { inner: Box::from_raw(slice as *mut [c_char] as *mut [u8]) }
406 }
407 }
408
409 /// Consumes the `CString` and transfers ownership of the string to a C caller.
410 ///
411 /// The pointer which this function returns must be returned to Rust and reconstituted using
412 /// [`CString::from_raw`] to be properly deallocated. Specifically, one
413 /// should *not* use the standard C `free()` function to deallocate
414 /// this string.
415 ///
416 /// Failure to call [`CString::from_raw`] will lead to a memory leak.
417 ///
418 /// The C side must **not** modify the length of the string (by writing a
419 /// nul byte somewhere inside the string or removing the final one) before
420 /// it makes it back into Rust using [`CString::from_raw`]. See the safety section
421 /// in [`CString::from_raw`].
422 ///
423 /// # Examples
424 ///
425 /// ```
426 /// use std::ffi::CString;
427 ///
428 /// let c_string = CString::from(c"foo");
429 ///
430 /// let ptr = c_string.into_raw();
431 ///
432 /// unsafe {
433 /// assert_eq!(b'f', *ptr as u8);
434 /// assert_eq!(b'o', *ptr.add(1) as u8);
435 /// assert_eq!(b'o', *ptr.add(2) as u8);
436 /// assert_eq!(b'\0', *ptr.add(3) as u8);
437 ///
438 /// // retake pointer to free memory
439 /// let _ = CString::from_raw(ptr);
440 /// }
441 /// ```
442 #[inline]
443 #[must_use = "`self` will be dropped if the result is not used"]
444 #[stable(feature = "cstr_memory", since = "1.4.0")]
445 pub fn into_raw(self) -> *mut c_char {
446 Box::into_raw(self.into_inner()) as *mut c_char
447 }
448
449 /// Converts the `CString` into a [`String`] if it contains valid UTF-8 data.
450 ///
451 /// On failure, ownership of the original `CString` is returned.
452 ///
453 /// # Examples
454 ///
455 /// ```
456 /// use std::ffi::CString;
457 ///
458 /// let valid_utf8 = vec![b'f', b'o', b'o'];
459 /// let cstring = CString::new(valid_utf8).expect("CString::new failed");
460 /// assert_eq!(cstring.into_string().expect("into_string() call failed"), "foo");
461 ///
462 /// let invalid_utf8 = vec![b'f', 0xff, b'o', b'o'];
463 /// let cstring = CString::new(invalid_utf8).expect("CString::new failed");
464 /// let err = cstring.into_string().err().expect("into_string().err() failed");
465 /// assert_eq!(err.utf8_error().valid_up_to(), 1);
466 /// ```
467 #[stable(feature = "cstring_into", since = "1.7.0")]
468 pub fn into_string(self) -> Result<String, IntoStringError> {
469 String::from_utf8(self.into_bytes()).map_err(|e| IntoStringError {
470 error: e.utf8_error(),
471 inner: unsafe { Self::_from_vec_unchecked(e.into_bytes()) },
472 })
473 }
474
475 /// Consumes the `CString` and returns the underlying byte buffer.
476 ///
477 /// The returned buffer does **not** contain the trailing nul
478 /// terminator, and it is guaranteed to not have any interior nul
479 /// bytes.
480 ///
481 /// # Examples
482 ///
483 /// ```
484 /// use std::ffi::CString;
485 ///
486 /// let c_string = CString::from(c"foo");
487 /// let bytes = c_string.into_bytes();
488 /// assert_eq!(bytes, vec![b'f', b'o', b'o']);
489 /// ```
490 #[must_use = "`self` will be dropped if the result is not used"]
491 #[stable(feature = "cstring_into", since = "1.7.0")]
492 pub fn into_bytes(self) -> Vec<u8> {
493 let mut vec = self.into_inner().into_vec();
494 let _nul = vec.pop();
495 debug_assert_eq!(_nul, Some(0u8));
496 vec
497 }
498
499 /// Equivalent to [`CString::into_bytes()`] except that the
500 /// returned vector includes the trailing nul terminator.
501 ///
502 /// # Examples
503 ///
504 /// ```
505 /// use std::ffi::CString;
506 ///
507 /// let c_string = CString::from(c"foo");
508 /// let bytes = c_string.into_bytes_with_nul();
509 /// assert_eq!(bytes, vec![b'f', b'o', b'o', b'\0']);
510 /// ```
511 #[must_use = "`self` will be dropped if the result is not used"]
512 #[stable(feature = "cstring_into", since = "1.7.0")]
513 pub fn into_bytes_with_nul(self) -> Vec<u8> {
514 self.into_inner().into_vec()
515 }
516
517 /// Returns the contents of this `CString` as a slice of bytes.
518 ///
519 /// The returned slice does **not** contain the trailing nul
520 /// terminator, and it is guaranteed to not have any interior nul
521 /// bytes. If you need the nul terminator, use
522 /// [`CString::as_bytes_with_nul`] instead.
523 ///
524 /// # Examples
525 ///
526 /// ```
527 /// use std::ffi::CString;
528 ///
529 /// let c_string = CString::from(c"foo");
530 /// let bytes = c_string.as_bytes();
531 /// assert_eq!(bytes, &[b'f', b'o', b'o']);
532 /// ```
533 #[inline]
534 #[must_use]
535 #[stable(feature = "rust1", since = "1.0.0")]
536 pub fn as_bytes(&self) -> &[u8] {
537 // SAFETY: CString has a length at least 1
538 unsafe { self.inner.get_unchecked(..self.inner.len() - 1) }
539 }
540
541 /// Equivalent to [`CString::as_bytes()`] except that the
542 /// returned slice includes the trailing nul terminator.
543 ///
544 /// # Examples
545 ///
546 /// ```
547 /// use std::ffi::CString;
548 ///
549 /// let c_string = CString::from(c"foo");
550 /// let bytes = c_string.as_bytes_with_nul();
551 /// assert_eq!(bytes, &[b'f', b'o', b'o', b'\0']);
552 /// ```
553 #[inline]
554 #[must_use]
555 #[stable(feature = "rust1", since = "1.0.0")]
556 pub fn as_bytes_with_nul(&self) -> &[u8] {
557 &self.inner
558 }
559
560 /// Extracts a [`CStr`] slice containing the entire string.
561 ///
562 /// # Examples
563 ///
564 /// ```
565 /// use std::ffi::{CString, CStr};
566 ///
567 /// let c_string = CString::from(c"foo");
568 /// let cstr = c_string.as_c_str();
569 /// assert_eq!(cstr,
570 /// CStr::from_bytes_with_nul(b"foo\0").expect("CStr::from_bytes_with_nul failed"));
571 /// ```
572 #[inline]
573 #[must_use]
574 #[stable(feature = "as_c_str", since = "1.20.0")]
575 #[rustc_diagnostic_item = "cstring_as_c_str"]
576 pub fn as_c_str(&self) -> &CStr {
577 &*self
578 }
579
580 /// Converts this `CString` into a boxed [`CStr`].
581 ///
582 /// # Examples
583 ///
584 /// ```
585 /// let c_string = c"foo".to_owned();
586 /// let boxed = c_string.into_boxed_c_str();
587 /// assert_eq!(boxed.to_bytes_with_nul(), b"foo\0");
588 /// ```
589 #[must_use = "`self` will be dropped if the result is not used"]
590 #[stable(feature = "into_boxed_c_str", since = "1.20.0")]
591 pub fn into_boxed_c_str(self) -> Box<CStr> {
592 unsafe { Box::from_raw(Box::into_raw(self.into_inner()) as *mut CStr) }
593 }
594
595 /// Bypass "move out of struct which implements [`Drop`] trait" restriction.
596 #[inline]
597 fn into_inner(self) -> Box<[u8]> {
598 // Rationale: `mem::forget(self)` invalidates the previous call to `ptr::read(&self.inner)`
599 // so we use `ManuallyDrop` to ensure `self` is not dropped.
600 // Then we can return the box directly without invalidating it.
601 // See https://github.com/rust-lang/rust/issues/62553.
602 let this = mem::ManuallyDrop::new(self);
603 unsafe { ptr::read(&this.inner) }
604 }
605
606 /// Converts a <code>[Vec]<[u8]></code> to a [`CString`] without checking the
607 /// invariants on the given [`Vec`].
608 ///
609 /// # Safety
610 ///
611 /// The given [`Vec`] **must** have one nul byte as its last element.
612 /// This means it cannot be empty nor have any other nul byte anywhere else.
613 ///
614 /// # Example
615 ///
616 /// ```
617 /// use std::ffi::CString;
618 /// assert_eq!(
619 /// unsafe { CString::from_vec_with_nul_unchecked(b"abc\0".to_vec()) },
620 /// unsafe { CString::from_vec_unchecked(b"abc".to_vec()) }
621 /// );
622 /// ```
623 #[must_use]
624 #[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
625 pub unsafe fn from_vec_with_nul_unchecked(v: Vec<u8>) -> Self {
626 debug_assert!(memchr::memchr(0, &v).unwrap() + 1 == v.len());
627 unsafe { Self::_from_vec_with_nul_unchecked(v) }
628 }
629
630 unsafe fn _from_vec_with_nul_unchecked(v: Vec<u8>) -> Self {
631 Self { inner: v.into_boxed_slice() }
632 }
633
634 /// Attempts to converts a <code>[Vec]<[u8]></code> to a [`CString`].
635 ///
636 /// Runtime checks are present to ensure there is only one nul byte in the
637 /// [`Vec`], its last element.
638 ///
639 /// # Errors
640 ///
641 /// If a nul byte is present and not the last element or no nul bytes
642 /// is present, an error will be returned.
643 ///
644 /// # Examples
645 ///
646 /// A successful conversion will produce the same result as [`CString::new`]
647 /// when called without the ending nul byte.
648 ///
649 /// ```
650 /// use std::ffi::CString;
651 /// assert_eq!(
652 /// CString::from_vec_with_nul(b"abc\0".to_vec())
653 /// .expect("CString::from_vec_with_nul failed"),
654 /// c"abc".to_owned()
655 /// );
656 /// ```
657 ///
658 /// An incorrectly formatted [`Vec`] will produce an error.
659 ///
660 /// ```
661 /// use std::ffi::{CString, FromVecWithNulError};
662 /// // Interior nul byte
663 /// let _: FromVecWithNulError = CString::from_vec_with_nul(b"a\0bc".to_vec()).unwrap_err();
664 /// // No nul byte
665 /// let _: FromVecWithNulError = CString::from_vec_with_nul(b"abc".to_vec()).unwrap_err();
666 /// ```
667 #[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
668 pub fn from_vec_with_nul(v: Vec<u8>) -> Result<Self, FromVecWithNulError> {
669 let nul_pos = memchr::memchr(0, &v);
670 match nul_pos {
671 Some(nul_pos) if nul_pos + 1 == v.len() => {
672 // SAFETY: We know there is only one nul byte, at the end
673 // of the vec.
674 Ok(unsafe { Self::_from_vec_with_nul_unchecked(v) })
675 }
676 Some(nul_pos) => Err(FromVecWithNulError {
677 error_kind: FromBytesWithNulErrorKind::InteriorNul(nul_pos),
678 bytes: v,
679 }),
680 None => Err(FromVecWithNulError {
681 error_kind: FromBytesWithNulErrorKind::NotNulTerminated,
682 bytes: v,
683 }),
684 }
685 }
686}
687
688// Turns this `CString` into an empty string to prevent
689// memory-unsafe code from working by accident. Inline
690// to prevent LLVM from optimizing it away in debug builds.
691#[stable(feature = "cstring_drop", since = "1.13.0")]
692#[rustc_insignificant_dtor]
693impl Drop for CString {
694 #[inline]
695 fn drop(&mut self) {
696 unsafe {
697 *self.inner.get_unchecked_mut(0) = 0;
698 }
699 }
700}
701
702#[stable(feature = "rust1", since = "1.0.0")]
703impl ops::Deref for CString {
704 type Target = CStr;
705
706 #[inline]
707 fn deref(&self) -> &CStr {
708 unsafe { CStr::from_bytes_with_nul_unchecked(self.as_bytes_with_nul()) }
709 }
710}
711
712#[stable(feature = "rust1", since = "1.0.0")]
713impl fmt::Debug for CString {
714 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
715 fmt::Debug::fmt(&**self, f)
716 }
717}
718
719#[stable(feature = "cstring_into", since = "1.7.0")]
720impl From<CString> for Vec<u8> {
721 /// Converts a [`CString`] into a <code>[Vec]<[u8]></code>.
722 ///
723 /// The conversion consumes the [`CString`], and removes the terminating NUL byte.
724 #[inline]
725 fn from(s: CString) -> Vec<u8> {
726 s.into_bytes()
727 }
728}
729
730#[stable(feature = "cstr_default", since = "1.10.0")]
731impl Default for CString {
732 /// Creates an empty `CString`.
733 fn default() -> CString {
734 let a: &CStr = Default::default();
735 a.to_owned()
736 }
737}
738
739#[stable(feature = "cstr_borrow", since = "1.3.0")]
740impl Borrow<CStr> for CString {
741 #[inline]
742 fn borrow(&self) -> &CStr {
743 self
744 }
745}
746
747#[stable(feature = "cstring_from_cow_cstr", since = "1.28.0")]
748impl<'a> From<Cow<'a, CStr>> for CString {
749 /// Converts a `Cow<'a, CStr>` into a `CString`, by copying the contents if they are
750 /// borrowed.
751 #[inline]
752 fn from(s: Cow<'a, CStr>) -> Self {
753 s.into_owned()
754 }
755}
756
757#[stable(feature = "box_from_c_str", since = "1.17.0")]
758impl From<&CStr> for Box<CStr> {
759 /// Converts a `&CStr` into a `Box<CStr>`,
760 /// by copying the contents into a newly allocated [`Box`].
761 fn from(s: &CStr) -> Box<CStr> {
762 let boxed: Box<[u8]> = Box::from(s.to_bytes_with_nul());
763 unsafe { Box::from_raw(Box::into_raw(boxed) as *mut CStr) }
764 }
765}
766
767#[stable(feature = "box_from_mut_slice", since = "1.84.0")]
768impl From<&mut CStr> for Box<CStr> {
769 /// Converts a `&mut CStr` into a `Box<CStr>`,
770 /// by copying the contents into a newly allocated [`Box`].
771 fn from(s: &mut CStr) -> Box<CStr> {
772 Self::from(&*s)
773 }
774}
775
776#[stable(feature = "box_from_cow", since = "1.45.0")]
777impl From<Cow<'_, CStr>> for Box<CStr> {
778 /// Converts a `Cow<'a, CStr>` into a `Box<CStr>`,
779 /// by copying the contents if they are borrowed.
780 #[inline]
781 fn from(cow: Cow<'_, CStr>) -> Box<CStr> {
782 match cow {
783 Cow::Borrowed(s) => Box::from(s),
784 Cow::Owned(s) => Box::from(s),
785 }
786 }
787}
788
789#[stable(feature = "c_string_from_box", since = "1.18.0")]
790impl From<Box<CStr>> for CString {
791 /// Converts a <code>[Box]<[CStr]></code> into a [`CString`] without copying or allocating.
792 #[inline]
793 fn from(s: Box<CStr>) -> CString {
794 let raw = Box::into_raw(s) as *mut [u8];
795 CString { inner: unsafe { Box::from_raw(raw) } }
796 }
797}
798
799#[stable(feature = "cstring_from_vec_of_nonzerou8", since = "1.43.0")]
800impl From<Vec<NonZero<u8>>> for CString {
801 /// Converts a <code>[Vec]<[NonZero]<[u8]>></code> into a [`CString`] without
802 /// copying nor checking for inner nul bytes.
803 #[inline]
804 fn from(v: Vec<NonZero<u8>>) -> CString {
805 unsafe {
806 // Transmute `Vec<NonZero<u8>>` to `Vec<u8>`.
807 let v: Vec<u8> = {
808 // SAFETY:
809 // - transmuting between `NonZero<u8>` and `u8` is sound;
810 // - `alloc::Layout<NonZero<u8>> == alloc::Layout<u8>`.
811 let (ptr, len, cap): (*mut NonZero<u8>, _, _) = Vec::into_raw_parts(v);
812 Vec::from_raw_parts(ptr.cast::<u8>(), len, cap)
813 };
814 // SAFETY: `v` cannot contain nul bytes, given the type-level
815 // invariant of `NonZero<u8>`.
816 Self::_from_vec_unchecked(v)
817 }
818 }
819}
820
821impl FromStr for CString {
822 type Err = NulError;
823
824 /// Converts a string `s` into a [`CString`].
825 ///
826 /// This method is equivalent to [`CString::new`].
827 #[inline]
828 fn from_str(s: &str) -> Result<Self, Self::Err> {
829 Self::new(s)
830 }
831}
832
833impl TryFrom<CString> for String {
834 type Error = IntoStringError;
835
836 /// Converts a [`CString`] into a [`String`] if it contains valid UTF-8 data.
837 ///
838 /// This method is equivalent to [`CString::into_string`].
839 #[inline]
840 fn try_from(value: CString) -> Result<Self, Self::Error> {
841 value.into_string()
842 }
843}
844
845#[stable(feature = "more_box_slice_clone", since = "1.29.0")]
846impl Clone for Box<CStr> {
847 #[inline]
848 fn clone(&self) -> Self {
849 (**self).into()
850 }
851}
852
853#[stable(feature = "box_from_c_string", since = "1.20.0")]
854impl From<CString> for Box<CStr> {
855 /// Converts a [`CString`] into a <code>[Box]<[CStr]></code> without copying or allocating.
856 #[inline]
857 fn from(s: CString) -> Box<CStr> {
858 s.into_boxed_c_str()
859 }
860}
861
862#[stable(feature = "cow_from_cstr", since = "1.28.0")]
863impl<'a> From<CString> for Cow<'a, CStr> {
864 /// Converts a [`CString`] into an owned [`Cow`] without copying or allocating.
865 #[inline]
866 fn from(s: CString) -> Cow<'a, CStr> {
867 Cow::Owned(s)
868 }
869}
870
871#[stable(feature = "cow_from_cstr", since = "1.28.0")]
872impl<'a> From<&'a CStr> for Cow<'a, CStr> {
873 /// Converts a [`CStr`] into a borrowed [`Cow`] without copying or allocating.
874 #[inline]
875 fn from(s: &'a CStr) -> Cow<'a, CStr> {
876 Cow::Borrowed(s)
877 }
878}
879
880#[stable(feature = "cow_from_cstr", since = "1.28.0")]
881impl<'a> From<&'a CString> for Cow<'a, CStr> {
882 /// Converts a `&`[`CString`] into a borrowed [`Cow`] without copying or allocating.
883 #[inline]
884 fn from(s: &'a CString) -> Cow<'a, CStr> {
885 Cow::Borrowed(s.as_c_str())
886 }
887}
888
889#[cfg(target_has_atomic = "ptr")]
890#[stable(feature = "shared_from_slice2", since = "1.24.0")]
891impl From<CString> for Arc<CStr> {
892 /// Converts a [`CString`] into an <code>[Arc]<[CStr]></code> by moving the [`CString`]
893 /// data into a new [`Arc`] buffer.
894 #[inline]
895 fn from(s: CString) -> Arc<CStr> {
896 let arc: Arc<[u8]> = Arc::from(s.into_inner());
897 unsafe { Arc::from_raw(Arc::into_raw(arc) as *const CStr) }
898 }
899}
900
901#[cfg(target_has_atomic = "ptr")]
902#[stable(feature = "shared_from_slice2", since = "1.24.0")]
903impl From<&CStr> for Arc<CStr> {
904 /// Converts a `&CStr` into a `Arc<CStr>`,
905 /// by copying the contents into a newly allocated [`Arc`].
906 #[inline]
907 fn from(s: &CStr) -> Arc<CStr> {
908 let arc: Arc<[u8]> = Arc::from(s.to_bytes_with_nul());
909 unsafe { Arc::from_raw(Arc::into_raw(arc) as *const CStr) }
910 }
911}
912
913#[cfg(target_has_atomic = "ptr")]
914#[stable(feature = "shared_from_mut_slice", since = "1.84.0")]
915impl From<&mut CStr> for Arc<CStr> {
916 /// Converts a `&mut CStr` into a `Arc<CStr>`,
917 /// by copying the contents into a newly allocated [`Arc`].
918 #[inline]
919 fn from(s: &mut CStr) -> Arc<CStr> {
920 Arc::from(&*s)
921 }
922}
923
924#[stable(feature = "shared_from_slice2", since = "1.24.0")]
925impl From<CString> for Rc<CStr> {
926 /// Converts a [`CString`] into an <code>[Rc]<[CStr]></code> by moving the [`CString`]
927 /// data into a new [`Rc`] buffer.
928 #[inline]
929 fn from(s: CString) -> Rc<CStr> {
930 let rc: Rc<[u8]> = Rc::from(s.into_inner());
931 unsafe { Rc::from_raw(Rc::into_raw(rc) as *const CStr) }
932 }
933}
934
935#[stable(feature = "shared_from_slice2", since = "1.24.0")]
936impl From<&CStr> for Rc<CStr> {
937 /// Converts a `&CStr` into a `Rc<CStr>`,
938 /// by copying the contents into a newly allocated [`Rc`].
939 #[inline]
940 fn from(s: &CStr) -> Rc<CStr> {
941 let rc: Rc<[u8]> = Rc::from(s.to_bytes_with_nul());
942 unsafe { Rc::from_raw(Rc::into_raw(rc) as *const CStr) }
943 }
944}
945
946#[stable(feature = "shared_from_mut_slice", since = "1.84.0")]
947impl From<&mut CStr> for Rc<CStr> {
948 /// Converts a `&mut CStr` into a `Rc<CStr>`,
949 /// by copying the contents into a newly allocated [`Rc`].
950 #[inline]
951 fn from(s: &mut CStr) -> Rc<CStr> {
952 Rc::from(&*s)
953 }
954}
955
956#[cfg(not(no_global_oom_handling))]
957#[stable(feature = "more_rc_default_impls", since = "1.80.0")]
958impl Default for Rc<CStr> {
959 /// Creates an empty CStr inside an Rc
960 ///
961 /// This may or may not share an allocation with other Rcs on the same thread.
962 #[inline]
963 fn default() -> Self {
964 let rc = Rc::<[u8]>::from(*b"\0");
965 // `[u8]` has the same layout as `CStr`, and it is `NUL` terminated.
966 unsafe { Rc::from_raw(Rc::into_raw(rc) as *const CStr) }
967 }
968}
969
970#[stable(feature = "default_box_extra", since = "1.17.0")]
971impl Default for Box<CStr> {
972 fn default() -> Box<CStr> {
973 let boxed: Box<[u8]> = Box::from([0]);
974 unsafe { Box::from_raw(Box::into_raw(boxed) as *mut CStr) }
975 }
976}
977
978impl NulError {
979 /// Returns the position of the nul byte in the slice that caused
980 /// [`CString::new`] to fail.
981 ///
982 /// # Examples
983 ///
984 /// ```
985 /// use std::ffi::CString;
986 ///
987 /// let nul_error = CString::new("foo\0bar").unwrap_err();
988 /// assert_eq!(nul_error.nul_position(), 3);
989 ///
990 /// let nul_error = CString::new("foo bar\0").unwrap_err();
991 /// assert_eq!(nul_error.nul_position(), 7);
992 /// ```
993 #[must_use]
994 #[stable(feature = "rust1", since = "1.0.0")]
995 pub fn nul_position(&self) -> usize {
996 self.0
997 }
998
999 /// Consumes this error, returning the underlying vector of bytes which
1000 /// generated the error in the first place.
1001 ///
1002 /// # Examples
1003 ///
1004 /// ```
1005 /// use std::ffi::CString;
1006 ///
1007 /// let nul_error = CString::new("foo\0bar").unwrap_err();
1008 /// assert_eq!(nul_error.into_vec(), b"foo\0bar");
1009 /// ```
1010 #[must_use = "`self` will be dropped if the result is not used"]
1011 #[stable(feature = "rust1", since = "1.0.0")]
1012 pub fn into_vec(self) -> Vec<u8> {
1013 self.1
1014 }
1015}
1016
1017#[stable(feature = "rust1", since = "1.0.0")]
1018impl fmt::Display for NulError {
1019 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1020 write!(f, "nul byte found in provided data at position: {}", self.0)
1021 }
1022}
1023
1024#[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
1025impl fmt::Display for FromVecWithNulError {
1026 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1027 match self.error_kind {
1028 FromBytesWithNulErrorKind::InteriorNul(pos) => {
1029 write!(f, "data provided contains an interior nul byte at pos {pos}")
1030 }
1031 FromBytesWithNulErrorKind::NotNulTerminated => {
1032 write!(f, "data provided is not nul terminated")
1033 }
1034 }
1035 }
1036}
1037
1038impl IntoStringError {
1039 /// Consumes this error, returning original [`CString`] which generated the
1040 /// error.
1041 #[must_use = "`self` will be dropped if the result is not used"]
1042 #[stable(feature = "cstring_into", since = "1.7.0")]
1043 pub fn into_cstring(self) -> CString {
1044 self.inner
1045 }
1046
1047 /// Access the underlying UTF-8 error that was the cause of this error.
1048 #[must_use]
1049 #[stable(feature = "cstring_into", since = "1.7.0")]
1050 pub fn utf8_error(&self) -> Utf8Error {
1051 self.error
1052 }
1053}
1054
1055impl IntoStringError {
1056 fn description(&self) -> &str {
1057 "C string contained non-utf8 bytes"
1058 }
1059}
1060
1061#[stable(feature = "cstring_into", since = "1.7.0")]
1062impl fmt::Display for IntoStringError {
1063 #[allow(deprecated, deprecated_in_future)]
1064 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1065 self.description().fmt(f)
1066 }
1067}
1068
1069#[stable(feature = "cstr_borrow", since = "1.3.0")]
1070impl ToOwned for CStr {
1071 type Owned = CString;
1072
1073 fn to_owned(&self) -> CString {
1074 CString { inner: self.to_bytes_with_nul().into() }
1075 }
1076
1077 fn clone_into(&self, target: &mut CString) {
1078 let mut b = mem::take(&mut target.inner).into_vec();
1079 self.to_bytes_with_nul().clone_into(&mut b);
1080 target.inner = b.into_boxed_slice();
1081 }
1082}
1083
1084#[stable(feature = "cstring_asref", since = "1.7.0")]
1085impl From<&CStr> for CString {
1086 /// Converts a <code>&[CStr]</code> into a [`CString`]
1087 /// by copying the contents into a new allocation.
1088 fn from(s: &CStr) -> CString {
1089 s.to_owned()
1090 }
1091}
1092
1093#[stable(feature = "cstring_asref", since = "1.7.0")]
1094impl ops::Index<ops::RangeFull> for CString {
1095 type Output = CStr;
1096
1097 #[inline]
1098 fn index(&self, _index: ops::RangeFull) -> &CStr {
1099 self
1100 }
1101}
1102
1103#[stable(feature = "cstring_asref", since = "1.7.0")]
1104impl AsRef<CStr> for CString {
1105 #[inline]
1106 fn as_ref(&self) -> &CStr {
1107 self
1108 }
1109}
1110
1111impl CStr {
1112 /// Converts a `CStr` into a <code>[Cow]<[str]></code>.
1113 ///
1114 /// If the contents of the `CStr` are valid UTF-8 data, this
1115 /// function will return a <code>[Cow]::[Borrowed]\(&[str])</code>
1116 /// with the corresponding <code>&[str]</code> slice. Otherwise, it will
1117 /// replace any invalid UTF-8 sequences with
1118 /// [`U+FFFD REPLACEMENT CHARACTER`][U+FFFD] and return a
1119 /// <code>[Cow]::[Owned]\(&[str])</code> with the result.
1120 ///
1121 /// [str]: prim@str "str"
1122 /// [Borrowed]: Cow::Borrowed
1123 /// [Owned]: Cow::Owned
1124 /// [U+FFFD]: core::char::REPLACEMENT_CHARACTER "std::char::REPLACEMENT_CHARACTER"
1125 ///
1126 /// # Examples
1127 ///
1128 /// Calling `to_string_lossy` on a `CStr` containing valid UTF-8. The leading
1129 /// `c` on the string literal denotes a `CStr`.
1130 ///
1131 /// ```
1132 /// use std::borrow::Cow;
1133 ///
1134 /// assert_eq!(c"Hello World".to_string_lossy(), Cow::Borrowed("Hello World"));
1135 /// ```
1136 ///
1137 /// Calling `to_string_lossy` on a `CStr` containing invalid UTF-8:
1138 ///
1139 /// ```
1140 /// use std::borrow::Cow;
1141 ///
1142 /// assert_eq!(
1143 /// c"Hello \xF0\x90\x80World".to_string_lossy(),
1144 /// Cow::Owned(String::from("Hello �World")) as Cow<'_, str>
1145 /// );
1146 /// ```
1147 #[rustc_allow_incoherent_impl]
1148 #[must_use = "this returns the result of the operation, \
1149 without modifying the original"]
1150 #[stable(feature = "cstr_to_str", since = "1.4.0")]
1151 pub fn to_string_lossy(&self) -> Cow<'_, str> {
1152 String::from_utf8_lossy(self.to_bytes())
1153 }
1154
1155 /// Converts a <code>[Box]<[CStr]></code> into a [`CString`] without copying or allocating.
1156 ///
1157 /// # Examples
1158 ///
1159 /// ```
1160 /// use std::ffi::{CStr, CString};
1161 ///
1162 /// let boxed: Box<CStr> = Box::from(c"foo");
1163 /// let c_string: CString = c"foo".to_owned();
1164 ///
1165 /// assert_eq!(boxed.into_c_string(), c_string);
1166 /// ```
1167 #[rustc_allow_incoherent_impl]
1168 #[must_use = "`self` will be dropped if the result is not used"]
1169 #[stable(feature = "into_boxed_c_str", since = "1.20.0")]
1170 pub fn into_c_string(self: Box<Self>) -> CString {
1171 CString::from(self)
1172 }
1173}
1174
1175#[stable(feature = "rust1", since = "1.0.0")]
1176impl core::error::Error for NulError {
1177 #[allow(deprecated)]
1178 fn description(&self) -> &str {
1179 "nul byte found in data"
1180 }
1181}
1182
1183#[stable(feature = "cstring_from_vec_with_nul", since = "1.58.0")]
1184impl core::error::Error for FromVecWithNulError {}
1185
1186#[stable(feature = "cstring_into", since = "1.7.0")]
1187impl core::error::Error for IntoStringError {
1188 #[allow(deprecated)]
1189 fn description(&self) -> &str {
1190 "C string contained non-utf8 bytes"
1191 }
1192
1193 fn source(&self) -> Option<&(dyn core::error::Error + 'static)> {
1194 Some(&self.error)
1195 }
1196}