Skip to main content

core/bstr/
mod.rs

1//! The `ByteStr` type and trait implementations.
2
3mod traits;
4
5#[unstable(feature = "bstr_internals", issue = "none")]
6pub use traits::{impl_partial_eq, impl_partial_eq_n, impl_partial_eq_ord};
7
8use crate::borrow::{Borrow, BorrowMut};
9use crate::fmt;
10use crate::ops::{Deref, DerefMut, DerefPure};
11
12/// A wrapper for `&[u8]` representing a human-readable string that's conventionally, but not
13/// always, UTF-8.
14///
15/// Unlike `&str`, this type permits non-UTF-8 contents, making it suitable for user input,
16/// non-native filenames (as `Path` only supports native filenames), and other applications that
17/// need to round-trip whatever data the user provides.
18///
19/// For an owned, growable byte string buffer, use
20/// [`ByteString`](../../std/bstr/struct.ByteString.html).
21///
22/// `ByteStr` implements `Deref` to `[u8]`, so all methods available on `[u8]` are available on
23/// `ByteStr`.
24///
25/// # Representation
26///
27/// A `&ByteStr` has the same representation as a `&str`. That is, a `&ByteStr` is a wide pointer
28/// which includes a pointer to some bytes and a length.
29///
30/// # Trait implementations
31///
32/// The `ByteStr` type has a number of trait implementations, and in particular, defines equality
33/// and comparisons between `&ByteStr`, `&str`, and `&[u8]`, for convenience.
34///
35/// The `Debug` implementation for `ByteStr` shows its bytes as a normal string, with invalid UTF-8
36/// presented as hex escape sequences.
37///
38/// The `Display` implementation behaves as if the `ByteStr` were first lossily converted to a
39/// `str`, with invalid UTF-8 presented as the Unicode replacement character (�).
40#[unstable(feature = "bstr", issue = "134915")]
41#[repr(transparent)]
42#[doc(alias = "BStr")]
43pub struct ByteStr(pub [u8]);
44
45impl ByteStr {
46    /// Creates a `ByteStr` slice from anything that can be converted to a byte slice.
47    ///
48    /// This is a zero-cost conversion.
49    ///
50    /// # Example
51    ///
52    /// You can create a `ByteStr` from a byte array, a byte slice or a string slice:
53    ///
54    /// ```
55    /// # #![feature(bstr)]
56    /// # use std::bstr::ByteStr;
57    /// let a = ByteStr::new(b"abc");
58    /// let b = ByteStr::new(&b"abc"[..]);
59    /// let c = ByteStr::new("abc");
60    ///
61    /// assert_eq!(a, b);
62    /// assert_eq!(a, c);
63    /// ```
64    #[inline]
65    #[unstable(feature = "bstr", issue = "134915")]
66    #[rustc_const_unstable(feature = "const_convert", issue = "143773")]
67    pub const fn new<B: ?Sized + [const] AsRef<[u8]>>(bytes: &B) -> &Self {
68        ByteStr::from_bytes(bytes.as_ref())
69    }
70
71    /// Returns the same string as `&ByteStr`.
72    ///
73    /// This method is redundant when used directly on `&ByteStr`, but
74    /// it helps dereferencing other "container" types,
75    /// for example `Box<ByteStr>` or `Arc<ByteStr>`.
76    #[inline]
77    #[unstable(feature = "bstr", issue = "134915")]
78    pub const fn as_byte_str(&self) -> &ByteStr {
79        self
80    }
81
82    /// Returns the same string as `&mut ByteStr`.
83    ///
84    /// This method is redundant when used directly on `&mut ByteStr`, but
85    /// it helps dereferencing other "container" types,
86    /// for example `Box<ByteStr>` or `MutexGuard<ByteStr>`.
87    #[inline]
88    #[unstable(feature = "bstr", issue = "134915")]
89    pub const fn as_mut_byte_str(&mut self) -> &mut ByteStr {
90        self
91    }
92
93    #[doc(hidden)]
94    #[unstable(feature = "bstr_internals", issue = "none")]
95    #[inline]
96    #[rustc_const_unstable(feature = "bstr_internals", issue = "none")]
97    pub const fn from_bytes(slice: &[u8]) -> &Self {
98        // SAFETY: `ByteStr` is a transparent wrapper around `[u8]`, so we can turn a reference to
99        // the wrapped type into a reference to the wrapper type.
100        unsafe { &*(slice as *const [u8] as *const Self) }
101    }
102
103    #[doc(hidden)]
104    #[unstable(feature = "bstr_internals", issue = "none")]
105    #[inline]
106    #[rustc_const_unstable(feature = "bstr_internals", issue = "none")]
107    pub const fn from_bytes_mut(slice: &mut [u8]) -> &mut Self {
108        // SAFETY: `ByteStr` is a transparent wrapper around `[u8]`, so we can turn a reference to
109        // the wrapped type into a reference to the wrapper type.
110        unsafe { &mut *(slice as *mut [u8] as *mut Self) }
111    }
112
113    #[doc(hidden)]
114    #[unstable(feature = "bstr_internals", issue = "none")]
115    #[inline]
116    #[rustc_const_unstable(feature = "bstr_internals", issue = "none")]
117    pub const fn as_bytes(&self) -> &[u8] {
118        &self.0
119    }
120
121    #[doc(hidden)]
122    #[unstable(feature = "bstr_internals", issue = "none")]
123    #[inline]
124    #[rustc_const_unstable(feature = "bstr_internals", issue = "none")]
125    pub const fn as_bytes_mut(&mut self) -> &mut [u8] {
126        &mut self.0
127    }
128}
129
130#[unstable(feature = "bstr", issue = "134915")]
131#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
132impl const Deref for ByteStr {
133    type Target = [u8];
134
135    #[inline]
136    fn deref(&self) -> &[u8] {
137        &self.0
138    }
139}
140
141#[unstable(feature = "bstr", issue = "134915")]
142#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
143impl const DerefMut for ByteStr {
144    #[inline]
145    fn deref_mut(&mut self) -> &mut [u8] {
146        &mut self.0
147    }
148}
149
150#[unstable(feature = "deref_pure_trait", issue = "87121")]
151unsafe impl DerefPure for ByteStr {}
152
153#[unstable(feature = "bstr", issue = "134915")]
154impl fmt::Debug for ByteStr {
155    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
156        write!(f, "\"")?;
157        for chunk in self.utf8_chunks() {
158            for c in chunk.valid().chars() {
159                match c {
160                    '\0' => write!(f, "\\0")?,
161                    '\x01'..='\x7f' => write!(f, "{}", (c as u8).escape_ascii())?,
162                    _ => write!(f, "{}", c.escape_debug())?,
163                }
164            }
165            write!(f, "{}", chunk.invalid().escape_ascii())?;
166        }
167        write!(f, "\"")?;
168        Ok(())
169    }
170}
171
172#[unstable(feature = "bstr", issue = "134915")]
173impl fmt::Display for ByteStr {
174    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
175        let nchars: usize = self
176            .utf8_chunks()
177            .map(|chunk| {
178                chunk.valid().chars().count() + if chunk.invalid().is_empty() { 0 } else { 1 }
179            })
180            .sum();
181
182        let padding = f.width().unwrap_or(0).saturating_sub(nchars);
183        let fill = f.fill();
184
185        let (lpad, rpad) = match f.align() {
186            Some(fmt::Alignment::Right) => (padding, 0),
187            Some(fmt::Alignment::Center) => {
188                let half = padding / 2;
189                (half, half + padding % 2)
190            }
191            // Either alignment is not specified or it's left aligned
192            // which behaves the same with padding
193            _ => (0, padding),
194        };
195
196        for _ in 0..lpad {
197            write!(f, "{fill}")?;
198        }
199
200        for chunk in self.utf8_chunks() {
201            f.write_str(chunk.valid())?;
202            if !chunk.invalid().is_empty() {
203                f.write_str("\u{FFFD}")?;
204            }
205        }
206
207        for _ in 0..rpad {
208            write!(f, "{fill}")?;
209        }
210
211        Ok(())
212    }
213}
214
215#[unstable(feature = "bstr", issue = "134915")]
216#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
217impl const AsRef<[u8]> for ByteStr {
218    #[inline]
219    fn as_ref(&self) -> &[u8] {
220        &self.0
221    }
222}
223
224#[unstable(feature = "bstr", issue = "134915")]
225#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
226impl const AsRef<ByteStr> for ByteStr {
227    #[inline]
228    fn as_ref(&self) -> &ByteStr {
229        self
230    }
231}
232
233// `impl AsRef<ByteStr> for [u8]` omitted to avoid widespread inference failures
234
235#[unstable(feature = "bstr", issue = "134915")]
236#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
237impl const AsRef<ByteStr> for str {
238    #[inline]
239    fn as_ref(&self) -> &ByteStr {
240        ByteStr::new(self)
241    }
242}
243
244#[unstable(feature = "bstr", issue = "134915")]
245#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
246impl const AsMut<[u8]> for ByteStr {
247    #[inline]
248    fn as_mut(&mut self) -> &mut [u8] {
249        &mut self.0
250    }
251}
252
253// `impl AsMut<ByteStr> for [u8]` omitted to avoid widespread inference failures
254
255// `impl Borrow<ByteStr> for [u8]` omitted to avoid widespread inference failures
256
257// `impl Borrow<ByteStr> for str` omitted to avoid widespread inference failures
258
259#[unstable(feature = "bstr", issue = "134915")]
260#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
261impl const Borrow<[u8]> for ByteStr {
262    #[inline]
263    fn borrow(&self) -> &[u8] {
264        &self.0
265    }
266}
267
268// `impl BorrowMut<ByteStr> for [u8]` omitted to avoid widespread inference failures
269
270#[unstable(feature = "bstr", issue = "134915")]
271#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
272impl const BorrowMut<[u8]> for ByteStr {
273    #[inline]
274    fn borrow_mut(&mut self) -> &mut [u8] {
275        &mut self.0
276    }
277}
278
279#[unstable(feature = "bstr", issue = "134915")]
280impl<'a> Default for &'a ByteStr {
281    fn default() -> Self {
282        ByteStr::from_bytes(b"")
283    }
284}
285
286#[unstable(feature = "bstr", issue = "134915")]
287impl<'a> Default for &'a mut ByteStr {
288    fn default() -> Self {
289        ByteStr::from_bytes_mut(&mut [])
290    }
291}
292
293// Omitted due to inference failures
294//
295// #[unstable(feature = "bstr", issue = "134915")]
296// impl<'a, const N: usize> From<&'a [u8; N]> for &'a ByteStr {
297//     #[inline]
298//     fn from(s: &'a [u8; N]) -> Self {
299//         ByteStr::from_bytes(s)
300//     }
301// }
302//
303// #[unstable(feature = "bstr", issue = "134915")]
304// impl<'a> From<&'a [u8]> for &'a ByteStr {
305//     #[inline]
306//     fn from(s: &'a [u8]) -> Self {
307//         ByteStr::from_bytes(s)
308//     }
309// }
310
311// Omitted due to slice-from-array-issue-113238:
312//
313// #[unstable(feature = "bstr", issue = "134915")]
314// impl<'a> From<&'a ByteStr> for &'a [u8] {
315//     #[inline]
316//     fn from(s: &'a ByteStr) -> Self {
317//         &s.0
318//     }
319// }
320//
321// #[unstable(feature = "bstr", issue = "134915")]
322// impl<'a> From<&'a mut ByteStr> for &'a mut [u8] {
323//     #[inline]
324//     fn from(s: &'a mut ByteStr) -> Self {
325//         &mut s.0
326//     }
327// }
328
329// Omitted due to inference failures
330//
331// #[unstable(feature = "bstr", issue = "134915")]
332// impl<'a> From<&'a str> for &'a ByteStr {
333//     #[inline]
334//     fn from(s: &'a str) -> Self {
335//         ByteStr::from_bytes(s.as_bytes())
336//     }
337// }
338
339#[unstable(feature = "bstr", issue = "134915")]
340#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
341impl<'a> const TryFrom<&'a ByteStr> for &'a str {
342    type Error = crate::str::Utf8Error;
343
344    #[inline]
345    fn try_from(s: &'a ByteStr) -> Result<Self, Self::Error> {
346        crate::str::from_utf8(&s.0)
347    }
348}
349
350#[unstable(feature = "bstr", issue = "134915")]
351#[rustc_const_unstable(feature = "const_convert", issue = "143773")]
352impl<'a> const TryFrom<&'a mut ByteStr> for &'a mut str {
353    type Error = crate::str::Utf8Error;
354
355    #[inline]
356    fn try_from(s: &'a mut ByteStr) -> Result<Self, Self::Error> {
357        crate::str::from_utf8_mut(&mut s.0)
358    }
359}