alloc/string.rs
1//! A UTF-8โencoded, growable string.
2//!
3//! This module contains the [`String`] type, the [`ToString`] trait for
4//! converting to strings, and several error types that may result from
5//! working with [`String`]s.
6//!
7//! # Examples
8//!
9//! There are multiple ways to create a new [`String`] from a string literal:
10//!
11//! ```
12//! let s = "Hello".to_string();
13//!
14//! let s = String::from("world");
15//! let s: String = "also this".into();
16//! ```
17//!
18//! You can create a new [`String`] from an existing one by concatenating with
19//! `+`:
20//!
21//! ```
22//! let s = "Hello".to_string();
23//!
24//! let message = s + " world!";
25//! ```
26//!
27//! If you have a vector of valid UTF-8 bytes, you can make a [`String`] out of
28//! it. You can do the reverse too.
29//!
30//! ```
31//! let sparkle_heart = vec![240, 159, 146, 150];
32//!
33//! // We know these bytes are valid, so we'll use `unwrap()`.
34//! let sparkle_heart = String::from_utf8(sparkle_heart).unwrap();
35//!
36//! assert_eq!("๐", sparkle_heart);
37//!
38//! let bytes = sparkle_heart.into_bytes();
39//!
40//! assert_eq!(bytes, [240, 159, 146, 150]);
41//! ```
42
43#![stable(feature = "rust1", since = "1.0.0")]
44
45use core::error::Error;
46use core::iter::FusedIterator;
47#[cfg(not(no_global_oom_handling))]
48use core::iter::from_fn;
49#[cfg(not(no_global_oom_handling))]
50use core::num::Saturating;
51#[cfg(not(no_global_oom_handling))]
52use core::ops::Add;
53#[cfg(not(no_global_oom_handling))]
54use core::ops::AddAssign;
55use core::ops::{self, Range, RangeBounds};
56use core::str::pattern::{Pattern, Utf8Pattern};
57use core::{fmt, hash, ptr, slice};
58
59#[cfg(not(no_global_oom_handling))]
60use crate::alloc::Allocator;
61#[cfg(not(no_global_oom_handling))]
62use crate::borrow::{Cow, ToOwned};
63use crate::boxed::Box;
64use crate::collections::TryReserveError;
65use crate::str::{self, CharIndices, Chars, Utf8Error, from_utf8_unchecked_mut};
66#[cfg(not(no_global_oom_handling))]
67use crate::str::{FromStr, from_boxed_utf8_unchecked};
68use crate::vec::{self, Vec};
69
70/// A UTF-8โencoded, growable string.
71///
72/// `String` is the most common string type. It has ownership over the contents
73/// of the string, stored in a heap-allocated buffer (see [Representation](#representation)).
74/// It is closely related to its borrowed counterpart, the primitive [`str`].
75///
76/// # Examples
77///
78/// You can create a `String` from [a literal string][`&str`] with [`String::from`]:
79///
80/// [`String::from`]: From::from
81///
82/// ```
83/// let hello = String::from("Hello, world!");
84/// ```
85///
86/// You can append a [`char`] to a `String` with the [`push`] method, and
87/// append a [`&str`] with the [`push_str`] method:
88///
89/// ```
90/// let mut hello = String::from("Hello, ");
91///
92/// hello.push('w');
93/// hello.push_str("orld!");
94/// ```
95///
96/// [`push`]: String::push
97/// [`push_str`]: String::push_str
98///
99/// If you have a vector of UTF-8 bytes, you can create a `String` from it with
100/// the [`from_utf8`] method:
101///
102/// ```
103/// // some bytes, in a vector
104/// let sparkle_heart = vec![240, 159, 146, 150];
105///
106/// // We know these bytes are valid, so we'll use `unwrap()`.
107/// let sparkle_heart = String::from_utf8(sparkle_heart).unwrap();
108///
109/// assert_eq!("๐", sparkle_heart);
110/// ```
111///
112/// [`from_utf8`]: String::from_utf8
113///
114/// # UTF-8
115///
116/// `String`s are always valid UTF-8. If you need a non-UTF-8 string, consider
117/// [`OsString`]. It is similar, but without the UTF-8 constraint. Because UTF-8
118/// is a variable width encoding, `String`s are typically smaller than an array of
119/// the same `char`s:
120///
121/// ```
122/// // `s` is ASCII which represents each `char` as one byte
123/// let s = "hello";
124/// assert_eq!(s.len(), 5);
125///
126/// // A `char` array with the same contents would be longer because
127/// // every `char` is four bytes
128/// let s = ['h', 'e', 'l', 'l', 'o'];
129/// let size: usize = s.into_iter().map(|c| size_of_val(&c)).sum();
130/// assert_eq!(size, 20);
131///
132/// // However, for non-ASCII strings, the difference will be smaller
133/// // and sometimes they are the same
134/// let s = "๐๐๐๐๐";
135/// assert_eq!(s.len(), 20);
136///
137/// let s = ['๐', '๐', '๐', '๐', '๐'];
138/// let size: usize = s.into_iter().map(|c| size_of_val(&c)).sum();
139/// assert_eq!(size, 20);
140/// ```
141///
142/// This raises interesting questions as to how `s[i]` should work.
143/// What should `i` be here? Several options include byte indices and
144/// `char` indices but, because of UTF-8 encoding, only byte indices
145/// would provide constant time indexing. Getting the `i`th `char`, for
146/// example, is available using [`chars`]:
147///
148/// ```
149/// let s = "hello";
150/// let third_character = s.chars().nth(2);
151/// assert_eq!(third_character, Some('l'));
152///
153/// let s = "๐๐๐๐๐";
154/// let third_character = s.chars().nth(2);
155/// assert_eq!(third_character, Some('๐'));
156/// ```
157///
158/// Next, what should `s[i]` return? Because indexing returns a reference
159/// to underlying data it could be `&u8`, `&[u8]`, or something similar.
160/// Since we're only providing one index, `&u8` makes the most sense but that
161/// might not be what the user expects and can be explicitly achieved with
162/// [`as_bytes()`]:
163///
164/// ```
165/// // The first byte is 104 - the byte value of `'h'`
166/// let s = "hello";
167/// assert_eq!(s.as_bytes()[0], 104);
168/// // or
169/// assert_eq!(s.as_bytes()[0], b'h');
170///
171/// // The first byte is 240 which isn't obviously useful
172/// let s = "๐๐๐๐๐";
173/// assert_eq!(s.as_bytes()[0], 240);
174/// ```
175///
176/// Due to these ambiguities/restrictions, indexing with a `usize` is simply
177/// forbidden:
178///
179/// ```compile_fail,E0277
180/// let s = "hello";
181///
182/// // The following will not compile!
183/// println!("The first letter of s is {}", s[0]);
184/// ```
185///
186/// It is more clear, however, how `&s[i..j]` should work (that is,
187/// indexing with a range). It should accept byte indices (to be constant-time)
188/// and return a `&str` which is UTF-8 encoded. This is also called "string slicing".
189/// Note this will panic if the byte indices provided are not character
190/// boundaries - see [`is_char_boundary`] for more details. See the implementations
191/// for [`SliceIndex<str>`] for more details on string slicing. For a non-panicking
192/// version of string slicing, see [`get`].
193///
194/// [`OsString`]: ../../std/ffi/struct.OsString.html "ffi::OsString"
195/// [`SliceIndex<str>`]: core::slice::SliceIndex
196/// [`as_bytes()`]: str::as_bytes
197/// [`get`]: str::get
198/// [`is_char_boundary`]: str::is_char_boundary
199///
200/// The [`bytes`] and [`chars`] methods return iterators over the bytes and
201/// codepoints of the string, respectively. To iterate over codepoints along
202/// with byte indices, use [`char_indices`].
203///
204/// [`bytes`]: str::bytes
205/// [`chars`]: str::chars
206/// [`char_indices`]: str::char_indices
207///
208/// # Deref
209///
210/// `String` implements <code>[Deref]<Target = [str]></code>, and so inherits all of [`str`]'s
211/// methods. In addition, this means that you can pass a `String` to a
212/// function which takes a [`&str`] by using an ampersand (`&`):
213///
214/// ```
215/// fn takes_str(s: &str) { }
216///
217/// let s = String::from("Hello");
218///
219/// takes_str(&s);
220/// ```
221///
222/// This will create a [`&str`] from the `String` and pass it in. This
223/// conversion is very inexpensive, and so generally, functions will accept
224/// [`&str`]s as arguments unless they need a `String` for some specific
225/// reason.
226///
227/// In certain cases Rust doesn't have enough information to make this
228/// conversion, known as [`Deref`] coercion. In the following example a string
229/// slice [`&'a str`][`&str`] implements the trait `TraitExample`, and the function
230/// `example_func` takes anything that implements the trait. In this case Rust
231/// would need to make two implicit conversions, which Rust doesn't have the
232/// means to do. For that reason, the following example will not compile.
233///
234/// ```compile_fail,E0277
235/// trait TraitExample {}
236///
237/// impl<'a> TraitExample for &'a str {}
238///
239/// fn example_func<A: TraitExample>(example_arg: A) {}
240///
241/// let example_string = String::from("example_string");
242/// example_func(&example_string);
243/// ```
244///
245/// There are two options that would work instead. The first would be to
246/// change the line `example_func(&example_string);` to
247/// `example_func(example_string.as_str());`, using the method [`as_str()`]
248/// to explicitly extract the string slice containing the string. The second
249/// way changes `example_func(&example_string);` to
250/// `example_func(&*example_string);`. In this case we are dereferencing a
251/// `String` to a [`str`], then referencing the [`str`] back to
252/// [`&str`]. The second way is more idiomatic, however both work to do the
253/// conversion explicitly rather than relying on the implicit conversion.
254///
255/// # Representation
256///
257/// A `String` is made up of three components: a pointer to some bytes, a
258/// length, and a capacity. The pointer points to the internal buffer which `String`
259/// uses to store its data. The length is the number of bytes currently stored
260/// in the buffer, and the capacity is the size of the buffer in bytes. As such,
261/// the length will always be less than or equal to the capacity.
262///
263/// This buffer is always stored on the heap.
264///
265/// You can look at these with the [`as_ptr`], [`len`], and [`capacity`]
266/// methods:
267///
268/// ```
269/// let story = String::from("Once upon a time...");
270///
271/// // Deconstruct the String into parts.
272/// let (ptr, len, capacity) = story.into_raw_parts();
273///
274/// // story has nineteen bytes
275/// assert_eq!(19, len);
276///
277/// // We can re-build a String out of ptr, len, and capacity. This is all
278/// // unsafe because we are responsible for making sure the components are
279/// // valid:
280/// let s = unsafe { String::from_raw_parts(ptr, len, capacity) } ;
281///
282/// assert_eq!(String::from("Once upon a time..."), s);
283/// ```
284///
285/// [`as_ptr`]: str::as_ptr
286/// [`len`]: String::len
287/// [`capacity`]: String::capacity
288///
289/// If a `String` has enough capacity, adding elements to it will not
290/// re-allocate. For example, consider this program:
291///
292/// ```
293/// let mut s = String::new();
294///
295/// println!("{}", s.capacity());
296///
297/// for _ in 0..5 {
298/// s.push_str("hello");
299/// println!("{}", s.capacity());
300/// }
301/// ```
302///
303/// This will output the following:
304///
305/// ```text
306/// 0
307/// 8
308/// 16
309/// 16
310/// 32
311/// 32
312/// ```
313///
314/// At first, we have no memory allocated at all, but as we append to the
315/// string, it increases its capacity appropriately. If we instead use the
316/// [`with_capacity`] method to allocate the correct capacity initially:
317///
318/// ```
319/// let mut s = String::with_capacity(25);
320///
321/// println!("{}", s.capacity());
322///
323/// for _ in 0..5 {
324/// s.push_str("hello");
325/// println!("{}", s.capacity());
326/// }
327/// ```
328///
329/// [`with_capacity`]: String::with_capacity
330///
331/// We end up with a different output:
332///
333/// ```text
334/// 25
335/// 25
336/// 25
337/// 25
338/// 25
339/// 25
340/// ```
341///
342/// Here, there's no need to allocate more memory inside the loop.
343///
344/// [str]: prim@str "str"
345/// [`str`]: prim@str "str"
346/// [`&str`]: prim@str "&str"
347/// [Deref]: core::ops::Deref "ops::Deref"
348/// [`Deref`]: core::ops::Deref "ops::Deref"
349/// [`as_str()`]: String::as_str
350#[derive(PartialEq, PartialOrd, Eq, Ord)]
351#[stable(feature = "rust1", since = "1.0.0")]
352#[lang = "String"]
353pub struct String {
354 vec: Vec<u8>,
355}
356
357/// A possible error value when converting a `String` from a UTF-8 byte vector.
358///
359/// This type is the error type for the [`from_utf8`] method on [`String`]. It
360/// is designed in such a way to carefully avoid reallocations: the
361/// [`into_bytes`] method will give back the byte vector that was used in the
362/// conversion attempt.
363///
364/// [`from_utf8`]: String::from_utf8
365/// [`into_bytes`]: FromUtf8Error::into_bytes
366///
367/// The [`Utf8Error`] type provided by [`std::str`] represents an error that may
368/// occur when converting a slice of [`u8`]s to a [`&str`]. In this sense, it's
369/// an analogue to `FromUtf8Error`, and you can get one from a `FromUtf8Error`
370/// through the [`utf8_error`] method.
371///
372/// [`Utf8Error`]: str::Utf8Error "std::str::Utf8Error"
373/// [`std::str`]: core::str "std::str"
374/// [`&str`]: prim@str "&str"
375/// [`utf8_error`]: FromUtf8Error::utf8_error
376///
377/// # Examples
378///
379/// ```
380/// // some invalid bytes, in a vector
381/// let bytes = vec![0, 159];
382///
383/// let value = String::from_utf8(bytes);
384///
385/// assert!(value.is_err());
386/// assert_eq!(vec![0, 159], value.unwrap_err().into_bytes());
387/// ```
388#[stable(feature = "rust1", since = "1.0.0")]
389#[cfg_attr(not(no_global_oom_handling), derive(Clone))]
390#[derive(Debug, PartialEq, Eq)]
391pub struct FromUtf8Error {
392 bytes: Vec<u8>,
393 error: Utf8Error,
394}
395
396/// A possible error value when converting a `String` from a UTF-16 byte slice.
397///
398/// This type is the error type for the [`from_utf16`] method on [`String`].
399///
400/// [`from_utf16`]: String::from_utf16
401///
402/// # Examples
403///
404/// ```
405/// // ๐mu<invalid>ic
406/// let v = &[0xD834, 0xDD1E, 0x006d, 0x0075,
407/// 0xD800, 0x0069, 0x0063];
408///
409/// assert!(String::from_utf16(v).is_err());
410/// ```
411#[stable(feature = "rust1", since = "1.0.0")]
412#[derive(Debug)]
413pub struct FromUtf16Error {
414 kind: FromUtf16ErrorKind,
415}
416
417#[cfg_attr(no_global_oom_handling, expect(dead_code))]
418#[derive(Clone, PartialEq, Eq, Debug)]
419enum FromUtf16ErrorKind {
420 LoneSurrogate,
421 OddBytes,
422}
423
424impl String {
425 /// Creates a new empty `String`.
426 ///
427 /// Given that the `String` is empty, this will not allocate any initial
428 /// buffer. While that means that this initial operation is very
429 /// inexpensive, it may cause excessive allocation later when you add
430 /// data. If you have an idea of how much data the `String` will hold,
431 /// consider the [`with_capacity`] method to prevent excessive
432 /// re-allocation.
433 ///
434 /// [`with_capacity`]: String::with_capacity
435 ///
436 /// # Examples
437 ///
438 /// ```
439 /// let s = String::new();
440 /// ```
441 #[inline]
442 #[rustc_const_stable(feature = "const_string_new", since = "1.39.0")]
443 #[rustc_diagnostic_item = "string_new"]
444 #[stable(feature = "rust1", since = "1.0.0")]
445 #[must_use]
446 pub const fn new() -> String {
447 String { vec: Vec::new() }
448 }
449
450 /// Creates a new empty `String` with at least the specified capacity.
451 ///
452 /// `String`s have an internal buffer to hold their data. The capacity is
453 /// the length of that buffer, and can be queried with the [`capacity`]
454 /// method. This method creates an empty `String`, but one with an initial
455 /// buffer that can hold at least `capacity` bytes. This is useful when you
456 /// may be appending a bunch of data to the `String`, reducing the number of
457 /// reallocations it needs to do.
458 ///
459 /// [`capacity`]: String::capacity
460 ///
461 /// If the given capacity is `0`, no allocation will occur, and this method
462 /// is identical to the [`new`] method.
463 ///
464 /// [`new`]: String::new
465 ///
466 /// # Panics
467 ///
468 /// Panics if the capacity exceeds `isize::MAX` _bytes_.
469 ///
470 /// # Examples
471 ///
472 /// ```
473 /// let mut s = String::with_capacity(10);
474 ///
475 /// // The String contains no chars, even though it has capacity for more
476 /// assert_eq!(s.len(), 0);
477 ///
478 /// // These are all done without reallocating...
479 /// let cap = s.capacity();
480 /// for _ in 0..10 {
481 /// s.push('a');
482 /// }
483 ///
484 /// assert_eq!(s.capacity(), cap);
485 ///
486 /// // ...but this may make the string reallocate
487 /// s.push('a');
488 /// ```
489 #[cfg(not(no_global_oom_handling))]
490 #[inline]
491 #[stable(feature = "rust1", since = "1.0.0")]
492 #[must_use]
493 pub fn with_capacity(capacity: usize) -> String {
494 String { vec: Vec::with_capacity(capacity) }
495 }
496
497 /// Creates a new empty `String` with at least the specified capacity.
498 ///
499 /// # Errors
500 ///
501 /// Returns [`Err`] if the capacity exceeds `isize::MAX` bytes,
502 /// or if the memory allocator reports failure.
503 ///
504 #[inline]
505 #[unstable(feature = "try_with_capacity", issue = "91913")]
506 pub fn try_with_capacity(capacity: usize) -> Result<String, TryReserveError> {
507 Ok(String { vec: Vec::try_with_capacity(capacity)? })
508 }
509
510 /// Converts a vector of bytes to a `String`.
511 ///
512 /// A string ([`String`]) is made of bytes ([`u8`]), and a vector of bytes
513 /// ([`Vec<u8>`]) is made of bytes, so this function converts between the
514 /// two. Not all byte slices are valid `String`s, however: `String`
515 /// requires that it is valid UTF-8. `from_utf8()` checks to ensure that
516 /// the bytes are valid UTF-8, and then does the conversion.
517 ///
518 /// If you are sure that the byte slice is valid UTF-8, and you don't want
519 /// to incur the overhead of the validity check, there is an unsafe version
520 /// of this function, [`from_utf8_unchecked`], which has the same behavior
521 /// but skips the check.
522 ///
523 /// This method will take care to not copy the vector, for efficiency's
524 /// sake.
525 ///
526 /// If you need a [`&str`] instead of a `String`, consider
527 /// [`str::from_utf8`].
528 ///
529 /// The inverse of this method is [`into_bytes`].
530 ///
531 /// # Errors
532 ///
533 /// Returns [`Err`] if the slice is not UTF-8 with a description as to why the
534 /// provided bytes are not UTF-8. The vector you moved in is also included.
535 ///
536 /// # Examples
537 ///
538 /// Basic usage:
539 ///
540 /// ```
541 /// // some bytes, in a vector
542 /// let sparkle_heart = vec![240, 159, 146, 150];
543 ///
544 /// // We know these bytes are valid, so we'll use `unwrap()`.
545 /// let sparkle_heart = String::from_utf8(sparkle_heart).unwrap();
546 ///
547 /// assert_eq!("๐", sparkle_heart);
548 /// ```
549 ///
550 /// Incorrect bytes:
551 ///
552 /// ```
553 /// // some invalid bytes, in a vector
554 /// let sparkle_heart = vec![0, 159, 146, 150];
555 ///
556 /// assert!(String::from_utf8(sparkle_heart).is_err());
557 /// ```
558 ///
559 /// See the docs for [`FromUtf8Error`] for more details on what you can do
560 /// with this error.
561 ///
562 /// [`from_utf8_unchecked`]: String::from_utf8_unchecked
563 /// [`Vec<u8>`]: crate::vec::Vec "Vec"
564 /// [`&str`]: prim@str "&str"
565 /// [`into_bytes`]: String::into_bytes
566 #[inline]
567 #[stable(feature = "rust1", since = "1.0.0")]
568 #[rustc_diagnostic_item = "string_from_utf8"]
569 pub fn from_utf8(vec: Vec<u8>) -> Result<String, FromUtf8Error> {
570 match str::from_utf8(&vec) {
571 Ok(..) => Ok(String { vec }),
572 Err(e) => Err(FromUtf8Error { bytes: vec, error: e }),
573 }
574 }
575
576 /// Converts a slice of bytes to a string, including invalid characters.
577 ///
578 /// Strings are made of bytes ([`u8`]), and a slice of bytes
579 /// ([`&[u8]`][byteslice]) is made of bytes, so this function converts
580 /// between the two. Not all byte slices are valid strings, however: strings
581 /// are required to be valid UTF-8. During this conversion,
582 /// `from_utf8_lossy()` will replace any invalid UTF-8 sequences with
583 /// [`U+FFFD REPLACEMENT CHARACTER`][U+FFFD], which looks like this: ๏ฟฝ
584 ///
585 /// [byteslice]: prim@slice
586 /// [U+FFFD]: core::char::REPLACEMENT_CHARACTER
587 ///
588 /// If you are sure that the byte slice is valid UTF-8, and you don't want
589 /// to incur the overhead of the conversion, there is an unsafe version
590 /// of this function, [`from_utf8_unchecked`], which has the same behavior
591 /// but skips the checks.
592 ///
593 /// [`from_utf8_unchecked`]: String::from_utf8_unchecked
594 ///
595 /// This function returns a [`Cow<'a, str>`]. If our byte slice is invalid
596 /// UTF-8, then we need to insert the replacement characters, which will
597 /// change the size of the string, and hence, require a `String`. But if
598 /// it's already valid UTF-8, we don't need a new allocation. This return
599 /// type allows us to handle both cases.
600 ///
601 /// [`Cow<'a, str>`]: crate::borrow::Cow "borrow::Cow"
602 ///
603 /// # Examples
604 ///
605 /// Basic usage:
606 ///
607 /// ```
608 /// // some bytes, in a vector
609 /// let sparkle_heart = vec![240, 159, 146, 150];
610 ///
611 /// let sparkle_heart = String::from_utf8_lossy(&sparkle_heart);
612 ///
613 /// assert_eq!("๐", sparkle_heart);
614 /// ```
615 ///
616 /// Incorrect bytes:
617 ///
618 /// ```
619 /// // some invalid bytes
620 /// let input = b"Hello \xF0\x90\x80World";
621 /// let output = String::from_utf8_lossy(input);
622 ///
623 /// assert_eq!("Hello ๏ฟฝWorld", output);
624 /// ```
625 #[must_use]
626 #[cfg(not(no_global_oom_handling))]
627 #[stable(feature = "rust1", since = "1.0.0")]
628 pub fn from_utf8_lossy(v: &[u8]) -> Cow<'_, str> {
629 let mut iter = v.utf8_chunks();
630
631 let Some(chunk) = iter.next() else {
632 return Cow::Borrowed("");
633 };
634 let first_valid = chunk.valid();
635 if chunk.invalid().is_empty() {
636 debug_assert_eq!(first_valid.len(), v.len());
637 return Cow::Borrowed(first_valid);
638 }
639
640 const REPLACEMENT: &str = "\u{FFFD}";
641
642 let mut res = String::with_capacity(v.len());
643 res.push_str(first_valid);
644 res.push_str(REPLACEMENT);
645
646 for chunk in iter {
647 res.push_str(chunk.valid());
648 if !chunk.invalid().is_empty() {
649 res.push_str(REPLACEMENT);
650 }
651 }
652
653 Cow::Owned(res)
654 }
655
656 /// Converts a [`Vec<u8>`] to a `String`, substituting invalid UTF-8
657 /// sequences with replacement characters.
658 ///
659 /// See [`from_utf8_lossy`] for more details.
660 ///
661 /// [`from_utf8_lossy`]: String::from_utf8_lossy
662 ///
663 /// Note that this function does not guarantee reuse of the original `Vec`
664 /// allocation.
665 ///
666 /// # Examples
667 ///
668 /// Basic usage:
669 ///
670 /// ```
671 /// #![feature(string_from_utf8_lossy_owned)]
672 /// // some bytes, in a vector
673 /// let sparkle_heart = vec![240, 159, 146, 150];
674 ///
675 /// let sparkle_heart = String::from_utf8_lossy_owned(sparkle_heart);
676 ///
677 /// assert_eq!(String::from("๐"), sparkle_heart);
678 /// ```
679 ///
680 /// Incorrect bytes:
681 ///
682 /// ```
683 /// #![feature(string_from_utf8_lossy_owned)]
684 /// // some invalid bytes
685 /// let input: Vec<u8> = b"Hello \xF0\x90\x80World".into();
686 /// let output = String::from_utf8_lossy_owned(input);
687 ///
688 /// assert_eq!(String::from("Hello ๏ฟฝWorld"), output);
689 /// ```
690 #[must_use]
691 #[cfg(not(no_global_oom_handling))]
692 #[unstable(feature = "string_from_utf8_lossy_owned", issue = "129436")]
693 pub fn from_utf8_lossy_owned(v: Vec<u8>) -> String {
694 if let Cow::Owned(string) = String::from_utf8_lossy(&v) {
695 string
696 } else {
697 // SAFETY: `String::from_utf8_lossy`'s contract ensures that if
698 // it returns a `Cow::Borrowed`, it is a valid UTF-8 string.
699 // Otherwise, it returns a new allocation of an owned `String`, with
700 // replacement characters for invalid sequences, which is returned
701 // above.
702 unsafe { String::from_utf8_unchecked(v) }
703 }
704 }
705
706 /// Decode a native endian UTF-16โencoded vector `v` into a `String`,
707 /// returning [`Err`] if `v` contains any invalid data.
708 ///
709 /// # Examples
710 ///
711 /// ```
712 /// // ๐music
713 /// let v = &[0xD834, 0xDD1E, 0x006d, 0x0075,
714 /// 0x0073, 0x0069, 0x0063];
715 /// assert_eq!(String::from("๐music"),
716 /// String::from_utf16(v).unwrap());
717 ///
718 /// // ๐mu<invalid>ic
719 /// let v = &[0xD834, 0xDD1E, 0x006d, 0x0075,
720 /// 0xD800, 0x0069, 0x0063];
721 /// assert!(String::from_utf16(v).is_err());
722 /// ```
723 #[cfg(not(no_global_oom_handling))]
724 #[stable(feature = "rust1", since = "1.0.0")]
725 pub fn from_utf16(v: &[u16]) -> Result<String, FromUtf16Error> {
726 // This isn't done via collect::<Result<_, _>>() for performance reasons.
727 // FIXME: the function can be simplified again when #48994 is closed.
728 let mut ret = String::with_capacity(v.len());
729 for c in char::decode_utf16(v.iter().cloned()) {
730 let Ok(c) = c else {
731 return Err(FromUtf16Error { kind: FromUtf16ErrorKind::LoneSurrogate });
732 };
733 ret.push(c);
734 }
735 Ok(ret)
736 }
737
738 /// Decode a native endian UTF-16โencoded slice `v` into a `String`,
739 /// replacing invalid data with [the replacement character (`U+FFFD`)][U+FFFD].
740 ///
741 /// Unlike [`from_utf8_lossy`] which returns a [`Cow<'a, str>`],
742 /// `from_utf16_lossy` returns a `String` since the UTF-16 to UTF-8
743 /// conversion requires a memory allocation.
744 ///
745 /// [`from_utf8_lossy`]: String::from_utf8_lossy
746 /// [`Cow<'a, str>`]: crate::borrow::Cow "borrow::Cow"
747 /// [U+FFFD]: core::char::REPLACEMENT_CHARACTER
748 ///
749 /// # Examples
750 ///
751 /// ```
752 /// // ๐mus<invalid>ic<invalid>
753 /// let v = &[0xD834, 0xDD1E, 0x006d, 0x0075,
754 /// 0x0073, 0xDD1E, 0x0069, 0x0063,
755 /// 0xD834];
756 ///
757 /// assert_eq!(String::from("๐mus\u{FFFD}ic\u{FFFD}"),
758 /// String::from_utf16_lossy(v));
759 /// ```
760 #[cfg(not(no_global_oom_handling))]
761 #[must_use]
762 #[inline]
763 #[stable(feature = "rust1", since = "1.0.0")]
764 pub fn from_utf16_lossy(v: &[u16]) -> String {
765 char::decode_utf16(v.iter().cloned())
766 .map(|r| r.unwrap_or(char::REPLACEMENT_CHARACTER))
767 .collect()
768 }
769
770 /// Decode a UTF-16LEโencoded vector `v` into a `String`,
771 /// returning [`Err`] if `v` contains any invalid data.
772 ///
773 /// # Examples
774 ///
775 /// Basic usage:
776 ///
777 /// ```
778 /// // ๐music
779 /// let v = &[0x34, 0xD8, 0x1E, 0xDD, 0x6d, 0x00, 0x75, 0x00,
780 /// 0x73, 0x00, 0x69, 0x00, 0x63, 0x00];
781 /// assert_eq!(String::from("๐music"),
782 /// String::from_utf16le(v).unwrap());
783 ///
784 /// // ๐mu<invalid>ic
785 /// let v = &[0x34, 0xD8, 0x1E, 0xDD, 0x6d, 0x00, 0x75, 0x00,
786 /// 0x00, 0xD8, 0x69, 0x00, 0x63, 0x00];
787 /// assert!(String::from_utf16le(v).is_err());
788 /// ```
789 #[cfg(not(no_global_oom_handling))]
790 #[stable(feature = "str_from_utf16_endian", since = "CURRENT_RUSTC_VERSION")]
791 pub fn from_utf16le(v: &[u8]) -> Result<String, FromUtf16Error> {
792 let (chunks, []) = v.as_chunks::<2>() else {
793 return Err(FromUtf16Error { kind: FromUtf16ErrorKind::OddBytes });
794 };
795 match (cfg!(target_endian = "little"), unsafe { v.align_to::<u16>() }) {
796 (true, ([], v, [])) => Self::from_utf16(v),
797 _ => char::decode_utf16(chunks.iter().copied().map(u16::from_le_bytes))
798 .collect::<Result<_, _>>()
799 .map_err(|_| FromUtf16Error { kind: FromUtf16ErrorKind::LoneSurrogate }),
800 }
801 }
802
803 /// Decode a UTF-16LEโencoded slice `v` into a `String`, replacing
804 /// invalid data with [the replacement character (`U+FFFD`)][U+FFFD].
805 ///
806 /// Unlike [`from_utf8_lossy`] which returns a [`Cow<'a, str>`],
807 /// `from_utf16le_lossy` returns a `String` since the UTF-16 to UTF-8
808 /// conversion requires a memory allocation.
809 ///
810 /// [`from_utf8_lossy`]: String::from_utf8_lossy
811 /// [`Cow<'a, str>`]: crate::borrow::Cow "borrow::Cow"
812 /// [U+FFFD]: core::char::REPLACEMENT_CHARACTER
813 ///
814 /// # Examples
815 ///
816 /// Basic usage:
817 ///
818 /// ```
819 /// // ๐mus<invalid>ic<invalid>
820 /// let v = &[0x34, 0xD8, 0x1E, 0xDD, 0x6d, 0x00, 0x75, 0x00,
821 /// 0x73, 0x00, 0x1E, 0xDD, 0x69, 0x00, 0x63, 0x00,
822 /// 0x34, 0xD8];
823 ///
824 /// assert_eq!(String::from("๐mus\u{FFFD}ic\u{FFFD}"),
825 /// String::from_utf16le_lossy(v));
826 /// ```
827 #[cfg(not(no_global_oom_handling))]
828 #[stable(feature = "str_from_utf16_endian", since = "CURRENT_RUSTC_VERSION")]
829 pub fn from_utf16le_lossy(v: &[u8]) -> String {
830 match (cfg!(target_endian = "little"), unsafe { v.align_to::<u16>() }) {
831 (true, ([], v, [])) => Self::from_utf16_lossy(v),
832 (true, ([], v, [_remainder])) => Self::from_utf16_lossy(v) + "\u{FFFD}",
833 _ => {
834 let (chunks, remainder) = v.as_chunks::<2>();
835 let string = char::decode_utf16(chunks.iter().copied().map(u16::from_le_bytes))
836 .map(|r| r.unwrap_or(char::REPLACEMENT_CHARACTER))
837 .collect();
838 if remainder.is_empty() { string } else { string + "\u{FFFD}" }
839 }
840 }
841 }
842
843 /// Decode a UTF-16BEโencoded vector `v` into a `String`,
844 /// returning [`Err`] if `v` contains any invalid data.
845 ///
846 /// # Examples
847 ///
848 /// Basic usage:
849 ///
850 /// ```
851 /// // ๐music
852 /// let v = &[0xD8, 0x34, 0xDD, 0x1E, 0x00, 0x6d, 0x00, 0x75,
853 /// 0x00, 0x73, 0x00, 0x69, 0x00, 0x63];
854 /// assert_eq!(String::from("๐music"),
855 /// String::from_utf16be(v).unwrap());
856 ///
857 /// // ๐mu<invalid>ic
858 /// let v = &[0xD8, 0x34, 0xDD, 0x1E, 0x00, 0x6d, 0x00, 0x75,
859 /// 0xD8, 0x00, 0x00, 0x69, 0x00, 0x63];
860 /// assert!(String::from_utf16be(v).is_err());
861 /// ```
862 #[cfg(not(no_global_oom_handling))]
863 #[stable(feature = "str_from_utf16_endian", since = "CURRENT_RUSTC_VERSION")]
864 pub fn from_utf16be(v: &[u8]) -> Result<String, FromUtf16Error> {
865 let (chunks, []) = v.as_chunks::<2>() else {
866 return Err(FromUtf16Error { kind: FromUtf16ErrorKind::OddBytes });
867 };
868 match (cfg!(target_endian = "big"), unsafe { v.align_to::<u16>() }) {
869 (true, ([], v, [])) => Self::from_utf16(v),
870 _ => char::decode_utf16(chunks.iter().copied().map(u16::from_be_bytes))
871 .collect::<Result<_, _>>()
872 .map_err(|_| FromUtf16Error { kind: FromUtf16ErrorKind::LoneSurrogate }),
873 }
874 }
875
876 /// Decode a UTF-16BEโencoded slice `v` into a `String`, replacing
877 /// invalid data with [the replacement character (`U+FFFD`)][U+FFFD].
878 ///
879 /// Unlike [`from_utf8_lossy`] which returns a [`Cow<'a, str>`],
880 /// `from_utf16le_lossy` returns a `String` since the UTF-16 to UTF-8
881 /// conversion requires a memory allocation.
882 ///
883 /// [`from_utf8_lossy`]: String::from_utf8_lossy
884 /// [`Cow<'a, str>`]: crate::borrow::Cow "borrow::Cow"
885 /// [U+FFFD]: core::char::REPLACEMENT_CHARACTER
886 ///
887 /// # Examples
888 ///
889 /// Basic usage:
890 ///
891 /// ```
892 /// // ๐mus<invalid>ic<invalid>
893 /// let v = &[0xD8, 0x34, 0xDD, 0x1E, 0x00, 0x6d, 0x00, 0x75,
894 /// 0x00, 0x73, 0xDD, 0x1E, 0x00, 0x69, 0x00, 0x63,
895 /// 0xD8, 0x34];
896 ///
897 /// assert_eq!(String::from("๐mus\u{FFFD}ic\u{FFFD}"),
898 /// String::from_utf16be_lossy(v));
899 /// ```
900 #[cfg(not(no_global_oom_handling))]
901 #[stable(feature = "str_from_utf16_endian", since = "CURRENT_RUSTC_VERSION")]
902 pub fn from_utf16be_lossy(v: &[u8]) -> String {
903 match (cfg!(target_endian = "big"), unsafe { v.align_to::<u16>() }) {
904 (true, ([], v, [])) => Self::from_utf16_lossy(v),
905 (true, ([], v, [_remainder])) => Self::from_utf16_lossy(v) + "\u{FFFD}",
906 _ => {
907 let (chunks, remainder) = v.as_chunks::<2>();
908 let string = char::decode_utf16(chunks.iter().copied().map(u16::from_be_bytes))
909 .map(|r| r.unwrap_or(char::REPLACEMENT_CHARACTER))
910 .collect();
911 if remainder.is_empty() { string } else { string + "\u{FFFD}" }
912 }
913 }
914 }
915
916 /// Decomposes a `String` into its raw components: `(pointer, length, capacity)`.
917 ///
918 /// Returns the raw pointer to the underlying data, the length of
919 /// the string (in bytes), and the allocated capacity of the data
920 /// (in bytes). These are the same arguments in the same order as
921 /// the arguments to [`from_raw_parts`].
922 ///
923 /// After calling this function, the caller is responsible for the
924 /// memory previously managed by the `String`. The only way to do
925 /// this is to convert the raw pointer, length, and capacity back
926 /// into a `String` with the [`from_raw_parts`] function, allowing
927 /// the destructor to perform the cleanup.
928 ///
929 /// [`from_raw_parts`]: String::from_raw_parts
930 ///
931 /// # Examples
932 ///
933 /// ```
934 /// let s = String::from("hello");
935 ///
936 /// let (ptr, len, cap) = s.into_raw_parts();
937 ///
938 /// let rebuilt = unsafe { String::from_raw_parts(ptr, len, cap) };
939 /// assert_eq!(rebuilt, "hello");
940 /// ```
941 #[must_use = "losing the pointer will leak memory"]
942 #[stable(feature = "vec_into_raw_parts", since = "1.93.0")]
943 pub fn into_raw_parts(self) -> (*mut u8, usize, usize) {
944 self.vec.into_raw_parts()
945 }
946
947 /// Creates a new `String` from a pointer, a length and a capacity.
948 ///
949 /// # Safety
950 ///
951 /// This is highly unsafe, due to the number of invariants that aren't
952 /// checked:
953 ///
954 /// * all safety requirements for [`Vec::<u8>::from_raw_parts`].
955 /// * all safety requirements for [`String::from_utf8_unchecked`].
956 ///
957 /// Violating these may cause problems like corrupting the allocator's
958 /// internal data structures. For example, it is normally **not** safe to
959 /// build a `String` from a pointer to a C `char` array containing UTF-8
960 /// _unless_ you are certain that array was originally allocated by the
961 /// Rust standard library's allocator.
962 ///
963 /// The ownership of `buf` is effectively transferred to the
964 /// `String` which may then deallocate, reallocate or change the
965 /// contents of memory pointed to by the pointer at will. Ensure
966 /// that nothing else uses the pointer after calling this
967 /// function.
968 ///
969 /// # Examples
970 ///
971 /// ```
972 /// unsafe {
973 /// let s = String::from("hello");
974 ///
975 /// // Deconstruct the String into parts.
976 /// let (ptr, len, capacity) = s.into_raw_parts();
977 ///
978 /// let s = String::from_raw_parts(ptr, len, capacity);
979 ///
980 /// assert_eq!(String::from("hello"), s);
981 /// }
982 /// ```
983 #[inline]
984 #[stable(feature = "rust1", since = "1.0.0")]
985 pub unsafe fn from_raw_parts(buf: *mut u8, length: usize, capacity: usize) -> String {
986 unsafe { String { vec: Vec::from_raw_parts(buf, length, capacity) } }
987 }
988
989 /// Converts a vector of bytes to a `String` without checking that the
990 /// string contains valid UTF-8.
991 ///
992 /// See the safe version, [`from_utf8`], for more details.
993 ///
994 /// [`from_utf8`]: String::from_utf8
995 ///
996 /// # Safety
997 ///
998 /// This function is unsafe because it does not check that the bytes passed
999 /// to it are valid UTF-8. If this constraint is violated, it may cause
1000 /// memory unsafety issues with future users of the `String`, as the rest of
1001 /// the standard library assumes that `String`s are valid UTF-8.
1002 ///
1003 /// # Examples
1004 ///
1005 /// ```
1006 /// // some bytes, in a vector
1007 /// let sparkle_heart = vec![240, 159, 146, 150];
1008 ///
1009 /// let sparkle_heart = unsafe {
1010 /// String::from_utf8_unchecked(sparkle_heart)
1011 /// };
1012 ///
1013 /// assert_eq!("๐", sparkle_heart);
1014 /// ```
1015 #[inline]
1016 #[must_use]
1017 #[stable(feature = "rust1", since = "1.0.0")]
1018 pub unsafe fn from_utf8_unchecked(bytes: Vec<u8>) -> String {
1019 String { vec: bytes }
1020 }
1021
1022 /// Converts a `String` into a byte vector.
1023 ///
1024 /// This consumes the `String`, so we do not need to copy its contents.
1025 ///
1026 /// # Examples
1027 ///
1028 /// ```
1029 /// let s = String::from("hello");
1030 /// let bytes = s.into_bytes();
1031 ///
1032 /// assert_eq!(&[104, 101, 108, 108, 111][..], &bytes[..]);
1033 /// ```
1034 #[inline]
1035 #[must_use = "`self` will be dropped if the result is not used"]
1036 #[stable(feature = "rust1", since = "1.0.0")]
1037 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1038 #[rustc_allow_const_fn_unstable(const_precise_live_drops)]
1039 pub const fn into_bytes(self) -> Vec<u8> {
1040 self.vec
1041 }
1042
1043 /// Extracts a string slice containing the entire `String`.
1044 ///
1045 /// # Examples
1046 ///
1047 /// ```
1048 /// let s = String::from("foo");
1049 ///
1050 /// assert_eq!("foo", s.as_str());
1051 /// ```
1052 #[inline]
1053 #[must_use]
1054 #[stable(feature = "string_as_str", since = "1.7.0")]
1055 #[rustc_diagnostic_item = "string_as_str"]
1056 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1057 pub const fn as_str(&self) -> &str {
1058 // SAFETY: String contents are stipulated to be valid UTF-8, invalid contents are an error
1059 // at construction.
1060 unsafe { str::from_utf8_unchecked(self.vec.as_slice()) }
1061 }
1062
1063 /// Converts a `String` into a mutable string slice.
1064 ///
1065 /// # Examples
1066 ///
1067 /// ```
1068 /// let mut s = String::from("foobar");
1069 /// let s_mut_str = s.as_mut_str();
1070 ///
1071 /// s_mut_str.make_ascii_uppercase();
1072 ///
1073 /// assert_eq!("FOOBAR", s_mut_str);
1074 /// ```
1075 #[inline]
1076 #[must_use]
1077 #[stable(feature = "string_as_str", since = "1.7.0")]
1078 #[rustc_diagnostic_item = "string_as_mut_str"]
1079 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1080 pub const fn as_mut_str(&mut self) -> &mut str {
1081 // SAFETY: String contents are stipulated to be valid UTF-8, invalid contents are an error
1082 // at construction.
1083 unsafe { str::from_utf8_unchecked_mut(self.vec.as_mut_slice()) }
1084 }
1085
1086 /// Appends a given string slice onto the end of this `String`.
1087 ///
1088 /// # Panics
1089 ///
1090 /// Panics if the new capacity exceeds `isize::MAX` _bytes_.
1091 ///
1092 /// # Examples
1093 ///
1094 /// ```
1095 /// let mut s = String::from("foo");
1096 ///
1097 /// s.push_str("bar");
1098 ///
1099 /// assert_eq!("foobar", s);
1100 /// ```
1101 #[cfg(not(no_global_oom_handling))]
1102 #[inline]
1103 #[stable(feature = "rust1", since = "1.0.0")]
1104 #[rustc_confusables("append", "push")]
1105 #[rustc_diagnostic_item = "string_push_str"]
1106 pub fn push_str(&mut self, string: &str) {
1107 self.vec.extend_from_slice(string.as_bytes())
1108 }
1109
1110 #[cfg(not(no_global_oom_handling))]
1111 #[inline]
1112 fn push_str_slice(&mut self, slice: &[&str]) {
1113 // use saturating arithmetic to ensure that in the case of an overflow, reserve() throws OOM
1114 let additional: Saturating<usize> = slice.iter().map(|x| Saturating(x.len())).sum();
1115 self.reserve(additional.0);
1116 let (ptr, len, cap) = core::mem::take(self).into_raw_parts();
1117 unsafe {
1118 let mut dst = ptr.add(len);
1119 for new in slice {
1120 core::ptr::copy_nonoverlapping(new.as_ptr(), dst, new.len());
1121 dst = dst.add(new.len());
1122 }
1123 *self = String::from_raw_parts(ptr, len + additional.0, cap);
1124 }
1125 }
1126
1127 /// Copies elements from `src` range to the end of the string.
1128 ///
1129 /// # Panics
1130 ///
1131 /// Panics if the range has `start_bound > end_bound`, if the range is
1132 /// bounded on either end and does not lie on a [`char`] boundary, or if the
1133 /// new capacity exceeds `isize::MAX` bytes.
1134 ///
1135 /// # Examples
1136 ///
1137 /// ```
1138 /// let mut string = String::from("abcde");
1139 ///
1140 /// string.extend_from_within(2..);
1141 /// assert_eq!(string, "abcdecde");
1142 ///
1143 /// string.extend_from_within(..2);
1144 /// assert_eq!(string, "abcdecdeab");
1145 ///
1146 /// string.extend_from_within(4..8);
1147 /// assert_eq!(string, "abcdecdeabecde");
1148 /// ```
1149 #[cfg(not(no_global_oom_handling))]
1150 #[stable(feature = "string_extend_from_within", since = "1.87.0")]
1151 #[track_caller]
1152 pub fn extend_from_within<R>(&mut self, src: R)
1153 where
1154 R: RangeBounds<usize>,
1155 {
1156 let src @ Range { start, end } = slice::range(src, ..self.len());
1157
1158 assert!(self.is_char_boundary(start));
1159 assert!(self.is_char_boundary(end));
1160
1161 self.vec.extend_from_within(src);
1162 }
1163
1164 /// Returns this `String`'s capacity, in bytes.
1165 ///
1166 /// # Examples
1167 ///
1168 /// ```
1169 /// let s = String::with_capacity(10);
1170 ///
1171 /// assert!(s.capacity() >= 10);
1172 /// ```
1173 #[inline]
1174 #[must_use]
1175 #[stable(feature = "rust1", since = "1.0.0")]
1176 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1177 pub const fn capacity(&self) -> usize {
1178 self.vec.capacity()
1179 }
1180
1181 /// Reserves capacity for at least `additional` bytes more than the
1182 /// current length. The allocator may reserve more space to speculatively
1183 /// avoid frequent allocations. After calling `reserve`,
1184 /// capacity will be greater than or equal to `self.len() + additional`.
1185 /// Does nothing if capacity is already sufficient.
1186 ///
1187 /// # Panics
1188 ///
1189 /// Panics if the new capacity exceeds `isize::MAX` _bytes_.
1190 ///
1191 /// # Examples
1192 ///
1193 /// Basic usage:
1194 ///
1195 /// ```
1196 /// let mut s = String::new();
1197 ///
1198 /// s.reserve(10);
1199 ///
1200 /// assert!(s.capacity() >= 10);
1201 /// ```
1202 ///
1203 /// This might not actually increase the capacity:
1204 ///
1205 /// ```
1206 /// let mut s = String::with_capacity(10);
1207 /// s.push('a');
1208 /// s.push('b');
1209 ///
1210 /// // s now has a length of 2 and a capacity of at least 10
1211 /// let capacity = s.capacity();
1212 /// assert_eq!(2, s.len());
1213 /// assert!(capacity >= 10);
1214 ///
1215 /// // Since we already have at least an extra 8 capacity, calling this...
1216 /// s.reserve(8);
1217 ///
1218 /// // ... doesn't actually increase.
1219 /// assert_eq!(capacity, s.capacity());
1220 /// ```
1221 #[cfg(not(no_global_oom_handling))]
1222 #[inline]
1223 #[stable(feature = "rust1", since = "1.0.0")]
1224 pub fn reserve(&mut self, additional: usize) {
1225 self.vec.reserve(additional)
1226 }
1227
1228 /// Reserves the minimum capacity for at least `additional` bytes more than
1229 /// the current length. Unlike [`reserve`], this will not
1230 /// deliberately over-allocate to speculatively avoid frequent allocations.
1231 /// After calling `reserve_exact`, capacity will be greater than or equal to
1232 /// `self.len() + additional`. Does nothing if the capacity is already
1233 /// sufficient.
1234 ///
1235 /// [`reserve`]: String::reserve
1236 ///
1237 /// # Panics
1238 ///
1239 /// Panics if the new capacity exceeds `isize::MAX` _bytes_.
1240 ///
1241 /// # Examples
1242 ///
1243 /// Basic usage:
1244 ///
1245 /// ```
1246 /// let mut s = String::new();
1247 ///
1248 /// s.reserve_exact(10);
1249 ///
1250 /// assert!(s.capacity() >= 10);
1251 /// ```
1252 ///
1253 /// This might not actually increase the capacity:
1254 ///
1255 /// ```
1256 /// let mut s = String::with_capacity(10);
1257 /// s.push('a');
1258 /// s.push('b');
1259 ///
1260 /// // s now has a length of 2 and a capacity of at least 10
1261 /// let capacity = s.capacity();
1262 /// assert_eq!(2, s.len());
1263 /// assert!(capacity >= 10);
1264 ///
1265 /// // Since we already have at least an extra 8 capacity, calling this...
1266 /// s.reserve_exact(8);
1267 ///
1268 /// // ... doesn't actually increase.
1269 /// assert_eq!(capacity, s.capacity());
1270 /// ```
1271 #[cfg(not(no_global_oom_handling))]
1272 #[inline]
1273 #[stable(feature = "rust1", since = "1.0.0")]
1274 pub fn reserve_exact(&mut self, additional: usize) {
1275 self.vec.reserve_exact(additional)
1276 }
1277
1278 /// Tries to reserve capacity for at least `additional` bytes more than the
1279 /// current length. The allocator may reserve more space to speculatively
1280 /// avoid frequent allocations. After calling `try_reserve`, capacity will be
1281 /// greater than or equal to `self.len() + additional` if it returns
1282 /// `Ok(())`. Does nothing if capacity is already sufficient. This method
1283 /// preserves the contents even if an error occurs.
1284 ///
1285 /// # Errors
1286 ///
1287 /// If the capacity overflows, or the allocator reports a failure, then an error
1288 /// is returned.
1289 ///
1290 /// # Examples
1291 ///
1292 /// ```
1293 /// use std::collections::TryReserveError;
1294 ///
1295 /// fn process_data(data: &str) -> Result<String, TryReserveError> {
1296 /// let mut output = String::new();
1297 ///
1298 /// // Pre-reserve the memory, exiting if we can't
1299 /// output.try_reserve(data.len())?;
1300 ///
1301 /// // Now we know this can't OOM in the middle of our complex work
1302 /// output.push_str(data);
1303 ///
1304 /// Ok(output)
1305 /// }
1306 /// # process_data("rust").expect("why is the test harness OOMing on 4 bytes?");
1307 /// ```
1308 #[stable(feature = "try_reserve", since = "1.57.0")]
1309 pub fn try_reserve(&mut self, additional: usize) -> Result<(), TryReserveError> {
1310 self.vec.try_reserve(additional)
1311 }
1312
1313 /// Tries to reserve the minimum capacity for at least `additional` bytes
1314 /// more than the current length. Unlike [`try_reserve`], this will not
1315 /// deliberately over-allocate to speculatively avoid frequent allocations.
1316 /// After calling `try_reserve_exact`, capacity will be greater than or
1317 /// equal to `self.len() + additional` if it returns `Ok(())`.
1318 /// Does nothing if the capacity is already sufficient.
1319 ///
1320 /// Note that the allocator may give the collection more space than it
1321 /// requests. Therefore, capacity can not be relied upon to be precisely
1322 /// minimal. Prefer [`try_reserve`] if future insertions are expected.
1323 ///
1324 /// [`try_reserve`]: String::try_reserve
1325 ///
1326 /// # Errors
1327 ///
1328 /// If the capacity overflows, or the allocator reports a failure, then an error
1329 /// is returned.
1330 ///
1331 /// # Examples
1332 ///
1333 /// ```
1334 /// use std::collections::TryReserveError;
1335 ///
1336 /// fn process_data(data: &str) -> Result<String, TryReserveError> {
1337 /// let mut output = String::new();
1338 ///
1339 /// // Pre-reserve the memory, exiting if we can't
1340 /// output.try_reserve_exact(data.len())?;
1341 ///
1342 /// // Now we know this can't OOM in the middle of our complex work
1343 /// output.push_str(data);
1344 ///
1345 /// Ok(output)
1346 /// }
1347 /// # process_data("rust").expect("why is the test harness OOMing on 4 bytes?");
1348 /// ```
1349 #[stable(feature = "try_reserve", since = "1.57.0")]
1350 pub fn try_reserve_exact(&mut self, additional: usize) -> Result<(), TryReserveError> {
1351 self.vec.try_reserve_exact(additional)
1352 }
1353
1354 /// Shrinks the capacity of this `String` to match its length.
1355 ///
1356 /// # Examples
1357 ///
1358 /// ```
1359 /// let mut s = String::from("foo");
1360 ///
1361 /// s.reserve(100);
1362 /// assert!(s.capacity() >= 100);
1363 ///
1364 /// s.shrink_to_fit();
1365 /// assert_eq!(3, s.capacity());
1366 /// ```
1367 #[cfg(not(no_global_oom_handling))]
1368 #[inline]
1369 #[stable(feature = "rust1", since = "1.0.0")]
1370 pub fn shrink_to_fit(&mut self) {
1371 self.vec.shrink_to_fit()
1372 }
1373
1374 /// Shrinks the capacity of this `String` with a lower bound.
1375 ///
1376 /// The capacity will remain at least as large as both the length
1377 /// and the supplied value.
1378 ///
1379 /// If the current capacity is less than the lower limit, this is a no-op.
1380 ///
1381 /// # Examples
1382 ///
1383 /// ```
1384 /// let mut s = String::from("foo");
1385 ///
1386 /// s.reserve(100);
1387 /// assert!(s.capacity() >= 100);
1388 ///
1389 /// s.shrink_to(10);
1390 /// assert!(s.capacity() >= 10);
1391 /// s.shrink_to(0);
1392 /// assert!(s.capacity() >= 3);
1393 /// ```
1394 #[cfg(not(no_global_oom_handling))]
1395 #[inline]
1396 #[stable(feature = "shrink_to", since = "1.56.0")]
1397 pub fn shrink_to(&mut self, min_capacity: usize) {
1398 self.vec.shrink_to(min_capacity)
1399 }
1400
1401 /// Appends the given [`char`] to the end of this `String`.
1402 ///
1403 /// # Panics
1404 ///
1405 /// Panics if the new capacity exceeds `isize::MAX` _bytes_.
1406 ///
1407 /// # Examples
1408 ///
1409 /// ```
1410 /// let mut s = String::from("abc");
1411 ///
1412 /// s.push('1');
1413 /// s.push('2');
1414 /// s.push('3');
1415 ///
1416 /// assert_eq!("abc123", s);
1417 /// ```
1418 #[cfg(not(no_global_oom_handling))]
1419 #[inline]
1420 #[stable(feature = "rust1", since = "1.0.0")]
1421 pub fn push(&mut self, ch: char) {
1422 let len = self.len();
1423 let ch_len = ch.len_utf8();
1424 self.reserve(ch_len);
1425
1426 // SAFETY: Just reserved capacity for at least the length needed to encode `ch`.
1427 unsafe {
1428 core::char::encode_utf8_raw_unchecked(ch as u32, self.vec.as_mut_ptr().add(len));
1429 self.vec.set_len(len + ch_len);
1430 }
1431 }
1432
1433 /// Returns a byte slice of this `String`'s contents.
1434 ///
1435 /// The inverse of this method is [`from_utf8`].
1436 ///
1437 /// [`from_utf8`]: String::from_utf8
1438 ///
1439 /// # Examples
1440 ///
1441 /// ```
1442 /// let s = String::from("hello");
1443 ///
1444 /// assert_eq!(&[104, 101, 108, 108, 111], s.as_bytes());
1445 /// ```
1446 #[inline]
1447 #[must_use]
1448 #[stable(feature = "rust1", since = "1.0.0")]
1449 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1450 pub const fn as_bytes(&self) -> &[u8] {
1451 self.vec.as_slice()
1452 }
1453
1454 /// Shortens this `String` to the specified length.
1455 ///
1456 /// If `new_len` is greater than or equal to the string's current length, this has no
1457 /// effect.
1458 ///
1459 /// Note that this method has no effect on the allocated capacity
1460 /// of the string
1461 ///
1462 /// # Panics
1463 ///
1464 /// Panics if `new_len` does not lie on a [`char`] boundary.
1465 ///
1466 /// # Examples
1467 ///
1468 /// ```
1469 /// let mut s = String::from("hello");
1470 ///
1471 /// s.truncate(2);
1472 ///
1473 /// assert_eq!("he", s);
1474 /// ```
1475 #[inline]
1476 #[stable(feature = "rust1", since = "1.0.0")]
1477 #[track_caller]
1478 pub fn truncate(&mut self, new_len: usize) {
1479 if new_len <= self.len() {
1480 assert!(self.is_char_boundary(new_len));
1481 self.vec.truncate(new_len)
1482 }
1483 }
1484
1485 /// Removes the last character from the string buffer and returns it.
1486 ///
1487 /// Returns [`None`] if this `String` is empty.
1488 ///
1489 /// # Examples
1490 ///
1491 /// ```
1492 /// let mut s = String::from("abฤ");
1493 ///
1494 /// assert_eq!(s.pop(), Some('ฤ'));
1495 /// assert_eq!(s.pop(), Some('b'));
1496 /// assert_eq!(s.pop(), Some('a'));
1497 ///
1498 /// assert_eq!(s.pop(), None);
1499 /// ```
1500 #[inline]
1501 #[stable(feature = "rust1", since = "1.0.0")]
1502 pub fn pop(&mut self) -> Option<char> {
1503 let ch = self.chars().rev().next()?;
1504 let newlen = self.len() - ch.len_utf8();
1505 unsafe {
1506 self.vec.set_len(newlen);
1507 }
1508 Some(ch)
1509 }
1510
1511 /// Removes a [`char`] from this `String` at byte position `idx` and returns it.
1512 ///
1513 /// Copies all bytes after the removed char to new positions.
1514 ///
1515 /// Note that calling this in a loop can result in quadratic behavior.
1516 ///
1517 /// # Panics
1518 ///
1519 /// Panics if `idx` is larger than or equal to the `String`'s length,
1520 /// or if it does not lie on a [`char`] boundary.
1521 ///
1522 /// # Examples
1523 ///
1524 /// ```
1525 /// let mut s = String::from("abรง");
1526 ///
1527 /// assert_eq!(s.remove(0), 'a');
1528 /// assert_eq!(s.remove(1), 'รง');
1529 /// assert_eq!(s.remove(0), 'b');
1530 /// ```
1531 #[inline]
1532 #[stable(feature = "rust1", since = "1.0.0")]
1533 #[track_caller]
1534 #[rustc_confusables("delete", "take")]
1535 pub fn remove(&mut self, idx: usize) -> char {
1536 let ch = match self[idx..].chars().next() {
1537 Some(ch) => ch,
1538 None => panic!("cannot remove a char from the end of a string"),
1539 };
1540
1541 let next = idx + ch.len_utf8();
1542 let len = self.len();
1543 unsafe {
1544 ptr::copy(self.vec.as_ptr().add(next), self.vec.as_mut_ptr().add(idx), len - next);
1545 self.vec.set_len(len - (next - idx));
1546 }
1547 ch
1548 }
1549
1550 /// Remove all matches of pattern `pat` in the `String`.
1551 ///
1552 /// # Examples
1553 ///
1554 /// ```
1555 /// #![feature(string_remove_matches)]
1556 /// let mut s = String::from("Trees are not green, the sky is not blue.");
1557 /// s.remove_matches("not ");
1558 /// assert_eq!("Trees are green, the sky is blue.", s);
1559 /// ```
1560 ///
1561 /// Matches will be detected and removed iteratively, so in cases where
1562 /// patterns overlap, only the first pattern will be removed:
1563 ///
1564 /// ```
1565 /// #![feature(string_remove_matches)]
1566 /// let mut s = String::from("banana");
1567 /// s.remove_matches("ana");
1568 /// assert_eq!("bna", s);
1569 /// ```
1570 #[cfg(not(no_global_oom_handling))]
1571 #[unstable(feature = "string_remove_matches", issue = "72826")]
1572 pub fn remove_matches<P: Pattern>(&mut self, pat: P) {
1573 use core::str::pattern::Searcher;
1574
1575 let rejections = {
1576 let mut searcher = pat.into_searcher(self);
1577 // Per Searcher::next:
1578 //
1579 // A Match result needs to contain the whole matched pattern,
1580 // however Reject results may be split up into arbitrary many
1581 // adjacent fragments. Both ranges may have zero length.
1582 //
1583 // In practice the implementation of Searcher::next_match tends to
1584 // be more efficient, so we use it here and do some work to invert
1585 // matches into rejections since that's what we want to copy below.
1586 let mut front = 0;
1587 let rejections: Vec<_> = from_fn(|| {
1588 let (start, end) = searcher.next_match()?;
1589 let prev_front = front;
1590 front = end;
1591 Some((prev_front, start))
1592 })
1593 .collect();
1594 rejections.into_iter().chain(core::iter::once((front, self.len())))
1595 };
1596
1597 let mut len = 0;
1598 let ptr = self.vec.as_mut_ptr();
1599
1600 for (start, end) in rejections {
1601 let count = end - start;
1602 if start != len {
1603 // SAFETY: per Searcher::next:
1604 //
1605 // The stream of Match and Reject values up to a Done will
1606 // contain index ranges that are adjacent, non-overlapping,
1607 // covering the whole haystack, and laying on utf8
1608 // boundaries.
1609 unsafe {
1610 ptr::copy(ptr.add(start), ptr.add(len), count);
1611 }
1612 }
1613 len += count;
1614 }
1615
1616 unsafe {
1617 self.vec.set_len(len);
1618 }
1619 }
1620
1621 /// Retains only the characters specified by the predicate.
1622 ///
1623 /// In other words, remove all characters `c` such that `f(c)` returns `false`.
1624 /// This method operates in place, visiting each character exactly once in the
1625 /// original order, and preserves the order of the retained characters.
1626 ///
1627 /// # Examples
1628 ///
1629 /// ```
1630 /// let mut s = String::from("f_o_ob_ar");
1631 ///
1632 /// s.retain(|c| c != '_');
1633 ///
1634 /// assert_eq!(s, "foobar");
1635 /// ```
1636 ///
1637 /// Because the elements are visited exactly once in the original order,
1638 /// external state may be used to decide which elements to keep.
1639 ///
1640 /// ```
1641 /// let mut s = String::from("abcde");
1642 /// let keep = [false, true, true, false, true];
1643 /// let mut iter = keep.iter();
1644 /// s.retain(|_| *iter.next().unwrap());
1645 /// assert_eq!(s, "bce");
1646 /// ```
1647 #[inline]
1648 #[stable(feature = "string_retain", since = "1.26.0")]
1649 pub fn retain<F>(&mut self, mut f: F)
1650 where
1651 F: FnMut(char) -> bool,
1652 {
1653 struct SetLenOnDrop<'a> {
1654 s: &'a mut String,
1655 idx: usize,
1656 del_bytes: usize,
1657 }
1658
1659 impl<'a> Drop for SetLenOnDrop<'a> {
1660 fn drop(&mut self) {
1661 let new_len = self.idx - self.del_bytes;
1662 debug_assert!(new_len <= self.s.len());
1663 unsafe { self.s.vec.set_len(new_len) };
1664 }
1665 }
1666
1667 let len = self.len();
1668 let mut guard = SetLenOnDrop { s: self, idx: 0, del_bytes: 0 };
1669
1670 while guard.idx < len {
1671 let ch =
1672 // SAFETY: `guard.idx` is positive-or-zero and less that len so the `get_unchecked`
1673 // is in bound. `self` is valid UTF-8 like string and the returned slice starts at
1674 // a unicode code point so the `Chars` always return one character.
1675 unsafe { guard.s.get_unchecked(guard.idx..len).chars().next().unwrap_unchecked() };
1676 let ch_len = ch.len_utf8();
1677
1678 if !f(ch) {
1679 guard.del_bytes += ch_len;
1680 } else if guard.del_bytes > 0 {
1681 // SAFETY: `guard.idx` is in bound and `guard.del_bytes` represent the number of
1682 // bytes that are erased from the string so the resulting `guard.idx -
1683 // guard.del_bytes` always represent a valid unicode code point.
1684 //
1685 // `guard.del_bytes` >= `ch.len_utf8()`, so taking a slice with `ch.len_utf8()` len
1686 // is safe.
1687 ch.encode_utf8(unsafe {
1688 crate::slice::from_raw_parts_mut(
1689 guard.s.as_mut_ptr().add(guard.idx - guard.del_bytes),
1690 ch.len_utf8(),
1691 )
1692 });
1693 }
1694
1695 // Point idx to the next char
1696 guard.idx += ch_len;
1697 }
1698
1699 drop(guard);
1700 }
1701
1702 /// Inserts a character into this `String` at byte position `idx`.
1703 ///
1704 /// Reallocates if `self.capacity()` is insufficient, which may involve copying all
1705 /// `self.capacity()` bytes. Makes space for the insertion by copying all bytes of
1706 /// `&self[idx..]` to new positions.
1707 ///
1708 /// Note that calling this in a loop can result in quadratic behavior.
1709 ///
1710 /// # Panics
1711 ///
1712 /// Panics if `idx` is larger than the `String`'s length, or if it does not
1713 /// lie on a [`char`] boundary.
1714 ///
1715 /// # Examples
1716 ///
1717 /// ```
1718 /// let mut s = String::with_capacity(3);
1719 ///
1720 /// s.insert(0, 'f');
1721 /// s.insert(1, 'o');
1722 /// s.insert(2, 'o');
1723 ///
1724 /// assert_eq!("foo", s);
1725 /// ```
1726 #[cfg(not(no_global_oom_handling))]
1727 #[inline]
1728 #[track_caller]
1729 #[stable(feature = "rust1", since = "1.0.0")]
1730 #[rustc_confusables("set")]
1731 pub fn insert(&mut self, idx: usize, ch: char) {
1732 assert!(self.is_char_boundary(idx));
1733
1734 let len = self.len();
1735 let ch_len = ch.len_utf8();
1736 self.reserve(ch_len);
1737
1738 // SAFETY: Move the bytes starting from `idx` to their new location `ch_len`
1739 // bytes ahead. This is safe because sufficient capacity was reserved, and `idx`
1740 // is a char boundary.
1741 unsafe {
1742 ptr::copy(
1743 self.vec.as_ptr().add(idx),
1744 self.vec.as_mut_ptr().add(idx + ch_len),
1745 len - idx,
1746 );
1747 }
1748
1749 // SAFETY: Encode the character into the vacated region if `idx != len`,
1750 // or into the uninitialized spare capacity otherwise.
1751 unsafe {
1752 core::char::encode_utf8_raw_unchecked(ch as u32, self.vec.as_mut_ptr().add(idx));
1753 }
1754
1755 // SAFETY: Update the length to include the newly added bytes.
1756 unsafe {
1757 self.vec.set_len(len + ch_len);
1758 }
1759 }
1760
1761 /// Inserts a string slice into this `String` at byte position `idx`.
1762 ///
1763 /// Reallocates if `self.capacity()` is insufficient, which may involve copying all
1764 /// `self.capacity()` bytes. Makes space for the insertion by copying all bytes of
1765 /// `&self[idx..]` to new positions.
1766 ///
1767 /// Note that calling this in a loop can result in quadratic behavior.
1768 ///
1769 /// # Panics
1770 ///
1771 /// Panics if `idx` is larger than the `String`'s length, or if it does not
1772 /// lie on a [`char`] boundary.
1773 ///
1774 /// # Examples
1775 ///
1776 /// ```
1777 /// let mut s = String::from("bar");
1778 ///
1779 /// s.insert_str(0, "foo");
1780 ///
1781 /// assert_eq!("foobar", s);
1782 /// ```
1783 #[cfg(not(no_global_oom_handling))]
1784 #[inline]
1785 #[track_caller]
1786 #[stable(feature = "insert_str", since = "1.16.0")]
1787 #[rustc_diagnostic_item = "string_insert_str"]
1788 pub fn insert_str(&mut self, idx: usize, string: &str) {
1789 assert!(self.is_char_boundary(idx));
1790
1791 let len = self.len();
1792 let amt = string.len();
1793 self.reserve(amt);
1794
1795 // SAFETY: Move the bytes starting from `idx` to their new location `amt` bytes
1796 // ahead. This is safe because sufficient capacity was just reserved, and `idx`
1797 // is a char boundary.
1798 unsafe {
1799 ptr::copy(self.vec.as_ptr().add(idx), self.vec.as_mut_ptr().add(idx + amt), len - idx);
1800 }
1801
1802 // SAFETY: Copy the new string slice into the vacated region if `idx != len`,
1803 // or into the uninitialized spare capacity otherwise. The borrow checker
1804 // ensures that the source and destination do not overlap.
1805 unsafe {
1806 ptr::copy_nonoverlapping(string.as_ptr(), self.vec.as_mut_ptr().add(idx), amt);
1807 }
1808
1809 // SAFETY: Update the length to include the newly added bytes.
1810 unsafe {
1811 self.vec.set_len(len + amt);
1812 }
1813 }
1814
1815 /// Returns a mutable reference to the contents of this `String`.
1816 ///
1817 /// # Safety
1818 ///
1819 /// This function is unsafe because the returned `&mut Vec` allows writing
1820 /// bytes which are not valid UTF-8. If this constraint is violated, using
1821 /// the original `String` after dropping the `&mut Vec` may violate memory
1822 /// safety, as the rest of the standard library assumes that `String`s are
1823 /// valid UTF-8.
1824 ///
1825 /// # Examples
1826 ///
1827 /// ```
1828 /// let mut s = String::from("hello");
1829 ///
1830 /// unsafe {
1831 /// let vec = s.as_mut_vec();
1832 /// assert_eq!(&[104, 101, 108, 108, 111][..], &vec[..]);
1833 ///
1834 /// vec.reverse();
1835 /// }
1836 /// assert_eq!(s, "olleh");
1837 /// ```
1838 #[inline]
1839 #[stable(feature = "rust1", since = "1.0.0")]
1840 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1841 pub const unsafe fn as_mut_vec(&mut self) -> &mut Vec<u8> {
1842 &mut self.vec
1843 }
1844
1845 /// Returns the length of this `String`, in bytes, not [`char`]s or
1846 /// graphemes. In other words, it might not be what a human considers the
1847 /// length of the string.
1848 ///
1849 /// # Examples
1850 ///
1851 /// ```
1852 /// let a = String::from("foo");
1853 /// assert_eq!(a.len(), 3);
1854 ///
1855 /// let fancy_f = String::from("ฦoo");
1856 /// assert_eq!(fancy_f.len(), 4);
1857 /// assert_eq!(fancy_f.chars().count(), 3);
1858 /// ```
1859 #[inline]
1860 #[must_use]
1861 #[stable(feature = "rust1", since = "1.0.0")]
1862 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1863 #[rustc_confusables("length", "size")]
1864 #[rustc_no_implicit_autorefs]
1865 pub const fn len(&self) -> usize {
1866 self.vec.len()
1867 }
1868
1869 /// Returns `true` if this `String` has a length of zero, and `false` otherwise.
1870 ///
1871 /// # Examples
1872 ///
1873 /// ```
1874 /// let mut v = String::new();
1875 /// assert!(v.is_empty());
1876 ///
1877 /// v.push('a');
1878 /// assert!(!v.is_empty());
1879 /// ```
1880 #[inline]
1881 #[must_use]
1882 #[stable(feature = "rust1", since = "1.0.0")]
1883 #[rustc_const_stable(feature = "const_vec_string_slice", since = "1.87.0")]
1884 #[rustc_no_implicit_autorefs]
1885 pub const fn is_empty(&self) -> bool {
1886 self.len() == 0
1887 }
1888
1889 /// Splits the string into two at the given byte index.
1890 ///
1891 /// Returns a newly allocated `String`. `self` contains bytes `[0, at)`, and
1892 /// the returned `String` contains bytes `[at, len)`. `at` must be on the
1893 /// boundary of a UTF-8 code point.
1894 ///
1895 /// Note that the capacity of `self` does not change.
1896 ///
1897 /// # Panics
1898 ///
1899 /// Panics if `at` is not on a `UTF-8` code point boundary, or if it is beyond the last
1900 /// code point of the string.
1901 ///
1902 /// # Examples
1903 ///
1904 /// ```
1905 /// # fn main() {
1906 /// let mut hello = String::from("Hello, World!");
1907 /// let world = hello.split_off(7);
1908 /// assert_eq!(hello, "Hello, ");
1909 /// assert_eq!(world, "World!");
1910 /// # }
1911 /// ```
1912 #[cfg(not(no_global_oom_handling))]
1913 #[inline]
1914 #[track_caller]
1915 #[stable(feature = "string_split_off", since = "1.16.0")]
1916 #[must_use = "use `.truncate()` if you don't need the other half"]
1917 pub fn split_off(&mut self, at: usize) -> String {
1918 assert!(self.is_char_boundary(at));
1919 let other = self.vec.split_off(at);
1920 unsafe { String::from_utf8_unchecked(other) }
1921 }
1922
1923 /// Truncates this `String`, removing all contents.
1924 ///
1925 /// While this means the `String` will have a length of zero, it does not
1926 /// touch its capacity.
1927 ///
1928 /// # Examples
1929 ///
1930 /// ```
1931 /// let mut s = String::from("foo");
1932 ///
1933 /// s.clear();
1934 ///
1935 /// assert!(s.is_empty());
1936 /// assert_eq!(0, s.len());
1937 /// assert_eq!(3, s.capacity());
1938 /// ```
1939 #[inline]
1940 #[stable(feature = "rust1", since = "1.0.0")]
1941 pub fn clear(&mut self) {
1942 self.vec.clear()
1943 }
1944
1945 /// Removes the specified range from the string in bulk, returning all
1946 /// removed characters as an iterator.
1947 ///
1948 /// The returned iterator keeps a mutable borrow on the string to optimize
1949 /// its implementation.
1950 ///
1951 /// # Panics
1952 ///
1953 /// Panics if the range has `start_bound > end_bound`, or, if the range is
1954 /// bounded on either end and does not lie on a [`char`] boundary.
1955 ///
1956 /// # Leaking
1957 ///
1958 /// If the returned iterator goes out of scope without being dropped (due to
1959 /// [`core::mem::forget`], for example), the string may still contain a copy
1960 /// of any drained characters, or may have lost characters arbitrarily,
1961 /// including characters outside the range.
1962 ///
1963 /// # Examples
1964 ///
1965 /// ```
1966 /// let mut s = String::from("ฮฑ is alpha, ฮฒ is beta");
1967 /// let beta_offset = s.find('ฮฒ').unwrap_or(s.len());
1968 ///
1969 /// // Remove the range up until the ฮฒ from the string
1970 /// let t: String = s.drain(..beta_offset).collect();
1971 /// assert_eq!(t, "ฮฑ is alpha, ");
1972 /// assert_eq!(s, "ฮฒ is beta");
1973 ///
1974 /// // A full range clears the string, like `clear()` does
1975 /// s.drain(..);
1976 /// assert_eq!(s, "");
1977 /// ```
1978 #[stable(feature = "drain", since = "1.6.0")]
1979 #[track_caller]
1980 pub fn drain<R>(&mut self, range: R) -> Drain<'_>
1981 where
1982 R: RangeBounds<usize>,
1983 {
1984 // Memory safety
1985 //
1986 // The String version of Drain does not have the memory safety issues
1987 // of the vector version. The data is just plain bytes.
1988 // Because the range removal happens in Drop, if the Drain iterator is leaked,
1989 // the removal will not happen.
1990 let Range { start, end } = slice::range(range, ..self.len());
1991 assert!(self.is_char_boundary(start));
1992 assert!(self.is_char_boundary(end));
1993
1994 // Take out two simultaneous borrows. The &mut String won't be accessed
1995 // until iteration is over, in Drop.
1996 let self_ptr = self as *mut _;
1997 // SAFETY: `slice::range` and `is_char_boundary` do the appropriate bounds checks.
1998 let chars_iter = unsafe { self.get_unchecked(start..end) }.chars();
1999
2000 Drain { start, end, iter: chars_iter, string: self_ptr }
2001 }
2002
2003 /// Converts a `String` into an iterator over the [`char`]s of the string.
2004 ///
2005 /// As a string consists of valid UTF-8, we can iterate through a string
2006 /// by [`char`]. This method returns such an iterator.
2007 ///
2008 /// It's important to remember that [`char`] represents a Unicode Scalar
2009 /// Value, and might not match your idea of what a 'character' is. Iteration
2010 /// over grapheme clusters may be what you actually want. That functionality
2011 /// is not provided by Rust's standard library, check crates.io instead.
2012 ///
2013 /// # Examples
2014 ///
2015 /// Basic usage:
2016 ///
2017 /// ```
2018 /// #![feature(string_into_chars)]
2019 ///
2020 /// let word = String::from("goodbye");
2021 ///
2022 /// let mut chars = word.into_chars();
2023 ///
2024 /// assert_eq!(Some('g'), chars.next());
2025 /// assert_eq!(Some('o'), chars.next());
2026 /// assert_eq!(Some('o'), chars.next());
2027 /// assert_eq!(Some('d'), chars.next());
2028 /// assert_eq!(Some('b'), chars.next());
2029 /// assert_eq!(Some('y'), chars.next());
2030 /// assert_eq!(Some('e'), chars.next());
2031 ///
2032 /// assert_eq!(None, chars.next());
2033 /// ```
2034 ///
2035 /// Remember, [`char`]s might not match your intuition about characters:
2036 ///
2037 /// ```
2038 /// #![feature(string_into_chars)]
2039 ///
2040 /// let y = String::from("yฬ");
2041 ///
2042 /// let mut chars = y.into_chars();
2043 ///
2044 /// assert_eq!(Some('y'), chars.next()); // not 'yฬ'
2045 /// assert_eq!(Some('\u{0306}'), chars.next());
2046 ///
2047 /// assert_eq!(None, chars.next());
2048 /// ```
2049 ///
2050 /// [`char`]: prim@char
2051 #[inline]
2052 #[must_use = "`self` will be dropped if the result is not used"]
2053 #[unstable(feature = "string_into_chars", issue = "133125")]
2054 pub fn into_chars(self) -> IntoChars {
2055 IntoChars { bytes: self.into_bytes().into_iter() }
2056 }
2057
2058 /// Removes the specified range in the string,
2059 /// and replaces it with the given string.
2060 /// The given string doesn't need to be the same length as the range.
2061 ///
2062 /// # Panics
2063 ///
2064 /// Panics if the range has `start_bound > end_bound`, or, if the range is
2065 /// bounded on either end and does not lie on a [`char`] boundary.
2066 ///
2067 /// # Examples
2068 ///
2069 /// ```
2070 /// let mut s = String::from("ฮฑ is alpha, ฮฒ is beta");
2071 /// let beta_offset = s.find('ฮฒ').unwrap_or(s.len());
2072 ///
2073 /// // Replace the range up until the ฮฒ from the string
2074 /// s.replace_range(..beta_offset, "ฮ is capital alpha; ");
2075 /// assert_eq!(s, "ฮ is capital alpha; ฮฒ is beta");
2076 /// ```
2077 #[cfg(not(no_global_oom_handling))]
2078 #[stable(feature = "splice", since = "1.27.0")]
2079 #[track_caller]
2080 pub fn replace_range<R>(&mut self, range: R, replace_with: &str)
2081 where
2082 R: RangeBounds<usize>,
2083 {
2084 // We avoid #81138 (nondeterministic RangeBounds impls) because we only use `range` once, here.
2085 let checked_range = slice::range(range, ..self.len());
2086
2087 assert!(
2088 self.is_char_boundary(checked_range.start),
2089 "start of range should be a character boundary"
2090 );
2091 assert!(
2092 self.is_char_boundary(checked_range.end),
2093 "end of range should be a character boundary"
2094 );
2095
2096 unsafe { self.as_mut_vec() }.splice(checked_range, replace_with.bytes());
2097 }
2098
2099 /// Replaces the leftmost occurrence of a pattern with another string, in-place.
2100 ///
2101 /// This method can be preferred over [`string = string.replacen(..., 1);`][replacen],
2102 /// as it can use the `String`'s existing capacity to prevent a reallocation if
2103 /// sufficient space is available.
2104 ///
2105 /// # Examples
2106 ///
2107 /// Basic usage:
2108 ///
2109 /// ```
2110 /// #![feature(string_replace_in_place)]
2111 ///
2112 /// let mut s = String::from("Test Results: โโโ");
2113 ///
2114 /// // Replace the leftmost โ with a โ
2115 /// s.replace_first('โ', "โ
");
2116 /// assert_eq!(s, "Test Results: โ
โโ");
2117 /// ```
2118 ///
2119 /// [replacen]: ../../std/primitive.str.html#method.replacen
2120 #[cfg(not(no_global_oom_handling))]
2121 #[unstable(feature = "string_replace_in_place", issue = "147949")]
2122 pub fn replace_first<P: Pattern>(&mut self, from: P, to: &str) {
2123 let range = match self.match_indices(from).next() {
2124 Some((start, match_str)) => start..start + match_str.len(),
2125 None => return,
2126 };
2127
2128 self.replace_range(range, to);
2129 }
2130
2131 /// Replaces the rightmost occurrence of a pattern with another string, in-place.
2132 ///
2133 /// # Examples
2134 ///
2135 /// Basic usage:
2136 ///
2137 /// ```
2138 /// #![feature(string_replace_in_place)]
2139 ///
2140 /// let mut s = String::from("Test Results: โโโ");
2141 ///
2142 /// // Replace the rightmost โ with a โ
2143 /// s.replace_last('โ', "โ
");
2144 /// assert_eq!(s, "Test Results: โโโ
");
2145 /// ```
2146 #[cfg(not(no_global_oom_handling))]
2147 #[unstable(feature = "string_replace_in_place", issue = "147949")]
2148 pub fn replace_last<P: Pattern>(&mut self, from: P, to: &str)
2149 where
2150 for<'a> P::Searcher<'a>: core::str::pattern::ReverseSearcher<'a>,
2151 {
2152 let range = match self.rmatch_indices(from).next() {
2153 Some((start, match_str)) => start..start + match_str.len(),
2154 None => return,
2155 };
2156
2157 self.replace_range(range, to);
2158 }
2159
2160 /// Converts this `String` into a <code>[Box]<[str]></code>.
2161 ///
2162 /// Before doing the conversion, this method discards excess capacity like [`shrink_to_fit`].
2163 /// Note that this call may reallocate and copy the bytes of the string.
2164 ///
2165 /// [`shrink_to_fit`]: String::shrink_to_fit
2166 /// [str]: prim@str "str"
2167 ///
2168 /// # Examples
2169 ///
2170 /// ```
2171 /// let s = String::from("hello");
2172 ///
2173 /// let b = s.into_boxed_str();
2174 /// ```
2175 #[cfg(not(no_global_oom_handling))]
2176 #[stable(feature = "box_str", since = "1.4.0")]
2177 #[must_use = "`self` will be dropped if the result is not used"]
2178 #[inline]
2179 pub fn into_boxed_str(self) -> Box<str> {
2180 let slice = self.vec.into_boxed_slice();
2181 unsafe { from_boxed_utf8_unchecked(slice) }
2182 }
2183
2184 /// Consumes and leaks the `String`, returning a mutable reference to the contents,
2185 /// `&'a mut str`.
2186 ///
2187 /// The caller has free choice over the returned lifetime, including `'static`. Indeed,
2188 /// this function is ideally used for data that lives for the remainder of the program's life,
2189 /// as dropping the returned reference will cause a memory leak.
2190 ///
2191 /// It does not reallocate or shrink the `String`, so the leaked allocation may include unused
2192 /// capacity that is not part of the returned slice. If you want to discard excess capacity,
2193 /// call [`into_boxed_str`], and then [`Box::leak`] instead. However, keep in mind that
2194 /// trimming the capacity may result in a reallocation and copy.
2195 ///
2196 /// [`into_boxed_str`]: Self::into_boxed_str
2197 ///
2198 /// # Examples
2199 ///
2200 /// ```
2201 /// let x = String::from("bucket");
2202 /// let static_ref: &'static mut str = x.leak();
2203 /// assert_eq!(static_ref, "bucket");
2204 /// # // FIXME(https://github.com/rust-lang/miri/issues/3670):
2205 /// # // use -Zmiri-disable-leak-check instead of unleaking in tests meant to leak.
2206 /// # drop(unsafe { Box::from_raw(static_ref) });
2207 /// ```
2208 #[stable(feature = "string_leak", since = "1.72.0")]
2209 #[inline]
2210 pub fn leak<'a>(self) -> &'a mut str {
2211 let slice = self.vec.leak();
2212 unsafe { from_utf8_unchecked_mut(slice) }
2213 }
2214}
2215
2216impl FromUtf8Error {
2217 /// Returns a slice of [`u8`]s bytes that were attempted to convert to a `String`.
2218 ///
2219 /// # Examples
2220 ///
2221 /// ```
2222 /// // some invalid bytes, in a vector
2223 /// let bytes = vec![0, 159];
2224 ///
2225 /// let value = String::from_utf8(bytes);
2226 ///
2227 /// assert_eq!(&[0, 159], value.unwrap_err().as_bytes());
2228 /// ```
2229 #[must_use]
2230 #[stable(feature = "from_utf8_error_as_bytes", since = "1.26.0")]
2231 pub fn as_bytes(&self) -> &[u8] {
2232 &self.bytes[..]
2233 }
2234
2235 /// Converts the bytes into a `String` lossily, substituting invalid UTF-8
2236 /// sequences with replacement characters.
2237 ///
2238 /// See [`String::from_utf8_lossy`] for more details on replacement of
2239 /// invalid sequences, and [`String::from_utf8_lossy_owned`] for the
2240 /// `String` function which corresponds to this function.
2241 ///
2242 /// This is useful in conjunction with [`String::from_utf8`] when you need
2243 /// to branch on whether the bytes are valid UTF-8, but still want to
2244 /// recover a lossily converted `String` in the error case. Use
2245 /// [`String::from_utf8_lossy_owned`] if you always need a lossily converted
2246 /// `String`.
2247 ///
2248 /// Since the original [`String::from_utf8`] error records where validation
2249 /// stopped, this method does not need to re-check the already valid prefix
2250 /// of the byte sequence.
2251 ///
2252 /// # Examples
2253 ///
2254 /// ```
2255 /// #![feature(string_from_utf8_lossy_owned)]
2256 /// // some invalid bytes
2257 /// let input: Vec<u8> = b"Hello \xF0\x90\x80World".into();
2258 ///
2259 /// let (output, had_invalid_utf8) = match String::from_utf8(input) {
2260 /// Ok(output) => (output, false),
2261 /// Err(error) => {
2262 /// // The bytes were not valid UTF-8, but we can still recover a string.
2263 /// (error.into_utf8_lossy(), true)
2264 /// }
2265 /// };
2266 ///
2267 /// assert_eq!(String::from("Hello ๏ฟฝWorld"), output);
2268 /// assert!(had_invalid_utf8);
2269 /// ```
2270 #[must_use]
2271 #[cfg(not(no_global_oom_handling))]
2272 #[unstable(feature = "string_from_utf8_lossy_owned", issue = "129436")]
2273 pub fn into_utf8_lossy(self) -> String {
2274 const REPLACEMENT: &str = "\u{FFFD}";
2275
2276 let mut res = {
2277 let mut v = Vec::with_capacity(self.bytes.len());
2278
2279 // `Utf8Error::valid_up_to` returns the maximum index of validated
2280 // UTF-8 bytes. Copy the valid bytes into the output buffer.
2281 v.extend_from_slice(&self.bytes[..self.error.valid_up_to()]);
2282
2283 // SAFETY: This is safe because the only bytes present in the buffer
2284 // were validated as UTF-8 by the call to `String::from_utf8` which
2285 // produced this `FromUtf8Error`.
2286 unsafe { String::from_utf8_unchecked(v) }
2287 };
2288
2289 let iter = self.bytes[self.error.valid_up_to()..].utf8_chunks();
2290
2291 for chunk in iter {
2292 res.push_str(chunk.valid());
2293 if !chunk.invalid().is_empty() {
2294 res.push_str(REPLACEMENT);
2295 }
2296 }
2297
2298 res
2299 }
2300
2301 /// Returns the bytes that were attempted to convert to a `String`.
2302 ///
2303 /// This method is carefully constructed to avoid allocation. It will
2304 /// consume the error, moving out the bytes, so that a copy of the bytes
2305 /// does not need to be made.
2306 ///
2307 /// # Examples
2308 ///
2309 /// ```
2310 /// // some invalid bytes, in a vector
2311 /// let bytes = vec![0, 159];
2312 ///
2313 /// let value = String::from_utf8(bytes);
2314 ///
2315 /// assert_eq!(vec![0, 159], value.unwrap_err().into_bytes());
2316 /// ```
2317 #[must_use = "`self` will be dropped if the result is not used"]
2318 #[stable(feature = "rust1", since = "1.0.0")]
2319 pub fn into_bytes(self) -> Vec<u8> {
2320 self.bytes
2321 }
2322
2323 /// Fetch a `Utf8Error` to get more details about the conversion failure.
2324 ///
2325 /// The [`Utf8Error`] type provided by [`std::str`] represents an error that may
2326 /// occur when converting a slice of [`u8`]s to a [`&str`]. In this sense, it's
2327 /// an analogue to `FromUtf8Error`. See its documentation for more details
2328 /// on using it.
2329 ///
2330 /// [`std::str`]: core::str "std::str"
2331 /// [`&str`]: prim@str "&str"
2332 ///
2333 /// # Examples
2334 ///
2335 /// ```
2336 /// // some invalid bytes, in a vector
2337 /// let bytes = vec![0, 159];
2338 ///
2339 /// let error = String::from_utf8(bytes).unwrap_err().utf8_error();
2340 ///
2341 /// // the first byte is invalid here
2342 /// assert_eq!(1, error.valid_up_to());
2343 /// ```
2344 #[must_use]
2345 #[stable(feature = "rust1", since = "1.0.0")]
2346 pub fn utf8_error(&self) -> Utf8Error {
2347 self.error
2348 }
2349}
2350
2351#[stable(feature = "rust1", since = "1.0.0")]
2352impl fmt::Display for FromUtf8Error {
2353 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
2354 fmt::Display::fmt(&self.error, f)
2355 }
2356}
2357
2358#[stable(feature = "rust1", since = "1.0.0")]
2359impl fmt::Display for FromUtf16Error {
2360 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
2361 match self.kind {
2362 FromUtf16ErrorKind::LoneSurrogate => "invalid utf-16: lone surrogate found",
2363 FromUtf16ErrorKind::OddBytes => "invalid utf-16: odd number of bytes",
2364 }
2365 .fmt(f)
2366 }
2367}
2368
2369#[stable(feature = "rust1", since = "1.0.0")]
2370impl Error for FromUtf8Error {}
2371
2372#[stable(feature = "rust1", since = "1.0.0")]
2373impl Error for FromUtf16Error {}
2374
2375#[cfg(not(no_global_oom_handling))]
2376#[stable(feature = "rust1", since = "1.0.0")]
2377impl Clone for String {
2378 fn clone(&self) -> Self {
2379 String { vec: self.vec.clone() }
2380 }
2381
2382 /// Clones the contents of `source` into `self`.
2383 ///
2384 /// This method is preferred over simply assigning `source.clone()` to `self`,
2385 /// as it avoids reallocation if possible.
2386 fn clone_from(&mut self, source: &Self) {
2387 self.vec.clone_from(&source.vec);
2388 }
2389}
2390
2391#[cfg(not(no_global_oom_handling))]
2392#[stable(feature = "rust1", since = "1.0.0")]
2393impl FromIterator<char> for String {
2394 fn from_iter<I: IntoIterator<Item = char>>(iter: I) -> String {
2395 let mut buf = String::new();
2396 buf.extend(iter);
2397 buf
2398 }
2399}
2400
2401#[cfg(not(no_global_oom_handling))]
2402#[stable(feature = "string_from_iter_by_ref", since = "1.17.0")]
2403impl<'a> FromIterator<&'a char> for String {
2404 fn from_iter<I: IntoIterator<Item = &'a char>>(iter: I) -> String {
2405 let mut buf = String::new();
2406 buf.extend(iter);
2407 buf
2408 }
2409}
2410
2411#[cfg(not(no_global_oom_handling))]
2412#[stable(feature = "rust1", since = "1.0.0")]
2413impl<'a> FromIterator<&'a str> for String {
2414 fn from_iter<I: IntoIterator<Item = &'a str>>(iter: I) -> String {
2415 let mut buf = String::new();
2416 buf.extend(iter);
2417 buf
2418 }
2419}
2420
2421#[cfg(not(no_global_oom_handling))]
2422#[stable(feature = "extend_string", since = "1.4.0")]
2423impl FromIterator<String> for String {
2424 fn from_iter<I: IntoIterator<Item = String>>(iter: I) -> String {
2425 let mut iterator = iter.into_iter();
2426
2427 // Because we're iterating over `String`s, we can avoid at least
2428 // one allocation by getting the first string from the iterator
2429 // and appending to it all the subsequent strings.
2430 match iterator.next() {
2431 None => String::new(),
2432 Some(mut buf) => {
2433 buf.extend(iterator);
2434 buf
2435 }
2436 }
2437 }
2438}
2439
2440#[cfg(not(no_global_oom_handling))]
2441#[stable(feature = "box_str2", since = "1.45.0")]
2442impl<A: Allocator> FromIterator<Box<str, A>> for String {
2443 fn from_iter<I: IntoIterator<Item = Box<str, A>>>(iter: I) -> String {
2444 let mut buf = String::new();
2445 buf.extend(iter);
2446 buf
2447 }
2448}
2449
2450#[cfg(not(no_global_oom_handling))]
2451#[stable(feature = "herd_cows", since = "1.19.0")]
2452impl<'a> FromIterator<Cow<'a, str>> for String {
2453 fn from_iter<I: IntoIterator<Item = Cow<'a, str>>>(iter: I) -> String {
2454 let mut iterator = iter.into_iter();
2455
2456 // Because we're iterating over CoWs, we can (potentially) avoid at least
2457 // one allocation by getting the first item and appending to it all the
2458 // subsequent items.
2459 match iterator.next() {
2460 None => String::new(),
2461 Some(cow) => {
2462 let mut buf = cow.into_owned();
2463 buf.extend(iterator);
2464 buf
2465 }
2466 }
2467 }
2468}
2469
2470#[cfg(not(no_global_oom_handling))]
2471#[unstable(feature = "ascii_char", issue = "110998")]
2472impl FromIterator<core::ascii::Char> for String {
2473 fn from_iter<T: IntoIterator<Item = core::ascii::Char>>(iter: T) -> Self {
2474 let buf = iter.into_iter().map(core::ascii::Char::to_u8).collect();
2475 // SAFETY: `buf` is guaranteed to be valid UTF-8 because the `core::ascii::Char` type
2476 // only contains ASCII values (0x00-0x7F), which are valid UTF-8.
2477 unsafe { String::from_utf8_unchecked(buf) }
2478 }
2479}
2480
2481#[cfg(not(no_global_oom_handling))]
2482#[unstable(feature = "ascii_char", issue = "110998")]
2483impl<'a> FromIterator<&'a core::ascii::Char> for String {
2484 fn from_iter<T: IntoIterator<Item = &'a core::ascii::Char>>(iter: T) -> Self {
2485 let buf = iter.into_iter().copied().map(core::ascii::Char::to_u8).collect();
2486 // SAFETY: `buf` is guaranteed to be valid UTF-8 because the `core::ascii::Char` type
2487 // only contains ASCII values (0x00-0x7F), which are valid UTF-8.
2488 unsafe { String::from_utf8_unchecked(buf) }
2489 }
2490}
2491
2492#[cfg(not(no_global_oom_handling))]
2493#[stable(feature = "rust1", since = "1.0.0")]
2494impl Extend<char> for String {
2495 fn extend<I: IntoIterator<Item = char>>(&mut self, iter: I) {
2496 let iterator = iter.into_iter();
2497 let (lower_bound, _) = iterator.size_hint();
2498 self.reserve(lower_bound);
2499 iterator.for_each(move |c| self.push(c));
2500 }
2501
2502 #[inline]
2503 fn extend_one(&mut self, c: char) {
2504 self.push(c);
2505 }
2506
2507 #[inline]
2508 fn extend_reserve(&mut self, additional: usize) {
2509 self.reserve(additional);
2510 }
2511}
2512
2513#[cfg(not(no_global_oom_handling))]
2514#[stable(feature = "extend_ref", since = "1.2.0")]
2515impl<'a> Extend<&'a char> for String {
2516 fn extend<I: IntoIterator<Item = &'a char>>(&mut self, iter: I) {
2517 self.extend(iter.into_iter().cloned());
2518 }
2519
2520 #[inline]
2521 fn extend_one(&mut self, &c: &'a char) {
2522 self.push(c);
2523 }
2524
2525 #[inline]
2526 fn extend_reserve(&mut self, additional: usize) {
2527 self.reserve(additional);
2528 }
2529}
2530
2531#[cfg(not(no_global_oom_handling))]
2532#[stable(feature = "rust1", since = "1.0.0")]
2533impl<'a> Extend<&'a str> for String {
2534 fn extend<I: IntoIterator<Item = &'a str>>(&mut self, iter: I) {
2535 <I as SpecExtendStr>::spec_extend_into(iter, self)
2536 }
2537
2538 #[inline]
2539 fn extend_one(&mut self, s: &'a str) {
2540 self.push_str(s);
2541 }
2542}
2543
2544#[cfg(not(no_global_oom_handling))]
2545trait SpecExtendStr {
2546 fn spec_extend_into(self, s: &mut String);
2547}
2548
2549#[cfg(not(no_global_oom_handling))]
2550impl<'a, T: IntoIterator<Item = &'a str>> SpecExtendStr for T {
2551 default fn spec_extend_into(self, target: &mut String) {
2552 self.into_iter().for_each(move |s| target.push_str(s));
2553 }
2554}
2555
2556#[cfg(not(no_global_oom_handling))]
2557impl SpecExtendStr for [&str] {
2558 fn spec_extend_into(self, target: &mut String) {
2559 target.push_str_slice(&self);
2560 }
2561}
2562
2563#[cfg(not(no_global_oom_handling))]
2564impl<const N: usize> SpecExtendStr for [&str; N] {
2565 fn spec_extend_into(self, target: &mut String) {
2566 target.push_str_slice(&self[..]);
2567 }
2568}
2569
2570#[cfg(not(no_global_oom_handling))]
2571#[stable(feature = "box_str2", since = "1.45.0")]
2572impl<A: Allocator> Extend<Box<str, A>> for String {
2573 fn extend<I: IntoIterator<Item = Box<str, A>>>(&mut self, iter: I) {
2574 iter.into_iter().for_each(move |s| self.push_str(&s));
2575 }
2576}
2577
2578#[cfg(not(no_global_oom_handling))]
2579#[stable(feature = "extend_string", since = "1.4.0")]
2580impl Extend<String> for String {
2581 fn extend<I: IntoIterator<Item = String>>(&mut self, iter: I) {
2582 iter.into_iter().for_each(move |s| self.push_str(&s));
2583 }
2584
2585 #[inline]
2586 fn extend_one(&mut self, s: String) {
2587 self.push_str(&s);
2588 }
2589}
2590
2591#[cfg(not(no_global_oom_handling))]
2592#[stable(feature = "herd_cows", since = "1.19.0")]
2593impl<'a> Extend<Cow<'a, str>> for String {
2594 fn extend<I: IntoIterator<Item = Cow<'a, str>>>(&mut self, iter: I) {
2595 iter.into_iter().for_each(move |s| self.push_str(&s));
2596 }
2597
2598 #[inline]
2599 fn extend_one(&mut self, s: Cow<'a, str>) {
2600 self.push_str(&s);
2601 }
2602}
2603
2604#[cfg(not(no_global_oom_handling))]
2605#[unstable(feature = "ascii_char", issue = "110998")]
2606impl Extend<core::ascii::Char> for String {
2607 #[inline]
2608 fn extend<I: IntoIterator<Item = core::ascii::Char>>(&mut self, iter: I) {
2609 self.vec.extend(iter.into_iter().map(|c| c.to_u8()));
2610 }
2611
2612 #[inline]
2613 fn extend_one(&mut self, c: core::ascii::Char) {
2614 self.vec.push(c.to_u8());
2615 }
2616}
2617
2618#[cfg(not(no_global_oom_handling))]
2619#[unstable(feature = "ascii_char", issue = "110998")]
2620impl<'a> Extend<&'a core::ascii::Char> for String {
2621 #[inline]
2622 fn extend<I: IntoIterator<Item = &'a core::ascii::Char>>(&mut self, iter: I) {
2623 self.extend(iter.into_iter().cloned());
2624 }
2625
2626 #[inline]
2627 fn extend_one(&mut self, c: &'a core::ascii::Char) {
2628 self.vec.push(c.to_u8());
2629 }
2630}
2631
2632/// A convenience impl that delegates to the impl for `&str`.
2633///
2634/// # Examples
2635///
2636/// ```
2637/// assert_eq!(String::from("Hello world").find("world"), Some(6));
2638/// ```
2639#[unstable(
2640 feature = "pattern",
2641 reason = "API not fully fleshed out and ready to be stabilized",
2642 issue = "27721"
2643)]
2644impl<'b> Pattern for &'b String {
2645 type Searcher<'a> = <&'b str as Pattern>::Searcher<'a>;
2646
2647 fn into_searcher(self, haystack: &str) -> <&'b str as Pattern>::Searcher<'_> {
2648 self[..].into_searcher(haystack)
2649 }
2650
2651 #[inline]
2652 fn is_contained_in(self, haystack: &str) -> bool {
2653 self[..].is_contained_in(haystack)
2654 }
2655
2656 #[inline]
2657 fn is_prefix_of(self, haystack: &str) -> bool {
2658 self[..].is_prefix_of(haystack)
2659 }
2660
2661 #[inline]
2662 fn strip_prefix_of(self, haystack: &str) -> Option<&str> {
2663 self[..].strip_prefix_of(haystack)
2664 }
2665
2666 #[inline]
2667 fn is_suffix_of<'a>(self, haystack: &'a str) -> bool
2668 where
2669 Self::Searcher<'a>: core::str::pattern::ReverseSearcher<'a>,
2670 {
2671 self[..].is_suffix_of(haystack)
2672 }
2673
2674 #[inline]
2675 fn strip_suffix_of<'a>(self, haystack: &'a str) -> Option<&'a str>
2676 where
2677 Self::Searcher<'a>: core::str::pattern::ReverseSearcher<'a>,
2678 {
2679 self[..].strip_suffix_of(haystack)
2680 }
2681
2682 #[inline]
2683 fn as_utf8_pattern(&self) -> Option<Utf8Pattern<'_>> {
2684 Some(Utf8Pattern::StringPattern(self.as_str()))
2685 }
2686}
2687
2688macro_rules! impl_eq {
2689 ($lhs:ty, $rhs: ty) => {
2690 #[stable(feature = "rust1", since = "1.0.0")]
2691 impl PartialEq<$rhs> for $lhs {
2692 #[inline]
2693 fn eq(&self, other: &$rhs) -> bool {
2694 PartialEq::eq(&self[..], &other[..])
2695 }
2696 #[inline]
2697 fn ne(&self, other: &$rhs) -> bool {
2698 PartialEq::ne(&self[..], &other[..])
2699 }
2700 }
2701
2702 #[stable(feature = "rust1", since = "1.0.0")]
2703 impl PartialEq<$lhs> for $rhs {
2704 #[inline]
2705 fn eq(&self, other: &$lhs) -> bool {
2706 PartialEq::eq(&self[..], &other[..])
2707 }
2708 #[inline]
2709 fn ne(&self, other: &$lhs) -> bool {
2710 PartialEq::ne(&self[..], &other[..])
2711 }
2712 }
2713 };
2714}
2715
2716impl_eq! { String, str }
2717impl_eq! { String, &str }
2718#[cfg(not(no_global_oom_handling))]
2719impl_eq! { Cow<'_, str>, str }
2720#[cfg(not(no_global_oom_handling))]
2721impl_eq! { Cow<'_, str>, &'_ str }
2722#[cfg(not(no_global_oom_handling))]
2723impl_eq! { Cow<'_, str>, String }
2724
2725#[stable(feature = "rust1", since = "1.0.0")]
2726#[rustc_const_unstable(feature = "const_default", issue = "143894")]
2727const impl Default for String {
2728 /// Creates an empty `String`.
2729 #[inline]
2730 fn default() -> String {
2731 String::new()
2732 }
2733}
2734
2735#[stable(feature = "rust1", since = "1.0.0")]
2736impl fmt::Display for String {
2737 #[inline]
2738 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
2739 fmt::Display::fmt(&**self, f)
2740 }
2741}
2742
2743#[stable(feature = "rust1", since = "1.0.0")]
2744impl fmt::Debug for String {
2745 #[inline]
2746 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
2747 fmt::Debug::fmt(&**self, f)
2748 }
2749}
2750
2751#[stable(feature = "rust1", since = "1.0.0")]
2752impl hash::Hash for String {
2753 #[inline]
2754 fn hash<H: hash::Hasher>(&self, hasher: &mut H) {
2755 (**self).hash(hasher)
2756 }
2757}
2758
2759/// Implements the `+` operator for concatenating two strings.
2760///
2761/// This consumes the `String` on the left-hand side and re-uses its buffer (growing it if
2762/// necessary). This is done to avoid allocating a new `String` and copying the entire contents on
2763/// every operation, which would lead to *O*(*n*^2) running time when building an *n*-byte string by
2764/// repeated concatenation.
2765///
2766/// The string on the right-hand side is only borrowed; its contents are copied into the returned
2767/// `String`.
2768///
2769/// # Examples
2770///
2771/// Concatenating two `String`s takes the first by value and borrows the second:
2772///
2773/// ```
2774/// let a = String::from("hello");
2775/// let b = String::from(" world");
2776/// let c = a + &b;
2777/// // `a` is moved and can no longer be used here.
2778/// ```
2779///
2780/// If you want to keep using the first `String`, you can clone it and append to the clone instead:
2781///
2782/// ```
2783/// let a = String::from("hello");
2784/// let b = String::from(" world");
2785/// let c = a.clone() + &b;
2786/// // `a` is still valid here.
2787/// ```
2788///
2789/// Concatenating `&str` slices can be done by converting the first to a `String`:
2790///
2791/// ```
2792/// let a = "hello";
2793/// let b = " world";
2794/// let c = a.to_string() + b;
2795/// ```
2796#[cfg(not(no_global_oom_handling))]
2797#[stable(feature = "rust1", since = "1.0.0")]
2798impl Add<&str> for String {
2799 type Output = String;
2800
2801 #[inline]
2802 fn add(mut self, other: &str) -> String {
2803 self.push_str(other);
2804 self
2805 }
2806}
2807
2808/// Implements the `+=` operator for appending to a `String`.
2809///
2810/// This has the same behavior as the [`push_str`][String::push_str] method.
2811#[cfg(not(no_global_oom_handling))]
2812#[stable(feature = "stringaddassign", since = "1.12.0")]
2813impl AddAssign<&str> for String {
2814 #[inline]
2815 fn add_assign(&mut self, other: &str) {
2816 self.push_str(other);
2817 }
2818}
2819
2820#[stable(feature = "rust1", since = "1.0.0")]
2821impl<I> ops::Index<I> for String
2822where
2823 I: slice::SliceIndex<str>,
2824{
2825 type Output = I::Output;
2826
2827 #[inline]
2828 fn index(&self, index: I) -> &I::Output {
2829 index.index(self.as_str())
2830 }
2831}
2832
2833#[stable(feature = "rust1", since = "1.0.0")]
2834impl<I> ops::IndexMut<I> for String
2835where
2836 I: slice::SliceIndex<str>,
2837{
2838 #[inline]
2839 fn index_mut(&mut self, index: I) -> &mut I::Output {
2840 index.index_mut(self.as_mut_str())
2841 }
2842}
2843
2844#[stable(feature = "rust1", since = "1.0.0")]
2845impl ops::Deref for String {
2846 type Target = str;
2847
2848 #[inline]
2849 fn deref(&self) -> &str {
2850 self.as_str()
2851 }
2852}
2853
2854#[unstable(feature = "deref_pure_trait", issue = "87121")]
2855unsafe impl ops::DerefPure for String {}
2856
2857#[stable(feature = "derefmut_for_string", since = "1.3.0")]
2858impl ops::DerefMut for String {
2859 #[inline]
2860 fn deref_mut(&mut self) -> &mut str {
2861 self.as_mut_str()
2862 }
2863}
2864
2865/// A type alias for [`Infallible`].
2866///
2867/// This alias exists for backwards compatibility, and may be eventually deprecated.
2868///
2869/// [`Infallible`]: core::convert::Infallible "convert::Infallible"
2870#[stable(feature = "str_parse_error", since = "1.5.0")]
2871pub type ParseError = core::convert::Infallible;
2872
2873#[cfg(not(no_global_oom_handling))]
2874#[stable(feature = "rust1", since = "1.0.0")]
2875impl FromStr for String {
2876 type Err = core::convert::Infallible;
2877 #[inline]
2878 fn from_str(s: &str) -> Result<String, Self::Err> {
2879 Ok(String::from(s))
2880 }
2881}
2882
2883/// A trait for converting a value to a `String`.
2884///
2885/// This trait is automatically implemented for any type which implements the
2886/// [`Display`] trait. As such, `ToString` shouldn't be implemented directly:
2887/// [`Display`] should be implemented instead, and you get the `ToString`
2888/// implementation for free.
2889///
2890/// [`Display`]: fmt::Display
2891#[rustc_diagnostic_item = "ToString"]
2892#[stable(feature = "rust1", since = "1.0.0")]
2893pub trait ToString {
2894 /// Converts the given value to a `String`.
2895 ///
2896 /// # Examples
2897 ///
2898 /// ```
2899 /// let i = 5;
2900 /// let five = String::from("5");
2901 ///
2902 /// assert_eq!(five, i.to_string());
2903 /// ```
2904 #[rustc_conversion_suggestion]
2905 #[stable(feature = "rust1", since = "1.0.0")]
2906 #[rustc_diagnostic_item = "to_string_method"]
2907 fn to_string(&self) -> String;
2908}
2909
2910/// # Panics
2911///
2912/// In this implementation, the `to_string` method panics
2913/// if the `Display` implementation returns an error.
2914/// This indicates an incorrect `Display` implementation
2915/// since `fmt::Write for String` never returns an error itself.
2916#[cfg(not(no_global_oom_handling))]
2917#[stable(feature = "rust1", since = "1.0.0")]
2918impl<T: fmt::Display + ?Sized> ToString for T {
2919 #[inline]
2920 fn to_string(&self) -> String {
2921 <Self as SpecToString>::spec_to_string(self)
2922 }
2923}
2924
2925#[cfg(not(no_global_oom_handling))]
2926trait SpecToString {
2927 fn spec_to_string(&self) -> String;
2928}
2929
2930#[cfg(not(no_global_oom_handling))]
2931impl<T: fmt::Display + ?Sized> SpecToString for T {
2932 // A common guideline is to not inline generic functions. However,
2933 // removing `#[inline]` from this method causes non-negligible regressions.
2934 // See <https://github.com/rust-lang/rust/pull/74852>, the last attempt
2935 // to try to remove it.
2936 #[inline]
2937 default fn spec_to_string(&self) -> String {
2938 let mut buf = String::new();
2939 let mut formatter =
2940 core::fmt::Formatter::new(&mut buf, core::fmt::FormattingOptions::new());
2941 // Bypass format_args!() to avoid write_str with zero-length strs
2942 fmt::Display::fmt(self, &mut formatter)
2943 .expect("a Display implementation returned an error unexpectedly");
2944 buf
2945 }
2946}
2947
2948#[cfg(not(no_global_oom_handling))]
2949impl SpecToString for core::ascii::Char {
2950 #[inline]
2951 fn spec_to_string(&self) -> String {
2952 self.as_str().to_owned()
2953 }
2954}
2955
2956#[cfg(not(no_global_oom_handling))]
2957impl SpecToString for char {
2958 #[inline]
2959 fn spec_to_string(&self) -> String {
2960 String::from(self.encode_utf8(&mut [0; char::MAX_LEN_UTF8]))
2961 }
2962}
2963
2964#[cfg(not(no_global_oom_handling))]
2965impl SpecToString for bool {
2966 #[inline]
2967 fn spec_to_string(&self) -> String {
2968 String::from(if *self { "true" } else { "false" })
2969 }
2970}
2971
2972macro_rules! impl_to_string {
2973 ($($signed:ident, $unsigned:ident,)*) => {
2974 $(
2975 #[cfg(not(no_global_oom_handling))]
2976 #[cfg(not(feature = "optimize_for_size"))]
2977 impl SpecToString for $signed {
2978 #[inline]
2979 fn spec_to_string(&self) -> String {
2980 const SIZE: usize = $signed::MAX.ilog10() as usize + 1;
2981 let mut buf = [core::mem::MaybeUninit::<u8>::uninit(); SIZE];
2982 // Only difference between signed and unsigned are these 8 lines.
2983 let mut out;
2984 if *self < 0 {
2985 out = String::with_capacity(SIZE + 1);
2986 out.push('-');
2987 } else {
2988 out = String::with_capacity(SIZE);
2989 }
2990
2991 // SAFETY: `buf` is always big enough to contain all the digits.
2992 unsafe { out.push_str(self.unsigned_abs()._fmt(&mut buf)); }
2993 out
2994 }
2995 }
2996 #[cfg(not(no_global_oom_handling))]
2997 #[cfg(not(feature = "optimize_for_size"))]
2998 impl SpecToString for $unsigned {
2999 #[inline]
3000 fn spec_to_string(&self) -> String {
3001 const SIZE: usize = $unsigned::MAX.ilog10() as usize + 1;
3002 let mut buf = [core::mem::MaybeUninit::<u8>::uninit(); SIZE];
3003
3004 // SAFETY: `buf` is always big enough to contain all the digits.
3005 unsafe { self._fmt(&mut buf).to_string() }
3006 }
3007 }
3008 )*
3009 }
3010}
3011
3012impl_to_string! {
3013 i8, u8,
3014 i16, u16,
3015 i32, u32,
3016 i64, u64,
3017 isize, usize,
3018 i128, u128,
3019}
3020
3021#[cfg(not(no_global_oom_handling))]
3022#[cfg(feature = "optimize_for_size")]
3023impl SpecToString for u8 {
3024 #[inline]
3025 fn spec_to_string(&self) -> String {
3026 let mut buf = String::with_capacity(3);
3027 let mut n = *self;
3028 if n >= 10 {
3029 if n >= 100 {
3030 buf.push((b'0' + n / 100) as char);
3031 n %= 100;
3032 }
3033 buf.push((b'0' + n / 10) as char);
3034 n %= 10;
3035 }
3036 buf.push((b'0' + n) as char);
3037 buf
3038 }
3039}
3040
3041#[cfg(not(no_global_oom_handling))]
3042#[cfg(feature = "optimize_for_size")]
3043impl SpecToString for i8 {
3044 #[inline]
3045 fn spec_to_string(&self) -> String {
3046 let mut buf = String::with_capacity(4);
3047 if self.is_negative() {
3048 buf.push('-');
3049 }
3050 let mut n = self.unsigned_abs();
3051 if n >= 10 {
3052 if n >= 100 {
3053 buf.push('1');
3054 n -= 100;
3055 }
3056 buf.push((b'0' + n / 10) as char);
3057 n %= 10;
3058 }
3059 buf.push((b'0' + n) as char);
3060 buf
3061 }
3062}
3063
3064#[cfg(not(no_global_oom_handling))]
3065macro_rules! to_string_str {
3066 {$($type:ty,)*} => {
3067 $(
3068 impl SpecToString for $type {
3069 #[inline]
3070 fn spec_to_string(&self) -> String {
3071 let s: &str = self;
3072 String::from(s)
3073 }
3074 }
3075 )*
3076 };
3077}
3078
3079#[cfg(not(no_global_oom_handling))]
3080to_string_str! {
3081 Cow<'_, str>,
3082 String,
3083 // Generic/generated code can sometimes have multiple, nested references
3084 // for strings, including `&&&str`s that would never be written
3085 // by hand.
3086 &&&&&&&&&&&&str,
3087 &&&&&&&&&&&str,
3088 &&&&&&&&&&str,
3089 &&&&&&&&&str,
3090 &&&&&&&&str,
3091 &&&&&&&str,
3092 &&&&&&str,
3093 &&&&&str,
3094 &&&&str,
3095 &&&str,
3096 &&str,
3097 &str,
3098 str,
3099}
3100
3101#[cfg(not(no_global_oom_handling))]
3102impl SpecToString for fmt::Arguments<'_> {
3103 #[inline]
3104 fn spec_to_string(&self) -> String {
3105 crate::fmt::format(*self)
3106 }
3107}
3108
3109#[stable(feature = "rust1", since = "1.0.0")]
3110impl AsRef<str> for String {
3111 #[inline]
3112 fn as_ref(&self) -> &str {
3113 self
3114 }
3115}
3116
3117#[stable(feature = "string_as_mut", since = "1.43.0")]
3118impl AsMut<str> for String {
3119 #[inline]
3120 fn as_mut(&mut self) -> &mut str {
3121 self
3122 }
3123}
3124
3125#[stable(feature = "rust1", since = "1.0.0")]
3126impl AsRef<[u8]> for String {
3127 #[inline]
3128 fn as_ref(&self) -> &[u8] {
3129 self.as_bytes()
3130 }
3131}
3132
3133#[cfg(not(no_global_oom_handling))]
3134#[stable(feature = "rust1", since = "1.0.0")]
3135impl From<&str> for String {
3136 /// Converts a `&str` into a [`String`].
3137 ///
3138 /// The result is allocated on the heap.
3139 #[inline]
3140 fn from(s: &str) -> String {
3141 s.to_owned()
3142 }
3143}
3144
3145#[cfg(not(no_global_oom_handling))]
3146#[stable(feature = "from_mut_str_for_string", since = "1.44.0")]
3147impl From<&mut str> for String {
3148 /// Converts a `&mut str` into a [`String`].
3149 ///
3150 /// The result is allocated on the heap.
3151 #[inline]
3152 fn from(s: &mut str) -> String {
3153 s.to_owned()
3154 }
3155}
3156
3157#[cfg(not(no_global_oom_handling))]
3158#[stable(feature = "from_ref_string", since = "1.35.0")]
3159impl From<&String> for String {
3160 /// Converts a `&String` into a [`String`].
3161 ///
3162 /// This clones `s` and returns the clone.
3163 #[inline]
3164 fn from(s: &String) -> String {
3165 s.clone()
3166 }
3167}
3168
3169// note: test pulls in std, which causes errors here
3170#[stable(feature = "string_from_box", since = "1.18.0")]
3171impl From<Box<str>> for String {
3172 /// Converts the given boxed `str` slice to a [`String`].
3173 /// It is notable that the `str` slice is owned.
3174 ///
3175 /// # Examples
3176 ///
3177 /// ```
3178 /// let s1: String = String::from("hello world");
3179 /// let s2: Box<str> = s1.into_boxed_str();
3180 /// let s3: String = String::from(s2);
3181 ///
3182 /// assert_eq!("hello world", s3)
3183 /// ```
3184 fn from(s: Box<str>) -> String {
3185 s.into_string()
3186 }
3187}
3188
3189#[cfg(not(no_global_oom_handling))]
3190#[stable(feature = "box_from_str", since = "1.20.0")]
3191impl From<String> for Box<str> {
3192 /// Converts the given [`String`] to a boxed `str` slice that is owned.
3193 ///
3194 /// # Examples
3195 ///
3196 /// ```
3197 /// let s1: String = String::from("hello world");
3198 /// let s2: Box<str> = Box::from(s1);
3199 /// let s3: String = String::from(s2);
3200 ///
3201 /// assert_eq!("hello world", s3)
3202 /// ```
3203 fn from(s: String) -> Box<str> {
3204 s.into_boxed_str()
3205 }
3206}
3207
3208#[cfg(not(no_global_oom_handling))]
3209#[stable(feature = "string_from_cow_str", since = "1.14.0")]
3210impl<'a> From<Cow<'a, str>> for String {
3211 /// Converts a clone-on-write string to an owned
3212 /// instance of [`String`].
3213 ///
3214 /// This extracts the owned string,
3215 /// clones the string if it is not already owned.
3216 ///
3217 /// # Example
3218 ///
3219 /// ```
3220 /// # use std::borrow::Cow;
3221 /// // If the string is not owned...
3222 /// let cow: Cow<'_, str> = Cow::Borrowed("eggplant");
3223 /// // It will allocate on the heap and copy the string.
3224 /// let owned: String = String::from(cow);
3225 /// assert_eq!(&owned[..], "eggplant");
3226 /// ```
3227 fn from(s: Cow<'a, str>) -> String {
3228 s.into_owned()
3229 }
3230}
3231
3232#[cfg(not(no_global_oom_handling))]
3233#[stable(feature = "rust1", since = "1.0.0")]
3234impl<'a> From<&'a str> for Cow<'a, str> {
3235 /// Converts a string slice into a [`Borrowed`] variant.
3236 /// No heap allocation is performed, and the string
3237 /// is not copied.
3238 ///
3239 /// # Example
3240 ///
3241 /// ```
3242 /// # use std::borrow::Cow;
3243 /// assert_eq!(Cow::from("eggplant"), Cow::Borrowed("eggplant"));
3244 /// ```
3245 ///
3246 /// [`Borrowed`]: crate::borrow::Cow::Borrowed "borrow::Cow::Borrowed"
3247 #[inline]
3248 fn from(s: &'a str) -> Cow<'a, str> {
3249 Cow::Borrowed(s)
3250 }
3251}
3252
3253#[cfg(not(no_global_oom_handling))]
3254#[stable(feature = "rust1", since = "1.0.0")]
3255impl<'a> From<String> for Cow<'a, str> {
3256 /// Converts a [`String`] into an [`Owned`] variant.
3257 /// No heap allocation is performed, and the string
3258 /// is not copied.
3259 ///
3260 /// # Example
3261 ///
3262 /// ```
3263 /// # use std::borrow::Cow;
3264 /// let s = "eggplant".to_string();
3265 /// let s2 = "eggplant".to_string();
3266 /// assert_eq!(Cow::from(s), Cow::<'static, str>::Owned(s2));
3267 /// ```
3268 ///
3269 /// [`Owned`]: crate::borrow::Cow::Owned "borrow::Cow::Owned"
3270 #[inline]
3271 fn from(s: String) -> Cow<'a, str> {
3272 Cow::Owned(s)
3273 }
3274}
3275
3276#[cfg(not(no_global_oom_handling))]
3277#[stable(feature = "cow_from_string_ref", since = "1.28.0")]
3278impl<'a> From<&'a String> for Cow<'a, str> {
3279 /// Converts a [`String`] reference into a [`Borrowed`] variant.
3280 /// No heap allocation is performed, and the string
3281 /// is not copied.
3282 ///
3283 /// # Example
3284 ///
3285 /// ```
3286 /// # use std::borrow::Cow;
3287 /// let s = "eggplant".to_string();
3288 /// assert_eq!(Cow::from(&s), Cow::Borrowed("eggplant"));
3289 /// ```
3290 ///
3291 /// [`Borrowed`]: crate::borrow::Cow::Borrowed "borrow::Cow::Borrowed"
3292 #[inline]
3293 fn from(s: &'a String) -> Cow<'a, str> {
3294 Cow::Borrowed(s.as_str())
3295 }
3296}
3297
3298#[cfg(not(no_global_oom_handling))]
3299#[stable(feature = "cow_str_from_iter", since = "1.12.0")]
3300impl<'a> FromIterator<char> for Cow<'a, str> {
3301 fn from_iter<I: IntoIterator<Item = char>>(it: I) -> Cow<'a, str> {
3302 Cow::Owned(FromIterator::from_iter(it))
3303 }
3304}
3305
3306#[cfg(not(no_global_oom_handling))]
3307#[stable(feature = "cow_str_from_iter", since = "1.12.0")]
3308impl<'a, 'b> FromIterator<&'b str> for Cow<'a, str> {
3309 fn from_iter<I: IntoIterator<Item = &'b str>>(it: I) -> Cow<'a, str> {
3310 Cow::Owned(FromIterator::from_iter(it))
3311 }
3312}
3313
3314#[cfg(not(no_global_oom_handling))]
3315#[stable(feature = "cow_str_from_iter", since = "1.12.0")]
3316impl<'a> FromIterator<String> for Cow<'a, str> {
3317 fn from_iter<I: IntoIterator<Item = String>>(it: I) -> Cow<'a, str> {
3318 Cow::Owned(FromIterator::from_iter(it))
3319 }
3320}
3321
3322#[cfg(not(no_global_oom_handling))]
3323#[unstable(feature = "ascii_char", issue = "110998")]
3324impl<'a> FromIterator<core::ascii::Char> for Cow<'a, str> {
3325 fn from_iter<T: IntoIterator<Item = core::ascii::Char>>(it: T) -> Self {
3326 Cow::Owned(FromIterator::from_iter(it))
3327 }
3328}
3329
3330#[stable(feature = "from_string_for_vec_u8", since = "1.14.0")]
3331impl From<String> for Vec<u8> {
3332 /// Converts the given [`String`] to a vector [`Vec`] that holds values of type [`u8`].
3333 ///
3334 /// # Examples
3335 ///
3336 /// ```
3337 /// let s1 = String::from("hello world");
3338 /// let v1 = Vec::from(s1);
3339 ///
3340 /// for b in v1 {
3341 /// println!("{b}");
3342 /// }
3343 /// ```
3344 fn from(string: String) -> Vec<u8> {
3345 string.into_bytes()
3346 }
3347}
3348
3349#[stable(feature = "try_from_vec_u8_for_string", since = "1.87.0")]
3350impl TryFrom<Vec<u8>> for String {
3351 type Error = FromUtf8Error;
3352 /// Converts the given [`Vec<u8>`] into a [`String`] if it contains valid UTF-8 data.
3353 ///
3354 /// # Examples
3355 ///
3356 /// ```
3357 /// let s1 = b"hello world".to_vec();
3358 /// let v1 = String::try_from(s1).unwrap();
3359 /// assert_eq!(v1, "hello world");
3360 ///
3361 /// ```
3362 fn try_from(bytes: Vec<u8>) -> Result<Self, Self::Error> {
3363 Self::from_utf8(bytes)
3364 }
3365}
3366
3367#[cfg(not(no_global_oom_handling))]
3368#[stable(feature = "rust1", since = "1.0.0")]
3369impl fmt::Write for String {
3370 #[inline]
3371 fn write_str(&mut self, s: &str) -> fmt::Result {
3372 self.push_str(s);
3373 Ok(())
3374 }
3375
3376 #[inline]
3377 fn write_char(&mut self, c: char) -> fmt::Result {
3378 self.push(c);
3379 Ok(())
3380 }
3381}
3382
3383/// An iterator over the [`char`]s of a string.
3384///
3385/// This struct is created by the [`into_chars`] method on [`String`].
3386/// See its documentation for more.
3387///
3388/// [`char`]: prim@char
3389/// [`into_chars`]: String::into_chars
3390#[cfg_attr(not(no_global_oom_handling), derive(Clone))]
3391#[must_use = "iterators are lazy and do nothing unless consumed"]
3392#[unstable(feature = "string_into_chars", issue = "133125")]
3393pub struct IntoChars {
3394 bytes: vec::IntoIter<u8>,
3395}
3396
3397#[unstable(feature = "string_into_chars", issue = "133125")]
3398impl fmt::Debug for IntoChars {
3399 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
3400 f.debug_tuple("IntoChars").field(&self.as_str()).finish()
3401 }
3402}
3403
3404impl IntoChars {
3405 /// Views the underlying data as a subslice of the original data.
3406 ///
3407 /// # Examples
3408 ///
3409 /// ```
3410 /// #![feature(string_into_chars)]
3411 ///
3412 /// let mut chars = String::from("abc").into_chars();
3413 ///
3414 /// assert_eq!(chars.as_str(), "abc");
3415 /// chars.next();
3416 /// assert_eq!(chars.as_str(), "bc");
3417 /// chars.next();
3418 /// chars.next();
3419 /// assert_eq!(chars.as_str(), "");
3420 /// ```
3421 #[unstable(feature = "string_into_chars", issue = "133125")]
3422 #[must_use]
3423 #[inline]
3424 pub fn as_str(&self) -> &str {
3425 // SAFETY: `bytes` is a valid UTF-8 string.
3426 unsafe { str::from_utf8_unchecked(self.bytes.as_slice()) }
3427 }
3428
3429 /// Consumes the `IntoChars`, returning the remaining string.
3430 ///
3431 /// # Examples
3432 ///
3433 /// ```
3434 /// #![feature(string_into_chars)]
3435 ///
3436 /// let chars = String::from("abc").into_chars();
3437 /// assert_eq!(chars.into_string(), "abc");
3438 ///
3439 /// let mut chars = String::from("def").into_chars();
3440 /// chars.next();
3441 /// assert_eq!(chars.into_string(), "ef");
3442 /// ```
3443 #[cfg(not(no_global_oom_handling))]
3444 #[unstable(feature = "string_into_chars", issue = "133125")]
3445 #[inline]
3446 pub fn into_string(self) -> String {
3447 // Safety: `bytes` are kept in UTF-8 form, only removing whole `char`s at a time.
3448 unsafe { String::from_utf8_unchecked(self.bytes.collect()) }
3449 }
3450
3451 #[inline]
3452 fn iter(&self) -> CharIndices<'_> {
3453 self.as_str().char_indices()
3454 }
3455}
3456
3457#[unstable(feature = "string_into_chars", issue = "133125")]
3458impl Iterator for IntoChars {
3459 type Item = char;
3460
3461 #[inline]
3462 fn next(&mut self) -> Option<char> {
3463 let mut iter = self.iter();
3464 match iter.next() {
3465 None => None,
3466 Some((_, ch)) => {
3467 let offset = iter.offset();
3468 // `offset` is a valid index.
3469 let _ = self.bytes.advance_by(offset);
3470 Some(ch)
3471 }
3472 }
3473 }
3474
3475 #[inline]
3476 fn count(self) -> usize {
3477 self.iter().count()
3478 }
3479
3480 #[inline]
3481 fn size_hint(&self) -> (usize, Option<usize>) {
3482 self.iter().size_hint()
3483 }
3484
3485 #[inline]
3486 fn last(mut self) -> Option<char> {
3487 self.next_back()
3488 }
3489}
3490
3491#[unstable(feature = "string_into_chars", issue = "133125")]
3492impl DoubleEndedIterator for IntoChars {
3493 #[inline]
3494 fn next_back(&mut self) -> Option<char> {
3495 let len = self.as_str().len();
3496 let mut iter = self.iter();
3497 match iter.next_back() {
3498 None => None,
3499 Some((idx, ch)) => {
3500 // `idx` is a valid index.
3501 let _ = self.bytes.advance_back_by(len - idx);
3502 Some(ch)
3503 }
3504 }
3505 }
3506}
3507
3508#[unstable(feature = "string_into_chars", issue = "133125")]
3509impl FusedIterator for IntoChars {}
3510
3511/// A draining iterator for `String`.
3512///
3513/// This struct is created by the [`drain`] method on [`String`]. See its
3514/// documentation for more.
3515///
3516/// [`drain`]: String::drain
3517#[stable(feature = "drain", since = "1.6.0")]
3518pub struct Drain<'a> {
3519 /// Will be used as &'a mut String in the destructor
3520 string: *mut String,
3521 /// Start of part to remove
3522 start: usize,
3523 /// End of part to remove
3524 end: usize,
3525 /// Current remaining range to remove
3526 iter: Chars<'a>,
3527}
3528
3529#[stable(feature = "collection_debug", since = "1.17.0")]
3530impl fmt::Debug for Drain<'_> {
3531 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
3532 f.debug_tuple("Drain").field(&self.as_str()).finish()
3533 }
3534}
3535
3536#[stable(feature = "drain", since = "1.6.0")]
3537unsafe impl Sync for Drain<'_> {}
3538#[stable(feature = "drain", since = "1.6.0")]
3539unsafe impl Send for Drain<'_> {}
3540
3541#[stable(feature = "drain", since = "1.6.0")]
3542impl Drop for Drain<'_> {
3543 fn drop(&mut self) {
3544 unsafe {
3545 // Use Vec::drain. "Reaffirm" the bounds checks to avoid
3546 // panic code being inserted again.
3547 let self_vec = (*self.string).as_mut_vec();
3548 if self.start <= self.end && self.end <= self_vec.len() {
3549 self_vec.drain(self.start..self.end);
3550 }
3551 }
3552 }
3553}
3554
3555impl<'a> Drain<'a> {
3556 /// Returns the remaining (sub)string of this iterator as a slice.
3557 ///
3558 /// # Examples
3559 ///
3560 /// ```
3561 /// let mut s = String::from("abc");
3562 /// let mut drain = s.drain(..);
3563 /// assert_eq!(drain.as_str(), "abc");
3564 /// let _ = drain.next().unwrap();
3565 /// assert_eq!(drain.as_str(), "bc");
3566 /// ```
3567 #[must_use]
3568 #[stable(feature = "string_drain_as_str", since = "1.55.0")]
3569 pub fn as_str(&self) -> &str {
3570 self.iter.as_str()
3571 }
3572}
3573
3574#[stable(feature = "string_drain_as_str", since = "1.55.0")]
3575impl<'a> AsRef<str> for Drain<'a> {
3576 fn as_ref(&self) -> &str {
3577 self.as_str()
3578 }
3579}
3580
3581#[stable(feature = "string_drain_as_str", since = "1.55.0")]
3582impl<'a> AsRef<[u8]> for Drain<'a> {
3583 fn as_ref(&self) -> &[u8] {
3584 self.as_str().as_bytes()
3585 }
3586}
3587
3588#[stable(feature = "drain", since = "1.6.0")]
3589impl Iterator for Drain<'_> {
3590 type Item = char;
3591
3592 #[inline]
3593 fn next(&mut self) -> Option<char> {
3594 self.iter.next()
3595 }
3596
3597 fn size_hint(&self) -> (usize, Option<usize>) {
3598 self.iter.size_hint()
3599 }
3600
3601 #[inline]
3602 fn last(mut self) -> Option<char> {
3603 self.next_back()
3604 }
3605}
3606
3607#[stable(feature = "drain", since = "1.6.0")]
3608impl DoubleEndedIterator for Drain<'_> {
3609 #[inline]
3610 fn next_back(&mut self) -> Option<char> {
3611 self.iter.next_back()
3612 }
3613}
3614
3615#[stable(feature = "fused", since = "1.26.0")]
3616impl FusedIterator for Drain<'_> {}
3617
3618#[cfg(not(no_global_oom_handling))]
3619#[stable(feature = "from_char_for_string", since = "1.46.0")]
3620impl From<char> for String {
3621 /// Allocates an owned [`String`] from a single character.
3622 ///
3623 /// # Example
3624 /// ```rust
3625 /// let c: char = 'a';
3626 /// let s: String = String::from(c);
3627 /// assert_eq!("a", &s[..]);
3628 /// ```
3629 #[inline]
3630 fn from(c: char) -> Self {
3631 c.to_string()
3632 }
3633}