rune_alloc/string/mod.rs
1//! A UTF-8–encoded, growable string.
2//!
3//! This module contains the [`String`] type, the [`TryToString`] trait for
4//! converting to strings, and several error types that may result from working
5//! with [`String`]s.
6//!
7//! # Examples
8//!
9//! There are multiple ways to create a new [`String`] from a string literal:
10//!
11//! ```
12//! use rune::alloc::prelude::*;
13//!
14//! let s = "Hello".try_to_string()?;
15//!
16//! let s = String::try_from("world")?;
17//! let s: String = "also this".try_into()?;
18//! # Ok::<_, rune::alloc::Error>(())
19//! ```
20//!
21//! If you have a vector of valid UTF-8 bytes, you can make a [`String`] out of
22//! it. You can do the reverse too.
23//!
24//! ```
25//! use rune::alloc::prelude::*;
26//!
27//! let sparkle_heart = try_vec![240, 159, 146, 150];
28//! let sparkle_heart = String::from_utf8(sparkle_heart)?;
29//!
30//! assert_eq!("💖", sparkle_heart);
31//!
32//! let bytes = sparkle_heart.into_bytes();
33//!
34//! assert_eq!(bytes, [240, 159, 146, 150]);
35//! # Ok::<_, std::boxed::Box<dyn core::error::Error>>(())
36//! ```
37
38#[cfg(feature = "serde")]
39mod serde;
40
41pub use self::try_to_string::TryToString;
42pub(crate) mod try_to_string;
43
44#[cfg(feature = "alloc")]
45use core::alloc::Layout;
46use core::borrow::Borrow;
47use core::cmp::Ordering;
48use core::fmt;
49use core::hash;
50use core::iter::FusedIterator;
51#[cfg(feature = "alloc")]
52use core::mem::ManuallyDrop;
53use core::ops::Bound::{Excluded, Included, Unbounded};
54use core::ops::{self, Index, IndexMut, Range, RangeBounds};
55use core::ptr;
56use core::slice;
57use core::str::{from_utf8, from_utf8_unchecked, from_utf8_unchecked_mut};
58use core::str::{Chars, Utf8Error};
59
60use crate::alloc::{Allocator, Global};
61use crate::borrow::Cow;
62use crate::boxed::Box;
63use crate::clone::TryClone;
64use crate::error::Error;
65use crate::fmt::TryWrite;
66use crate::iter::{TryExtend, TryFromIteratorIn, TryJoin};
67use crate::slice::range as slice_range;
68#[cfg(test)]
69use crate::testing::*;
70use crate::vec::Vec;
71
72/// A UTF-8–encoded, growable string.
73///
74/// The `String` type is the most common string type that has ownership over the
75/// contents of the string. It has a close relationship with its borrowed
76/// counterpart, the primitive [`str`].
77///
78/// # Examples
79///
80/// You can create a `String` from [a literal string][`&str`] with
81/// [`String::try_from`]:
82///
83/// [`String::try_from`]: TryFrom::try_from
84///
85/// ```
86/// use rune::alloc::String;
87///
88/// let hello = String::try_from("Hello, world!")?;
89/// # Ok::<_, rune::alloc::Error>(())
90/// ```
91///
92/// You can append a [`char`] to a `String` with the [`try_push`] method, and
93/// append a [`&str`] with the [`try_push_str`] method:
94///
95/// ```
96/// use rune::alloc::String;
97///
98/// let mut hello = String::try_from("Hello, ")?;
99///
100/// hello.try_push('w')?;
101/// hello.try_push_str("orld!")?;
102/// # Ok::<_, rune::alloc::Error>(())
103/// ```
104///
105/// [`try_push`]: String::try_push
106/// [`try_push_str`]: String::try_push_str
107///
108/// If you have a vector of UTF-8 bytes, you can create a `String` from it with
109/// the [`from_utf8`] method:
110///
111/// ```
112/// use rune::alloc::{try_vec, String};
113///
114/// // some bytes, in a vector
115/// let sparkle_heart = try_vec![240, 159, 146, 150];
116/// let sparkle_heart = String::from_utf8(sparkle_heart)?;
117///
118/// assert_eq!("💖", sparkle_heart);
119/// # Ok::<_, Box<dyn core::error::Error>>(())
120/// ```
121///
122/// [`from_utf8`]: String::from_utf8
123///
124/// # UTF-8
125///
126/// `String`s are always valid UTF-8. If you need a non-UTF-8 string, consider
127/// [`OsString`]. It is similar, but without the UTF-8 constraint. Because UTF-8
128/// is a variable width encoding, `String`s are typically smaller than an array of
129/// the same `chars`:
130///
131/// ```
132/// use core::mem;
133///
134/// // `s` is ASCII which represents each `char` as one byte
135/// let s = "hello";
136/// assert_eq!(s.len(), 5);
137///
138/// // A `char` array with the same contents would be longer because
139/// // every `char` is four bytes
140/// let s = ['h', 'e', 'l', 'l', 'o'];
141/// let size: usize = s.into_iter().map(|c| mem::size_of_val(&c)).sum();
142/// assert_eq!(size, 20);
143///
144/// // However, for non-ASCII strings, the difference will be smaller
145/// // and sometimes they are the same
146/// let s = "💖💖💖💖💖";
147/// assert_eq!(s.len(), 20);
148///
149/// let s = ['💖', '💖', '💖', '💖', '💖'];
150/// let size: usize = s.into_iter().map(|c| mem::size_of_val(&c)).sum();
151/// assert_eq!(size, 20);
152/// ```
153///
154/// This raises interesting questions as to how `s[i]` should work.
155/// What should `i` be here? Several options include byte indices and
156/// `char` indices but, because of UTF-8 encoding, only byte indices
157/// would provide constant time indexing. Getting the `i`th `char`, for
158/// example, is available using [`chars`]:
159///
160/// ```
161/// let s = "hello";
162/// let third_character = s.chars().nth(2);
163/// assert_eq!(third_character, Some('l'));
164///
165/// let s = "💖💖💖💖💖";
166/// let third_character = s.chars().nth(2);
167/// assert_eq!(third_character, Some('💖'));
168/// ```
169///
170/// Next, what should `s[i]` return? Because indexing returns a reference
171/// to underlying data it could be `&u8`, `&[u8]`, or something else similar.
172/// Since we're only providing one index, `&u8` makes the most sense but that
173/// might not be what the user expects and can be explicitly achieved with
174/// [`as_bytes()`]:
175///
176/// ```
177/// // The first byte is 104 - the byte value of `'h'`
178/// let s = "hello";
179/// assert_eq!(s.as_bytes()[0], 104);
180/// // or
181/// assert_eq!(s.as_bytes()[0], b'h');
182///
183/// // The first byte is 240 which isn't obviously useful
184/// let s = "💖💖💖💖💖";
185/// assert_eq!(s.as_bytes()[0], 240);
186/// ```
187///
188/// Due to these ambiguities/restrictions, indexing with a `usize` is simply
189/// forbidden:
190///
191/// ```compile_fail,E0277
192/// let s = "hello";
193///
194/// // The following will not compile!
195/// println!("The first letter of s is {}", s[0]);
196/// ```
197///
198/// It is more clear, however, how `&s[i..j]` should work (that is,
199/// indexing with a range). It should accept byte indices (to be constant-time)
200/// and return a `&str` which is UTF-8 encoded. This is also called "string slicing".
201/// Note this will panic if the byte indices provided are not character
202/// boundaries - see [`is_char_boundary`] for more details. See the implementations
203/// for [`SliceIndex<str>`] for more details on string slicing. For a non-panicking
204/// version of string slicing, see [`get`].
205///
206/// [`OsString`]: ../../std/ffi/struct.OsString.html "ffi::OsString"
207/// [`SliceIndex<str>`]: core::slice::SliceIndex
208/// [`as_bytes()`]: str::as_bytes
209/// [`get`]: str::get
210/// [`is_char_boundary`]: str::is_char_boundary
211///
212/// The [`bytes`] and [`chars`] methods return iterators over the bytes and
213/// codepoints of the string, respectively. To iterate over codepoints along
214/// with byte indices, use [`char_indices`].
215///
216/// [`bytes`]: str::bytes
217/// [`chars`]: str::chars
218/// [`char_indices`]: str::char_indices
219///
220/// # Deref
221///
222/// `String` implements <code>[Deref]<Target = [str]></code>, and so inherits all of [`str`]'s
223/// methods. In addition, this means that you can pass a `String` to a
224/// function which takes a [`&str`] by using an ampersand (`&`):
225///
226/// ```
227/// use rune::alloc::String;
228///
229/// fn takes_str(s: &str) { }
230///
231/// let s = String::try_from("Hello")?;
232///
233/// takes_str(&s);
234/// # Ok::<_, rune::alloc::Error>(())
235/// ```
236///
237/// This will create a [`&str`] from the `String` and pass it in. This
238/// conversion is very inexpensive, and so generally, functions will accept
239/// [`&str`]s as arguments unless they need a `String` for some specific
240/// reason.
241///
242/// In certain cases Rust doesn't have enough information to make this
243/// conversion, known as [`Deref`] coercion. In the following example a string
244/// slice [`&'a str`][`&str`] implements the trait `TraitExample`, and the function
245/// `example_func` takes anything that implements the trait. In this case Rust
246/// would need to make two implicit conversions, which Rust doesn't have the
247/// means to do. For that reason, the following example will not compile.
248///
249/// ```compile_fail,E0277
250/// use rune::alloc::String;
251///
252/// trait TraitExample {}
253///
254/// impl<'a> TraitExample for &'a str {}
255///
256/// fn example_func<A: TraitExample>(example_arg: A) {}
257///
258/// let example_string = String::try_from("example_string")?;
259/// example_func(&example_string);
260/// # Ok::<_, rune::alloc::Error>(())
261/// ```
262///
263/// There are two options that would work instead. The first would be to
264/// change the line `example_func(&example_string);` to
265/// `example_func(example_string.as_str());`, using the method [`as_str()`]
266/// to explicitly extract the string slice containing the string. The second
267/// way changes `example_func(&example_string);` to
268/// `example_func(&*example_string);`. In this case we are dereferencing a
269/// `String` to a [`str`], then referencing the [`str`] back to
270/// [`&str`]. The second way is more idiomatic, however both work to do the
271/// conversion explicitly rather than relying on the implicit conversion.
272///
273/// # Representation
274///
275/// A `String` is made up of three components: a pointer to some bytes, a
276/// length, and a capacity. The pointer points to an internal buffer `String`
277/// uses to store its data. The length is the number of bytes currently stored
278/// in the buffer, and the capacity is the size of the buffer in bytes. As such,
279/// the length will always be less than or equal to the capacity.
280///
281/// This buffer is always stored on the heap.
282///
283/// You can look at these with the [`as_ptr`], [`len`], and [`capacity`]
284/// methods:
285///
286/// ```
287/// use core::mem;
288/// use rune::alloc::String;
289///
290/// let story = String::try_from("Once upon a time...")?;
291///
292/// // Prevent automatically dropping the String's data
293/// let mut story = mem::ManuallyDrop::new(story);
294///
295/// let ptr = story.as_mut_ptr();
296/// let len = story.len();
297/// let capacity = story.capacity();
298/// let allocator = story.allocator().clone();
299///
300/// // story has nineteen bytes
301/// assert_eq!(19, len);
302///
303/// // We can re-build a String out of ptr, len, and capacity. This is all
304/// // unsafe because we are responsible for making sure the components are
305/// // valid:
306/// let s = unsafe { String::from_raw_parts_in(ptr, len, capacity, allocator) } ;
307///
308/// assert_eq!("Once upon a time...", s);
309/// # Ok::<_, rune::alloc::Error>(())
310/// ```
311///
312/// [`as_ptr`]: str::as_ptr
313/// [`len`]: String::len
314/// [`capacity`]: String::capacity
315///
316/// If a `String` has enough capacity, adding elements to it will not
317/// re-allocate. For example, consider this program:
318///
319/// ```
320/// use rune::alloc::String;
321///
322/// let mut s = String::new();
323///
324/// println!("{}", s.capacity());
325///
326/// for _ in 0..5 {
327/// s.try_push_str("hello")?;
328/// println!("{}", s.capacity());
329/// }
330/// # Ok::<_, rune::alloc::Error>(())
331/// ```
332///
333/// This will output the following:
334///
335/// ```text
336/// 0
337/// 8
338/// 16
339/// 16
340/// 32
341/// 32
342/// ```
343///
344/// At first, we have no memory allocated at all, but as we append to the
345/// string, it increases its capacity appropriately. If we instead use the
346/// [`try_with_capacity_in`] method to allocate the correct capacity initially:
347///
348/// ```
349/// use rune::alloc::String;
350/// use rune::alloc::alloc::Global;
351///
352/// let mut s = String::try_with_capacity_in(25, Global)?;
353///
354/// println!("{}", s.capacity());
355///
356/// for _ in 0..5 {
357/// s.try_push_str("hello")?;
358/// println!("{}", s.capacity());
359/// }
360/// # Ok::<_, rune::alloc::Error>(())
361/// ```
362///
363/// [`try_with_capacity_in`]: String::try_with_capacity_in
364///
365/// We end up with a different output:
366///
367/// ```text
368/// 25
369/// 25
370/// 25
371/// 25
372/// 25
373/// 25
374/// ```
375///
376/// Here, there's no need to allocate more memory inside the loop.
377///
378/// [str]: prim@str "str"
379/// [`str`]: prim@str "str"
380/// [`&str`]: prim@str "&str"
381/// [Deref]: core::ops::Deref "ops::Deref"
382/// [`Deref`]: core::ops::Deref "ops::Deref"
383/// [`as_str()`]: String::as_str
384pub struct String<A: Allocator = Global> {
385 vec: Vec<u8, A>,
386}
387
388impl String {
389 /// Creates a new empty `String`.
390 ///
391 /// Given that the `String` is empty, this will not allocate any initial
392 /// buffer. While that means that this initial operation is very
393 /// inexpensive, it may cause excessive allocation later when you add data.
394 /// If you have an idea of how much data the `String` will hold, consider
395 /// the [`try_with_capacity`] method to prevent excessive re-allocation.
396 ///
397 /// [`try_with_capacity`]: String::try_with_capacity
398 ///
399 /// # Examples
400 ///
401 /// Basic usage:
402 ///
403 /// ```
404 /// use rune::alloc::String;
405 ///
406 /// let s = String::new();
407 /// ```
408 #[inline]
409 #[must_use]
410 pub const fn new() -> Self {
411 String { vec: Vec::new() }
412 }
413
414 /// Creates a new empty `String` with at least the specified capacity.
415 ///
416 /// `String`s have an internal buffer to hold their data. The capacity is
417 /// the length of that buffer, and can be queried with the [`capacity`]
418 /// method. This method creates an empty `String`, but one with an initial
419 /// buffer that can hold at least `capacity` bytes. This is useful when you
420 /// may be appending a bunch of data to the `String`, reducing the number of
421 /// reallocations it needs to do.
422 ///
423 /// [`capacity`]: String::capacity
424 ///
425 /// If the given capacity is `0`, no allocation will occur, and this method
426 /// is identical to the [`new`] method.
427 ///
428 /// [`new`]: String::new
429 ///
430 /// # Examples
431 ///
432 /// Basic usage:
433 ///
434 /// ```
435 /// use rune::alloc::String;
436 ///
437 /// let mut s = String::try_with_capacity(10)?;
438 ///
439 /// // The String contains no chars, even though it has capacity for more
440 /// assert_eq!(s.len(), 0);
441 ///
442 /// // These are all done without reallocating...
443 /// let cap = s.capacity();
444 ///
445 /// for _ in 0..10 {
446 /// s.try_push('a')?;
447 /// }
448 ///
449 /// assert_eq!(s.capacity(), cap);
450 ///
451 /// // ...but this may make the string reallocate
452 /// s.try_push('a')?;
453 /// # Ok::<_, rune::alloc::Error>(())
454 /// ```
455 #[inline]
456 pub fn try_with_capacity(capacity: usize) -> Result<Self, Error> {
457 Ok(String {
458 vec: Vec::try_with_capacity_in(capacity, Global)?,
459 })
460 }
461
462 /// Convert a [`String`] into a std `String`.
463 ///
464 /// The result is allocated on the heap, using the default global allocator
465 /// so this is a zero-copy operation.
466 ///
467 /// The memory previously occupied by this vector will be released.
468 #[cfg(feature = "alloc")]
469 pub fn into_std(self) -> ::rust_alloc::string::String {
470 // SAFETY: The interior vector is valid UTF-8.
471 unsafe { ::rust_alloc::string::String::from_utf8_unchecked(self.vec.into_std()) }
472 }
473
474 #[cfg(test)]
475 pub fn from(value: &str) -> Self {
476 Self::try_from(value).abort()
477 }
478}
479
480/// A possible error value when converting a `String` from a UTF-8 byte vector.
481///
482/// This type is the error type for the [`from_utf8`] method on [`String`]. It
483/// is designed in such a way to carefully avoid reallocations: the
484/// [`into_bytes`] method will give back the byte vector that was used in the
485/// conversion attempt.
486///
487/// [`from_utf8`]: String::from_utf8
488/// [`into_bytes`]: FromUtf8Error::into_bytes
489///
490/// The [`Utf8Error`] type provided by [`std::str`] represents an error that may
491/// occur when converting a slice of [`u8`]s to a [`&str`]. In this sense, it's
492/// an analogue to `FromUtf8Error`, and you can get one from a `FromUtf8Error`
493/// through the [`utf8_error`] method.
494///
495/// [`Utf8Error`]: core::str::Utf8Error "std::str::Utf8Error"
496/// [`std::str`]: core::str "std::str"
497/// [`&str`]: prim@str "&str"
498/// [`utf8_error`]: FromUtf8Error::utf8_error
499///
500/// # Examples
501///
502/// ```
503/// use rune::alloc::{try_vec, String};
504///
505/// // some invalid bytes, in a vector
506/// let bytes = try_vec![0, 159];
507///
508/// let value = String::from_utf8(bytes);
509///
510/// assert!(value.is_err());
511/// assert_eq!(try_vec![0, 159], value.unwrap_err().into_bytes());
512/// # Ok::<_, rune::alloc::Error>(())
513/// ```
514pub struct FromUtf8Error<A: Allocator = Global> {
515 bytes: Vec<u8, A>,
516 error: Utf8Error,
517}
518
519impl<A: Allocator> fmt::Debug for FromUtf8Error<A> {
520 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
521 f.debug_struct("FromUtf8Error")
522 .field("bytes", &self.bytes)
523 .field("error", &self.error)
524 .finish()
525 }
526}
527
528impl<A: Allocator> PartialEq for FromUtf8Error<A> {
529 fn eq(&self, other: &Self) -> bool {
530 self.bytes == other.bytes && self.error == other.error
531 }
532}
533
534impl<A: Allocator> Eq for FromUtf8Error<A> {}
535
536impl<A: Allocator> String<A> {
537 /// Creates a new empty `String`.
538 ///
539 /// Given that the `String` is empty, this will not allocate any initial
540 /// buffer. While that means that this initial operation is very
541 /// inexpensive, it may cause excessive allocation later when you add data.
542 /// If you have an idea of how much data the `String` will hold, consider
543 /// the [`try_with_capacity_in`] method to prevent excessive re-allocation.
544 ///
545 /// [`try_with_capacity_in`]: String::try_with_capacity_in
546 ///
547 /// # Examples
548 ///
549 /// ```
550 /// use rune::alloc::String;
551 /// use rune::alloc::alloc::Global;
552 ///
553 /// let s = String::new_in(Global);
554 /// ```
555 #[inline]
556 #[must_use]
557 pub fn new_in(alloc: A) -> String<A> {
558 String {
559 vec: Vec::new_in(alloc),
560 }
561 }
562
563 /// Returns a reference to the underlying allocator.
564 ///
565 /// # Examples
566 ///
567 /// ```
568 /// use rune::alloc::String;
569 /// use rune::alloc::alloc::Global;
570 ///
571 /// let s = String::new_in(Global);
572 /// let alloc: &Global = s.allocator();
573 /// ```
574 #[inline]
575 pub fn allocator(&self) -> &A {
576 self.vec.allocator()
577 }
578
579 /// Creates a new empty `String` with at least the specified capacity.
580 ///
581 /// `String`s have an internal buffer to hold their data. The capacity is
582 /// the length of that buffer, and can be queried with the [`capacity`]
583 /// method. This method creates an empty `String`, but one with an initial
584 /// buffer that can hold at least `capacity` bytes. This is useful when you
585 /// may be appending a bunch of data to the `String`, reducing the number of
586 /// reallocations it needs to do.
587 ///
588 /// [`capacity`]: String::capacity
589 ///
590 /// If the given capacity is `0`, no allocation will occur, and this method
591 /// is identical to the [`new_in`] method.
592 ///
593 /// [`new_in`]: String::new_in
594 ///
595 /// # Examples
596 ///
597 /// ```
598 /// use rune::alloc::String;
599 /// use rune::alloc::alloc::Global;
600 ///
601 /// let mut s = String::try_with_capacity_in(10, Global)?;
602 ///
603 /// // The String contains no chars, even though it has capacity for more
604 /// assert_eq!(s.len(), 0);
605 ///
606 /// // These are all done without reallocating...
607 /// let cap = s.capacity();
608 ///
609 /// for _ in 0..10 {
610 /// s.try_push('a')?;
611 /// }
612 ///
613 /// assert_eq!(s.capacity(), cap);
614 ///
615 /// // ...but this may make the string reallocate
616 /// s.try_push('a')?;
617 /// # Ok::<_, rune::alloc::Error>(())
618 /// ```
619 #[inline]
620 pub fn try_with_capacity_in(capacity: usize, alloc: A) -> Result<String<A>, Error> {
621 Ok(String {
622 vec: Vec::try_with_capacity_in(capacity, alloc)?,
623 })
624 }
625
626 /// Converts a vector of bytes to a `String`.
627 ///
628 /// A string ([`String`]) is made of bytes ([`u8`]), and a vector of bytes
629 /// ([`Vec<u8>`]) is made of bytes, so this function converts between the
630 /// two. Not all byte slices are valid `String`s, however: `String` requires
631 /// that it is valid UTF-8. `from_utf8()` checks to ensure that the bytes
632 /// are valid UTF-8, and then does the conversion.
633 ///
634 /// If you are sure that the byte slice is valid UTF-8, and you don't want
635 /// to incur the overhead of the validity check, there is an unsafe version
636 /// of this function, [`from_utf8_unchecked`], which has the same behavior
637 /// but skips the check.
638 ///
639 /// This method will take care to not copy the vector, for efficiency's
640 /// sake.
641 ///
642 /// If you need a [`&str`] instead of a `String`, consider
643 /// [`str::from_utf8`].
644 ///
645 /// The inverse of this method is [`into_bytes`].
646 ///
647 /// [`str::from_utf8`]: core::str::from_utf8
648 ///
649 /// # Errors
650 ///
651 /// Returns [`Err`] if the slice is not UTF-8 with a description as to why
652 /// the provided bytes are not UTF-8. The vector you moved in is also
653 /// included.
654 ///
655 /// # Examples
656 ///
657 /// Basic usage:
658 ///
659 /// ```
660 /// use rune::alloc::{try_vec, String};
661 ///
662 /// // some bytes, in a vector
663 /// let sparkle_heart = try_vec![240, 159, 146, 150];
664 /// let sparkle_heart = String::from_utf8(sparkle_heart)?;
665 ///
666 /// assert_eq!("💖", sparkle_heart);
667 /// # Ok::<_, Box<dyn core::error::Error>>(())
668 /// ```
669 ///
670 /// Incorrect bytes:
671 ///
672 /// ```
673 /// use rune::alloc::{try_vec, String};
674 ///
675 /// // some invalid bytes, in a vector
676 /// let sparkle_heart = try_vec![0, 159, 146, 150];
677 ///
678 /// assert!(String::from_utf8(sparkle_heart).is_err());
679 /// # Ok::<_, rune::alloc::Error>(())
680 /// ```
681 ///
682 /// See the docs for [`FromUtf8Error`] for more details on what you can do
683 /// with this error.
684 ///
685 /// [`from_utf8_unchecked`]: String::from_utf8_unchecked
686 /// [`Vec<u8>`]: crate::vec::Vec "Vec"
687 /// [`&str`]: prim@str "&str"
688 /// [`into_bytes`]: String::into_bytes
689 #[inline]
690 pub fn from_utf8(vec: Vec<u8, A>) -> Result<String<A>, FromUtf8Error<A>> {
691 match from_utf8(&vec) {
692 Ok(..) => Ok(String { vec }),
693 Err(e) => Err(FromUtf8Error {
694 bytes: vec,
695 error: e,
696 }),
697 }
698 }
699
700 /// Creates a new `String` from a length, capacity, and pointer.
701 ///
702 /// # Safety
703 ///
704 /// This is highly unsafe, due to the number of invariants that aren't
705 /// checked:
706 ///
707 /// * The memory at `buf` needs to have been previously allocated by the
708 /// same allocator the standard library uses, with a required alignment of exactly 1.
709 /// * `length` needs to be less than or equal to `capacity`.
710 /// * `capacity` needs to be the correct value.
711 /// * The first `length` bytes at `buf` need to be valid UTF-8.
712 ///
713 /// Violating these may cause problems like corrupting the allocator's
714 /// internal data structures. For example, it is normally **not** safe to
715 /// build a `String` from a pointer to a C `char` array containing UTF-8
716 /// _unless_ you are certain that array was originally allocated by the
717 /// Rust standard library's allocator.
718 ///
719 /// The ownership of `buf` is effectively transferred to the
720 /// `String` which may then deallocate, reallocate or change the
721 /// contents of memory pointed to by the pointer at will. Ensure
722 /// that nothing else uses the pointer after calling this
723 /// function.
724 ///
725 /// # Examples
726 ///
727 /// ```
728 /// use rune::alloc::String;
729 /// use core::mem;
730 ///
731 /// unsafe {
732 /// let s = String::try_from("hello")?;
733 ///
734 /// // Prevent automatically dropping the String's data
735 /// let mut s = mem::ManuallyDrop::new(s);
736 ///
737 /// let ptr = s.as_mut_ptr();
738 /// let len = s.len();
739 /// let capacity = s.capacity();
740 /// let allocator = s.allocator().clone();
741 ///
742 /// let s = String::from_raw_parts_in(ptr, len, capacity, allocator);
743 ///
744 /// assert_eq!("hello", s);
745 /// }
746 /// # Ok::<_, rune::alloc::Error>(())
747 /// ```
748 #[inline]
749 pub unsafe fn from_raw_parts_in(
750 buf: *mut u8,
751 length: usize,
752 capacity: usize,
753 alloc: A,
754 ) -> String<A> {
755 unsafe {
756 String {
757 vec: Vec::from_raw_parts_in(buf, length, capacity, alloc),
758 }
759 }
760 }
761
762 /// Converts a vector of bytes to a `String` without checking that the
763 /// string contains valid UTF-8.
764 ///
765 /// See the safe version, [`from_utf8`], for more details.
766 ///
767 /// [`from_utf8`]: String::from_utf8
768 ///
769 /// # Safety
770 ///
771 /// This function is unsafe because it does not check that the bytes passed
772 /// to it are valid UTF-8. If this constraint is violated, it may cause
773 /// memory unsafety issues with future users of the `String`, as the rest of
774 /// the standard library assumes that `String`s are valid UTF-8.
775 ///
776 /// # Examples
777 ///
778 /// ```
779 /// use rune::alloc::{try_vec, String};
780 ///
781 /// // some bytes, in a vector
782 /// let sparkle_heart = try_vec![240, 159, 146, 150];
783 ///
784 /// let sparkle_heart = unsafe {
785 /// String::from_utf8_unchecked(sparkle_heart)
786 /// };
787 ///
788 /// assert_eq!("💖", sparkle_heart);
789 /// # Ok::<_, rune::alloc::Error>(())
790 /// ```
791 #[inline]
792 #[must_use]
793 pub unsafe fn from_utf8_unchecked(bytes: Vec<u8, A>) -> String<A> {
794 String { vec: bytes }
795 }
796
797 /// Converts a `String` into a byte vector.
798 ///
799 /// This consumes the `String`, so we do not need to copy its contents.
800 ///
801 /// # Examples
802 ///
803 /// ```
804 /// use rune::alloc::String;
805 ///
806 /// let s = String::try_from("hello")?;
807 /// let bytes = s.into_bytes();
808 ///
809 /// assert_eq!(&[104, 101, 108, 108, 111][..], &bytes[..]);
810 /// # Ok::<_, rune::alloc::Error>(())
811 /// ```
812 #[inline]
813 #[must_use = "`self` will be dropped if the result is not used"]
814 pub fn into_bytes(self) -> Vec<u8, A> {
815 self.vec
816 }
817
818 /// Extracts a string slice containing the entire `String`.
819 ///
820 /// # Examples
821 ///
822 /// ```
823 /// use rune::alloc::String;
824 ///
825 /// let s = String::try_from("foo")?;
826 ///
827 /// assert_eq!("foo", s.as_str());
828 /// # Ok::<_, rune::alloc::Error>(())
829 /// ```
830 #[inline]
831 #[must_use]
832 pub fn as_str(&self) -> &str {
833 self
834 }
835
836 /// Converts a `String` into a mutable string slice.
837 ///
838 /// # Examples
839 ///
840 /// ```
841 /// use rune::alloc::String;
842 ///
843 /// let mut s = String::try_from("foobar")?;
844 /// let s_mut_str = s.as_mut_str();
845 ///
846 /// s_mut_str.make_ascii_uppercase();
847 ///
848 /// assert_eq!("FOOBAR", s_mut_str);
849 /// # Ok::<_, rune::alloc::Error>(())
850 /// ```
851 #[inline]
852 #[must_use]
853 pub fn as_mut_str(&mut self) -> &mut str {
854 self
855 }
856
857 /// Appends a given string slice onto the end of this `String`.
858 ///
859 /// # Examples
860 ///
861 /// ```
862 /// use rune::alloc::String;
863 /// use rune::alloc::alloc::Global;
864 ///
865 /// let mut s = String::try_with_capacity_in(3, Global)?;
866 ///
867 /// s.try_push_str("foo")?;
868 /// s.try_push_str("bar")?;
869 ///
870 /// assert_eq!("foobar", s);
871 /// # Ok::<_, rune::alloc::Error>(())
872 /// ```
873 #[inline]
874 pub fn try_push_str(&mut self, string: &str) -> Result<(), Error> {
875 self.vec.try_extend_from_slice(string.as_bytes())
876 }
877
878 #[cfg(test)]
879 pub(crate) fn push_str(&mut self, string: &str) {
880 self.try_push_str(string).abort()
881 }
882
883 /// Returns this `String`'s capacity, in bytes.
884 ///
885 /// # Examples
886 ///
887 /// ```
888 /// use rune::alloc::String;
889 /// use rune::alloc::alloc::Global;
890 ///
891 /// let s = String::try_with_capacity_in(10, Global)?;
892 ///
893 /// assert!(s.capacity() >= 10);
894 /// # Ok::<_, rune::alloc::Error>(())
895 /// ```
896 #[inline]
897 #[must_use]
898 pub fn capacity(&self) -> usize {
899 self.vec.capacity()
900 }
901
902 /// Tries to reserve capacity for at least `additional` bytes more than the
903 /// current length. The allocator may reserve more space to speculatively
904 /// avoid frequent allocations. After calling `try_reserve`, capacity will be
905 /// greater than or equal to `self.len() + additional` if it returns
906 /// `Ok(())`. Does nothing if capacity is already sufficient. This method
907 /// preserves the contents even if an error occurs.
908 ///
909 /// # Errors
910 ///
911 /// If the capacity overflows, or the allocator reports a failure, then an error
912 /// is returned.
913 ///
914 /// # Examples
915 ///
916 /// ```
917 /// use rune::alloc::{String, Error};
918 ///
919 /// fn process_data(data: &str) -> Result<String, Error> {
920 /// let mut output = String::new();
921 ///
922 /// // Pre-reserve the memory, exiting if we can't
923 /// output.try_reserve(data.len())?;
924 ///
925 /// // Now we know this can't OOM in the middle of our complex work
926 /// output.try_push_str(data)?;
927 ///
928 /// Ok(output)
929 /// }
930 /// # process_data("rust").expect("why is the test harness OOMing on 4 bytes?");
931 /// ```
932 pub fn try_reserve(&mut self, additional: usize) -> Result<(), Error> {
933 self.vec.try_reserve(additional)
934 }
935
936 /// Tries to reserve the minimum capacity for at least `additional` bytes
937 /// more than the current length. Unlike [`try_reserve`], this will not
938 /// deliberately over-allocate to speculatively avoid frequent allocations.
939 /// After calling `try_reserve_exact`, capacity will be greater than or
940 /// equal to `self.len() + additional` if it returns `Ok(())`.
941 /// Does nothing if the capacity is already sufficient.
942 ///
943 /// Note that the allocator may give the collection more space than it
944 /// requests. Therefore, capacity can not be relied upon to be precisely
945 /// minimal. Prefer [`try_reserve`] if future insertions are expected.
946 ///
947 /// [`try_reserve`]: String::try_reserve
948 ///
949 /// # Errors
950 ///
951 /// If the capacity overflows, or the allocator reports a failure, then an error
952 /// is returned.
953 ///
954 /// # Examples
955 ///
956 /// ```
957 /// use rune::alloc::{String, Error};
958 ///
959 /// fn process_data(data: &str) -> Result<String, Error> {
960 /// let mut output = String::new();
961 ///
962 /// // Pre-reserve the memory, exiting if we can't
963 /// output.try_reserve_exact(data.len())?;
964 ///
965 /// // Now we know this can't OOM in the middle of our complex work
966 /// output.try_push_str(data);
967 ///
968 /// Ok(output)
969 /// }
970 /// # process_data("rust").expect("why is the test harness OOMing on 4 bytes?");
971 /// ```
972 pub fn try_reserve_exact(&mut self, additional: usize) -> Result<(), Error> {
973 self.vec.try_reserve_exact(additional)
974 }
975
976 /// Shrinks the capacity of this `String` to match its length.
977 ///
978 /// # Examples
979 ///
980 /// ```
981 /// use rune::alloc::String;
982 /// let mut s = String::try_from("foo")?;
983 ///
984 /// s.try_reserve(100)?;
985 /// assert!(s.capacity() >= 100);
986 ///
987 /// s.try_shrink_to_fit()?;
988 /// assert_eq!(3, s.capacity());
989 /// # Ok::<_, rune::alloc::Error>(())
990 /// ```
991 #[inline]
992 pub fn try_shrink_to_fit(&mut self) -> Result<(), Error> {
993 self.vec.try_shrink_to_fit()
994 }
995
996 /// Shrinks the capacity of this `String` with a lower bound.
997 ///
998 /// The capacity will remain at least as large as both the length
999 /// and the supplied value.
1000 ///
1001 /// If the current capacity is less than the lower limit, this is a no-op.
1002 ///
1003 /// # Examples
1004 ///
1005 /// ```
1006 /// use rune::alloc::String;
1007 ///
1008 /// let mut s = String::try_from("foo")?;
1009 ///
1010 /// s.try_reserve(100)?;
1011 /// assert!(s.capacity() >= 100);
1012 ///
1013 /// s.try_shrink_to(10)?;
1014 /// assert!(s.capacity() >= 10);
1015 /// s.try_shrink_to(0)?;
1016 /// assert!(s.capacity() >= 3);
1017 /// # Ok::<_, rune::alloc::Error>(())
1018 /// ```
1019 #[inline]
1020 pub fn try_shrink_to(&mut self, min_capacity: usize) -> Result<(), Error> {
1021 self.vec.try_shrink_to(min_capacity)
1022 }
1023
1024 /// Appends the given [`char`] to the end of this `String`.
1025 ///
1026 /// # Examples
1027 ///
1028 /// ```
1029 /// use rune::alloc::String;
1030 /// use rune::alloc::alloc::Global;
1031 ///
1032 /// let mut s = String::try_with_capacity_in(3, Global)?;
1033 /// s.try_push_str("abc")?;
1034 ///
1035 /// s.try_push('1')?;
1036 /// s.try_push('2')?;
1037 /// s.try_push('3')?;
1038 ///
1039 /// assert_eq!("abc123", s);
1040 /// # Ok::<_, rune::alloc::Error>(())
1041 /// ```
1042 #[inline]
1043 pub fn try_push(&mut self, ch: char) -> Result<(), Error> {
1044 match ch.len_utf8() {
1045 1 => self.vec.try_push(ch as u8),
1046 _ => self
1047 .vec
1048 .try_extend_from_slice(ch.encode_utf8(&mut [0; 4]).as_bytes()),
1049 }
1050 }
1051
1052 /// Returns a byte slice of this `String`'s contents.
1053 ///
1054 /// The inverse of this method is [`from_utf8`].
1055 ///
1056 /// [`from_utf8`]: String::from_utf8
1057 ///
1058 /// # Examples
1059 ///
1060 /// ```
1061 /// use rune::alloc::String;
1062 ///
1063 /// let s = String::try_from("hello")?;
1064 ///
1065 /// assert_eq!(&[104, 101, 108, 108, 111], s.as_bytes());
1066 /// # Ok::<_, rune::alloc::Error>(())
1067 /// ```
1068 #[inline]
1069 #[must_use]
1070 pub fn as_bytes(&self) -> &[u8] {
1071 &self.vec
1072 }
1073
1074 /// Shortens this `String` to the specified length.
1075 ///
1076 /// If `new_len` is greater than the string's current length, this has no
1077 /// effect.
1078 ///
1079 /// Note that this method has no effect on the allocated capacity
1080 /// of the string
1081 ///
1082 /// # Panics
1083 ///
1084 /// Panics if `new_len` does not lie on a [`char`] boundary.
1085 ///
1086 /// # Examples
1087 ///
1088 /// ```
1089 /// use rune::alloc::String;
1090 ///
1091 /// let mut s = String::try_from("hello")?;
1092 ///
1093 /// s.truncate(2);
1094 ///
1095 /// assert_eq!("he", s);
1096 /// # Ok::<_, rune::alloc::Error>(())
1097 /// ```
1098 #[inline]
1099 pub fn truncate(&mut self, new_len: usize) {
1100 if new_len <= self.len() {
1101 assert!(self.is_char_boundary(new_len));
1102 self.vec.truncate(new_len)
1103 }
1104 }
1105
1106 /// Removes the last character from the string buffer and returns it.
1107 ///
1108 /// Returns [`None`] if this `String` is empty.
1109 ///
1110 /// # Examples
1111 ///
1112 /// ```
1113 /// use rune::alloc::String;
1114 ///
1115 /// let mut s = String::try_from("abč")?;
1116 ///
1117 /// assert_eq!(s.pop(), Some('č'));
1118 /// assert_eq!(s.pop(), Some('b'));
1119 /// assert_eq!(s.pop(), Some('a'));
1120 ///
1121 /// assert_eq!(s.pop(), None);
1122 /// # Ok::<_, rune::alloc::Error>(())
1123 /// ```
1124 #[inline]
1125 pub fn pop(&mut self) -> Option<char> {
1126 let ch = self.chars().next_back()?;
1127 let newlen = self.len() - ch.len_utf8();
1128 unsafe {
1129 self.vec.set_len(newlen);
1130 }
1131 Some(ch)
1132 }
1133
1134 /// Removes a [`char`] from this `String` at a byte position and returns it.
1135 ///
1136 /// This is an *O*(*n*) operation, as it requires copying every element in the
1137 /// buffer.
1138 ///
1139 /// # Panics
1140 ///
1141 /// Panics if `idx` is larger than or equal to the `String`'s length,
1142 /// or if it does not lie on a [`char`] boundary.
1143 ///
1144 /// # Examples
1145 ///
1146 /// ```
1147 /// use rune::alloc::String;
1148 ///
1149 /// let mut s = String::try_from("abç")?;
1150 ///
1151 /// assert_eq!(s.remove(0), 'a');
1152 /// assert_eq!(s.remove(1), 'ç');
1153 /// assert_eq!(s.remove(0), 'b');
1154 /// # Ok::<_, rune::alloc::Error>(())
1155 /// ```
1156 #[inline]
1157 pub fn remove(&mut self, idx: usize) -> char {
1158 let ch = match self[idx..].chars().next() {
1159 Some(ch) => ch,
1160 None => panic!("cannot remove a char from the end of a string"),
1161 };
1162
1163 let next = idx + ch.len_utf8();
1164 let len = self.len();
1165 unsafe {
1166 ptr::copy(
1167 self.vec.as_ptr().add(next),
1168 self.vec.as_mut_ptr().add(idx),
1169 len - next,
1170 );
1171 self.vec.set_len(len - (next - idx));
1172 }
1173 ch
1174 }
1175
1176 /// Retains only the characters specified by the predicate.
1177 ///
1178 /// In other words, remove all characters `c` such that `f(c)` returns `false`.
1179 /// This method operates in place, visiting each character exactly once in the
1180 /// original order, and preserves the order of the retained characters.
1181 ///
1182 /// # Examples
1183 ///
1184 /// ```
1185 /// use rune::alloc::String;
1186 ///
1187 /// let mut s = String::try_from("f_o_ob_ar")?;
1188 ///
1189 /// s.retain(|c| c != '_');
1190 ///
1191 /// assert_eq!(s, "foobar");
1192 /// # Ok::<_, rune::alloc::Error>(())
1193 /// ```
1194 ///
1195 /// Because the elements are visited exactly once in the original order,
1196 /// external state may be used to decide which elements to keep.
1197 ///
1198 /// ```
1199 /// use rune::alloc::String;
1200 ///
1201 /// let mut s = String::try_from("abcde")?;
1202 /// let keep = [false, true, true, false, true];
1203 /// let mut iter = keep.iter();
1204 /// s.retain(|_| *iter.next().unwrap());
1205 /// assert_eq!(s, "bce");
1206 /// # Ok::<_, rune::alloc::Error>(())
1207 /// ```
1208 #[inline]
1209 pub fn retain<F>(&mut self, mut f: F)
1210 where
1211 F: FnMut(char) -> bool,
1212 {
1213 struct SetLenOnDrop<'a, A: Allocator> {
1214 s: &'a mut String<A>,
1215 idx: usize,
1216 del_bytes: usize,
1217 }
1218
1219 impl<A: Allocator> Drop for SetLenOnDrop<'_, A> {
1220 fn drop(&mut self) {
1221 let new_len = self.idx - self.del_bytes;
1222 debug_assert!(new_len <= self.s.len());
1223 unsafe { self.s.vec.set_len(new_len) };
1224 }
1225 }
1226
1227 let len = self.len();
1228 let mut guard = SetLenOnDrop {
1229 s: self,
1230 idx: 0,
1231 del_bytes: 0,
1232 };
1233
1234 while guard.idx < len {
1235 let ch =
1236 // SAFETY: `guard.idx` is positive-or-zero and less that len so the `get_unchecked`
1237 // is in bound. `self` is valid UTF-8 like string and the returned slice starts at
1238 // a unicode code point so the `Chars` always return one character.
1239 unsafe { guard.s.get_unchecked(guard.idx..len).chars().next().unwrap_unchecked() };
1240 let ch_len = ch.len_utf8();
1241
1242 if !f(ch) {
1243 guard.del_bytes += ch_len;
1244 } else if guard.del_bytes > 0 {
1245 // SAFETY: `guard.idx` is in bound and `guard.del_bytes` represent the number of
1246 // bytes that are erased from the string so the resulting `guard.idx -
1247 // guard.del_bytes` always represent a valid unicode code point.
1248 //
1249 // `guard.del_bytes` >= `ch.len_utf8()`, so taking a slice with `ch.len_utf8()` len
1250 // is safe.
1251 ch.encode_utf8(unsafe {
1252 slice::from_raw_parts_mut(
1253 guard.s.as_mut_ptr().add(guard.idx - guard.del_bytes),
1254 ch.len_utf8(),
1255 )
1256 });
1257 }
1258
1259 // Point idx to the next char
1260 guard.idx += ch_len;
1261 }
1262
1263 drop(guard);
1264 }
1265
1266 /// Inserts a character into this `String` at a byte position.
1267 ///
1268 /// This is an *O*(*n*) operation as it requires copying every element in the
1269 /// buffer.
1270 ///
1271 /// # Panics
1272 ///
1273 /// Panics if `idx` is larger than the `String`'s length, or if it does not
1274 /// lie on a [`char`] boundary.
1275 ///
1276 /// # Examples
1277 ///
1278 /// ```
1279 /// use rune::alloc::String;
1280 /// use rune::alloc::alloc::Global;
1281 ///
1282 /// let mut s = String::try_with_capacity_in(3, Global)?;
1283 ///
1284 /// s.try_insert(0, 'f')?;
1285 /// s.try_insert(1, 'o')?;
1286 /// s.try_insert(2, 'o')?;
1287 ///
1288 /// assert_eq!(s, "foo");
1289 /// # Ok::<_, rune::alloc::Error>(())
1290 /// ```
1291 #[inline]
1292 pub fn try_insert(&mut self, idx: usize, ch: char) -> Result<(), Error> {
1293 assert!(self.is_char_boundary(idx));
1294 let mut bits = [0; 4];
1295 let bits = ch.encode_utf8(&mut bits).as_bytes();
1296
1297 unsafe {
1298 self.insert_bytes(idx, bits)?;
1299 }
1300
1301 Ok(())
1302 }
1303
1304 unsafe fn insert_bytes(&mut self, idx: usize, bytes: &[u8]) -> Result<(), Error> {
1305 let len = self.len();
1306 let amt = bytes.len();
1307 self.vec.try_reserve(amt)?;
1308
1309 unsafe {
1310 ptr::copy(
1311 self.vec.as_ptr().add(idx),
1312 self.vec.as_mut_ptr().add(idx + amt),
1313 len - idx,
1314 );
1315 ptr::copy_nonoverlapping(bytes.as_ptr(), self.vec.as_mut_ptr().add(idx), amt);
1316 self.vec.set_len(len + amt);
1317 }
1318
1319 Ok(())
1320 }
1321
1322 /// Inserts a string slice into this `String` at a byte position.
1323 ///
1324 /// This is an *O*(*n*) operation as it requires copying every element in the
1325 /// buffer.
1326 ///
1327 /// # Panics
1328 ///
1329 /// Panics if `idx` is larger than the `String`'s length, or if it does not
1330 /// lie on a [`char`] boundary.
1331 ///
1332 /// # Examples
1333 ///
1334 /// ```
1335 /// use rune::alloc::String;
1336 ///
1337 /// let mut s = String::try_from("bar")?;
1338 ///
1339 /// s.try_insert_str(0, "foo")?;
1340 ///
1341 /// assert_eq!("foobar", s);
1342 /// # Ok::<_, rune::alloc::Error>(())
1343 /// ```
1344 #[inline]
1345 pub fn try_insert_str(&mut self, idx: usize, string: &str) -> Result<(), Error> {
1346 assert!(self.is_char_boundary(idx));
1347
1348 unsafe {
1349 self.insert_bytes(idx, string.as_bytes())?;
1350 }
1351
1352 Ok(())
1353 }
1354
1355 /// Returns a mutable reference to the contents of this `String`.
1356 ///
1357 /// # Safety
1358 ///
1359 /// This function is unsafe because the returned `&mut Vec` allows writing
1360 /// bytes which are not valid UTF-8. If this constraint is violated, using
1361 /// the original `String` after dropping the `&mut Vec` may violate memory
1362 /// safety, as the rest of the standard library assumes that `String`s are
1363 /// valid UTF-8.
1364 ///
1365 /// # Examples
1366 ///
1367 /// ```
1368 /// use rune::alloc::String;
1369 ///
1370 /// let mut s = String::try_from("hello")?;
1371 ///
1372 /// unsafe {
1373 /// let vec = s.as_mut_vec();
1374 /// assert_eq!(&[104, 101, 108, 108, 111][..], &vec[..]);
1375 ///
1376 /// vec.reverse();
1377 /// }
1378 /// assert_eq!(s, "olleh");
1379 /// # Ok::<_, rune::alloc::Error>(())
1380 /// ```
1381 #[inline]
1382 pub unsafe fn as_mut_vec(&mut self) -> &mut Vec<u8, A> {
1383 &mut self.vec
1384 }
1385
1386 /// Returns the length of this `String`, in bytes, not [`char`]s or
1387 /// graphemes. In other words, it might not be what a human considers the
1388 /// length of the string.
1389 ///
1390 /// # Examples
1391 ///
1392 /// ```
1393 /// use rune::alloc::String;
1394 ///
1395 /// let a = String::try_from("foo")?;
1396 /// assert_eq!(a.len(), 3);
1397 ///
1398 /// let fancy_f = String::try_from("ƒoo")?;
1399 /// assert_eq!(fancy_f.len(), 4);
1400 /// assert_eq!(fancy_f.chars().count(), 3);
1401 /// # Ok::<_, rune::alloc::Error>(())
1402 /// ```
1403 #[inline]
1404 #[must_use]
1405 pub fn len(&self) -> usize {
1406 self.vec.len()
1407 }
1408
1409 /// Returns `true` if this `String` has a length of zero, and `false`
1410 /// otherwise.
1411 ///
1412 /// # Examples
1413 ///
1414 /// ```
1415 /// use rune::alloc::String;
1416 ///
1417 /// let mut v = String::new();
1418 /// assert!(v.is_empty());
1419 ///
1420 /// v.try_push('a')?;
1421 /// assert!(!v.is_empty());
1422 /// # Ok::<_, rune::alloc::Error>(())
1423 /// ```
1424 #[inline]
1425 #[must_use]
1426 pub fn is_empty(&self) -> bool {
1427 self.len() == 0
1428 }
1429
1430 /// Splits the string into two at the given byte index.
1431 ///
1432 /// Returns a newly allocated `String`. `self` contains bytes `[0, at)`, and
1433 /// the returned `String` contains bytes `[at, len)`. `at` must be on the
1434 /// boundary of a UTF-8 code point.
1435 ///
1436 /// Note that the capacity of `self` does not change.
1437 ///
1438 /// # Panics
1439 ///
1440 /// Panics if `at` is not on a `UTF-8` code point boundary, or if it is beyond the last
1441 /// code point of the string.
1442 ///
1443 /// # Examples
1444 ///
1445 /// ```
1446 /// use rune::alloc::String;
1447 ///
1448 /// let mut hello = String::try_from("Hello, World!")?;
1449 /// let world = hello.try_split_off(7)?;
1450 /// assert_eq!(hello, "Hello, ");
1451 /// assert_eq!(world, "World!");
1452 /// # Ok::<_, rune::alloc::Error>(())
1453 /// ```
1454 #[inline]
1455 #[must_use = "use `.truncate()` if you don't need the other half"]
1456 pub fn try_split_off(&mut self, at: usize) -> Result<String<A>, Error>
1457 where
1458 A: Clone,
1459 {
1460 assert!(self.is_char_boundary(at));
1461 let other = self.vec.try_split_off(at)?;
1462 Ok(unsafe { String::from_utf8_unchecked(other) })
1463 }
1464
1465 /// Truncates this `String`, removing all contents.
1466 ///
1467 /// While this means the `String` will have a length of zero, it does not
1468 /// touch its capacity.
1469 ///
1470 /// # Examples
1471 ///
1472 /// ```
1473 /// use rune::alloc::String;
1474 ///
1475 /// let mut s = String::try_from("foo")?;
1476 ///
1477 /// s.clear();
1478 ///
1479 /// assert!(s.is_empty());
1480 /// assert_eq!(0, s.len());
1481 /// assert_eq!(3, s.capacity());
1482 /// # Ok::<_, rune::alloc::Error>(())
1483 /// ```
1484 #[inline]
1485 pub fn clear(&mut self) {
1486 self.vec.clear()
1487 }
1488
1489 /// Removes the specified range from the string in bulk, returning all
1490 /// removed characters as an iterator.
1491 ///
1492 /// The returned iterator keeps a mutable borrow on the string to optimize
1493 /// its implementation.
1494 ///
1495 /// # Panics
1496 ///
1497 /// Panics if the starting point or end point do not lie on a [`char`]
1498 /// boundary, or if they're out of bounds.
1499 ///
1500 /// # Leaking
1501 ///
1502 /// If the returned iterator goes out of scope without being dropped (due to
1503 /// [`core::mem::forget`], for example), the string may still contain a copy
1504 /// of any drained characters, or may have lost characters arbitrarily,
1505 /// including characters outside the range.
1506 ///
1507 /// # Examples
1508 ///
1509 /// ```
1510 /// use rune::alloc::String;
1511 /// use rune::alloc::prelude::*;
1512 ///
1513 /// let mut s = String::try_from("α is alpha, β is beta")?;
1514 /// let beta_offset = s.find('β').unwrap_or(s.len());
1515 ///
1516 /// // Remove the range up until the β from the string
1517 /// let t: String = s.drain(..beta_offset).try_collect()?;
1518 /// assert_eq!(t, "α is alpha, ");
1519 /// assert_eq!(s, "β is beta");
1520 ///
1521 /// // A full range clears the string, like `clear()` does
1522 /// s.drain(..);
1523 /// assert_eq!(s, "");
1524 /// # Ok::<_, rune::alloc::Error>(())
1525 /// ```
1526 pub fn drain<R>(&mut self, range: R) -> Drain<'_, A>
1527 where
1528 R: RangeBounds<usize>,
1529 {
1530 // Memory safety
1531 //
1532 // The String version of Drain does not have the memory safety issues
1533 // of the vector version. The data is just plain bytes.
1534 // Because the range removal happens in Drop, if the Drain iterator is leaked,
1535 // the removal will not happen.
1536 let Range { start, end } = slice_range(range, ..self.len());
1537 assert!(self.is_char_boundary(start));
1538 assert!(self.is_char_boundary(end));
1539
1540 // Take out two simultaneous borrows. The &mut String won't be accessed
1541 // until iteration is over, in Drop.
1542 let self_ptr = self as *mut _;
1543 // SAFETY: `slice::range` and `is_char_boundary` do the appropriate bounds checks.
1544 let chars_iter = unsafe { self.get_unchecked(start..end) }.chars();
1545
1546 Drain {
1547 start,
1548 end,
1549 iter: chars_iter,
1550 string: self_ptr,
1551 }
1552 }
1553
1554 /// Removes the specified range in the string,
1555 /// and replaces it with the given string.
1556 /// The given string doesn't need to be the same length as the range.
1557 ///
1558 /// # Panics
1559 ///
1560 /// Panics if the starting point or end point do not lie on a [`char`]
1561 /// boundary, or if they're out of bounds.
1562 ///
1563 /// # Examples
1564 ///
1565 /// ```
1566 /// use rune::alloc::String;
1567 ///
1568 /// let mut s = String::try_from("α is alpha, β is beta")?;
1569 /// let beta_offset = s.find('β').unwrap_or(s.len());
1570 ///
1571 /// // Replace the range up until the β from the string
1572 /// s.try_replace_range(..beta_offset, "Α is capital alpha; ")?;
1573 /// assert_eq!(s, "Α is capital alpha; β is beta");
1574 /// # Ok::<_, rune::alloc::Error>(())
1575 /// ```
1576 pub fn try_replace_range<R>(&mut self, range: R, replace_with: &str) -> Result<(), Error>
1577 where
1578 R: RangeBounds<usize>,
1579 {
1580 // Memory safety
1581 //
1582 // Replace_range does not have the memory safety issues of a vector Splice.
1583 // of the vector version. The data is just plain bytes.
1584
1585 // WARNING: Inlining this variable would be unsound (#81138)
1586 let start = range.start_bound();
1587 match start {
1588 Included(&n) => assert!(self.is_char_boundary(n)),
1589 Excluded(&n) => assert!(self.is_char_boundary(n + 1)),
1590 Unbounded => {}
1591 };
1592 // WARNING: Inlining this variable would be unsound (#81138)
1593 let end = range.end_bound();
1594 match end {
1595 Included(&n) => assert!(self.is_char_boundary(n + 1)),
1596 Excluded(&n) => assert!(self.is_char_boundary(n)),
1597 Unbounded => {}
1598 };
1599
1600 // Using `range` again would be unsound (#81138)
1601 // We assume the bounds reported by `range` remain the same, but
1602 // an adversarial implementation could change between calls
1603 unsafe { self.as_mut_vec() }.try_splice_in_place((start, end), replace_with.bytes())?;
1604 Ok(())
1605 }
1606
1607 /// Converts this `String` into a <code>[Box]<[str]></code>.
1608 ///
1609 /// This will drop any excess capacity.
1610 ///
1611 /// [str]: prim@str "str"
1612 ///
1613 /// # Examples
1614 ///
1615 /// ```
1616 /// use rune::alloc::String;
1617 /// let s = String::try_from("hello")?;
1618 ///
1619 /// let b = s.try_into_boxed_str()?;
1620 /// # Ok::<_, rune::alloc::Error>(())
1621 /// ```
1622 #[must_use = "`self` will be dropped if the result is not used"]
1623 #[inline]
1624 pub fn try_into_boxed_str(self) -> Result<Box<str, A>, Error> {
1625 let slice = self.vec.try_into_boxed_slice()?;
1626 Ok(unsafe { crate::str::from_boxed_utf8_unchecked(slice) })
1627 }
1628
1629 /// Consumes and leaks the `String`, returning a mutable reference to the contents,
1630 /// `&'a mut str`.
1631 ///
1632 /// The caller has free choice over the returned lifetime, including `'static`. Indeed,
1633 /// this function is ideally used for data that lives for the remainder of the program's life,
1634 /// as dropping the returned reference will cause a memory leak.
1635 ///
1636 /// It does not reallocate or shrink the `String`,
1637 /// so the leaked allocation may include unused capacity that is not part
1638 /// of the returned slice. If you don't want that, call [`try_into_boxed_str`],
1639 /// and then [`Box::leak`].
1640 ///
1641 /// [`try_into_boxed_str`]: Self::try_into_boxed_str
1642 ///
1643 /// # Examples
1644 ///
1645 /// ```
1646 /// # #[cfg(not(miri))]
1647 /// # fn main() -> Result<(), rune_alloc::Error> {
1648 /// use rune::alloc::String;
1649 ///
1650 /// let x = String::try_from("bucket")?;
1651 /// let static_ref: &'static mut str = x.leak();
1652 /// assert_eq!(static_ref, "bucket");
1653 /// # Ok(())
1654 /// # }
1655 /// # #[cfg(miri)] fn main() {}
1656 /// ```
1657 #[inline]
1658 pub fn leak<'a>(self) -> &'a mut str
1659 where
1660 A: 'a,
1661 {
1662 let slice = self.vec.leak();
1663 unsafe { from_utf8_unchecked_mut(slice) }
1664 }
1665}
1666
1667impl<A: Allocator> FromUtf8Error<A> {
1668 /// Returns a slice of [`u8`]s bytes that were attempted to convert to a `String`.
1669 ///
1670 /// # Examples
1671 ///
1672 /// ```
1673 /// use rune::alloc::{try_vec, String};
1674 ///
1675 /// // some invalid bytes, in a vector
1676 /// let bytes = try_vec![0, 159];
1677 ///
1678 /// let value = String::from_utf8(bytes);
1679 ///
1680 /// assert_eq!(&[0, 159], value.unwrap_err().as_bytes());
1681 /// # Ok::<_, rune::alloc::Error>(())
1682 /// ```
1683 #[must_use]
1684 pub fn as_bytes(&self) -> &[u8] {
1685 &self.bytes[..]
1686 }
1687
1688 /// Returns the bytes that were attempted to convert to a `String`.
1689 ///
1690 /// This method is carefully constructed to avoid allocation. It will
1691 /// consume the error, moving out the bytes, so that a copy of the bytes
1692 /// does not need to be made.
1693 ///
1694 /// # Examples
1695 ///
1696 /// ```
1697 /// use rune::alloc::{try_vec, String};
1698 ///
1699 /// // some invalid bytes, in a vector
1700 /// let bytes = try_vec![0, 159];
1701 ///
1702 /// let value = String::from_utf8(bytes);
1703 ///
1704 /// assert_eq!(try_vec![0, 159], value.unwrap_err().into_bytes());
1705 /// # Ok::<_, rune::alloc::Error>(())
1706 /// ```
1707 #[must_use = "`self` will be dropped if the result is not used"]
1708 pub fn into_bytes(self) -> Vec<u8, A> {
1709 self.bytes
1710 }
1711
1712 /// Fetch a `Utf8Error` to get more details about the conversion failure.
1713 ///
1714 /// The [`Utf8Error`] type provided by [`std::str`] represents an error that
1715 /// may occur when converting a slice of [`u8`]s to a [`&str`]. In this
1716 /// sense, it's an analogue to `FromUtf8Error`. See its documentation for
1717 /// more details on using it.
1718 ///
1719 /// [`std::str`]: core::str "std::str"
1720 /// [`&str`]: prim@str "&str"
1721 ///
1722 /// # Examples
1723 ///
1724 /// ```
1725 /// use rune::alloc::{try_vec, String};
1726 ///
1727 /// // some invalid bytes, in a vector
1728 /// let bytes = try_vec![0, 159];
1729 ///
1730 /// let error = String::from_utf8(bytes).unwrap_err().utf8_error();
1731 ///
1732 /// // the first byte is invalid here
1733 /// assert_eq!(1, error.valid_up_to());
1734 /// # Ok::<_, rune::alloc::Error>(())
1735 /// ```
1736 #[must_use]
1737 pub fn utf8_error(&self) -> Utf8Error {
1738 self.error
1739 }
1740}
1741
1742impl<A: Allocator> Default for String<A>
1743where
1744 A: Default,
1745{
1746 /// Construct a default string.
1747 ///
1748 /// # Examples
1749 ///
1750 /// ```
1751 /// use rune::alloc::String;
1752 /// let s = String::default();
1753 /// assert_eq!(s, "");
1754 /// ```
1755 fn default() -> Self {
1756 Self::new_in(A::default())
1757 }
1758}
1759
1760impl<A: Allocator> Borrow<str> for String<A> {
1761 #[inline]
1762 fn borrow(&self) -> &str {
1763 &self[..]
1764 }
1765}
1766
1767impl<A: Allocator> fmt::Display for FromUtf8Error<A> {
1768 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1769 fmt::Display::fmt(&self.error, f)
1770 }
1771}
1772
1773impl<A: Allocator> core::error::Error for FromUtf8Error<A> {}
1774
1775impl<A: Allocator + Clone> TryClone for String<A> {
1776 fn try_clone(&self) -> Result<Self, Error> {
1777 Ok(String {
1778 vec: self.vec.try_clone()?,
1779 })
1780 }
1781}
1782
1783#[cfg(test)]
1784impl<A: Allocator + Clone> Clone for String<A> {
1785 fn clone(&self) -> Self {
1786 self.try_clone().abort()
1787 }
1788}
1789
1790impl<A: Allocator> PartialEq for String<A> {
1791 #[inline]
1792 fn eq(&self, other: &Self) -> bool {
1793 self.vec == other.vec
1794 }
1795}
1796
1797impl<A: Allocator> Eq for String<A> {}
1798
1799impl<A: Allocator> PartialOrd for String<A> {
1800 #[inline]
1801 fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
1802 Some(self.cmp(other))
1803 }
1804}
1805
1806impl<A: Allocator> Ord for String<A> {
1807 #[inline]
1808 fn cmp(&self, other: &Self) -> Ordering {
1809 self.vec.cmp(&other.vec)
1810 }
1811}
1812
1813macro_rules! impl_eq {
1814 ($lhs:ty, $rhs: ty) => {
1815 #[allow(unused_lifetimes)]
1816 #[allow(clippy::partialeq_ne_impl)]
1817 impl<'a, 'b> PartialEq<$rhs> for $lhs {
1818 #[inline]
1819 fn eq(&self, other: &$rhs) -> bool {
1820 PartialEq::eq(&self[..], &other[..])
1821 }
1822 #[inline]
1823 fn ne(&self, other: &$rhs) -> bool {
1824 PartialEq::ne(&self[..], &other[..])
1825 }
1826 }
1827
1828 #[allow(unused_lifetimes)]
1829 #[allow(clippy::partialeq_ne_impl)]
1830 impl<'a, 'b> PartialEq<$lhs> for $rhs {
1831 #[inline]
1832 fn eq(&self, other: &$lhs) -> bool {
1833 PartialEq::eq(&self[..], &other[..])
1834 }
1835 #[inline]
1836 fn ne(&self, other: &$lhs) -> bool {
1837 PartialEq::ne(&self[..], &other[..])
1838 }
1839 }
1840 };
1841}
1842
1843impl_eq! { String, str }
1844impl_eq! { String, &'a str }
1845impl_eq! { Cow<'a, str>, str }
1846impl_eq! { Cow<'a, str>, &'b str }
1847impl_eq! { Cow<'a, str>, String }
1848
1849impl<A: Allocator> fmt::Display for String<A> {
1850 #[inline]
1851 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1852 fmt::Display::fmt(&**self, f)
1853 }
1854}
1855
1856impl<A: Allocator> fmt::Debug for String<A> {
1857 #[inline]
1858 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1859 fmt::Debug::fmt(&**self, f)
1860 }
1861}
1862
1863impl<A: Allocator> hash::Hash for String<A> {
1864 #[inline]
1865 fn hash<H: hash::Hasher>(&self, hasher: &mut H) {
1866 (**self).hash(hasher)
1867 }
1868}
1869
1870impl<A: Allocator> ops::Index<ops::Range<usize>> for String<A> {
1871 type Output = str;
1872
1873 #[inline]
1874 fn index(&self, index: ops::Range<usize>) -> &str {
1875 &self[..][index]
1876 }
1877}
1878
1879impl<A: Allocator> ops::Index<ops::RangeTo<usize>> for String<A> {
1880 type Output = str;
1881
1882 #[inline]
1883 fn index(&self, index: ops::RangeTo<usize>) -> &str {
1884 &self[..][index]
1885 }
1886}
1887
1888impl<A: Allocator> ops::Index<ops::RangeFrom<usize>> for String<A> {
1889 type Output = str;
1890
1891 #[inline]
1892 fn index(&self, index: ops::RangeFrom<usize>) -> &str {
1893 &self[..][index]
1894 }
1895}
1896
1897impl<A: Allocator> ops::Index<ops::RangeFull> for String<A> {
1898 type Output = str;
1899
1900 #[inline]
1901 fn index(&self, _index: ops::RangeFull) -> &str {
1902 unsafe { from_utf8_unchecked(&self.vec) }
1903 }
1904}
1905
1906impl<A: Allocator> ops::Index<ops::RangeInclusive<usize>> for String<A> {
1907 type Output = str;
1908
1909 #[inline]
1910 fn index(&self, index: ops::RangeInclusive<usize>) -> &str {
1911 Index::index(&**self, index)
1912 }
1913}
1914
1915impl<A: Allocator> ops::Index<ops::RangeToInclusive<usize>> for String<A> {
1916 type Output = str;
1917
1918 #[inline]
1919 fn index(&self, index: ops::RangeToInclusive<usize>) -> &str {
1920 Index::index(&**self, index)
1921 }
1922}
1923
1924impl<A: Allocator> ops::IndexMut<ops::Range<usize>> for String<A> {
1925 #[inline]
1926 fn index_mut(&mut self, index: ops::Range<usize>) -> &mut str {
1927 &mut self[..][index]
1928 }
1929}
1930
1931impl<A: Allocator> ops::IndexMut<ops::RangeTo<usize>> for String<A> {
1932 #[inline]
1933 fn index_mut(&mut self, index: ops::RangeTo<usize>) -> &mut str {
1934 &mut self[..][index]
1935 }
1936}
1937
1938impl<A: Allocator> ops::IndexMut<ops::RangeFrom<usize>> for String<A> {
1939 #[inline]
1940 fn index_mut(&mut self, index: ops::RangeFrom<usize>) -> &mut str {
1941 &mut self[..][index]
1942 }
1943}
1944
1945impl<A: Allocator> ops::IndexMut<ops::RangeFull> for String<A> {
1946 #[inline]
1947 fn index_mut(&mut self, _index: ops::RangeFull) -> &mut str {
1948 unsafe { from_utf8_unchecked_mut(&mut self.vec) }
1949 }
1950}
1951
1952impl<A: Allocator> ops::IndexMut<ops::RangeInclusive<usize>> for String<A> {
1953 #[inline]
1954 fn index_mut(&mut self, index: ops::RangeInclusive<usize>) -> &mut str {
1955 IndexMut::index_mut(&mut **self, index)
1956 }
1957}
1958
1959impl<A: Allocator> ops::IndexMut<ops::RangeToInclusive<usize>> for String<A> {
1960 #[inline]
1961 fn index_mut(&mut self, index: ops::RangeToInclusive<usize>) -> &mut str {
1962 IndexMut::index_mut(&mut **self, index)
1963 }
1964}
1965
1966impl<A: Allocator> ops::Deref for String<A> {
1967 type Target = str;
1968
1969 #[inline]
1970 fn deref(&self) -> &str {
1971 unsafe { from_utf8_unchecked(&self.vec) }
1972 }
1973}
1974
1975impl<A: Allocator> ops::DerefMut for String<A> {
1976 #[inline]
1977 fn deref_mut(&mut self) -> &mut str {
1978 unsafe { from_utf8_unchecked_mut(&mut self.vec) }
1979 }
1980}
1981
1982impl<A: Allocator> AsRef<str> for String<A> {
1983 #[inline]
1984 fn as_ref(&self) -> &str {
1985 self
1986 }
1987}
1988
1989impl<A: Allocator> AsMut<str> for String<A> {
1990 #[inline]
1991 fn as_mut(&mut self) -> &mut str {
1992 self
1993 }
1994}
1995
1996#[cfg(feature = "std")]
1997impl<A: Allocator> AsRef<std::ffi::OsStr> for String<A> {
1998 #[inline]
1999 fn as_ref(&self) -> &std::ffi::OsStr {
2000 (**self).as_ref()
2001 }
2002}
2003
2004impl<A: Allocator> AsRef<[u8]> for String<A> {
2005 #[inline]
2006 fn as_ref(&self) -> &[u8] {
2007 self.as_bytes()
2008 }
2009}
2010
2011impl<A: Allocator> From<Box<str, A>> for String<A> {
2012 /// Converts the given boxed `str` slice to a [`String`].
2013 /// It is notable that the `str` slice is owned.
2014 ///
2015 /// # Examples
2016 ///
2017 /// Basic usage:
2018 ///
2019 /// ```
2020 /// use rune::alloc::{Box, String};
2021 ///
2022 /// let s1: String = String::try_from("hello world")?;
2023 /// let s2: Box<str> = s1.try_into_boxed_str()?;
2024 /// let s3: String = String::from(s2);
2025 ///
2026 /// assert_eq!("hello world", s3);
2027 /// # Ok::<_, rune::alloc::Error>(())
2028 /// ```
2029 fn from(s: Box<str, A>) -> String<A> {
2030 crate::str::into_string(s)
2031 }
2032}
2033
2034#[cfg(feature = "alloc")]
2035impl TryFrom<::rust_alloc::boxed::Box<str>> for String<Global> {
2036 type Error = Error;
2037
2038 /// Try to convert a std `Box<str>` into a [`String`].
2039 ///
2040 /// The result is fallibly allocated on the heap.
2041 fn try_from(s: ::rust_alloc::boxed::Box<str>) -> Result<Self, Error> {
2042 Self::try_from(s.as_ref())
2043 }
2044}
2045
2046#[cfg(feature = "alloc")]
2047impl TryFrom<::rust_alloc::string::String> for String<Global> {
2048 type Error = Error;
2049
2050 /// Try to convert a std `String` into a [`String`].
2051 ///
2052 /// The result is fallibly allocated on the heap.
2053 ///
2054 /// # Examples
2055 ///
2056 /// ```
2057 /// use rune::alloc;
2058 ///
2059 /// let s1 = String::from("Hello World");
2060 /// let s2 = alloc::String::try_from(s1)?;
2061 ///
2062 /// assert_eq!("Hello World", s2);
2063 /// # Ok::<_, rune::alloc::Error>(())
2064 /// ```
2065 fn try_from(string: ::rust_alloc::string::String) -> Result<Self, Error> {
2066 let mut string = ManuallyDrop::new(string.into_bytes());
2067
2068 let buf = string.as_mut_ptr();
2069 let length = string.len();
2070 let capacity = string.capacity();
2071
2072 if let Ok(layout) = Layout::array::<u8>(capacity) {
2073 Global.take(layout)?;
2074 }
2075
2076 // SAFETY: The layout of the string is identical to the std string and
2077 // it uses the same underlying allocator.
2078 unsafe { Ok(String::from_raw_parts_in(buf, length, capacity, Global)) }
2079 }
2080}
2081
2082#[cfg(feature = "alloc")]
2083impl<A: Allocator> From<String<A>> for ::rust_alloc::string::String {
2084 /// Try to convert a [`String`] into a std `String`.
2085 ///
2086 /// The result is allocated on the heap.
2087 fn from(s: String<A>) -> Self {
2088 Self::from(s.as_str())
2089 }
2090}
2091
2092#[cfg(feature = "alloc")]
2093impl<A: Allocator> From<&String<A>> for ::rust_alloc::string::String {
2094 /// Try to convert a [`String`] reference into a std `String`.
2095 ///
2096 /// The result is allocated on the heap.
2097 fn from(s: &String<A>) -> Self {
2098 Self::from(s.as_str())
2099 }
2100}
2101
2102impl TryFrom<&str> for String<Global> {
2103 type Error = Error;
2104
2105 /// Converts a `&str` into a [`String`].
2106 ///
2107 /// The result is fallibly allocated on the heap.
2108 ///
2109 /// ```
2110 /// use rune::alloc::String;
2111 ///
2112 /// let s = String::try_from("Hello World")?;
2113 /// assert_eq!(s, "Hello World");
2114 /// # Ok::<_, rune::alloc::Error>(())
2115 /// ```
2116 fn try_from(s: &str) -> Result<Self, Error> {
2117 let mut out = String::try_with_capacity_in(s.len(), Global)?;
2118 out.try_push_str(s)?;
2119 Ok(out)
2120 }
2121}
2122
2123impl TryFrom<Cow<'_, str>> for String<Global> {
2124 type Error = Error;
2125
2126 /// Converts a `Cow<str>` into a [`String`].
2127 ///
2128 /// The result is fallibly allocated on the heap unless the values is
2129 /// `Cow::Owned`.
2130 ///
2131 /// ```
2132 /// use rune::alloc::String;
2133 /// use rune::alloc::borrow::Cow;
2134 ///
2135 /// let s = Cow::Borrowed("Hello World");
2136 /// let s = String::try_from(s)?;
2137 /// assert_eq!(s, "Hello World");
2138 ///
2139 /// let s = Cow::Owned(String::try_from("Hello World")?);
2140 /// let s = String::try_from(s)?;
2141 /// assert_eq!(s, "Hello World");
2142 /// # Ok::<_, rune::alloc::Error>(())
2143 /// ```
2144 fn try_from(s: Cow<'_, str>) -> Result<Self, Error> {
2145 match s {
2146 Cow::Borrowed(s) => Self::try_from(s),
2147 Cow::Owned(s) => Ok(s),
2148 }
2149 }
2150}
2151
2152impl<A: Allocator + Clone> TryFrom<&String<A>> for String<A> {
2153 type Error = Error;
2154
2155 /// Converts the given [`String`] to a boxed `str` slice that is owned.
2156 ///
2157 /// # Examples
2158 ///
2159 /// ```
2160 /// use rune::alloc::{String, Box};
2161 ///
2162 /// let s1: String = String::try_from("Hello World")?;
2163 /// let s2: String = String::try_from(&s1)?;
2164 ///
2165 /// assert_eq!(s2, "Hello World");
2166 /// # Ok::<_, rune::alloc::Error>(())
2167 /// ```
2168 #[inline]
2169 fn try_from(s: &String<A>) -> Result<Self, Error> {
2170 let mut this = String::new_in(s.allocator().clone());
2171 this.try_push_str(s.as_str())?;
2172 Ok(this)
2173 }
2174}
2175
2176impl<A: Allocator> TryFrom<String<A>> for Box<str, A> {
2177 type Error = Error;
2178
2179 /// Converts the given [`String`] to a boxed `str` slice that is owned.
2180 ///
2181 /// # Examples
2182 ///
2183 /// ```
2184 /// use rune::alloc::{String, Box};
2185 ///
2186 /// let s1: String = String::try_from("Hello World")?;
2187 /// let s2: Box<str> = Box::try_from("Hello World")?;
2188 ///
2189 /// assert_eq!("Hello World", s2.as_ref());
2190 /// # Ok::<_, rune::alloc::Error>(())
2191 /// ```
2192 #[inline]
2193 fn try_from(s: String<A>) -> Result<Self, Error> {
2194 s.try_into_boxed_str()
2195 }
2196}
2197
2198impl TryFrom<Cow<'_, str>> for Box<str> {
2199 type Error = Error;
2200
2201 /// Converts the given [`String`] to a boxed `str` slice that is owned.
2202 ///
2203 /// # Examples
2204 ///
2205 /// ```
2206 /// use rune::alloc::Box;
2207 /// use rune::alloc::borrow::Cow;
2208 ///
2209 /// let s2: Box<str> = Box::try_from(Cow::Borrowed("Hello World"))?;
2210 ///
2211 /// assert_eq!("Hello World", s2.as_ref());
2212 /// # Ok::<_, rune::alloc::Error>(())
2213 /// ```
2214 #[inline]
2215 fn try_from(s: Cow<'_, str>) -> Result<Self, Error> {
2216 Self::try_from(s.as_ref())
2217 }
2218}
2219
2220impl<A: Allocator> From<String<A>> for Vec<u8, A> {
2221 /// Converts the given [`String`] to a vector [`Vec`] that holds values of type [`u8`].
2222 ///
2223 /// # Examples
2224 ///
2225 /// ```
2226 /// use rune::alloc::{String, Vec};
2227 ///
2228 /// let s1 = String::try_from("hello world")?;
2229 /// let v1 = Vec::from(s1);
2230 ///
2231 /// for b in v1 {
2232 /// println!("{b}");
2233 /// }
2234 /// # Ok::<_, rune::alloc::Error>(())
2235 /// ```
2236 #[inline]
2237 fn from(string: String<A>) -> Vec<u8, A> {
2238 string.into_bytes()
2239 }
2240}
2241
2242/// A draining iterator for `String`.
2243///
2244/// This struct is created by the [`drain`] method on [`String`]. See its
2245/// documentation for more.
2246///
2247/// [`drain`]: String::drain
2248pub struct Drain<'a, A: Allocator> {
2249 /// Will be used as &'a mut String in the destructor
2250 string: *mut String<A>,
2251 /// Start of part to remove
2252 start: usize,
2253 /// End of part to remove
2254 end: usize,
2255 /// Current remaining range to remove
2256 iter: Chars<'a>,
2257}
2258
2259impl<A: Allocator> fmt::Debug for Drain<'_, A> {
2260 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
2261 f.debug_tuple("Drain").field(&self.as_str()).finish()
2262 }
2263}
2264
2265unsafe impl<A: Allocator> Sync for Drain<'_, A> {}
2266unsafe impl<A: Allocator> Send for Drain<'_, A> {}
2267
2268impl<A: Allocator> Drop for Drain<'_, A> {
2269 fn drop(&mut self) {
2270 unsafe {
2271 // Use Vec::drain. "Reaffirm" the bounds checks to avoid
2272 // panic code being inserted again.
2273 let self_vec = (*self.string).as_mut_vec();
2274
2275 if self.start <= self.end && self.end <= self_vec.len() {
2276 self_vec.drain(self.start..self.end);
2277 }
2278 }
2279 }
2280}
2281
2282impl<A: Allocator> Drain<'_, A> {
2283 /// Returns the remaining (sub)string of this iterator as a slice.
2284 ///
2285 /// # Examples
2286 ///
2287 /// ```
2288 /// use rune::alloc::String;
2289 ///
2290 /// let mut s = String::try_from("abc")?;
2291 /// let mut drain = s.drain(..);
2292 /// assert_eq!(drain.as_str(), "abc");
2293 /// assert!(drain.next().is_some());
2294 /// assert_eq!(drain.as_str(), "bc");
2295 /// # Ok::<_, rune::alloc::Error>(())
2296 /// ```
2297 #[must_use]
2298 pub fn as_str(&self) -> &str {
2299 self.iter.as_str()
2300 }
2301}
2302
2303impl<A: Allocator> AsRef<str> for Drain<'_, A> {
2304 fn as_ref(&self) -> &str {
2305 self.as_str()
2306 }
2307}
2308
2309impl<A: Allocator> AsRef<[u8]> for Drain<'_, A> {
2310 fn as_ref(&self) -> &[u8] {
2311 self.as_str().as_bytes()
2312 }
2313}
2314
2315impl<A: Allocator> Iterator for Drain<'_, A> {
2316 type Item = char;
2317
2318 #[inline]
2319 fn next(&mut self) -> Option<char> {
2320 self.iter.next()
2321 }
2322
2323 fn size_hint(&self) -> (usize, Option<usize>) {
2324 self.iter.size_hint()
2325 }
2326
2327 #[inline]
2328 fn last(mut self) -> Option<char> {
2329 self.next_back()
2330 }
2331}
2332
2333impl<A: Allocator> DoubleEndedIterator for Drain<'_, A> {
2334 #[inline]
2335 fn next_back(&mut self) -> Option<char> {
2336 self.iter.next_back()
2337 }
2338}
2339
2340impl<A: Allocator> FusedIterator for Drain<'_, A> {}
2341
2342impl<A: Allocator> TryWrite for String<A> {
2343 #[inline]
2344 fn try_write_str(&mut self, s: &str) -> Result<(), Error> {
2345 self.try_push_str(s)
2346 }
2347
2348 #[inline]
2349 fn try_write_char(&mut self, c: char) -> Result<(), Error> {
2350 self.try_push(c)
2351 }
2352}
2353
2354impl<A: Allocator> TryFromIteratorIn<char, A> for String<A> {
2355 /// Construct a string from an iterator of characters.
2356 ///
2357 /// ```
2358 /// use rune::alloc::String;
2359 /// use rune::alloc::prelude::*;
2360 ///
2361 /// let string = String::try_from_iter(['a', 'b', 'c'].into_iter())?;
2362 /// assert_eq!(string, "abc");
2363 /// # Ok::<_, rune::alloc::Error>(())
2364 /// ```
2365 fn try_from_iter_in<I>(iter: I, alloc: A) -> Result<Self, Error>
2366 where
2367 I: IntoIterator<Item = char>,
2368 {
2369 let mut this = String::new_in(alloc);
2370 this.try_extend(iter)?;
2371 Ok(this)
2372 }
2373}
2374
2375impl<'a, A: Allocator> TryFromIteratorIn<&'a str, A> for String<A> {
2376 /// Construct a string from an iterator of characters.
2377 ///
2378 /// ```
2379 /// use rune::alloc::String;
2380 /// use rune::alloc::prelude::*;
2381 ///
2382 /// let string = String::try_from_iter(["hello", " ", "world"].into_iter())?;
2383 /// assert_eq!(string, "hello world");
2384 /// # Ok::<_, rune::alloc::Error>(())
2385 /// ```
2386 fn try_from_iter_in<I>(iter: I, alloc: A) -> Result<Self, Error>
2387 where
2388 I: IntoIterator<Item = &'a str>,
2389 {
2390 let mut this = String::new_in(alloc);
2391 this.try_extend(iter)?;
2392 Ok(this)
2393 }
2394}
2395
2396impl<T, A: Allocator> TryJoin<char, T, A> for String<A>
2397where
2398 T: AsRef<str>,
2399{
2400 fn try_join_in<I>(iter: I, sep: char, alloc: A) -> Result<Self, Error>
2401 where
2402 I: IntoIterator<Item = T>,
2403 {
2404 let mut string = String::new_in(alloc);
2405
2406 let mut iter = iter.into_iter().peekable();
2407
2408 while let Some(value) = iter.next() {
2409 string.try_push_str(value.as_ref())?;
2410
2411 if iter.peek().is_some() {
2412 string.try_push(sep)?;
2413 }
2414 }
2415
2416 Ok(string)
2417 }
2418}
2419
2420impl<T, A: Allocator> TryJoin<&str, T, A> for String<A>
2421where
2422 T: AsRef<str>,
2423{
2424 fn try_join_in<I>(iter: I, sep: &str, alloc: A) -> Result<Self, Error>
2425 where
2426 I: IntoIterator<Item = T>,
2427 {
2428 let mut string = String::new_in(alloc);
2429
2430 let mut iter = iter.into_iter().peekable();
2431
2432 while let Some(value) = iter.next() {
2433 string.try_push_str(value.as_ref())?;
2434
2435 if iter.peek().is_some() {
2436 string.try_push_str(sep)?;
2437 }
2438 }
2439
2440 Ok(string)
2441 }
2442}
2443
2444impl<A: Allocator> TryExtend<char> for String<A> {
2445 /// Extend a string using a character iterator.
2446 ///
2447 /// ```
2448 /// use rune::alloc::String;
2449 /// use rune::alloc::prelude::*;
2450 ///
2451 /// let mut string = String::new();
2452 /// string.try_extend(['a', 'b', 'c'])?;
2453 /// assert_eq!(string, "abc");
2454 /// # Ok::<_, rune::alloc::Error>(())
2455 /// ```
2456 #[inline]
2457 fn try_extend<I: IntoIterator<Item = char>>(&mut self, iter: I) -> Result<(), Error> {
2458 for value in iter {
2459 self.try_push(value)?;
2460 }
2461
2462 Ok(())
2463 }
2464}
2465
2466impl<'a, A: Allocator> TryExtend<&'a str> for String<A> {
2467 /// Extend a string using a character iterator.
2468 ///
2469 /// ```
2470 /// use rune::alloc::String;
2471 /// use rune::alloc::prelude::*;
2472 ///
2473 /// let mut string = String::new();
2474 /// string.try_extend(["hello", " ", "world"])?;
2475 /// assert_eq!(string, "hello world");
2476 /// # Ok::<_, rune::alloc::Error>(())
2477 /// ```
2478 #[inline]
2479 fn try_extend<I: IntoIterator<Item = &'a str>>(&mut self, iter: I) -> Result<(), Error> {
2480 for value in iter {
2481 self.try_push_str(value)?;
2482 }
2483
2484 Ok(())
2485 }
2486}