rust/library/core/src/char/methods.rs

//! impl char {}

use crate::intrinsics::likely;
use crate::slice;
use crate::str::from_utf8_unchecked_mut;
use crate::unicode::printable::is_printable;
use crate::unicode::{self, conversions};

use super::*;

#[lang = "char"]
impl char {
    /// The highest valid code point a `char` can have.
    ///
    /// A `char` is a [Unicode Scalar Value], which means that it is a [Code
    /// Point], but only ones within a certain range. `MAX` is the highest valid
    /// code point that's a valid [Unicode Scalar Value].
    ///
    /// [Unicode Scalar Value]: http://www.unicode.org/glossary/#unicode_scalar_value
    /// [Code Point]: http://www.unicode.org/glossary/#code_point
    #[stable(feature = "assoc_char_consts", since = "1.52.0")]
    pub const MAX: char = '\u{10ffff}';

    /// `U+FFFD REPLACEMENT CHARACTER` (<28>) is used in Unicode to represent a
    /// decoding error.
    ///
    /// It can occur, for example, when giving ill-formed UTF-8 bytes to
    /// [`String::from_utf8_lossy`](string/struct.String.html#method.from_utf8_lossy).
    #[stable(feature = "assoc_char_consts", since = "1.52.0")]
    pub const REPLACEMENT_CHARACTER: char = '\u{FFFD}';

    /// The version of [Unicode](http://www.unicode.org/) that the Unicode parts of
    /// `char` and `str` methods are based on.
    ///
    /// New versions of Unicode are released regularly and subsequently all methods
    /// in the standard library depending on Unicode are updated. Therefore the
    /// behavior of some `char` and `str` methods and the value of this constant
    /// changes over time. This is *not* considered to be a breaking change.
    ///
    /// The version numbering scheme is explained in
    /// [Unicode 11.0 or later, Section 3.1 Versions of the Unicode Standard](https://www.unicode.org/versions/Unicode11.0.0/ch03.pdf#page=4).
    #[stable(feature = "assoc_char_consts", since = "1.52.0")]
    pub const UNICODE_VERSION: (u8, u8, u8) = crate::unicode::UNICODE_VERSION;

    /// Creates an iterator over the UTF-16 encoded code points in `iter`,
    /// returning unpaired surrogates as `Err`s.
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// use std::char::decode_utf16;
    ///
    /// // 𝄞mus<invalid>ic<invalid>
    /// let v = [
    ///     0xD834, 0xDD1E, 0x006d, 0x0075, 0x0073, 0xDD1E, 0x0069, 0x0063, 0xD834,
    /// ];
    ///
    /// assert_eq!(
    ///     decode_utf16(v.iter().cloned())
    ///         .map(|r| r.map_err(|e| e.unpaired_surrogate()))
    ///         .collect::<Vec<_>>(),
    ///     vec![
    ///         Ok('𝄞'),
    ///         Ok('m'), Ok('u'), Ok('s'),
    ///         Err(0xDD1E),
    ///         Ok('i'), Ok('c'),
    ///         Err(0xD834)
    ///     ]
    /// );
    /// ```
    ///
    /// A lossy decoder can be obtained by replacing `Err` results with the replacement character:
    ///
    /// ```
    /// use std::char::{decode_utf16, REPLACEMENT_CHARACTER};
    ///
    /// // 𝄞mus<invalid>ic<invalid>
    /// let v = [
    ///     0xD834, 0xDD1E, 0x006d, 0x0075, 0x0073, 0xDD1E, 0x0069, 0x0063, 0xD834,
    /// ];
    ///
    /// assert_eq!(
    ///     decode_utf16(v.iter().cloned())
    ///        .map(|r| r.unwrap_or(REPLACEMENT_CHARACTER))
    ///        .collect::<String>(),
    ///     "𝄞mus<75>ic<69>"
    /// );
    /// ```
    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
    #[inline]
    pub fn decode_utf16<I: IntoIterator<Item = u16>>(iter: I) -> DecodeUtf16<I::IntoIter> {
        super::decode::decode_utf16(iter)
    }

    /// Converts a `u32` to a `char`.
    ///
    /// Note that all `char`s are valid [`u32`]s, and can be cast to one with
    /// `as`:
    ///
    /// ```
    /// let c = '💯';
    /// let i = c as u32;
    ///
    /// assert_eq!(128175, i);
    /// ```
    ///
    /// However, the reverse is not true: not all valid [`u32`]s are valid
    /// `char`s. `from_u32()` will return `None` if the input is not a valid value
    /// for a `char`.
    ///
    /// For an unsafe version of this function which ignores these checks, see
    /// [`from_u32_unchecked`].
    ///
    /// [`from_u32_unchecked`]: #method.from_u32_unchecked
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// use std::char;
    ///
    /// let c = char::from_u32(0x2764);
    ///
    /// assert_eq!(Some('❤'), c);
    /// ```
    ///
    /// Returning `None` when the input is not a valid `char`:
    ///
    /// ```
    /// use std::char;
    ///
    /// let c = char::from_u32(0x110000);
    ///
    /// assert_eq!(None, c);
    /// ```
    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
    #[inline]
    pub fn from_u32(i: u32) -> Option<char> {
        super::convert::from_u32(i)
    }

    /// Converts a `u32` to a `char`, ignoring validity.
    ///
    /// Note that all `char`s are valid [`u32`]s, and can be cast to one with
    /// `as`:
    ///
    /// ```
    /// let c = '💯';
    /// let i = c as u32;
    ///
    /// assert_eq!(128175, i);
    /// ```
    ///
    /// However, the reverse is not true: not all valid [`u32`]s are valid
    /// `char`s. `from_u32_unchecked()` will ignore this, and blindly cast to
    /// `char`, possibly creating an invalid one.
    ///
    /// # Safety
    ///
    /// This function is unsafe, as it may construct invalid `char` values.
    ///
    /// For a safe version of this function, see the [`from_u32`] function.
    ///
    /// [`from_u32`]: #method.from_u32
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// use std::char;
    ///
    /// let c = unsafe { char::from_u32_unchecked(0x2764) };
    ///
    /// assert_eq!('❤', c);
    /// ```
    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
    #[inline]
    pub unsafe fn from_u32_unchecked(i: u32) -> char {
        // SAFETY: the safety contract must be upheld by the caller.
        unsafe { super::convert::from_u32_unchecked(i) }
    }

    /// Converts a digit in the given radix to a `char`.
    ///
    /// A 'radix' here is sometimes also called a 'base'. A radix of two
    /// indicates a binary number, a radix of ten, decimal, and a radix of
    /// sixteen, hexadecimal, to give some common values. Arbitrary
    /// radices are supported.
    ///
    /// `from_digit()` will return `None` if the input is not a digit in
    /// the given radix.
    ///
    /// # Panics
    ///
    /// Panics if given a radix larger than 36.
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// use std::char;
    ///
    /// let c = char::from_digit(4, 10);
    ///
    /// assert_eq!(Some('4'), c);
    ///
    /// // Decimal 11 is a single digit in base 16
    /// let c = char::from_digit(11, 16);
    ///
    /// assert_eq!(Some('b'), c);
    /// ```
    ///
    /// Returning `None` when the input is not a digit:
    ///
    /// ```
    /// use std::char;
    ///
    /// let c = char::from_digit(20, 10);
    ///
    /// assert_eq!(None, c);
    /// ```
    ///
    /// Passing a large radix, causing a panic:
    ///
    /// ```should_panic
    /// use std::char;
    ///
    /// // this panics
    /// char::from_digit(1, 37);
    /// ```
    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
    #[inline]
    pub fn from_digit(num: u32, radix: u32) -> Option<char> {
        super::convert::from_digit(num, radix)
    }

    /// Checks if a `char` is a digit in the given radix.
    ///
    /// A 'radix' here is sometimes also called a 'base'. A radix of two
    /// indicates a binary number, a radix of ten, decimal, and a radix of
    /// sixteen, hexadecimal, to give some common values. Arbitrary
    /// radices are supported.
    ///
    /// Compared to [`is_numeric()`], this function only recognizes the characters
    /// `0-9`, `a-z` and `A-Z`.
    ///
    /// 'Digit' is defined to be only the following characters:
    ///
    /// * `0-9`
    /// * `a-z`
    /// * `A-Z`
    ///
    /// For a more comprehensive understanding of 'digit', see [`is_numeric()`].
    ///
    /// [`is_numeric()`]: #method.is_numeric
    ///
    /// # Panics
    ///
    /// Panics if given a radix larger than 36.
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!('1'.is_digit(10));
    /// assert!('f'.is_digit(16));
    /// assert!(!'f'.is_digit(10));
    /// ```
    ///
    /// Passing a large radix, causing a panic:
    ///
    /// ```should_panic
    /// // this panics
    /// '1'.is_digit(37);
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_digit(self, radix: u32) -> bool {
        self.to_digit(radix).is_some()
    }

    /// Converts a `char` to a digit in the given radix.
    ///
    /// A 'radix' here is sometimes also called a 'base'. A radix of two
    /// indicates a binary number, a radix of ten, decimal, and a radix of
    /// sixteen, hexadecimal, to give some common values. Arbitrary
    /// radices are supported.
    ///
    /// 'Digit' is defined to be only the following characters:
    ///
    /// * `0-9`
    /// * `a-z`
    /// * `A-Z`
    ///
    /// # Errors
    ///
    /// Returns `None` if the `char` does not refer to a digit in the given radix.
    ///
    /// # Panics
    ///
    /// Panics if given a radix larger than 36.
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert_eq!('1'.to_digit(10), Some(1));
    /// assert_eq!('f'.to_digit(16), Some(15));
    /// ```
    ///
    /// Passing a non-digit results in failure:
    ///
    /// ```
    /// assert_eq!('f'.to_digit(10), None);
    /// assert_eq!('z'.to_digit(16), None);
    /// ```
    ///
    /// Passing a large radix, causing a panic:
    ///
    /// ```should_panic
    /// // this panics
    /// '1'.to_digit(37);
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn to_digit(self, radix: u32) -> Option<u32> {
        assert!(radix <= 36, "to_digit: radix is too high (maximum 36)");
        // the code is split up here to improve execution speed for cases where
        // the `radix` is constant and 10 or smaller
        let val = if likely(radix <= 10) {
            // If not a digit, a number greater than radix will be created.
            (self as u32).wrapping_sub('0' as u32)
        } else {
            match self {
                '0'..='9' => self as u32 - '0' as u32,
                'a'..='z' => self as u32 - 'a' as u32 + 10,
                'A'..='Z' => self as u32 - 'A' as u32 + 10,
                _ => return None,
            }
        };

        if val < radix { Some(val) } else { None }
    }

    /// Returns an iterator that yields the hexadecimal Unicode escape of a
    /// character as `char`s.
    ///
    /// This will escape characters with the Rust syntax of the form
    /// `\u{NNNNNN}` where `NNNNNN` is a hexadecimal representation.
    ///
    /// # Examples
    ///
    /// As an iterator:
    ///
    /// ```
    /// for c in '❤'.escape_unicode() {
    ///     print!("{}", c);
    /// }
    /// println!();
    /// ```
    ///
    /// Using `println!` directly:
    ///
    /// ```
    /// println!("{}", '❤'.escape_unicode());
    /// ```
    ///
    /// Both are equivalent to:
    ///
    /// ```
    /// println!("\\u{{2764}}");
    /// ```
    ///
    /// Using `to_string`:
    ///
    /// ```
    /// assert_eq!('❤'.escape_unicode().to_string(), "\\u{2764}");
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn escape_unicode(self) -> EscapeUnicode {
        let c = self as u32;

        // or-ing 1 ensures that for c==0 the code computes that one
        // digit should be printed and (which is the same) avoids the
        // (31 - 32) underflow
        let msb = 31 - (c | 1).leading_zeros();

        // the index of the most significant hex digit
        let ms_hex_digit = msb / 4;
        EscapeUnicode {
            c: self,
            state: EscapeUnicodeState::Backslash,
            hex_digit_idx: ms_hex_digit as usize,
        }
    }

    /// An extended version of `escape_debug` that optionally permits escaping
    /// Extended Grapheme codepoints. This allows us to format characters like
    /// nonspacing marks better when they're at the start of a string.
    #[inline]
    pub(crate) fn escape_debug_ext(self, escape_grapheme_extended: bool) -> EscapeDebug {
        let init_state = match self {
            '\t' => EscapeDefaultState::Backslash('t'),
            '\r' => EscapeDefaultState::Backslash('r'),
            '\n' => EscapeDefaultState::Backslash('n'),
            '\\' | '\'' | '"' => EscapeDefaultState::Backslash(self),
            _ if escape_grapheme_extended && self.is_grapheme_extended() => {
                EscapeDefaultState::Unicode(self.escape_unicode())
            }
            _ if is_printable(self) => EscapeDefaultState::Char(self),
            _ => EscapeDefaultState::Unicode(self.escape_unicode()),
        };
        EscapeDebug(EscapeDefault { state: init_state })
    }

    /// Returns an iterator that yields the literal escape code of a character
    /// as `char`s.
    ///
    /// This will escape the characters similar to the `Debug` implementations
    /// of `str` or `char`.
    ///
    /// # Examples
    ///
    /// As an iterator:
    ///
    /// ```
    /// for c in '\n'.escape_debug() {
    ///     print!("{}", c);
    /// }
    /// println!();
    /// ```
    ///
    /// Using `println!` directly:
    ///
    /// ```
    /// println!("{}", '\n'.escape_debug());
    /// ```
    ///
    /// Both are equivalent to:
    ///
    /// ```
    /// println!("\\n");
    /// ```
    ///
    /// Using `to_string`:
    ///
    /// ```
    /// assert_eq!('\n'.escape_debug().to_string(), "\\n");
    /// ```
    #[stable(feature = "char_escape_debug", since = "1.20.0")]
    #[inline]
    pub fn escape_debug(self) -> EscapeDebug {
        self.escape_debug_ext(true)
    }

    /// Returns an iterator that yields the literal escape code of a character
    /// as `char`s.
    ///
    /// The default is chosen with a bias toward producing literals that are
    /// legal in a variety of languages, including C++11 and similar C-family
    /// languages. The exact rules are:
    ///
    /// * Tab is escaped as `\t`.
    /// * Carriage return is escaped as `\r`.
    /// * Line feed is escaped as `\n`.
    /// * Single quote is escaped as `\'`.
    /// * Double quote is escaped as `\"`.
    /// * Backslash is escaped as `\\`.
    /// * Any character in the 'printable ASCII' range `0x20` .. `0x7e`
    ///   inclusive is not escaped.
    /// * All other characters are given hexadecimal Unicode escapes; see
    ///   [`escape_unicode`].
    ///
    /// [`escape_unicode`]: #method.escape_unicode
    ///
    /// # Examples
    ///
    /// As an iterator:
    ///
    /// ```
    /// for c in '"'.escape_default() {
    ///     print!("{}", c);
    /// }
    /// println!();
    /// ```
    ///
    /// Using `println!` directly:
    ///
    /// ```
    /// println!("{}", '"'.escape_default());
    /// ```
    ///
    /// Both are equivalent to:
    ///
    /// ```
    /// println!("\\\"");
    /// ```
    ///
    /// Using `to_string`:
    ///
    /// ```
    /// assert_eq!('"'.escape_default().to_string(), "\\\"");
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn escape_default(self) -> EscapeDefault {
        let init_state = match self {
            '\t' => EscapeDefaultState::Backslash('t'),
            '\r' => EscapeDefaultState::Backslash('r'),
            '\n' => EscapeDefaultState::Backslash('n'),
            '\\' | '\'' | '"' => EscapeDefaultState::Backslash(self),
            '\x20'..='\x7e' => EscapeDefaultState::Char(self),
            _ => EscapeDefaultState::Unicode(self.escape_unicode()),
        };
        EscapeDefault { state: init_state }
    }

    /// Returns the number of bytes this `char` would need if encoded in UTF-8.
    ///
    /// That number of bytes is always between 1 and 4, inclusive.
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// let len = 'A'.len_utf8();
    /// assert_eq!(len, 1);
    ///
    /// let len = 'ß'.len_utf8();
    /// assert_eq!(len, 2);
    ///
    /// let len = 'ℝ'.len_utf8();
    /// assert_eq!(len, 3);
    ///
    /// let len = '💣'.len_utf8();
    /// assert_eq!(len, 4);
    /// ```
    ///
    /// The `&str` type guarantees that its contents are UTF-8, and so we can compare the length it
    /// would take if each code point was represented as a `char` vs in the `&str` itself:
    ///
    /// ```
    /// // as chars
    /// let eastern = '東';
    /// let capital = '京';
    ///
    /// // both can be represented as three bytes
    /// assert_eq!(3, eastern.len_utf8());
    /// assert_eq!(3, capital.len_utf8());
    ///
    /// // as a &str, these two are encoded in UTF-8
    /// let tokyo = "東京";
    ///
    /// let len = eastern.len_utf8() + capital.len_utf8();
    ///
    /// // we can see that they take six bytes total...
    /// assert_eq!(6, tokyo.len());
    ///
    /// // ... just like the &str
    /// assert_eq!(len, tokyo.len());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[rustc_const_stable(feature = "const_char_len_utf", since = "1.52.0")]
    #[inline]
    pub const fn len_utf8(self) -> usize {
        len_utf8(self as u32)
    }

    /// Returns the number of 16-bit code units this `char` would need if
    /// encoded in UTF-16.
    ///
    /// See the documentation for [`len_utf8()`] for more explanation of this
    /// concept. This function is a mirror, but for UTF-16 instead of UTF-8.
    ///
    /// [`len_utf8()`]: #method.len_utf8
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// let n = 'ß'.len_utf16();
    /// assert_eq!(n, 1);
    ///
    /// let len = '💣'.len_utf16();
    /// assert_eq!(len, 2);
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[rustc_const_stable(feature = "const_char_len_utf", since = "1.52.0")]
    #[inline]
    pub const fn len_utf16(self) -> usize {
        let ch = self as u32;
        if (ch & 0xFFFF) == ch { 1 } else { 2 }
    }

    /// Encodes this character as UTF-8 into the provided byte buffer,
    /// and then returns the subslice of the buffer that contains the encoded character.
    ///
    /// # Panics
    ///
    /// Panics if the buffer is not large enough.
    /// A buffer of length four is large enough to encode any `char`.
    ///
    /// # Examples
    ///
    /// In both of these examples, 'ß' takes two bytes to encode.
    ///
    /// ```
    /// let mut b = [0; 2];
    ///
    /// let result = 'ß'.encode_utf8(&mut b);
    ///
    /// assert_eq!(result, "ß");
    ///
    /// assert_eq!(result.len(), 2);
    /// ```
    ///
    /// A buffer that's too small:
    ///
    /// ```should_panic
    /// let mut b = [0; 1];
    ///
    /// // this panics
    /// 'ß'.encode_utf8(&mut b);
    /// ```
    #[stable(feature = "unicode_encode_char", since = "1.15.0")]
    #[inline]
    pub fn encode_utf8(self, dst: &mut [u8]) -> &mut str {
        // SAFETY: `char` is not a surrogate, so this is valid UTF-8.
        unsafe { from_utf8_unchecked_mut(encode_utf8_raw(self as u32, dst)) }
    }

    /// Encodes this character as UTF-16 into the provided `u16` buffer,
    /// and then returns the subslice of the buffer that contains the encoded character.
    ///
    /// # Panics
    ///
    /// Panics if the buffer is not large enough.
    /// A buffer of length 2 is large enough to encode any `char`.
    ///
    /// # Examples
    ///
    /// In both of these examples, '𝕊' takes two `u16`s to encode.
    ///
    /// ```
    /// let mut b = [0; 2];
    ///
    /// let result = '𝕊'.encode_utf16(&mut b);
    ///
    /// assert_eq!(result.len(), 2);
    /// ```
    ///
    /// A buffer that's too small:
    ///
    /// ```should_panic
    /// let mut b = [0; 1];
    ///
    /// // this panics
    /// '𝕊'.encode_utf16(&mut b);
    /// ```
    #[stable(feature = "unicode_encode_char", since = "1.15.0")]
    #[inline]
    pub fn encode_utf16(self, dst: &mut [u16]) -> &mut [u16] {
        encode_utf16_raw(self as u32, dst)
    }

    /// Returns `true` if this `char` has the `Alphabetic` property.
    ///
    /// `Alphabetic` is described in Chapter 4 (Character Properties) of the [Unicode Standard] and
    /// specified in the [Unicode Character Database][ucd] [`DerivedCoreProperties.txt`].
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!('a'.is_alphabetic());
    /// assert!('京'.is_alphabetic());
    ///
    /// let c = '💝';
    /// // love is many things, but it is not alphabetic
    /// assert!(!c.is_alphabetic());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_alphabetic(self) -> bool {
        match self {
            'a'..='z' | 'A'..='Z' => true,
            c => c > '\x7f' && unicode::Alphabetic(c),
        }
    }

    /// Returns `true` if this `char` has the `Lowercase` property.
    ///
    /// `Lowercase` is described in Chapter 4 (Character Properties) of the [Unicode Standard] and
    /// specified in the [Unicode Character Database][ucd] [`DerivedCoreProperties.txt`].
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!('a'.is_lowercase());
    /// assert!('δ'.is_lowercase());
    /// assert!(!'A'.is_lowercase());
    /// assert!(!'Δ'.is_lowercase());
    ///
    /// // The various Chinese scripts and punctuation do not have case, and so:
    /// assert!(!'中'.is_lowercase());
    /// assert!(!' '.is_lowercase());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_lowercase(self) -> bool {
        match self {
            'a'..='z' => true,
            c => c > '\x7f' && unicode::Lowercase(c),
        }
    }

    /// Returns `true` if this `char` has the `Uppercase` property.
    ///
    /// `Uppercase` is described in Chapter 4 (Character Properties) of the [Unicode Standard] and
    /// specified in the [Unicode Character Database][ucd] [`DerivedCoreProperties.txt`].
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!(!'a'.is_uppercase());
    /// assert!(!'δ'.is_uppercase());
    /// assert!('A'.is_uppercase());
    /// assert!('Δ'.is_uppercase());
    ///
    /// // The various Chinese scripts and punctuation do not have case, and so:
    /// assert!(!'中'.is_uppercase());
    /// assert!(!' '.is_uppercase());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_uppercase(self) -> bool {
        match self {
            'A'..='Z' => true,
            c => c > '\x7f' && unicode::Uppercase(c),
        }
    }

    /// Returns `true` if this `char` has the `White_Space` property.
    ///
    /// `White_Space` is specified in the [Unicode Character Database][ucd] [`PropList.txt`].
    ///
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`PropList.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/PropList.txt
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!(' '.is_whitespace());
    ///
    /// // a non-breaking space
    /// assert!('\u{A0}'.is_whitespace());
    ///
    /// assert!(!'越'.is_whitespace());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_whitespace(self) -> bool {
        match self {
            ' ' | '\x09'..='\x0d' => true,
            c => c > '\x7f' && unicode::White_Space(c),
        }
    }

    /// Returns `true` if this `char` satisfies either [`is_alphabetic()`] or [`is_numeric()`].
    ///
    /// [`is_alphabetic()`]: #method.is_alphabetic
    /// [`is_numeric()`]: #method.is_numeric
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!('٣'.is_alphanumeric());
    /// assert!('7'.is_alphanumeric());
    /// assert!('৬'.is_alphanumeric());
    /// assert!('¾'.is_alphanumeric());
    /// assert!('①'.is_alphanumeric());
    /// assert!('K'.is_alphanumeric());
    /// assert!('و'.is_alphanumeric());
    /// assert!('藏'.is_alphanumeric());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_alphanumeric(self) -> bool {
        self.is_alphabetic() || self.is_numeric()
    }

    /// Returns `true` if this `char` has the general category for control codes.
    ///
    /// Control codes (code points with the general category of `Cc`) are described in Chapter 4
    /// (Character Properties) of the [Unicode Standard] and specified in the [Unicode Character
    /// Database][ucd] [`UnicodeData.txt`].
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// // U+009C, STRING TERMINATOR
    /// assert!(''.is_control());
    /// assert!(!'q'.is_control());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_control(self) -> bool {
        unicode::Cc(self)
    }

    /// Returns `true` if this `char` has the `Grapheme_Extend` property.
    ///
    /// `Grapheme_Extend` is described in [Unicode Standard Annex #29 (Unicode Text
    /// Segmentation)][uax29] and specified in the [Unicode Character Database][ucd]
    /// [`DerivedCoreProperties.txt`].
    ///
    /// [uax29]: https://www.unicode.org/reports/tr29/
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
    #[inline]
    pub(crate) fn is_grapheme_extended(self) -> bool {
        unicode::Grapheme_Extend(self)
    }

    /// Returns `true` if this `char` has one of the general categories for numbers.
    ///
    /// The general categories for numbers (`Nd` for decimal digits, `Nl` for letter-like numeric
    /// characters, and `No` for other numeric characters) are specified in the [Unicode Character
    /// Database][ucd] [`UnicodeData.txt`].
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
    ///
    /// # Examples
    ///
    /// Basic usage:
    ///
    /// ```
    /// assert!('٣'.is_numeric());
    /// assert!('7'.is_numeric());
    /// assert!('৬'.is_numeric());
    /// assert!('¾'.is_numeric());
    /// assert!('①'.is_numeric());
    /// assert!(!'K'.is_numeric());
    /// assert!(!'و'.is_numeric());
    /// assert!(!'藏'.is_numeric());
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn is_numeric(self) -> bool {
        match self {
            '0'..='9' => true,
            c => c > '\x7f' && unicode::N(c),
        }
    }

    /// Returns an iterator that yields the lowercase mapping of this `char` as one or more
    /// `char`s.
    ///
    /// If this `char` does not have a lowercase mapping, the iterator yields the same `char`.
    ///
    /// If this `char` has a one-to-one lowercase mapping given by the [Unicode Character
    /// Database][ucd] [`UnicodeData.txt`], the iterator yields that `char`.
    ///
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
    ///
    /// If this `char` requires special considerations (e.g. multiple `char`s) the iterator yields
    /// the `char`(s) given by [`SpecialCasing.txt`].
    ///
    /// [`SpecialCasing.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/SpecialCasing.txt
    ///
    /// This operation performs an unconditional mapping without tailoring. That is, the conversion
    /// is independent of context and language.
    ///
    /// In the [Unicode Standard], Chapter 4 (Character Properties) discusses case mapping in
    /// general and Chapter 3 (Conformance) discusses the default algorithm for case conversion.
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    ///
    /// # Examples
    ///
    /// As an iterator:
    ///
    /// ```
    /// for c in 'İ'.to_lowercase() {
    ///     print!("{}", c);
    /// }
    /// println!();
    /// ```
    ///
    /// Using `println!` directly:
    ///
    /// ```
    /// println!("{}", 'İ'.to_lowercase());
    /// ```
    ///
    /// Both are equivalent to:
    ///
    /// ```
    /// println!("i\u{307}");
    /// ```
    ///
    /// Using `to_string`:
    ///
    /// ```
    /// assert_eq!('C'.to_lowercase().to_string(), "c");
    ///
    /// // Sometimes the result is more than one character:
    /// assert_eq!('İ'.to_lowercase().to_string(), "i\u{307}");
    ///
    /// // Characters that do not have both uppercase and lowercase
    /// // convert into themselves.
    /// assert_eq!('山'.to_lowercase().to_string(), "山");
    /// ```
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn to_lowercase(self) -> ToLowercase {
        ToLowercase(CaseMappingIter::new(conversions::to_lower(self)))
    }

    /// Returns an iterator that yields the uppercase mapping of this `char` as one or more
    /// `char`s.
    ///
    /// If this `char` does not have a uppercase mapping, the iterator yields the same `char`.
    ///
    /// If this `char` has a one-to-one uppercase mapping given by the [Unicode Character
    /// Database][ucd] [`UnicodeData.txt`], the iterator yields that `char`.
    ///
    /// [ucd]: https://www.unicode.org/reports/tr44/
    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
    ///
    /// If this `char` requires special considerations (e.g. multiple `char`s) the iterator yields
    /// the `char`(s) given by [`SpecialCasing.txt`].
    ///
    /// [`SpecialCasing.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/SpecialCasing.txt
    ///
    /// This operation performs an unconditional mapping without tailoring. That is, the conversion
    /// is independent of context and language.
    ///
    /// In the [Unicode Standard], Chapter 4 (Character Properties) discusses case mapping in
    /// general and Chapter 3 (Conformance) discusses the default algorithm for case conversion.
    ///
    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
    ///
    /// # Examples
    ///
    /// As an iterator:
    ///
    /// ```
    /// for c in 'ß'.to_uppercase() {
    ///     print!("{}", c);
    /// }
    /// println!();
    /// ```
    ///
    /// Using `println!` directly:
    ///
    /// ```
    /// println!("{}", 'ß'.to_uppercase());
    /// ```
    ///
    /// Both are equivalent to:
    ///
    /// ```
    /// println!("SS");
    /// ```
    ///
    /// Using `to_string`:
    ///
    /// ```
    /// assert_eq!('c'.to_uppercase().to_string(), "C");
    ///
    /// // Sometimes the result is more than one character:
    /// assert_eq!('ß'.to_uppercase().to_string(), "SS");
    ///
    /// // Characters that do not have both uppercase and lowercase
    /// // convert into themselves.
    /// assert_eq!('山'.to_uppercase().to_string(), "山");
    /// ```
    ///
    /// # Note on locale
    ///
    /// In Turkish, the equivalent of 'i' in Latin has five forms instead of two:
    ///
    /// * 'Dotless': I / ı, sometimes written ï
    /// * 'Dotted': İ / i
    ///
    /// Note that the lowercase dotted 'i' is the same as the Latin. Therefore:
    ///
    /// ```
    /// let upper_i = 'i'.to_uppercase().to_string();
    /// ```
    ///
    /// The value of `upper_i` here relies on the language of the text: if we're
    /// in `en-US`, it should be `"I"`, but if we're in `tr_TR`, it should
    /// be `"İ"`. `to_uppercase()` does not take this into account, and so:
    ///
    /// ```
    /// let upper_i = 'i'.to_uppercase().to_string();
    ///
    /// assert_eq!(upper_i, "I");
    /// ```
    ///
    /// holds across languages.
    #[stable(feature = "rust1", since = "1.0.0")]
    #[inline]
    pub fn to_uppercase(self) -> ToUppercase {
        ToUppercase(CaseMappingIter::new(conversions::to_upper(self)))
    }

    /// Checks if the value is within the ASCII range.
    ///
    /// # Examples
    ///
    /// ```
    /// let ascii = 'a';
    /// let non_ascii = '❤';
    ///
    /// assert!(ascii.is_ascii());
    /// assert!(!non_ascii.is_ascii());
    /// ```
    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.32.0")]
    #[inline]
    pub const fn is_ascii(&self) -> bool {
        *self as u32 <= 0x7F
    }

    /// Makes a copy of the value in its ASCII upper case equivalent.
    ///
    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
    /// but non-ASCII letters are unchanged.
    ///
    /// To uppercase the value in-place, use [`make_ascii_uppercase()`].
    ///
    /// To uppercase ASCII characters in addition to non-ASCII characters, use
    /// [`to_uppercase()`].
    ///
    /// # Examples
    ///
    /// ```
    /// let ascii = 'a';
    /// let non_ascii = '❤';
    ///
    /// assert_eq!('A', ascii.to_ascii_uppercase());
    /// assert_eq!('❤', non_ascii.to_ascii_uppercase());
    /// ```
    ///
    /// [`make_ascii_uppercase()`]: #method.make_ascii_uppercase
    /// [`to_uppercase()`]: #method.to_uppercase
    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.52.0")]
    #[inline]
    pub const fn to_ascii_uppercase(&self) -> char {
        if self.is_ascii_lowercase() {
            (*self as u8).ascii_change_case_unchecked() as char
        } else {
            *self
        }
    }

    /// Makes a copy of the value in its ASCII lower case equivalent.
    ///
    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
    /// but non-ASCII letters are unchanged.
    ///
    /// To lowercase the value in-place, use [`make_ascii_lowercase()`].
    ///
    /// To lowercase ASCII characters in addition to non-ASCII characters, use
    /// [`to_lowercase()`].
    ///
    /// # Examples
    ///
    /// ```
    /// let ascii = 'A';
    /// let non_ascii = '❤';
    ///
    /// assert_eq!('a', ascii.to_ascii_lowercase());
    /// assert_eq!('❤', non_ascii.to_ascii_lowercase());
    /// ```
    ///
    /// [`make_ascii_lowercase()`]: #method.make_ascii_lowercase
    /// [`to_lowercase()`]: #method.to_lowercase
    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.52.0")]
    #[inline]
    pub const fn to_ascii_lowercase(&self) -> char {
        if self.is_ascii_uppercase() {
            (*self as u8).ascii_change_case_unchecked() as char
        } else {
            *self
        }
    }

    /// Checks that two values are an ASCII case-insensitive match.
    ///
    /// Equivalent to `to_ascii_lowercase(a) == to_ascii_lowercase(b)`.
    ///
    /// # Examples
    ///
    /// ```
    /// let upper_a = 'A';
    /// let lower_a = 'a';
    /// let lower_z = 'z';
    ///
    /// assert!(upper_a.eq_ignore_ascii_case(&lower_a));
    /// assert!(upper_a.eq_ignore_ascii_case(&upper_a));
    /// assert!(!upper_a.eq_ignore_ascii_case(&lower_z));
    /// ```
    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.52.0")]
    #[inline]
    pub const fn eq_ignore_ascii_case(&self, other: &char) -> bool {
        self.to_ascii_lowercase() == other.to_ascii_lowercase()
    }

    /// Converts this type to its ASCII upper case equivalent in-place.
    ///
    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
    /// but non-ASCII letters are unchanged.
    ///
    /// To return a new uppercased value without modifying the existing one, use
    /// [`to_ascii_uppercase()`].
    ///
    /// # Examples
    ///
    /// ```
    /// let mut ascii = 'a';
    ///
    /// ascii.make_ascii_uppercase();
    ///
    /// assert_eq!('A', ascii);
    /// ```
    ///
    /// [`to_ascii_uppercase()`]: #method.to_ascii_uppercase
    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
    #[inline]
    pub fn make_ascii_uppercase(&mut self) {
        *self = self.to_ascii_uppercase();
    }

    /// Converts this type to its ASCII lower case equivalent in-place.
    ///
    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
    /// but non-ASCII letters are unchanged.
    ///
    /// To return a new lowercased value without modifying the existing one, use
    /// [`to_ascii_lowercase()`].
    ///
    /// # Examples
    ///
    /// ```
    /// let mut ascii = 'A';
    ///
    /// ascii.make_ascii_lowercase();
    ///
    /// assert_eq!('a', ascii);
    /// ```
    ///
    /// [`to_ascii_lowercase()`]: #method.to_ascii_lowercase
    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
    #[inline]
    pub fn make_ascii_lowercase(&mut self) {
        *self = self.to_ascii_lowercase();
    }

    /// Checks if the value is an ASCII alphabetic character:
    ///
    /// - U+0041 'A' ..= U+005A 'Z', or
    /// - U+0061 'a' ..= U+007A 'z'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(uppercase_a.is_ascii_alphabetic());
    /// assert!(uppercase_g.is_ascii_alphabetic());
    /// assert!(a.is_ascii_alphabetic());
    /// assert!(g.is_ascii_alphabetic());
    /// assert!(!zero.is_ascii_alphabetic());
    /// assert!(!percent.is_ascii_alphabetic());
    /// assert!(!space.is_ascii_alphabetic());
    /// assert!(!lf.is_ascii_alphabetic());
    /// assert!(!esc.is_ascii_alphabetic());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_alphabetic(&self) -> bool {
        matches!(*self, 'A'..='Z' | 'a'..='z')
    }

    /// Checks if the value is an ASCII uppercase character:
    /// U+0041 'A' ..= U+005A 'Z'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(uppercase_a.is_ascii_uppercase());
    /// assert!(uppercase_g.is_ascii_uppercase());
    /// assert!(!a.is_ascii_uppercase());
    /// assert!(!g.is_ascii_uppercase());
    /// assert!(!zero.is_ascii_uppercase());
    /// assert!(!percent.is_ascii_uppercase());
    /// assert!(!space.is_ascii_uppercase());
    /// assert!(!lf.is_ascii_uppercase());
    /// assert!(!esc.is_ascii_uppercase());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_uppercase(&self) -> bool {
        matches!(*self, 'A'..='Z')
    }

    /// Checks if the value is an ASCII lowercase character:
    /// U+0061 'a' ..= U+007A 'z'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(!uppercase_a.is_ascii_lowercase());
    /// assert!(!uppercase_g.is_ascii_lowercase());
    /// assert!(a.is_ascii_lowercase());
    /// assert!(g.is_ascii_lowercase());
    /// assert!(!zero.is_ascii_lowercase());
    /// assert!(!percent.is_ascii_lowercase());
    /// assert!(!space.is_ascii_lowercase());
    /// assert!(!lf.is_ascii_lowercase());
    /// assert!(!esc.is_ascii_lowercase());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_lowercase(&self) -> bool {
        matches!(*self, 'a'..='z')
    }

    /// Checks if the value is an ASCII alphanumeric character:
    ///
    /// - U+0041 'A' ..= U+005A 'Z', or
    /// - U+0061 'a' ..= U+007A 'z', or
    /// - U+0030 '0' ..= U+0039 '9'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(uppercase_a.is_ascii_alphanumeric());
    /// assert!(uppercase_g.is_ascii_alphanumeric());
    /// assert!(a.is_ascii_alphanumeric());
    /// assert!(g.is_ascii_alphanumeric());
    /// assert!(zero.is_ascii_alphanumeric());
    /// assert!(!percent.is_ascii_alphanumeric());
    /// assert!(!space.is_ascii_alphanumeric());
    /// assert!(!lf.is_ascii_alphanumeric());
    /// assert!(!esc.is_ascii_alphanumeric());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_alphanumeric(&self) -> bool {
        matches!(*self, '0'..='9' | 'A'..='Z' | 'a'..='z')
    }

    /// Checks if the value is an ASCII decimal digit:
    /// U+0030 '0' ..= U+0039 '9'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(!uppercase_a.is_ascii_digit());
    /// assert!(!uppercase_g.is_ascii_digit());
    /// assert!(!a.is_ascii_digit());
    /// assert!(!g.is_ascii_digit());
    /// assert!(zero.is_ascii_digit());
    /// assert!(!percent.is_ascii_digit());
    /// assert!(!space.is_ascii_digit());
    /// assert!(!lf.is_ascii_digit());
    /// assert!(!esc.is_ascii_digit());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_digit(&self) -> bool {
        matches!(*self, '0'..='9')
    }

    /// Checks if the value is an ASCII hexadecimal digit:
    ///
    /// - U+0030 '0' ..= U+0039 '9', or
    /// - U+0041 'A' ..= U+0046 'F', or
    /// - U+0061 'a' ..= U+0066 'f'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(uppercase_a.is_ascii_hexdigit());
    /// assert!(!uppercase_g.is_ascii_hexdigit());
    /// assert!(a.is_ascii_hexdigit());
    /// assert!(!g.is_ascii_hexdigit());
    /// assert!(zero.is_ascii_hexdigit());
    /// assert!(!percent.is_ascii_hexdigit());
    /// assert!(!space.is_ascii_hexdigit());
    /// assert!(!lf.is_ascii_hexdigit());
    /// assert!(!esc.is_ascii_hexdigit());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_hexdigit(&self) -> bool {
        matches!(*self, '0'..='9' | 'A'..='F' | 'a'..='f')
    }

    /// Checks if the value is an ASCII punctuation character:
    ///
    /// - U+0021 ..= U+002F `! " # $ % & ' ( ) * + , - . /`, or
    /// - U+003A ..= U+0040 `: ; < = > ? @`, or
    /// - U+005B ..= U+0060 ``[ \ ] ^ _ ` ``, or
    /// - U+007B ..= U+007E `{ | } ~`
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(!uppercase_a.is_ascii_punctuation());
    /// assert!(!uppercase_g.is_ascii_punctuation());
    /// assert!(!a.is_ascii_punctuation());
    /// assert!(!g.is_ascii_punctuation());
    /// assert!(!zero.is_ascii_punctuation());
    /// assert!(percent.is_ascii_punctuation());
    /// assert!(!space.is_ascii_punctuation());
    /// assert!(!lf.is_ascii_punctuation());
    /// assert!(!esc.is_ascii_punctuation());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_punctuation(&self) -> bool {
        matches!(*self, '!'..='/' | ':'..='@' | '['..='`' | '{'..='~')
    }

    /// Checks if the value is an ASCII graphic character:
    /// U+0021 '!' ..= U+007E '~'.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(uppercase_a.is_ascii_graphic());
    /// assert!(uppercase_g.is_ascii_graphic());
    /// assert!(a.is_ascii_graphic());
    /// assert!(g.is_ascii_graphic());
    /// assert!(zero.is_ascii_graphic());
    /// assert!(percent.is_ascii_graphic());
    /// assert!(!space.is_ascii_graphic());
    /// assert!(!lf.is_ascii_graphic());
    /// assert!(!esc.is_ascii_graphic());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_graphic(&self) -> bool {
        matches!(*self, '!'..='~')
    }

    /// Checks if the value is an ASCII whitespace character:
    /// U+0020 SPACE, U+0009 HORIZONTAL TAB, U+000A LINE FEED,
    /// U+000C FORM FEED, or U+000D CARRIAGE RETURN.
    ///
    /// Rust uses the WhatWG Infra Standard's [definition of ASCII
    /// whitespace][infra-aw]. There are several other definitions in
    /// wide use. For instance, [the POSIX locale][pct] includes
    /// U+000B VERTICAL TAB as well as all the above characters,
    /// but—from the very same specification—[the default rule for
    /// "field splitting" in the Bourne shell][bfs] considers *only*
    /// SPACE, HORIZONTAL TAB, and LINE FEED as whitespace.
    ///
    /// If you are writing a program that will process an existing
    /// file format, check what that format's definition of whitespace is
    /// before using this function.
    ///
    /// [infra-aw]: https://infra.spec.whatwg.org/#ascii-whitespace
    /// [pct]: http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap07.html#tag_07_03_01
    /// [bfs]: http://pubs.opengroup.org/onlinepubs/9699919799/utilities/V3_chap02.html#tag_18_06_05
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(!uppercase_a.is_ascii_whitespace());
    /// assert!(!uppercase_g.is_ascii_whitespace());
    /// assert!(!a.is_ascii_whitespace());
    /// assert!(!g.is_ascii_whitespace());
    /// assert!(!zero.is_ascii_whitespace());
    /// assert!(!percent.is_ascii_whitespace());
    /// assert!(space.is_ascii_whitespace());
    /// assert!(lf.is_ascii_whitespace());
    /// assert!(!esc.is_ascii_whitespace());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_whitespace(&self) -> bool {
        matches!(*self, '\t' | '\n' | '\x0C' | '\r' | ' ')
    }

    /// Checks if the value is an ASCII control character:
    /// U+0000 NUL ..= U+001F UNIT SEPARATOR, or U+007F DELETE.
    /// Note that most ASCII whitespace characters are control
    /// characters, but SPACE is not.
    ///
    /// # Examples
    ///
    /// ```
    /// let uppercase_a = 'A';
    /// let uppercase_g = 'G';
    /// let a = 'a';
    /// let g = 'g';
    /// let zero = '0';
    /// let percent = '%';
    /// let space = ' ';
    /// let lf = '\n';
    /// let esc: char = 0x1b_u8.into();
    ///
    /// assert!(!uppercase_a.is_ascii_control());
    /// assert!(!uppercase_g.is_ascii_control());
    /// assert!(!a.is_ascii_control());
    /// assert!(!g.is_ascii_control());
    /// assert!(!zero.is_ascii_control());
    /// assert!(!percent.is_ascii_control());
    /// assert!(!space.is_ascii_control());
    /// assert!(lf.is_ascii_control());
    /// assert!(esc.is_ascii_control());
    /// ```
    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
    #[inline]
    pub const fn is_ascii_control(&self) -> bool {
        matches!(*self, '\0'..='\x1F' | '\x7F')
    }
}

#[inline]
const fn len_utf8(code: u32) -> usize {
    if code < MAX_ONE_B {
        1
    } else if code < MAX_TWO_B {
        2
    } else if code < MAX_THREE_B {
        3
    } else {
        4
    }
}

/// Encodes a raw u32 value as UTF-8 into the provided byte buffer,
/// and then returns the subslice of the buffer that contains the encoded character.
///
/// Unlike `char::encode_utf8`, this method also handles codepoints in the surrogate range.
/// (Creating a `char` in the surrogate range is UB.)
/// The result is valid [generalized UTF-8] but not valid UTF-8.
///
/// [generalized UTF-8]: https://simonsapin.github.io/wtf-8/#generalized-utf8
///
/// # Panics
///
/// Panics if the buffer is not large enough.
/// A buffer of length four is large enough to encode any `char`.
#[unstable(feature = "char_internals", reason = "exposed only for libstd", issue = "none")]
#[doc(hidden)]
#[inline]
pub fn encode_utf8_raw(code: u32, dst: &mut [u8]) -> &mut [u8] {
    let len = len_utf8(code);
    match (len, &mut dst[..]) {
        (1, [a, ..]) => {
            *a = code as u8;
        }
        (2, [a, b, ..]) => {
            *a = (code >> 6 & 0x1F) as u8 | TAG_TWO_B;
            *b = (code & 0x3F) as u8 | TAG_CONT;
        }
        (3, [a, b, c, ..]) => {
            *a = (code >> 12 & 0x0F) as u8 | TAG_THREE_B;
            *b = (code >> 6 & 0x3F) as u8 | TAG_CONT;
            *c = (code & 0x3F) as u8 | TAG_CONT;
        }
        (4, [a, b, c, d, ..]) => {
            *a = (code >> 18 & 0x07) as u8 | TAG_FOUR_B;
            *b = (code >> 12 & 0x3F) as u8 | TAG_CONT;
            *c = (code >> 6 & 0x3F) as u8 | TAG_CONT;
            *d = (code & 0x3F) as u8 | TAG_CONT;
        }
        _ => panic!(
            "encode_utf8: need {} bytes to encode U+{:X}, but the buffer has {}",
            len,
            code,
            dst.len(),
        ),
    };
    &mut dst[..len]
}

/// Encodes a raw u32 value as UTF-16 into the provided `u16` buffer,
/// and then returns the subslice of the buffer that contains the encoded character.
///
/// Unlike `char::encode_utf16`, this method also handles codepoints in the surrogate range.
/// (Creating a `char` in the surrogate range is UB.)
///
/// # Panics
///
/// Panics if the buffer is not large enough.
/// A buffer of length 2 is large enough to encode any `char`.
#[unstable(feature = "char_internals", reason = "exposed only for libstd", issue = "none")]
#[doc(hidden)]
#[inline]
pub fn encode_utf16_raw(mut code: u32, dst: &mut [u16]) -> &mut [u16] {
    // SAFETY: each arm checks whether there are enough bits to write into
    unsafe {
        if (code & 0xFFFF) == code && !dst.is_empty() {
            // The BMP falls through
            *dst.get_unchecked_mut(0) = code as u16;
            slice::from_raw_parts_mut(dst.as_mut_ptr(), 1)
        } else if dst.len() >= 2 {
            // Supplementary planes break into surrogates.
            code -= 0x1_0000;
            *dst.get_unchecked_mut(0) = 0xD800 | ((code >> 10) as u16);
            *dst.get_unchecked_mut(1) = 0xDC00 | ((code as u16) & 0x3FF);
            slice::from_raw_parts_mut(dst.as_mut_ptr(), 2)
        } else {
            panic!(
                "encode_utf16: need {} units to encode U+{:X}, but the buffer has {}",
                from_u32_unchecked(code).len_utf16(),
                code,
                dst.len(),
            )
        }
    }
}
-												Move the rest of core::unicode::char to core::unicode

											
										
										
											2018-04-05 18:36:02 +02:00
+								//! impl char {}
-												std: Stabilize more of the `char` module

This commit performs another pass over the `std::char` module for stabilization.
Some minor cleanup is performed such as migrating documentation from libcore to
libunicode (where the `std`-facing trait resides) as well as a slight
reorganiation in libunicode itself. Otherwise, the stability modifications made
are:

* `char::from_digit` is now stable
* `CharExt::is_digit` is now stable
* `CharExt::to_digit` is now stable
* `CharExt::to_{lower,upper}case` are now stable after being modified to return
  an iterator over characters. While the implementation today has not changed
  this should allow us to implement the full set of case conversions in unicode
  where some characters can map to multiple when doing an upper or lower case
  mapping.
* `StrExt::to_{lower,upper}case` was added as unstable for a convenience of not
  having to worry about characters expanding to more characters when you just
  want the whole string to get into upper or lower case.

This is a breaking change due to the change in the signatures of the
`CharExt::to_{upper,lower}case` methods. Code can be updated to use functions
like `flat_map` or `collect` to handle the difference.

[breaking-change]

											
										
										
											2015-03-06 03:23:57 +01:00
-												Simpler way to convert to digit

											
										
										
											2021-02-14 12:34:22 +01:00
+								use crate::intrinsics::likely;
-												libcore => 2018

											
										
										
											2019-04-15 04:23:21 +02:00
+								use crate::slice;
 								use crate::str::from_utf8_unchecked_mut;
 								use crate::unicode::printable::is_printable;
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								use crate::unicode::{self, conversions};
-												libcore => 2018

											
										
										
											2019-04-15 04:23:21 +02:00
-												Move the rest of core::unicode::char to core::unicode

											
										
										
											2018-04-05 18:36:02 +02:00
+								use super::*;
-												Add libunicode; move unicode functions from core

- created new crate, libunicode, below libstd
- split Char trait into Char (libcore) and UnicodeChar (libunicode)
  - Unicode-aware functions now live in libunicode
    - is_alphabetic, is_XID_start, is_XID_continue, is_lowercase,
      is_uppercase, is_whitespace, is_alphanumeric, is_control,
      is_digit, to_uppercase, to_lowercase
  - added width method in UnicodeChar trait
    - determines printed width of character in columns, or None if it is
      a non-NULL control character
    - takes a boolean argument indicating whether the present context is
      CJK or not (characters with 'A'mbiguous widths are double-wide in
      CJK contexts, single-wide otherwise)
- split StrSlice into StrSlice (libcore) and UnicodeStrSlice
  (libunicode)
  - functionality formerly in StrSlice that relied upon Unicode
    functionality from Char is now in UnicodeStrSlice
    - words, is_whitespace, is_alphanumeric, trim, trim_left, trim_right
  - also moved Words type alias into libunicode because words method is
    in UnicodeStrSlice
- unified Unicode tables from libcollections, libcore, and libregex into
  libunicode
- updated unicode.py in src/etc to generate aforementioned tables
- generated new tables based on latest Unicode data
- added UnicodeChar and UnicodeStrSlice traits to prelude
- libunicode is now the collection point for the std::char module,
  combining the libunicode functionality with the Char functionality
  from libcore
  - thus, moved doc comment for char from core::char to unicode::char
- libcollections remains the collection point for std::str

The Unicode-aware functions that previously lived in the Char and
StrSlice traits are no longer available to programs that only use
libcore. To regain use of these methods, include the libunicode crate
and use the UnicodeChar and/or UnicodeStrSlice traits:

    extern crate unicode;
    use unicode::UnicodeChar;
    use unicode::UnicodeStrSlice;
    use unicode::Words; // if you want to use the words() method

NOTE: this does *not* impact programs that use libstd, since UnicodeChar
and UnicodeStrSlice have been added to the prelude.

closes #15224
[breaking-change]

											
										
										
											2014-06-30 23:04:10 +02:00
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								#[lang = "char"]
 								impl char {
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    /// The highest valid code point a `char` can have.
 								    ///
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// A `char` is a [Unicode Scalar Value], which means that it is a [Code
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    /// Point], but only ones within a certain range. `MAX` is the highest valid
 								    /// code point that's a valid [Unicode Scalar Value].
 								    ///
 								    /// [Unicode Scalar Value]: http://www.unicode.org/glossary/#unicode_scalar_value
 								    /// [Code Point]: http://www.unicode.org/glossary/#code_point
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_consts", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    pub const MAX: char = '\u{10ffff}';
 								    /// `U+FFFD REPLACEMENT CHARACTER` (<28>) is used in Unicode to represent a
 								    /// decoding error.
 								    ///
 								    /// It can occur, for example, when giving ill-formed UTF-8 bytes to
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// [`String::from_utf8_lossy`](string/struct.String.html#method.from_utf8_lossy).
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_consts", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    pub const REPLACEMENT_CHARACTER: char = '\u{FFFD}';
 								    /// The version of [Unicode](http://www.unicode.org/) that the Unicode parts of
 								    /// `char` and `str` methods are based on.
 								    ///
 								    /// New versions of Unicode are released regularly and subsequently all methods
 								    /// in the standard library depending on Unicode are updated. Therefore the
 								    /// behavior of some `char` and `str` methods and the value of this constant
 								    /// changes over time. This is *not* considered to be a breaking change.
 								    ///
 								    /// The version numbering scheme is explained in
 								    /// [Unicode 11.0 or later, Section 3.1 Versions of the Unicode Standard](https://www.unicode.org/versions/Unicode11.0.0/ch03.pdf#page=4).
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_consts", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    pub const UNICODE_VERSION: (u8, u8, u8) = crate::unicode::UNICODE_VERSION;
 								    /// Creates an iterator over the UTF-16 encoded code points in `iter`,
 								    /// returning unpaired surrogates as `Err`s.
 								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
 								    /// use std::char::decode_utf16;
 								    ///
 								    /// // 𝄞mus<invalid>ic<invalid>
 								    /// let v = [
 								    ///     0xD834, 0xDD1E, 0x006d, 0x0075, 0x0073, 0xDD1E, 0x0069, 0x0063, 0xD834,
 								    /// ];
 								    ///
 								    /// assert_eq!(
 								    ///     decode_utf16(v.iter().cloned())
 								    ///         .map(|r| r.map_err(|e| e.unpaired_surrogate()))
 								    ///         .collect::<Vec<_>>(),
 								    ///     vec![
 								    ///         Ok('𝄞'),
 								    ///         Ok('m'), Ok('u'), Ok('s'),
 								    ///         Err(0xDD1E),
 								    ///         Ok('i'), Ok('c'),
 								    ///         Err(0xD834)
 								    ///     ]
 								    /// );
 								    /// ```
 								    ///
 								    /// A lossy decoder can be obtained by replacing `Err` results with the replacement character:
 								    ///
 								    /// ```
 								    /// use std::char::{decode_utf16, REPLACEMENT_CHARACTER};
 								    ///
 								    /// // 𝄞mus<invalid>ic<invalid>
 								    /// let v = [
 								    ///     0xD834, 0xDD1E, 0x006d, 0x0075, 0x0073, 0xDD1E, 0x0069, 0x0063, 0xD834,
 								    /// ];
 								    ///
 								    /// assert_eq!(
 								    ///     decode_utf16(v.iter().cloned())
 								    ///        .map(|r| r.unwrap_or(REPLACEMENT_CHARACTER))
 								    ///        .collect::<String>(),
 								    ///     "𝄞mus<75>ic<69>"
 								    /// );
 								    /// ```
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    #[inline]
 								    pub fn decode_utf16<I: IntoIterator<Item = u16>>(iter: I) -> DecodeUtf16<I::IntoIter> {
 								        super::decode::decode_utf16(iter)
 								    }
 								    /// Converts a `u32` to a `char`.
 								    ///
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// Note that all `char`s are valid [`u32`]s, and can be cast to one with
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    /// `as`:
 								    ///
 								    /// ```
 								    /// let c = '💯';
 								    /// let i = c as u32;
 								    ///
 								    /// assert_eq!(128175, i);
 								    /// ```
 								    ///
 								    /// However, the reverse is not true: not all valid [`u32`]s are valid
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// `char`s. `from_u32()` will return `None` if the input is not a valid value
 								    /// for a `char`.
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    ///
 								    /// For an unsafe version of this function which ignores these checks, see
 								    /// [`from_u32_unchecked`].
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`from_u32_unchecked`]: #method.from_u32_unchecked
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
 								    /// use std::char;
 								    ///
 								    /// let c = char::from_u32(0x2764);
 								    ///
 								    /// assert_eq!(Some('❤'), c);
 								    /// ```
 								    ///
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// Returning `None` when the input is not a valid `char`:
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    ///
 								    /// ```
 								    /// use std::char;
 								    ///
 								    /// let c = char::from_u32(0x110000);
 								    ///
 								    /// assert_eq!(None, c);
 								    /// ```
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    #[inline]
 								    pub fn from_u32(i: u32) -> Option<char> {
 								        super::convert::from_u32(i)
 								    }
 								    /// Converts a `u32` to a `char`, ignoring validity.
 								    ///
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// Note that all `char`s are valid [`u32`]s, and can be cast to one with
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    /// `as`:
 								    ///
 								    /// ```
 								    /// let c = '💯';
 								    /// let i = c as u32;
 								    ///
 								    /// assert_eq!(128175, i);
 								    /// ```
 								    ///
 								    /// However, the reverse is not true: not all valid [`u32`]s are valid
-												Try to fix doc links in new `char` methods.

											
										
										
											2020-05-03 20:04:52 +02:00
+								    /// `char`s. `from_u32_unchecked()` will ignore this, and blindly cast to
 								    /// `char`, possibly creating an invalid one.
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    ///
 								    /// # Safety
 								    ///
 								    /// This function is unsafe, as it may construct invalid `char` values.
 								    ///
 								    /// For a safe version of this function, see the [`from_u32`] function.
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`from_u32`]: #method.from_u32
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
 								    /// use std::char;
 								    ///
 								    /// let c = unsafe { char::from_u32_unchecked(0x2764) };
 								    ///
 								    /// assert_eq!('❤', c);
 								    /// ```
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    #[inline]
 								    pub unsafe fn from_u32_unchecked(i: u32) -> char {
-												Deny unsafe ops in unsafe fns, part 1

											
										
										
											2020-06-22 00:54:46 +02:00
+								        // SAFETY: the safety contract must be upheld by the caller.
 								        unsafe { super::convert::from_u32_unchecked(i) }
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    }
 								    /// Converts a digit in the given radix to a `char`.
 								    ///
 								    /// A 'radix' here is sometimes also called a 'base'. A radix of two
 								    /// indicates a binary number, a radix of ten, decimal, and a radix of
 								    /// sixteen, hexadecimal, to give some common values. Arbitrary
 								    /// radices are supported.
 								    ///
 								    /// `from_digit()` will return `None` if the input is not a digit in
 								    /// the given radix.
 								    ///
 								    /// # Panics
 								    ///
 								    /// Panics if given a radix larger than 36.
 								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
 								    /// use std::char;
 								    ///
 								    /// let c = char::from_digit(4, 10);
 								    ///
 								    /// assert_eq!(Some('4'), c);
 								    ///
 								    /// // Decimal 11 is a single digit in base 16
 								    /// let c = char::from_digit(11, 16);
 								    ///
 								    /// assert_eq!(Some('b'), c);
 								    /// ```
 								    ///
 								    /// Returning `None` when the input is not a digit:
 								    ///
 								    /// ```
 								    /// use std::char;
 								    ///
 								    /// let c = char::from_digit(20, 10);
 								    ///
 								    /// assert_eq!(None, c);
 								    /// ```
 								    ///
 								    /// Passing a large radix, causing a panic:
 								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// ```should_panic
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    /// use std::char;
 								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// // this panics
 								    /// char::from_digit(1, 37);
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    /// ```
-												Stabilize `assoc_char_funcs` and `assoc_char_consts`

											
										
										
											2021-03-09 00:44:03 +01:00
+								    #[stable(feature = "assoc_char_funcs", since = "1.52.0")]
-												Make `std::char` functions and constants associated to `char`.

											
										
										
											2020-05-03 18:12:00 +02:00
+								    #[inline]
 								    pub fn from_digit(num: u32, radix: u32) -> Option<char> {
 								        super::convert::from_digit(num, radix)
 								    }
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Checks if a `char` is a digit in the given radix.
 								    ///
 								    /// A 'radix' here is sometimes also called a 'base'. A radix of two
 								    /// indicates a binary number, a radix of ten, decimal, and a radix of
-												Fix the spelling of "hexadecimal"

											
										
										
											2016-01-05 16:40:40 +01:00
+								    /// sixteen, hexadecimal, to give some common values. Arbitrary
-												Use "radices" instead of "radicum"

											
										
										
											2016-11-23 14:49:35 +01:00
+								    /// radices are supported.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// Compared to [`is_numeric()`], this function only recognizes the characters
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// `0-9`, `a-z` and `A-Z`.
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// 'Digit' is defined to be only the following characters:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// * `0-9`
 								    /// * `a-z`
 								    /// * `A-Z`
 								    ///
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// For a more comprehensive understanding of 'digit', see [`is_numeric()`].
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`is_numeric()`]: #method.is_numeric
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Panics
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Panics if given a radix larger than 36.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Basic usage:
 								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('1'.is_digit(10));
 								    /// assert!('f'.is_digit(16));
 								    /// assert!(!'f'.is_digit(10));
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
 								    ///
 								    /// Passing a large radix, causing a panic:
 								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// ```should_panic
 								    /// // this panics
 								    /// '1'.is_digit(37);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    pub fn is_digit(self, radix: u32) -> bool {
-												Remove the CharExt trait, now that libcore has inherent methods for char

											
										
										
											2018-04-05 18:46:16 +02:00
+								        self.to_digit(radix).is_some()
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Converts a `char` to a digit in the given radix.
 								    ///
 								    /// A 'radix' here is sometimes also called a 'base'. A radix of two
 								    /// indicates a binary number, a radix of ten, decimal, and a radix of
-												Fix the spelling of "hexadecimal"

											
										
										
											2016-01-05 16:40:40 +01:00
+								    /// sixteen, hexadecimal, to give some common values. Arbitrary
-												Use "radices" instead of "radicum"

											
										
										
											2016-11-23 14:49:35 +01:00
+								    /// radices are supported.
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// 'Digit' is defined to be only the following characters:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// * `0-9`
 								    /// * `a-z`
 								    /// * `A-Z`
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												docs: Standardize on 'Errors' header in std docs

											
										
										
											2016-02-02 03:41:29 +01:00
+								    /// # Errors
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// Returns `None` if the `char` does not refer to a digit in the given radix.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Panics
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Panics if given a radix larger than 36.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert_eq!('1'.to_digit(10), Some(1));
 								    /// assert_eq!('f'.to_digit(16), Some(15));
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
 								    ///
 								    /// Passing a non-digit results in failure:
 								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert_eq!('f'.to_digit(10), None);
 								    /// assert_eq!('z'.to_digit(16), None);
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
 								    ///
 								    /// Passing a large radix, causing a panic:
 								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// ```should_panic
 								    /// // this panics
 								    /// '1'.to_digit(37);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    #[stable(feature = "rust1", since = "1.0.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    pub fn to_digit(self, radix: u32) -> Option<u32> {
-												Simpler way to convert to digit

											
										
										
											2021-02-14 12:34:22 +01:00
+								        assert!(radix <= 36, "to_digit: radix is too high (maximum 36)");
-												core/char: Add comment to `to_digit()`

											
										
										
											2018-11-14 11:26:00 +01:00
+								        // the code is split up here to improve execution speed for cases where
 								        // the `radix` is constant and 10 or smaller
-												Simpler way to convert to digit

											
										
										
											2021-02-14 12:34:22 +01:00
+								        let val = if likely(radix <= 10) {
 								            // If not a digit, a number greater than radix will be created.
-												Use wrapping sub

Co-authored-by: Mara <m-ou.se@m-ou.se>
											
										
										
											2021-02-15 08:35:28 +01:00
+								            (self as u32).wrapping_sub('0' as u32)
-												core/char: Speed up `to_digit()` for `radix <= 10`

### Before

```
# Run 1
test char::methods::bench_to_digit_radix_10                ... bench:      16,265 ns/iter (+/- 1,774)
test char::methods::bench_to_digit_radix_16                ... bench:      13,938 ns/iter (+/- 2,479)
test char::methods::bench_to_digit_radix_2                 ... bench:      13,090 ns/iter (+/- 524)
test char::methods::bench_to_digit_radix_36                ... bench:      14,236 ns/iter (+/- 1,949)

# Run 2
test char::methods::bench_to_digit_radix_10                ... bench:      16,176 ns/iter (+/- 1,589)
test char::methods::bench_to_digit_radix_16                ... bench:      13,896 ns/iter (+/- 3,140)
test char::methods::bench_to_digit_radix_2                 ... bench:      13,158 ns/iter (+/- 1,112)
test char::methods::bench_to_digit_radix_36                ... bench:      14,206 ns/iter (+/- 1,312)

# Run 3
test char::methods::bench_to_digit_radix_10                ... bench:      16,221 ns/iter (+/- 2,423)
test char::methods::bench_to_digit_radix_16                ... bench:      14,361 ns/iter (+/- 3,926)
test char::methods::bench_to_digit_radix_2                 ... bench:      13,097 ns/iter (+/- 671)
test char::methods::bench_to_digit_radix_36                ... bench:      14,388 ns/iter (+/- 1,068)
```

### After

```
# Run 1
test char::methods::bench_to_digit_radix_10      ... bench:      11,521 ns/iter (+/- 552)
test char::methods::bench_to_digit_radix_16      ... bench:      12,926 ns/iter (+/- 684)
test char::methods::bench_to_digit_radix_2       ... bench:      11,266 ns/iter (+/- 1,085)
test char::methods::bench_to_digit_radix_36      ... bench:      14,213 ns/iter (+/- 614)

# Run 2
test char::methods::bench_to_digit_radix_10      ... bench:      11,424 ns/iter (+/- 1,042)
test char::methods::bench_to_digit_radix_16      ... bench:      12,854 ns/iter (+/- 1,193)
test char::methods::bench_to_digit_radix_2       ... bench:      11,193 ns/iter (+/- 716)
test char::methods::bench_to_digit_radix_36      ... bench:      14,249 ns/iter (+/- 3,514)

# Run 3
test char::methods::bench_to_digit_radix_10      ... bench:      11,469 ns/iter (+/- 685)
test char::methods::bench_to_digit_radix_16      ... bench:      12,852 ns/iter (+/- 568)
test char::methods::bench_to_digit_radix_2       ... bench:      11,275 ns/iter (+/- 1,356)
test char::methods::bench_to_digit_radix_36      ... bench:      14,188 ns/iter (+/- 1,501)
```

											
										
										
											2018-11-13 18:05:46 +01:00
+								        } else {
 								            match self {
 								                '0'..='9' => self as u32 - '0' as u32,
 								                'a'..='z' => self as u32 - 'a' as u32 + 10,
 								                'A'..='Z' => self as u32 - 'A' as u32 + 10,
 								                _ => return None,
 								            }
-												Remove the CharExt trait, now that libcore has inherent methods for char

											
										
										
											2018-04-05 18:46:16 +02:00
+								        };
-												core/char: Speed up `to_digit()` for `radix <= 10`

### Before

```
# Run 1
test char::methods::bench_to_digit_radix_10                ... bench:      16,265 ns/iter (+/- 1,774)
test char::methods::bench_to_digit_radix_16                ... bench:      13,938 ns/iter (+/- 2,479)
test char::methods::bench_to_digit_radix_2                 ... bench:      13,090 ns/iter (+/- 524)
test char::methods::bench_to_digit_radix_36                ... bench:      14,236 ns/iter (+/- 1,949)

# Run 2
test char::methods::bench_to_digit_radix_10                ... bench:      16,176 ns/iter (+/- 1,589)
test char::methods::bench_to_digit_radix_16                ... bench:      13,896 ns/iter (+/- 3,140)
test char::methods::bench_to_digit_radix_2                 ... bench:      13,158 ns/iter (+/- 1,112)
test char::methods::bench_to_digit_radix_36                ... bench:      14,206 ns/iter (+/- 1,312)

# Run 3
test char::methods::bench_to_digit_radix_10                ... bench:      16,221 ns/iter (+/- 2,423)
test char::methods::bench_to_digit_radix_16                ... bench:      14,361 ns/iter (+/- 3,926)
test char::methods::bench_to_digit_radix_2                 ... bench:      13,097 ns/iter (+/- 671)
test char::methods::bench_to_digit_radix_36                ... bench:      14,388 ns/iter (+/- 1,068)
```

### After

```
# Run 1
test char::methods::bench_to_digit_radix_10      ... bench:      11,521 ns/iter (+/- 552)
test char::methods::bench_to_digit_radix_16      ... bench:      12,926 ns/iter (+/- 684)
test char::methods::bench_to_digit_radix_2       ... bench:      11,266 ns/iter (+/- 1,085)
test char::methods::bench_to_digit_radix_36      ... bench:      14,213 ns/iter (+/- 614)

# Run 2
test char::methods::bench_to_digit_radix_10      ... bench:      11,424 ns/iter (+/- 1,042)
test char::methods::bench_to_digit_radix_16      ... bench:      12,854 ns/iter (+/- 1,193)
test char::methods::bench_to_digit_radix_2       ... bench:      11,193 ns/iter (+/- 716)
test char::methods::bench_to_digit_radix_36      ... bench:      14,249 ns/iter (+/- 3,514)

# Run 3
test char::methods::bench_to_digit_radix_10      ... bench:      11,469 ns/iter (+/- 685)
test char::methods::bench_to_digit_radix_16      ... bench:      12,852 ns/iter (+/- 568)
test char::methods::bench_to_digit_radix_2       ... bench:      11,275 ns/iter (+/- 1,356)
test char::methods::bench_to_digit_radix_36      ... bench:      14,188 ns/iter (+/- 1,501)
```

											
										
										
											2018-11-13 18:05:46 +01:00
-												Format libcore with rustfmt

This commit applies rustfmt with default settings to files in
src/libcore *that are not involved in any currently open PR* to minimize
merge conflicts. The list of files involved in open PRs was determined
by querying GitHub's GraphQL API with this script:
https://gist.github.com/dtolnay/aa9c34993dc051a4f344d1b10e4487e8

With the list of files from the script in `outstanding_files`, the
relevant commands were:

    $ find src/libcore -name '*.rs' | xargs rustfmt --edition=2018
    $ rg libcore outstanding_files | xargs git checkout --

Repeating this process several months apart should get us coverage of
most of the rest of libcore.

											
										
										
											2019-11-24 10:43:32 +01:00
+								        if val < radix { Some(val) } else { None }
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
 								    /// Returns an iterator that yields the hexadecimal Unicode escape of a
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// character as `char`s.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// This will escape characters with the Rust syntax of the form
 								    /// `\u{NNNNNN}` where `NNNNNN` is a hexadecimal representation.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// As an iterator:
-												Fix up docs for char

Part of https://github.com/rust-lang/rust/issues/29333

											
										
										
											2015-11-23 22:56:07 +01:00
+								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												doc: 'c' feels more suitable than 'i' for representing characters

											
										
										
											2015-06-13 00:01:16 +02:00
+								    /// for c in '❤'.escape_unicode() {
 								    ///     print!("{}", c);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// }
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!();
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Using `println!` directly:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// ```
 								    /// println!("{}", '❤'.escape_unicode());
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Both are equivalent to:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!("\\u{{2764}}");
 								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Using `to_string`:
 								    ///
 								    /// ```
 								    /// assert_eq!('❤'.escape_unicode().to_string(), "\\u{2764}");
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    #[stable(feature = "rust1", since = "1.0.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												Remove const from iterator fns

											
										
										
											2021-02-14 00:16:48 +01:00
+								    pub fn escape_unicode(self) -> EscapeUnicode {
-												Remove the CharExt trait, now that libcore has inherent methods for char

											
										
										
											2018-04-05 18:46:16 +02:00
+								        let c = self as u32;
 								        // or-ing 1 ensures that for c==0 the code computes that one
 								        // digit should be printed and (which is the same) avoids the
 								        // (31 - 32) underflow
 								        let msb = 31 - (c | 1).leading_zeros();
 								        // the index of the most significant hex digit
 								        let ms_hex_digit = msb / 4;
 								        EscapeUnicode {
 								            c: self,
 								            state: EscapeUnicodeState::Backslash,
 								            hex_digit_idx: ms_hex_digit as usize,
 								        }
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												Only escape extended grapheme characters in the first position

											
										
										
											2018-05-17 11:45:34 +02:00
+								    /// An extended version of `escape_debug` that optionally permits escaping
 								    /// Extended Grapheme codepoints. This allows us to format characters like
 								    /// nonspacing marks better when they're at the start of a string.
 								    #[inline]
-												Make the prema-unstable char::escape_debug_ext method crate-private

											
										
										
											2019-02-02 10:37:40 +01:00
+								    pub(crate) fn escape_debug_ext(self, escape_grapheme_extended: bool) -> EscapeDebug {
-												Only escape extended grapheme characters in the first position

											
										
										
											2018-05-17 11:45:34 +02:00
+								        let init_state = match self {
 								            '\t' => EscapeDefaultState::Backslash('t'),
 								            '\r' => EscapeDefaultState::Backslash('r'),
 								            '\n' => EscapeDefaultState::Backslash('n'),
 								            '\\' | '\'' | '"' => EscapeDefaultState::Backslash(self),
 								            _ if escape_grapheme_extended && self.is_grapheme_extended() => {
 								                EscapeDefaultState::Unicode(self.escape_unicode())
 								            }
 								            _ if is_printable(self) => EscapeDefaultState::Char(self),
 								            _ => EscapeDefaultState::Unicode(self.escape_unicode()),
 								        };
 								        EscapeDebug(EscapeDefault { state: init_state })
 								    }
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Returns an iterator that yields the literal escape code of a character
 								    /// as `char`s.
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    ///
 								    /// This will escape the characters similar to the `Debug` implementations
 								    /// of `str` or `char`.
 								    ///
 								    /// # Examples
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// As an iterator:
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// for c in '\n'.escape_debug() {
 								    ///     print!("{}", c);
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    /// }
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!();
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    /// ```
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Using `println!` directly:
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// ```
 								    /// println!("{}", '\n'.escape_debug());
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    /// ```
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Both are equivalent to:
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!("\\n");
 								    /// ```
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Using `to_string`:
 								    ///
 								    /// ```
 								    /// assert_eq!('\n'.escape_debug().to_string(), "\\n");
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    /// ```
-												std: Stabilize `char_escape_debug`

Stabilizes:

* `<char>::escape_debug`
* `std::char::EscapeDebug`

Closes #35068

											
										
										
											2017-07-21 00:38:59 +02:00
+								    #[stable(feature = "char_escape_debug", since = "1.20.0")]
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    #[inline]
-												Rename `char::escape` to `char::escape_debug` and add tracking issue

											
										
										
											2016-07-27 12:10:31 +02:00
+								    pub fn escape_debug(self) -> EscapeDebug {
-												Only escape extended grapheme characters in the first position

											
										
										
											2018-05-17 11:45:34 +02:00
+								        self.escape_debug_ext(true)
-												Restore `char::escape_default` and add `char::escape` instead

											
										
										
											2016-07-26 01:39:54 +02:00
+								    }
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Returns an iterator that yields the literal escape code of a character
 								    /// as `char`s.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// The default is chosen with a bias toward producing literals that are
 								    /// legal in a variety of languages, including C++11 and similar C-family
 								    /// languages. The exact rules are:
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// * Tab is escaped as `\t`.
 								    /// * Carriage return is escaped as `\r`.
 								    /// * Line feed is escaped as `\n`.
 								    /// * Single quote is escaped as `\'`.
 								    /// * Double quote is escaped as `\"`.
 								    /// * Backslash is escaped as `\\`.
 								    /// * Any character in the 'printable ASCII' range `0x20` .. `0x7e`
 								    ///   inclusive is not escaped.
 								    /// * All other characters are given hexadecimal Unicode escapes; see
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    ///   [`escape_unicode`].
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`escape_unicode`]: #method.escape_unicode
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// As an iterator:
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// for c in '"'.escape_default() {
 								    ///     print!("{}", c);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// }
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!();
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// Using `println!` directly:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!("{}", '"'.escape_default());
 								    /// ```
 								    ///
 								    /// Both are equivalent to:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// println!("\\\"");
 								    /// ```
 								    ///
 								    /// Using `to_string`:
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// ```
 								    /// assert_eq!('"'.escape_default().to_string(), "\\\"");
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    #[stable(feature = "rust1", since = "1.0.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												Remove const from iterator fns

											
										
										
											2021-02-14 00:16:48 +01:00
+								    pub fn escape_default(self) -> EscapeDefault {
-												Remove the CharExt trait, now that libcore has inherent methods for char

											
										
										
											2018-04-05 18:46:16 +02:00
+								        let init_state = match self {
 								            '\t' => EscapeDefaultState::Backslash('t'),
 								            '\r' => EscapeDefaultState::Backslash('r'),
 								            '\n' => EscapeDefaultState::Backslash('n'),
 								            '\\' | '\'' | '"' => EscapeDefaultState::Backslash(self),
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								            '\x20'..='\x7e' => EscapeDefaultState::Char(self),
 								            _ => EscapeDefaultState::Unicode(self.escape_unicode()),
-												Remove the CharExt trait, now that libcore has inherent methods for char

											
										
										
											2018-04-05 18:46:16 +02:00
+								        };
 								        EscapeDefault { state: init_state }
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Returns the number of bytes this `char` would need if encoded in UTF-8.
 								    ///
 								    /// That number of bytes is always between 1 and 4, inclusive.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Basic usage:
 								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// let len = 'A'.len_utf8();
 								    /// assert_eq!(len, 1);
 								    ///
 								    /// let len = 'ß'.len_utf8();
 								    /// assert_eq!(len, 2);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// let len = 'ℝ'.len_utf8();
 								    /// assert_eq!(len, 3);
 								    ///
 								    /// let len = '💣'.len_utf8();
 								    /// assert_eq!(len, 4);
 								    /// ```
 								    ///
 								    /// The `&str` type guarantees that its contents are UTF-8, and so we can compare the length it
 								    /// would take if each code point was represented as a `char` vs in the `&str` itself:
 								    ///
 								    /// ```
 								    /// // as chars
 								    /// let eastern = '東';
-												Fix a typo
Fix a typo in `libcore/char/methods.rs`

											
										
										
											2019-06-29 19:02:03 +02:00
+								    /// let capital = '京';
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// // both can be represented as three bytes
 								    /// assert_eq!(3, eastern.len_utf8());
-												fix the same typo in doctest

											
										
										
											2019-06-29 19:46:45 +02:00
+								    /// assert_eq!(3, capital.len_utf8());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// // as a &str, these two are encoded in UTF-8
 								    /// let tokyo = "東京";
 								    ///
-												fix the same typo in doctest

											
										
										
											2019-06-29 19:46:45 +02:00
+								    /// let len = eastern.len_utf8() + capital.len_utf8();
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// // we can see that they take six bytes total...
 								    /// assert_eq!(6, tokyo.len());
 								    ///
 								    /// // ... just like the &str
 								    /// assert_eq!(len, tokyo.len());
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    #[stable(feature = "rust1", since = "1.0.0")]
-												Update since attributes for new const_ascii_methods_on_intrinsics to 1.52.0

											
										
										
											2021-02-14 00:17:44 +01:00
+								    #[rustc_const_stable(feature = "const_char_len_utf", since = "1.52.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												Make char methods const

`escape_unicode`, `escape_default`, `len_utf8`, `len_utf16`, to_ascii_lowercase`, `eq_ignore_ascii_case`

`u8` methods `to_ascii_lowercase`, `to_ascii_uppercase` also must be made const

u8 methods made const

Update methods.rs

Update mod.rs

Update methods.rs

Fix `since` in rustc_const_stable to next stable

Fix `since` in rustc_const_stable to next stable

Update methods.rs

Update mod.rs

											
										
										
											2020-11-30 03:16:31 +01:00
+								    pub const fn len_utf8(self) -> usize {
-												expose char::encode_utf8_raw for libstd

											
										
										
											2020-05-30 11:49:31 +02:00
+								        len_utf8(self as u32)
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// Returns the number of 16-bit code units this `char` would need if
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// encoded in UTF-16.
 								    ///
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// See the documentation for [`len_utf8()`] for more explanation of this
-												Fix link in char docs

											
										
										
											2015-12-09 21:58:49 +01:00
+								    /// concept. This function is a mirror, but for UTF-16 instead of UTF-8.
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`len_utf8()`]: #method.len_utf8
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// # Examples
 								    ///
-												Fix up docs for char

Part of https://github.com/rust-lang/rust/issues/29333

											
										
										
											2015-11-23 22:56:07 +01:00
+								    /// Basic usage:
 								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    /// let n = 'ß'.len_utf16();
 								    /// assert_eq!(n, 1);
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// let len = '💣'.len_utf16();
 								    /// assert_eq!(len, 2);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
 								    #[stable(feature = "rust1", since = "1.0.0")]
-												Update since attributes for new const_ascii_methods_on_intrinsics to 1.52.0

											
										
										
											2021-02-14 00:17:44 +01:00
+								    #[rustc_const_stable(feature = "const_char_len_utf", since = "1.52.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												Make char methods const

`escape_unicode`, `escape_default`, `len_utf8`, `len_utf16`, to_ascii_lowercase`, `eq_ignore_ascii_case`

`u8` methods `to_ascii_lowercase`, `to_ascii_uppercase` also must be made const

u8 methods made const

Update methods.rs

Update mod.rs

Update methods.rs

Fix `since` in rustc_const_stable to next stable

Fix `since` in rustc_const_stable to next stable

Update methods.rs

Update mod.rs

											
										
										
											2020-11-30 03:16:31 +01:00
+								    pub const fn len_utf16(self) -> usize {
-												Remove the CharExt trait, now that libcore has inherent methods for char

											
										
										
											2018-04-05 18:46:16 +02:00
+								        let ch = self as u32;
 								        if (ch & 0xFFFF) == ch { 1 } else { 2 }
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// Encodes this character as UTF-8 into the provided byte buffer,
 								    /// and then returns the subslice of the buffer that contains the encoded character.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// # Panics
 								    ///
 								    /// Panics if the buffer is not large enough.
 								    /// A buffer of length four is large enough to encode any `char`.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// In both of these examples, 'ß' takes two bytes to encode.
 								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// let mut b = [0; 2];
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// let result = 'ß'.encode_utf8(&mut b);
 								    ///
 								    /// assert_eq!(result, "ß");
 								    ///
 								    /// assert_eq!(result.len(), 2);
 								    /// ```
 								    ///
 								    /// A buffer that's too small:
 								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// ```should_panic
 								    /// let mut b = [0; 1];
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// // this panics
 								    /// 'ß'.encode_utf8(&mut b);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												Stabilize std::char::{encode_utf8, encode_utf16}

											
										
										
											2016-12-14 21:34:02 +01:00
+								    #[stable(feature = "unicode_encode_char", since = "1.15.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    pub fn encode_utf8(self, dst: &mut [u8]) -> &mut str {
-												encode_utf8_raw is not always valid UTF-8; clarify comments

											
										
										
											2020-05-30 17:13:07 +02:00
+								        // SAFETY: `char` is not a surrogate, so this is valid UTF-8.
 								        unsafe { from_utf8_unchecked_mut(encode_utf8_raw(self as u32, dst)) }
-												collections: Split the `collections` feature

This commit also deprecates the `as_string` and `as_slice` free functions in the
`string` and `vec` modules.

											
										
										
											2015-06-09 23:39:23 +02:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// Encodes this character as UTF-16 into the provided `u16` buffer,
 								    /// and then returns the subslice of the buffer that contains the encoded character.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// # Panics
 								    ///
 								    /// Panics if the buffer is not large enough.
 								    /// A buffer of length 2 is large enough to encode any `char`.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
 								    /// # Examples
 								    ///
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// In both of these examples, '𝕊' takes two `u16`s to encode.
 								    ///
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// let mut b = [0; 2];
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    /// let result = '𝕊'.encode_utf16(&mut b);
 								    ///
 								    /// assert_eq!(result.len(), 2);
 								    /// ```
 								    ///
 								    /// A buffer that's too small:
 								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// ```should_panic
 								    /// let mut b = [0; 1];
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    ///
-												Adjusted some doctests in libcore to use `should_panic`.

Previously, some doctests were spawning new threads and joining them to
indicate that a particular call should panic; this hurt readability, so
the tests have been adjusted to simply call the method and use the
`should_panic` marker.

											
										
										
											2020-06-13 06:06:09 +02:00
+								    /// // this panics
 								    /// '𝕊'.encode_utf16(&mut b);
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    /// ```
-												Stabilize std::char::{encode_utf8, encode_utf16}

											
										
										
											2016-12-14 21:34:02 +01:00
+								    #[stable(feature = "unicode_encode_char", since = "1.15.0")]
-												Add missing #[inline] to methods related to char.

											
										
										
											2015-06-09 23:58:00 +02:00
+								    #[inline]
-												[breaking-change] std: change `encode_utf{8,16}()` to take a buffer and return a slice

They panic if the buffer is too small.

											
										
										
											2016-09-08 13:54:39 +02:00
+								    pub fn encode_utf16(self, dst: &mut [u16]) -> &mut [u16] {
-												also expose and use encode_utf16_raw for wtf8

											
										
										
											2020-05-30 12:08:55 +02:00
+								        encode_utf16_raw(self as u32, dst)
-												collections: Split the `collections` feature

This commit also deprecates the `as_string` and `as_slice` free functions in the
`string` and `vec` modules.

											
										
										
											2015-06-09 23:39:23 +02:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has the `Alphabetic` property.
 								    ///
 								    /// `Alphabetic` is described in Chapter 4 (Character Properties) of the [Unicode Standard] and
 								    /// specified in the [Unicode Character Database][ucd] [`DerivedCoreProperties.txt`].
 								    ///
 								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('a'.is_alphabetic());
 								    /// assert!('京'.is_alphabetic());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// let c = '💝';
 								    /// // love is many things, but it is not alphabetic
 								    /// assert!(!c.is_alphabetic());
 								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn is_alphabetic(self) -> bool {
 								        match self {
-												migrate codebase to `..=` inclusive range patterns

These were stabilized in March 2018's #47813, and are the Preferred Way
to Do It going forward (q.v. #51043).

											
										
										
											2018-05-29 04:42:11 +02:00
+								            'a'..='z' | 'A'..='Z' => true,
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								            c => c > '\x7f' && unicode::Alphabetic(c),
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								        }
 								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has the `Lowercase` property.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// `Lowercase` is described in Chapter 4 (Character Properties) of the [Unicode Standard] and
 								    /// specified in the [Unicode Character Database][ucd] [`DerivedCoreProperties.txt`].
 								    ///
 								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('a'.is_lowercase());
 								    /// assert!('δ'.is_lowercase());
 								    /// assert!(!'A'.is_lowercase());
 								    /// assert!(!'Δ'.is_lowercase());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												FIX - Char documentation for unexperienced users

											
										
										
											2020-05-20 11:20:47 +02:00
+								    /// // The various Chinese scripts and punctuation do not have case, and so:
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(!'中'.is_lowercase());
-												FIX - Char documentation for unexperienced users

											
										
										
											2020-05-20 11:20:47 +02:00
+								    /// assert!(!' '.is_lowercase());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn is_lowercase(self) -> bool {
 								        match self {
-												migrate codebase to `..=` inclusive range patterns

These were stabilized in March 2018's #47813, and are the Preferred Way
to Do It going forward (q.v. #51043).

											
										
										
											2018-05-29 04:42:11 +02:00
+								            'a'..='z' => true,
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								            c => c > '\x7f' && unicode::Lowercase(c),
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								        }
 								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has the `Uppercase` property.
 								    ///
 								    /// `Uppercase` is described in Chapter 4 (Character Properties) of the [Unicode Standard] and
 								    /// specified in the [Unicode Character Database][ucd] [`DerivedCoreProperties.txt`].
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(!'a'.is_uppercase());
 								    /// assert!(!'δ'.is_uppercase());
 								    /// assert!('A'.is_uppercase());
 								    /// assert!('Δ'.is_uppercase());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												FIX - Char documentation for unexperienced users

											
										
										
											2020-05-20 11:20:47 +02:00
+								    /// // The various Chinese scripts and punctuation do not have case, and so:
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(!'中'.is_uppercase());
-												FIX - Char documentation for unexperienced users

											
										
										
											2020-05-20 11:20:47 +02:00
+								    /// assert!(!' '.is_uppercase());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn is_uppercase(self) -> bool {
 								        match self {
-												migrate codebase to `..=` inclusive range patterns

These were stabilized in March 2018's #47813, and are the Preferred Way
to Do It going forward (q.v. #51043).

											
										
										
											2018-05-29 04:42:11 +02:00
+								            'A'..='Z' => true,
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								            c => c > '\x7f' && unicode::Uppercase(c),
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								        }
 								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has the `White_Space` property.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// `White_Space` is specified in the [Unicode Character Database][ucd] [`PropList.txt`].
 								    ///
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`PropList.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/PropList.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(' '.is_whitespace());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// // a non-breaking space
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('\u{A0}'.is_whitespace());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(!'越'.is_whitespace());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn is_whitespace(self) -> bool {
 								        match self {
-												migrate codebase to `..=` inclusive range patterns

These were stabilized in March 2018's #47813, and are the Preferred Way
to Do It going forward (q.v. #51043).

											
										
										
											2018-05-29 04:42:11 +02:00
+								            ' ' | '\x09'..='\x0d' => true,
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								            c => c > '\x7f' && unicode::White_Space(c),
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								        }
 								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` satisfies either [`is_alphabetic()`] or [`is_numeric()`].
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`is_alphabetic()`]: #method.is_alphabetic
 								    /// [`is_numeric()`]: #method.is_numeric
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('٣'.is_alphanumeric());
 								    /// assert!('7'.is_alphanumeric());
 								    /// assert!('৬'.is_alphanumeric());
-												Treat gc=No characters as numeric

											
										
										
											2018-06-17 18:58:01 +02:00
+								    /// assert!('¾'.is_alphanumeric());
 								    /// assert!('①'.is_alphanumeric());
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('K'.is_alphanumeric());
 								    /// assert!('و'.is_alphanumeric());
 								    /// assert!('藏'.is_alphanumeric());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn is_alphanumeric(self) -> bool {
 								        self.is_alphabetic() || self.is_numeric()
 								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has the general category for control codes.
 								    ///
 								    /// Control codes (code points with the general category of `Cc`) are described in Chapter 4
 								    /// (Character Properties) of the [Unicode Standard] and specified in the [Unicode Character
 								    /// Database][ucd] [`UnicodeData.txt`].
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
 								    /// // U+009C, STRING TERMINATOR
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(''.is_control());
 								    /// assert!(!'q'.is_control());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    pub fn is_control(self) -> bool {
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								        unicode::Cc(self)
-												rustfmt librustc_unicode

											
										
										
											2015-10-25 11:19:14 +01:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has the `Grapheme_Extend` property.
-												Escape combining characters in escape_debug

											
										
										
											2018-04-12 12:39:18 +02:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// `Grapheme_Extend` is described in [Unicode Standard Annex #29 (Unicode Text
 								    /// Segmentation)][uax29] and specified in the [Unicode Character Database][ucd]
 								    /// [`DerivedCoreProperties.txt`].
 								    ///
 								    /// [uax29]: https://www.unicode.org/reports/tr29/
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`DerivedCoreProperties.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/DerivedCoreProperties.txt
-												Escape combining characters in escape_debug

											
										
										
											2018-04-12 12:39:18 +02:00
+								    #[inline]
-												Use Grapheme_Extend instead of Mn

											
										
										
											2018-05-17 00:19:58 +02:00
+								    pub(crate) fn is_grapheme_extended(self) -> bool {
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								        unicode::Grapheme_Extend(self)
-												Escape combining characters in escape_debug

											
										
										
											2018-04-12 12:39:18 +02:00
+								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns `true` if this `char` has one of the general categories for numbers.
 								    ///
 								    /// The general categories for numbers (`Nd` for decimal digits, `Nl` for letter-like numeric
 								    /// characters, and `No` for other numeric characters) are specified in the [Unicode Character
 								    /// Database][ucd] [`UnicodeData.txt`].
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
 								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// Basic usage:
 								    ///
 								    /// ```
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!('٣'.is_numeric());
 								    /// assert!('7'.is_numeric());
 								    /// assert!('৬'.is_numeric());
-												Treat gc=No characters as numeric

											
										
										
											2018-06-17 18:58:01 +02:00
+								    /// assert!('¾'.is_numeric());
 								    /// assert!('①'.is_numeric());
-												doc: remove needless bindings

											
										
										
											2016-03-22 22:09:43 +01:00
+								    /// assert!(!'K'.is_numeric());
 								    /// assert!(!'و'.is_numeric());
 								    /// assert!(!'藏'.is_numeric());
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn is_numeric(self) -> bool {
 								        match self {
-												migrate codebase to `..=` inclusive range patterns

These were stabilized in March 2018's #47813, and are the Preferred Way
to Do It going forward (q.v. #51043).

											
										
										
											2018-05-29 04:42:11 +02:00
+								            '0'..='9' => true,
-												Replace old tables with new unicode data

											
										
										
											2020-01-13 22:59:33 +01:00
+								            c => c > '\x7f' && unicode::N(c),
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								        }
 								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns an iterator that yields the lowercase mapping of this `char` as one or more
 								    /// `char`s.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// If this `char` does not have a lowercase mapping, the iterator yields the same `char`.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// If this `char` has a one-to-one lowercase mapping given by the [Unicode Character
 								    /// Database][ucd] [`UnicodeData.txt`], the iterator yields that `char`.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// If this `char` requires special considerations (e.g. multiple `char`s) the iterator yields
 								    /// the `char`(s) given by [`SpecialCasing.txt`].
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [`SpecialCasing.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/SpecialCasing.txt
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// This operation performs an unconditional mapping without tailoring. That is, the conversion
 								    /// is independent of context and language.
 								    ///
 								    /// In the [Unicode Standard], Chapter 4 (Character Properties) discusses case mapping in
 								    /// general and Chapter 3 (Conformance) discusses the default algorithm for case conversion.
 								    ///
 								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
-												doc: add examples for to_uppercase and to_lowercase

											
										
										
											2015-06-12 23:47:54 +02:00
+								    ///
 								    /// # Examples
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// As an iterator:
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												doc: add examples for to_uppercase and to_lowercase

											
										
										
											2015-06-12 23:47:54 +02:00
+								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// for c in 'İ'.to_lowercase() {
 								    ///     print!("{}", c);
 								    /// }
 								    /// println!();
 								    /// ```
 								    ///
 								    /// Using `println!` directly:
 								    ///
 								    /// ```
 								    /// println!("{}", 'İ'.to_lowercase());
 								    /// ```
 								    ///
 								    /// Both are equivalent to:
 								    ///
 								    /// ```
 								    /// println!("i\u{307}");
 								    /// ```
 								    ///
 								    /// Using `to_string`:
 								    ///
 								    /// ```
 								    /// assert_eq!('C'.to_lowercase().to_string(), "c");
-												docs: Improve char::to_{lower,upper}case examples

Collect the results to a String to make it clear that it will not always
return only one char and add examples showing that.

											
										
										
											2016-06-08 20:24:03 +02:00
+								    ///
 								    /// // Sometimes the result is more than one character:
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// assert_eq!('İ'.to_lowercase().to_string(), "i\u{307}");
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Ammended minor documentation detail abour Unicode cases.

											
										
										
											2017-03-15 02:05:55 +01:00
+								    /// // Characters that do not have both uppercase and lowercase
 								    /// // convert into themselves.
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// assert_eq!('山'.to_lowercase().to_string(), "山");
-												doc: add examples for to_uppercase and to_lowercase

											
										
										
											2015-06-12 23:47:54 +02:00
+								    /// ```
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn to_lowercase(self) -> ToLowercase {
-												Add complex (but unconditional) Unicode case mapping. Fix #25800

As a result, the iterator returned by `char::to_uppercase` sometimes
yields two or three `char`s instead of just one.

											
										
										
											2015-06-05 17:40:09 +02:00
+								        ToLowercase(CaseMappingIter::new(conversions::to_lower(self)))
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    }
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// Returns an iterator that yields the uppercase mapping of this `char` as one or more
 								    /// `char`s.
 								    ///
 								    /// If this `char` does not have a uppercase mapping, the iterator yields the same `char`.
 								    ///
 								    /// If this `char` has a one-to-one uppercase mapping given by the [Unicode Character
 								    /// Database][ucd] [`UnicodeData.txt`], the iterator yields that `char`.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [ucd]: https://www.unicode.org/reports/tr44/
 								    /// [`UnicodeData.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// If this `char` requires special considerations (e.g. multiple `char`s) the iterator yields
 								    /// the `char`(s) given by [`SpecialCasing.txt`].
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [`SpecialCasing.txt`]: https://www.unicode.org/Public/UCD/latest/ucd/SpecialCasing.txt
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// This operation performs an unconditional mapping without tailoring. That is, the conversion
 								    /// is independent of context and language.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// In the [Unicode Standard], Chapter 4 (Character Properties) discusses case mapping in
 								    /// general and Chapter 3 (Conformance) discusses the default algorithm for case conversion.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    ///
-												Improve docs on some char boolean methods

											
										
										
											2019-10-06 15:59:49 +02:00
+								    /// [Unicode Standard]: https://www.unicode.org/versions/latest/
-												doc: add examples for to_uppercase and to_lowercase

											
										
										
											2015-06-12 23:47:54 +02:00
+								    ///
 								    /// # Examples
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// As an iterator:
 								    ///
 								    /// ```
 								    /// for c in 'ß'.to_uppercase() {
 								    ///     print!("{}", c);
 								    /// }
 								    /// println!();
 								    /// ```
 								    ///
 								    /// Using `println!` directly:
 								    ///
 								    /// ```
 								    /// println!("{}", 'ß'.to_uppercase());
 								    /// ```
 								    ///
 								    /// Both are equivalent to:
 								    ///
 								    /// ```
 								    /// println!("SS");
 								    /// ```
 								    ///
 								    /// Using `to_string`:
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// assert_eq!('c'.to_uppercase().to_string(), "C");
-												docs: Improve char::to_{lower,upper}case examples

Collect the results to a String to make it clear that it will not always
return only one char and add examples showing that.

											
										
										
											2016-06-08 20:24:03 +02:00
+								    ///
 								    /// // Sometimes the result is more than one character:
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// assert_eq!('ß'.to_uppercase().to_string(), "SS");
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												Ammended minor documentation detail abour Unicode cases.

											
										
										
											2017-03-15 02:05:55 +01:00
+								    /// // Characters that do not have both uppercase and lowercase
 								    /// // convert into themselves.
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// assert_eq!('山'.to_uppercase().to_string(), "山");
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
 								    ///
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// # Note on locale
 								    ///
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// In Turkish, the equivalent of 'i' in Latin has five forms instead of two:
 								    ///
 								    /// * 'Dotless': I / ı, sometimes written ï
 								    /// * 'Dotted': İ / i
 								    ///
 								    /// Note that the lowercase dotted 'i' is the same as the Latin. Therefore:
 								    ///
 								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// let upper_i = 'i'.to_uppercase().to_string();
-												doc: add examples for to_uppercase and to_lowercase

											
										
										
											2015-06-12 23:47:54 +02:00
+								    /// ```
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
 								    /// The value of `upper_i` here relies on the language of the text: if we're
-												docs: Improve char::to_{lower,upper}case examples

Collect the results to a String to make it clear that it will not always
return only one char and add examples showing that.

											
										
										
											2016-06-08 20:24:03 +02:00
+								    /// in `en-US`, it should be `"I"`, but if we're in `tr_TR`, it should
 								    /// be `"İ"`. `to_uppercase()` does not take this into account, and so:
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												doc: add examples for to_uppercase and to_lowercase

											
										
										
											2015-06-12 23:47:54 +02:00
+								    /// ```
-												Implement Display for char Escape*, To*case.

											
										
										
											2017-01-07 19:16:03 +01:00
+								    /// let upper_i = 'i'.to_uppercase().to_string();
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    ///
-												docs: Improve char::to_{lower,upper}case examples

Collect the results to a String to make it clear that it will not always
return only one char and add examples showing that.

											
										
										
											2016-06-08 20:24:03 +02:00
+								    /// assert_eq!(upper_i, "I");
-												Write a bunch of docs for char

Mostly adding examples, and reformatting for consistency.

											
										
										
											2015-10-06 00:09:31 +02:00
+								    /// ```
 								    ///
 								    /// holds across languages.
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    #[stable(feature = "rust1", since = "1.0.0")]
-												libunicode: Partially inline the fast paths in character class checking.

											
										
										
											2015-03-19 01:36:34 +01:00
+								    #[inline]
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    pub fn to_uppercase(self) -> ToUppercase {
-												Add complex (but unconditional) Unicode case mapping. Fix #25800

As a result, the iterator returned by `char::to_uppercase` sometimes
yields two or three `char`s instead of just one.

											
										
										
											2015-06-05 17:40:09 +02:00
+								        ToUppercase(CaseMappingIter::new(conversions::to_upper(self)))
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								    }
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
 								    /// Checks if the value is within the ASCII range.
 								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let ascii = 'a';
 								    /// let non_ascii = '❤';
 								    ///
 								    /// assert!(ascii.is_ascii());
 								    /// assert!(!non_ascii.is_ascii());
 								    /// ```
-												Mark ascii methods on primitive types stable in 1.23.0.

The ascii_methods_on_intrinsics feature stabilization
didn't land in time for 1.21.0. Update the annotation
so the documentation is correct about when these
methods became available.

											
										
										
											2017-11-30 20:20:11 +01:00
+								    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
-												Propagate cfg bootstrap

											
										
										
											2019-12-18 18:00:59 +01:00
+								    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.32.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												constify parts of libcore.

											
										
										
											2018-10-23 02:04:14 +02:00
+								    pub const fn is_ascii(&self) -> bool {
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								        *self as u32 <= 0x7F
 								    }
 								    /// Makes a copy of the value in its ASCII upper case equivalent.
 								    ///
 								    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
 								    /// but non-ASCII letters are unchanged.
 								    ///
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// To uppercase the value in-place, use [`make_ascii_uppercase()`].
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// To uppercase ASCII characters in addition to non-ASCII characters, use
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// [`to_uppercase()`].
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let ascii = 'a';
 								    /// let non_ascii = '❤';
 								    ///
 								    /// assert_eq!('A', ascii.to_ascii_uppercase());
 								    /// assert_eq!('❤', non_ascii.to_ascii_uppercase());
 								    /// ```
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`make_ascii_uppercase()`]: #method.make_ascii_uppercase
 								    /// [`to_uppercase()`]: #method.to_uppercase
-												Mark ascii methods on primitive types stable in 1.23.0.

The ascii_methods_on_intrinsics feature stabilization
didn't land in time for 1.21.0. Update the annotation
so the documentation is correct about when these
methods became available.

											
										
										
											2017-11-30 20:20:11 +01:00
+								    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
-												Update since attributes for new const_ascii_methods_on_intrinsics to 1.52.0

											
										
										
											2021-02-14 00:17:44 +01:00
+								    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.52.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make char methods const

`escape_unicode`, `escape_default`, `len_utf8`, `len_utf16`, to_ascii_lowercase`, `eq_ignore_ascii_case`

`u8` methods `to_ascii_lowercase`, `to_ascii_uppercase` also must be made const

u8 methods made const

Update methods.rs

Update mod.rs

Update methods.rs

Fix `since` in rustc_const_stable to next stable

Fix `since` in rustc_const_stable to next stable

Update methods.rs

Update mod.rs

											
										
										
											2020-11-30 03:16:31 +01:00
+								    pub const fn to_ascii_uppercase(&self) -> char {
-												Slightly more explicit

											
										
										
											2021-02-12 14:42:42 +01:00
+								        if self.is_ascii_lowercase() {
 								            (*self as u8).ascii_change_case_unchecked() as char
 								        } else {
 								            *self
 								        }
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Makes a copy of the value in its ASCII lower case equivalent.
 								    ///
 								    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
 								    /// but non-ASCII letters are unchanged.
 								    ///
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// To lowercase the value in-place, use [`make_ascii_lowercase()`].
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// To lowercase ASCII characters in addition to non-ASCII characters, use
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// [`to_lowercase()`].
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let ascii = 'A';
 								    /// let non_ascii = '❤';
 								    ///
 								    /// assert_eq!('a', ascii.to_ascii_lowercase());
 								    /// assert_eq!('❤', non_ascii.to_ascii_lowercase());
 								    /// ```
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`make_ascii_lowercase()`]: #method.make_ascii_lowercase
 								    /// [`to_lowercase()`]: #method.to_lowercase
-												Mark ascii methods on primitive types stable in 1.23.0.

The ascii_methods_on_intrinsics feature stabilization
didn't land in time for 1.21.0. Update the annotation
so the documentation is correct about when these
methods became available.

											
										
										
											2017-11-30 20:20:11 +01:00
+								    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
-												Update since attributes for new const_ascii_methods_on_intrinsics to 1.52.0

											
										
										
											2021-02-14 00:17:44 +01:00
+								    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.52.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make char methods const

`escape_unicode`, `escape_default`, `len_utf8`, `len_utf16`, to_ascii_lowercase`, `eq_ignore_ascii_case`

`u8` methods `to_ascii_lowercase`, `to_ascii_uppercase` also must be made const

u8 methods made const

Update methods.rs

Update mod.rs

Update methods.rs

Fix `since` in rustc_const_stable to next stable

Fix `since` in rustc_const_stable to next stable

Update methods.rs

Update mod.rs

											
										
										
											2020-11-30 03:16:31 +01:00
+								    pub const fn to_ascii_lowercase(&self) -> char {
-												Slightly more explicit

											
										
										
											2021-02-12 14:42:42 +01:00
+								        if self.is_ascii_uppercase() {
 								            (*self as u8).ascii_change_case_unchecked() as char
 								        } else {
 								            *self
 								        }
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks that two values are an ASCII case-insensitive match.
 								    ///
 								    /// Equivalent to `to_ascii_lowercase(a) == to_ascii_lowercase(b)`.
 								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let upper_a = 'A';
 								    /// let lower_a = 'a';
 								    /// let lower_z = 'z';
 								    ///
 								    /// assert!(upper_a.eq_ignore_ascii_case(&lower_a));
 								    /// assert!(upper_a.eq_ignore_ascii_case(&upper_a));
 								    /// assert!(!upper_a.eq_ignore_ascii_case(&lower_z));
 								    /// ```
-												Mark ascii methods on primitive types stable in 1.23.0.

The ascii_methods_on_intrinsics feature stabilization
didn't land in time for 1.21.0. Update the annotation
so the documentation is correct about when these
methods became available.

											
										
										
											2017-11-30 20:20:11 +01:00
+								    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
-												Update since attributes for new const_ascii_methods_on_intrinsics to 1.52.0

											
										
										
											2021-02-14 00:17:44 +01:00
+								    #[rustc_const_stable(feature = "const_ascii_methods_on_intrinsics", since = "1.52.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make char methods const

`escape_unicode`, `escape_default`, `len_utf8`, `len_utf16`, to_ascii_lowercase`, `eq_ignore_ascii_case`

`u8` methods `to_ascii_lowercase`, `to_ascii_uppercase` also must be made const

u8 methods made const

Update methods.rs

Update mod.rs

Update methods.rs

Fix `since` in rustc_const_stable to next stable

Fix `since` in rustc_const_stable to next stable

Update methods.rs

Update mod.rs

											
										
										
											2020-11-30 03:16:31 +01:00
+								    pub const fn eq_ignore_ascii_case(&self, other: &char) -> bool {
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								        self.to_ascii_lowercase() == other.to_ascii_lowercase()
 								    }
 								    /// Converts this type to its ASCII upper case equivalent in-place.
 								    ///
 								    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
 								    /// but non-ASCII letters are unchanged.
 								    ///
 								    /// To return a new uppercased value without modifying the existing one, use
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// [`to_ascii_uppercase()`].
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let mut ascii = 'a';
 								    ///
 								    /// ascii.make_ascii_uppercase();
 								    ///
 								    /// assert_eq!('A', ascii);
 								    /// ```
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`to_ascii_uppercase()`]: #method.to_ascii_uppercase
-												Mark ascii methods on primitive types stable in 1.23.0.

The ascii_methods_on_intrinsics feature stabilization
didn't land in time for 1.21.0. Update the annotation
so the documentation is correct about when these
methods became available.

											
										
										
											2017-11-30 20:20:11 +01:00
+								    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
 								    pub fn make_ascii_uppercase(&mut self) {
 								        *self = self.to_ascii_uppercase();
 								    }
 								    /// Converts this type to its ASCII lower case equivalent in-place.
 								    ///
 								    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
 								    /// but non-ASCII letters are unchanged.
 								    ///
 								    /// To return a new lowercased value without modifying the existing one, use
-												Intra doc links for the char primitive

											
										
										
											2020-10-13 00:18:41 +02:00
+								    /// [`to_ascii_lowercase()`].
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let mut ascii = 'A';
 								    ///
 								    /// ascii.make_ascii_lowercase();
 								    ///
 								    /// assert_eq!('a', ascii);
 								    /// ```
 								    ///
-												Back to #method for links on char

											
										
										
											2020-11-19 14:55:57 +01:00
+								    /// [`to_ascii_lowercase()`]: #method.to_ascii_lowercase
-												Mark ascii methods on primitive types stable in 1.23.0.

The ascii_methods_on_intrinsics feature stabilization
didn't land in time for 1.21.0. Update the annotation
so the documentation is correct about when these
methods became available.

											
										
										
											2017-11-30 20:20:11 +01:00
+								    #[stable(feature = "ascii_methods_on_intrinsics", since = "1.23.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
 								    pub fn make_ascii_lowercase(&mut self) {
 								        *self = self.to_ascii_lowercase();
 								    }
 								    /// Checks if the value is an ASCII alphabetic character:
 								    ///
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// - U+0041 'A' ..= U+005A 'Z', or
 								    /// - U+0061 'a' ..= U+007A 'z'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(uppercase_a.is_ascii_alphabetic());
 								    /// assert!(uppercase_g.is_ascii_alphabetic());
 								    /// assert!(a.is_ascii_alphabetic());
 								    /// assert!(g.is_ascii_alphabetic());
 								    /// assert!(!zero.is_ascii_alphabetic());
 								    /// assert!(!percent.is_ascii_alphabetic());
 								    /// assert!(!space.is_ascii_alphabetic());
 								    /// assert!(!lf.is_ascii_alphabetic());
 								    /// assert!(!esc.is_ascii_alphabetic());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_alphabetic(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, 'A'..='Z' | 'a'..='z')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII uppercase character:
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// U+0041 'A' ..= U+005A 'Z'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(uppercase_a.is_ascii_uppercase());
 								    /// assert!(uppercase_g.is_ascii_uppercase());
 								    /// assert!(!a.is_ascii_uppercase());
 								    /// assert!(!g.is_ascii_uppercase());
 								    /// assert!(!zero.is_ascii_uppercase());
 								    /// assert!(!percent.is_ascii_uppercase());
 								    /// assert!(!space.is_ascii_uppercase());
 								    /// assert!(!lf.is_ascii_uppercase());
 								    /// assert!(!esc.is_ascii_uppercase());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_uppercase(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, 'A'..='Z')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII lowercase character:
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// U+0061 'a' ..= U+007A 'z'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(!uppercase_a.is_ascii_lowercase());
 								    /// assert!(!uppercase_g.is_ascii_lowercase());
 								    /// assert!(a.is_ascii_lowercase());
 								    /// assert!(g.is_ascii_lowercase());
 								    /// assert!(!zero.is_ascii_lowercase());
 								    /// assert!(!percent.is_ascii_lowercase());
 								    /// assert!(!space.is_ascii_lowercase());
 								    /// assert!(!lf.is_ascii_lowercase());
 								    /// assert!(!esc.is_ascii_lowercase());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_lowercase(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, 'a'..='z')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII alphanumeric character:
 								    ///
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// - U+0041 'A' ..= U+005A 'Z', or
 								    /// - U+0061 'a' ..= U+007A 'z', or
 								    /// - U+0030 '0' ..= U+0039 '9'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(uppercase_a.is_ascii_alphanumeric());
 								    /// assert!(uppercase_g.is_ascii_alphanumeric());
 								    /// assert!(a.is_ascii_alphanumeric());
 								    /// assert!(g.is_ascii_alphanumeric());
 								    /// assert!(zero.is_ascii_alphanumeric());
 								    /// assert!(!percent.is_ascii_alphanumeric());
 								    /// assert!(!space.is_ascii_alphanumeric());
 								    /// assert!(!lf.is_ascii_alphanumeric());
 								    /// assert!(!esc.is_ascii_alphanumeric());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_alphanumeric(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '0'..='9' | 'A'..='Z' | 'a'..='z')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII decimal digit:
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// U+0030 '0' ..= U+0039 '9'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(!uppercase_a.is_ascii_digit());
 								    /// assert!(!uppercase_g.is_ascii_digit());
 								    /// assert!(!a.is_ascii_digit());
 								    /// assert!(!g.is_ascii_digit());
 								    /// assert!(zero.is_ascii_digit());
 								    /// assert!(!percent.is_ascii_digit());
 								    /// assert!(!space.is_ascii_digit());
 								    /// assert!(!lf.is_ascii_digit());
 								    /// assert!(!esc.is_ascii_digit());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_digit(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '0'..='9')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII hexadecimal digit:
 								    ///
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// - U+0030 '0' ..= U+0039 '9', or
 								    /// - U+0041 'A' ..= U+0046 'F', or
 								    /// - U+0061 'a' ..= U+0066 'f'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(uppercase_a.is_ascii_hexdigit());
 								    /// assert!(!uppercase_g.is_ascii_hexdigit());
 								    /// assert!(a.is_ascii_hexdigit());
 								    /// assert!(!g.is_ascii_hexdigit());
 								    /// assert!(zero.is_ascii_hexdigit());
 								    /// assert!(!percent.is_ascii_hexdigit());
 								    /// assert!(!space.is_ascii_hexdigit());
 								    /// assert!(!lf.is_ascii_hexdigit());
 								    /// assert!(!esc.is_ascii_hexdigit());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_hexdigit(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '0'..='9' | 'A'..='F' | 'a'..='f')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII punctuation character:
 								    ///
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// - U+0021 ..= U+002F `! " # $ % & ' ( ) * + , - . /`, or
 								    /// - U+003A ..= U+0040 `: ; < = > ? @`, or
 								    /// - U+005B ..= U+0060 ``[ \ ] ^ _ ` ``, or
 								    /// - U+007B ..= U+007E `{ | } ~`
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(!uppercase_a.is_ascii_punctuation());
 								    /// assert!(!uppercase_g.is_ascii_punctuation());
 								    /// assert!(!a.is_ascii_punctuation());
 								    /// assert!(!g.is_ascii_punctuation());
 								    /// assert!(!zero.is_ascii_punctuation());
 								    /// assert!(percent.is_ascii_punctuation());
 								    /// assert!(!space.is_ascii_punctuation());
 								    /// assert!(!lf.is_ascii_punctuation());
 								    /// assert!(!esc.is_ascii_punctuation());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_punctuation(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '!'..='/' | ':'..='@' | '['..='`' | '{'..='~')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII graphic character:
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// U+0021 '!' ..= U+007E '~'.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(uppercase_a.is_ascii_graphic());
 								    /// assert!(uppercase_g.is_ascii_graphic());
 								    /// assert!(a.is_ascii_graphic());
 								    /// assert!(g.is_ascii_graphic());
 								    /// assert!(zero.is_ascii_graphic());
 								    /// assert!(percent.is_ascii_graphic());
 								    /// assert!(!space.is_ascii_graphic());
 								    /// assert!(!lf.is_ascii_graphic());
 								    /// assert!(!esc.is_ascii_graphic());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_graphic(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '!'..='~')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII whitespace character:
 								    /// U+0020 SPACE, U+0009 HORIZONTAL TAB, U+000A LINE FEED,
 								    /// U+000C FORM FEED, or U+000D CARRIAGE RETURN.
 								    ///
 								    /// Rust uses the WhatWG Infra Standard's [definition of ASCII
 								    /// whitespace][infra-aw]. There are several other definitions in
 								    /// wide use. For instance, [the POSIX locale][pct] includes
 								    /// U+000B VERTICAL TAB as well as all the above characters,
 								    /// but—from the very same specification—[the default rule for
 								    /// "field splitting" in the Bourne shell][bfs] considers *only*
 								    /// SPACE, HORIZONTAL TAB, and LINE FEED as whitespace.
 								    ///
 								    /// If you are writing a program that will process an existing
 								    /// file format, check what that format's definition of whitespace is
 								    /// before using this function.
 								    ///
 								    /// [infra-aw]: https://infra.spec.whatwg.org/#ascii-whitespace
 								    /// [pct]: http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap07.html#tag_07_03_01
 								    /// [bfs]: http://pubs.opengroup.org/onlinepubs/9699919799/utilities/V3_chap02.html#tag_18_06_05
 								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(!uppercase_a.is_ascii_whitespace());
 								    /// assert!(!uppercase_g.is_ascii_whitespace());
 								    /// assert!(!a.is_ascii_whitespace());
 								    /// assert!(!g.is_ascii_whitespace());
 								    /// assert!(!zero.is_ascii_whitespace());
 								    /// assert!(!percent.is_ascii_whitespace());
 								    /// assert!(space.is_ascii_whitespace());
 								    /// assert!(lf.is_ascii_whitespace());
 								    /// assert!(!esc.is_ascii_whitespace());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_whitespace(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '\t' | '\n' | '\x0C' | '\r' | ' ')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
 								    /// Checks if the value is an ASCII control character:
-												Change `...` to `..=` where applicable

											
										
										
											2019-06-14 19:24:38 +02:00
+								    /// U+0000 NUL ..= U+001F UNIT SEPARATOR, or U+007F DELETE.
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    /// Note that most ASCII whitespace characters are control
 								    /// characters, but SPACE is not.
 								    ///
 								    /// # Examples
 								    ///
 								    /// ```
 								    /// let uppercase_a = 'A';
 								    /// let uppercase_g = 'G';
 								    /// let a = 'a';
 								    /// let g = 'g';
 								    /// let zero = '0';
 								    /// let percent = '%';
 								    /// let space = ' ';
 								    /// let lf = '\n';
 								    /// let esc: char = 0x1b_u8.into();
 								    ///
 								    /// assert!(!uppercase_a.is_ascii_control());
 								    /// assert!(!uppercase_g.is_ascii_control());
 								    /// assert!(!a.is_ascii_control());
 								    /// assert!(!g.is_ascii_control());
 								    /// assert!(!zero.is_ascii_control());
 								    /// assert!(!percent.is_ascii_control());
 								    /// assert!(!space.is_ascii_control());
 								    /// assert!(lf.is_ascii_control());
 								    /// assert!(esc.is_ascii_control());
 								    /// ```
-												Change `since` attribute from ctype methods from 1.23 to 1.24

The changes didn't land in time for 1.23 and stabilizations won't
be backported to beta.

											
										
										
											2017-11-28 08:50:40 +01:00
+								    #[stable(feature = "ascii_ctype_on_intrinsics", since = "1.24.0")]
-												mark methods as constant since 1.47.0 instead of 1.46.0

											
										
										
											2020-07-22 09:16:16 +02:00
+								    #[rustc_const_stable(feature = "const_ascii_ctype_on_intrinsics", since = "1.47.0")]
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    #[inline]
-												Make the ASCII ctype inherent methods const

											
										
										
											2020-02-09 06:29:16 +01:00
+								    pub const fn is_ascii_control(&self) -> bool {
-												Use matches! for core::char methods
											
										
										
											2020-10-05 16:29:07 +02:00
+								        matches!(*self, '\0'..='\x1F' | '\x7F')
-												Copy `AsciiExt` methods to `char` directly

This is done in order to deprecate AsciiExt eventually.

											
										
										
											2017-09-28 17:04:38 +02:00
+								    }
-												impl char

											
										
										
											2015-03-11 05:13:16 +01:00
+								}
-												expose char::encode_utf8_raw for libstd

											
										
										
											2020-05-30 11:49:31 +02:00
 								#[inline]
-												Make char methods const

`escape_unicode`, `escape_default`, `len_utf8`, `len_utf16`, to_ascii_lowercase`, `eq_ignore_ascii_case`

`u8` methods `to_ascii_lowercase`, `to_ascii_uppercase` also must be made const

u8 methods made const

Update methods.rs

Update mod.rs

Update methods.rs

Fix `since` in rustc_const_stable to next stable

Fix `since` in rustc_const_stable to next stable

Update methods.rs

Update mod.rs

											
										
										
											2020-11-30 03:16:31 +01:00
+								const fn len_utf8(code: u32) -> usize {
-												expose char::encode_utf8_raw for libstd

											
										
										
											2020-05-30 11:49:31 +02:00
+								    if code < MAX_ONE_B {
 
 								    } else if code < MAX_TWO_B {
 
 								    } else if code < MAX_THREE_B {
 
 								    } else {
 
 								    }
 								}
 								/// Encodes a raw u32 value as UTF-8 into the provided byte buffer,
 								/// and then returns the subslice of the buffer that contains the encoded character.
 								///
-												encode_utf8_raw is not always valid UTF-8; clarify comments

											
										
										
											2020-05-30 17:13:07 +02:00
+								/// Unlike `char::encode_utf8`, this method also handles codepoints in the surrogate range.
 								/// (Creating a `char` in the surrogate range is UB.)
 								/// The result is valid [generalized UTF-8] but not valid UTF-8.
 								///
 								/// [generalized UTF-8]: https://simonsapin.github.io/wtf-8/#generalized-utf8
-												expose char::encode_utf8_raw for libstd

											
										
										
											2020-05-30 11:49:31 +02:00
+								///
 								/// # Panics
 								///
 								/// Panics if the buffer is not large enough.
 								/// A buffer of length four is large enough to encode any `char`.
 								#[unstable(feature = "char_internals", reason = "exposed only for libstd", issue = "none")]
 								#[doc(hidden)]
 								#[inline]
-												encode_utf8_raw is not always valid UTF-8; clarify comments

											
										
										
											2020-05-30 17:13:07 +02:00
+								pub fn encode_utf8_raw(code: u32, dst: &mut [u8]) -> &mut [u8] {
-												expose char::encode_utf8_raw for libstd

											
										
										
											2020-05-30 11:49:31 +02:00
+								    let len = len_utf8(code);
 								    match (len, &mut dst[..]) {
 								        (1, [a, ..]) => {
 								            *a = code as u8;
 								        }
 								        (2, [a, b, ..]) => {
 								            *a = (code >> 6 & 0x1F) as u8 | TAG_TWO_B;
 								            *b = (code & 0x3F) as u8 | TAG_CONT;
 								        }
 								        (3, [a, b, c, ..]) => {
 								            *a = (code >> 12 & 0x0F) as u8 | TAG_THREE_B;
 								            *b = (code >> 6 & 0x3F) as u8 | TAG_CONT;
 								            *c = (code & 0x3F) as u8 | TAG_CONT;
 								        }
 								        (4, [a, b, c, d, ..]) => {
 								            *a = (code >> 18 & 0x07) as u8 | TAG_FOUR_B;
 								            *b = (code >> 12 & 0x3F) as u8 | TAG_CONT;
 								            *c = (code >> 6 & 0x3F) as u8 | TAG_CONT;
 								            *d = (code & 0x3F) as u8 | TAG_CONT;
 								        }
 								        _ => panic!(
 								            "encode_utf8: need {} bytes to encode U+{:X}, but the buffer has {}",
 								            len,
 								            code,
 								            dst.len(),
 								        ),
 								    };
-												encode_utf8_raw is not always valid UTF-8; clarify comments

											
										
										
											2020-05-30 17:13:07 +02:00
+								    &mut dst[..len]
-												expose char::encode_utf8_raw for libstd

											
										
										
											2020-05-30 11:49:31 +02:00
+								}
-												also expose and use encode_utf16_raw for wtf8

											
										
										
											2020-05-30 12:08:55 +02:00
 								/// Encodes a raw u32 value as UTF-16 into the provided `u16` buffer,
 								/// and then returns the subslice of the buffer that contains the encoded character.
 								///
-												encode_utf8_raw is not always valid UTF-8; clarify comments

											
										
										
											2020-05-30 17:13:07 +02:00
+								/// Unlike `char::encode_utf16`, this method also handles codepoints in the surrogate range.
 								/// (Creating a `char` in the surrogate range is UB.)
-												also expose and use encode_utf16_raw for wtf8

											
										
										
											2020-05-30 12:08:55 +02:00
+								///
 								/// # Panics
 								///
 								/// Panics if the buffer is not large enough.
 								/// A buffer of length 2 is large enough to encode any `char`.
 								#[unstable(feature = "char_internals", reason = "exposed only for libstd", issue = "none")]
 								#[doc(hidden)]
 								#[inline]
 								pub fn encode_utf16_raw(mut code: u32, dst: &mut [u16]) -> &mut [u16] {
 								    // SAFETY: each arm checks whether there are enough bits to write into
 								    unsafe {
 								        if (code & 0xFFFF) == code && !dst.is_empty() {
-												encode_utf8_raw is not always valid UTF-8; clarify comments

											
										
										
											2020-05-30 17:13:07 +02:00
+								            // The BMP falls through
-												also expose and use encode_utf16_raw for wtf8

											
										
										
											2020-05-30 12:08:55 +02:00
+								            *dst.get_unchecked_mut(0) = code as u16;
 								            slice::from_raw_parts_mut(dst.as_mut_ptr(), 1)
 								        } else if dst.len() >= 2 {
 								            // Supplementary planes break into surrogates.
 								            code -= 0x1_0000;
 								            *dst.get_unchecked_mut(0) = 0xD800 | ((code >> 10) as u16);
 								            *dst.get_unchecked_mut(1) = 0xDC00 | ((code as u16) & 0x3FF);
 								            slice::from_raw_parts_mut(dst.as_mut_ptr(), 2)
 								        } else {
 								            panic!(
 								                "encode_utf16: need {} units to encode U+{:X}, but the buffer has {}",
 								                from_u32_unchecked(code).len_utf16(),
 								                code,
 								                dst.len(),
 								            )
 								        }
 								    }
 								}