rust/src/libstd/ascii.rs

// Copyright 2013-2014 The Rust Project Developers. See the COPYRIGHT
// file at the top-level directory of this distribution and at
// http://rust-lang.org/COPYRIGHT.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
//
// ignore-lexer-test FIXME #15679

//! Operations on ASCII strings and characters

#![unstable = "unsure about placement and naming"]
#![allow(deprecated)]

use core::kinds::Sized;
use iter::IteratorExt;
use ops::FnMut;
use slice::SliceExt;
use str::StrExt;
use string::String;
use vec::Vec;

/// Extension methods for ASCII-subset only operations on owned strings
#[experimental = "would prefer to do this in a more general way"]
pub trait OwnedAsciiExt {
    /// Convert the string to ASCII upper case:
    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
    /// but non-ASCII letters are unchanged.
    fn into_ascii_uppercase(self) -> Self;

    /// Convert the string to ASCII lower case:
    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
    /// but non-ASCII letters are unchanged.
    fn into_ascii_lowercase(self) -> Self;
}

/// Extension methods for ASCII-subset only operations on string slices
#[experimental = "would prefer to do this in a more general way"]
pub trait AsciiExt<T = Self> for Sized? {
    /// Check if within the ASCII range.
    fn is_ascii(&self) -> bool;

    /// Makes a copy of the string in ASCII upper case:
    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
    /// but non-ASCII letters are unchanged.
    fn to_ascii_uppercase(&self) -> T;

    /// Makes a copy of the string in ASCII lower case:
    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
    /// but non-ASCII letters are unchanged.
    fn to_ascii_lowercase(&self) -> T;

    /// Check that two strings are an ASCII case-insensitive match.
    /// Same as `to_ascii_lowercase(a) == to_ascii_lower(b)`,
    /// but without allocating and copying temporary strings.
    fn eq_ignore_ascii_case(&self, other: &Self) -> bool;
}

#[experimental = "would prefer to do this in a more general way"]
impl AsciiExt<String> for str {
    #[inline]
    fn is_ascii(&self) -> bool {
        self.bytes().all(|b| b.is_ascii())
    }

    #[inline]
    fn to_ascii_uppercase(&self) -> String {
        // Vec<u8>::to_ascii_uppercase() preserves the UTF-8 invariant.
        unsafe { String::from_utf8_unchecked(self.as_bytes().to_ascii_uppercase()) }
    }

    #[inline]
    fn to_ascii_lowercase(&self) -> String {
        // Vec<u8>::to_ascii_lowercase() preserves the UTF-8 invariant.
        unsafe { String::from_utf8_unchecked(self.as_bytes().to_ascii_lowercase()) }
    }

    #[inline]
    fn eq_ignore_ascii_case(&self, other: &str) -> bool {
        self.as_bytes().eq_ignore_ascii_case(other.as_bytes())
    }
}

#[experimental = "would prefer to do this in a more general way"]
impl OwnedAsciiExt for String {
    #[inline]
    fn into_ascii_uppercase(self) -> String {
        // Vec<u8>::into_ascii_uppercase() preserves the UTF-8 invariant.
        unsafe { String::from_utf8_unchecked(self.into_bytes().into_ascii_uppercase()) }
    }

    #[inline]
    fn into_ascii_lowercase(self) -> String {
        // Vec<u8>::into_ascii_lowercase() preserves the UTF-8 invariant.
        unsafe { String::from_utf8_unchecked(self.into_bytes().into_ascii_lowercase()) }
    }
}

#[experimental = "would prefer to do this in a more general way"]
impl AsciiExt<Vec<u8>> for [u8] {
    #[inline]
    fn is_ascii(&self) -> bool {
        self.iter().all(|b| b.is_ascii())
    }

    #[inline]
    fn to_ascii_uppercase(&self) -> Vec<u8> {
        self.iter().map(|&byte| ASCII_UPPER_MAP[byte as uint]).collect()
    }

    #[inline]
    fn to_ascii_lowercase(&self) -> Vec<u8> {
        self.iter().map(|&byte| ASCII_LOWER_MAP[byte as uint]).collect()
    }

    #[inline]
    fn eq_ignore_ascii_case(&self, other: &[u8]) -> bool {
        self.len() == other.len() &&
            self.iter().zip(other.iter()).all(
            |(byte_self, byte_other)| {
                ASCII_LOWER_MAP[*byte_self as uint] ==
                    ASCII_LOWER_MAP[*byte_other as uint]
            })
    }
}

#[experimental = "would prefer to do this in a more general way"]
impl OwnedAsciiExt for Vec<u8> {
    #[inline]
    fn into_ascii_uppercase(mut self) -> Vec<u8> {
        for byte in self.iter_mut() {
            *byte = ASCII_UPPER_MAP[*byte as uint];
        }
        self
    }

    #[inline]
    fn into_ascii_lowercase(mut self) -> Vec<u8> {
        for byte in self.iter_mut() {
            *byte = ASCII_LOWER_MAP[*byte as uint];
        }
        self
    }
}

#[experimental = "would prefer to do this in a more general way"]
impl AsciiExt for u8 {
    #[inline]
    fn is_ascii(&self) -> bool {
        *self & 128 == 0u8
    }

    #[inline]
    fn to_ascii_uppercase(&self) -> u8 {
        ASCII_UPPER_MAP[*self as uint]
    }

    #[inline]
    fn to_ascii_lowercase(&self) -> u8 {
        ASCII_LOWER_MAP[*self as uint]
    }

    #[inline]
    fn eq_ignore_ascii_case(&self, other: &u8) -> bool {
        ASCII_LOWER_MAP[*self as uint] == ASCII_LOWER_MAP[*other as uint]
    }
}

#[experimental = "would prefer to do this in a more general way"]
impl AsciiExt for char {
    #[inline]
    fn is_ascii(&self) -> bool {
        *self as u32 <= 0x7F
    }

    #[inline]
    fn to_ascii_uppercase(&self) -> char {
        if self.is_ascii() {
            ASCII_UPPER_MAP[*self as uint] as char
        } else {
            *self
        }
    }

    #[inline]
    fn to_ascii_lowercase(&self) -> char {
        if self.is_ascii() {
            ASCII_UPPER_MAP[*self as uint] as char
        } else {
            *self
        }
    }

    #[inline]
    fn eq_ignore_ascii_case(&self, other: &char) -> bool {
        self.to_ascii_lowercase() == other.to_ascii_lowercase()
    }
}

/// Returns a 'default' ASCII and C++11-like literal escape of a `u8`
///
/// The default is chosen with a bias toward producing literals that are
/// legal in a variety of languages, including C++11 and similar C-family
/// languages. The exact rules are:
///
/// - Tab, CR and LF are escaped as '\t', '\r' and '\n' respectively.
/// - Single-quote, double-quote and backslash chars are backslash-escaped.
/// - Any other chars in the range [0x20,0x7e] are not escaped.
/// - Any other chars are given hex escapes.
/// - Unicode escapes are never generated by this function.
#[unstable = "needs to be updated to use an iterator"]
pub fn escape_default<F>(c: u8, mut f: F) where
    F: FnMut(u8),
{
    match c {
        b'\t' => { f(b'\\'); f(b't'); }
        b'\r' => { f(b'\\'); f(b'r'); }
        b'\n' => { f(b'\\'); f(b'n'); }
        b'\\' => { f(b'\\'); f(b'\\'); }
        b'\'' => { f(b'\\'); f(b'\''); }
        b'"'  => { f(b'\\'); f(b'"'); }
        b'\x20' ... b'\x7e' => { f(c); }
        _ => {
            f(b'\\');
            f(b'x');
            for &offset in [4u, 0u].iter() {
                match ((c as i32) >> offset) & 0xf {
                    i @ 0 ... 9 => f(b'0' + (i as u8)),
                    i => f(b'a' + (i as u8 - 10)),
                }
            }
        }
    }
}

static ASCII_LOWER_MAP: [u8, ..256] = [
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
    0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
    0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
    0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
    b' ', b'!', b'"', b'#', b'$', b'%', b'&', b'\'',
    b'(', b')', b'*', b'+', b',', b'-', b'.', b'/',
    b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7',
    b'8', b'9', b':', b';', b'<', b'=', b'>', b'?',
    b'@',

          b'a', b'b', b'c', b'd', b'e', b'f', b'g',
    b'h', b'i', b'j', b'k', b'l', b'm', b'n', b'o',
    b'p', b'q', b'r', b's', b't', b'u', b'v', b'w',
    b'x', b'y', b'z',

                      b'[', b'\\', b']', b'^', b'_',
    b'`', b'a', b'b', b'c', b'd', b'e', b'f', b'g',
    b'h', b'i', b'j', b'k', b'l', b'm', b'n', b'o',
    b'p', b'q', b'r', b's', b't', b'u', b'v', b'w',
    b'x', b'y', b'z', b'{', b'|', b'}', b'~', 0x7f,
    0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
    0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
    0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
    0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
    0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
    0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
    0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
    0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
    0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
    0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
    0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
    0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
    0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
    0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
    0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
    0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
];

static ASCII_UPPER_MAP: [u8, ..256] = [
    0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
    0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
    0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
    0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
    b' ', b'!', b'"', b'#', b'$', b'%', b'&', b'\'',
    b'(', b')', b'*', b'+', b',', b'-', b'.', b'/',
    b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7',
    b'8', b'9', b':', b';', b'<', b'=', b'>', b'?',
    b'@', b'A', b'B', b'C', b'D', b'E', b'F', b'G',
    b'H', b'I', b'J', b'K', b'L', b'M', b'N', b'O',
    b'P', b'Q', b'R', b'S', b'T', b'U', b'V', b'W',
    b'X', b'Y', b'Z', b'[', b'\\', b']', b'^', b'_',
    b'`',

          b'A', b'B', b'C', b'D', b'E', b'F', b'G',
    b'H', b'I', b'J', b'K', b'L', b'M', b'N', b'O',
    b'P', b'Q', b'R', b'S', b'T', b'U', b'V', b'W',
    b'X', b'Y', b'Z',

                      b'{', b'|', b'}', b'~', 0x7f,
    0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
    0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
    0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
    0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
    0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
    0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
    0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
    0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
    0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
    0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
    0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
    0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
    0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
    0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
    0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
    0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
];


#[cfg(test)]
mod tests {
    use prelude::*;
    use super::*;
    use char::from_u32;

    #[test]
    fn test_ascii() {
        assert!("banana".chars().all(|c| c.is_ascii()));
        assert!(!"ประเทศไทย中华Việt Nam".chars().all(|c| c.is_ascii()));
    }

    #[test]
    fn test_ascii_vec() {
        assert!("".is_ascii());
        assert!("a".is_ascii());
        assert!(!"\u{2009}".is_ascii());

    }

    #[test]
    fn test_to_ascii_uppercase() {
        assert_eq!("url()URL()uRl()ürl".to_ascii_uppercase(), "URL()URL()URL()üRL");
        assert_eq!("hıKß".to_ascii_uppercase(), "HıKß");

        let mut i = 0;
        while i <= 500 {
            let upper = if 'a' as u32 <= i && i <= 'z' as u32 { i + 'A' as u32 - 'a' as u32 }
                        else { i };
            assert_eq!((from_u32(i).unwrap()).to_string().to_ascii_uppercase(),
                       (from_u32(upper).unwrap()).to_string());
            i += 1;
        }
    }

    #[test]
    fn test_to_ascii_lowercase() {
        assert_eq!("url()URL()uRl()Ürl".to_ascii_lowercase(), "url()url()url()Ürl");
        // Dotted capital I, Kelvin sign, Sharp S.
        assert_eq!("HİKß".to_ascii_lowercase(), "hİKß");

        let mut i = 0;
        while i <= 500 {
            let lower = if 'A' as u32 <= i && i <= 'Z' as u32 { i + 'a' as u32 - 'A' as u32 }
                        else { i };
            assert_eq!((from_u32(i).unwrap()).to_string().to_ascii_lowercase(),
                       (from_u32(lower).unwrap()).to_string());
            i += 1;
        }
    }

    #[test]
    fn test_into_ascii_uppercase() {
        assert_eq!(("url()URL()uRl()ürl".to_string()).into_ascii_uppercase(),
                   "URL()URL()URL()üRL".to_string());
        assert_eq!(("hıKß".to_string()).into_ascii_uppercase(), "HıKß");

        let mut i = 0;
        while i <= 500 {
            let upper = if 'a' as u32 <= i && i <= 'z' as u32 { i + 'A' as u32 - 'a' as u32 }
                        else { i };
            assert_eq!((from_u32(i).unwrap()).to_string().into_ascii_uppercase(),
                       (from_u32(upper).unwrap()).to_string());
            i += 1;
        }
    }

    #[test]
    fn test_into_ascii_lowercase() {
        assert_eq!(("url()URL()uRl()Ürl".to_string()).into_ascii_lowercase(),
                   "url()url()url()Ürl");
        // Dotted capital I, Kelvin sign, Sharp S.
        assert_eq!(("HİKß".to_string()).into_ascii_lowercase(), "hİKß");

        let mut i = 0;
        while i <= 500 {
            let lower = if 'A' as u32 <= i && i <= 'Z' as u32 { i + 'a' as u32 - 'A' as u32 }
                        else { i };
            assert_eq!((from_u32(i).unwrap()).to_string().into_ascii_lowercase(),
                       (from_u32(lower).unwrap()).to_string());
            i += 1;
        }
    }

    #[test]
    fn test_eq_ignore_ascii_case() {
        assert!("url()URL()uRl()Ürl".eq_ignore_ascii_case("url()url()url()Ürl"));
        assert!(!"Ürl".eq_ignore_ascii_case("ürl"));
        // Dotted capital I, Kelvin sign, Sharp S.
        assert!("HİKß".eq_ignore_ascii_case("hİKß"));
        assert!(!"İ".eq_ignore_ascii_case("i"));
        assert!(!"K".eq_ignore_ascii_case("k"));
        assert!(!"ß".eq_ignore_ascii_case("s"));

        let mut i = 0;
        while i <= 500 {
            let c = i;
            let lower = if 'A' as u32 <= c && c <= 'Z' as u32 { c + 'a' as u32 - 'A' as u32 }
                        else { c };
            assert!((from_u32(i).unwrap()).to_string().eq_ignore_ascii_case(
                    (from_u32(lower).unwrap()).to_string().as_slice()));
            i += 1;
        }
    }
}
-												Fix minor doc typos

											
										
										
											2014-01-30 12:29:35 -06:00
+								// Copyright 2013-2014 The Rust Project Developers. See the COPYRIGHT
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
+								// file at the top-level directory of this distribution and at
 								// http://rust-lang.org/COPYRIGHT.
 								//
 								// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
 								// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
 								// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
 								// option. This file may not be copied, modified, or distributed
 								// except according to those terms.
-												ignore-lexer-test to broken files and remove some tray hyphens

I blame @ChrisMorgan for the hyphens.

											
										
										
											2014-07-14 22:46:04 -05:00
+								//
 								// ignore-lexer-test FIXME #15679
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
-												std: uniform modules titles for doc

This commit uniforms the short title of modules provided by libstd,
in order to make their roles more explicit when glancing at the index.

Signed-off-by: Luca Bruno <lucab@debian.org>

											
										
										
											2013-12-24 10:08:28 -06:00
+								//! Operations on ASCII strings and characters
-												Add a brief description to show up in http://static.rust-lang.org/doc/core/index.html
											
										
										
											2013-05-03 01:20:01 -05:00
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#![unstable = "unsure about placement and naming"]
-												Fallout from deprecation

											
										
										
											2014-11-21 14:51:22 -06:00
+								#![allow(deprecated)]
-												libstd: set baseline stability levels.

Earlier commits have established a baseline of `experimental` stability
for all crates under the facade (so their contents are considered
experimental within libstd). Since `experimental` is `allow` by
default, we should use the same baseline stability for libstd itself.

This commit adds `experimental` tags to all of the modules defined in
`std`, and `unstable` to `std` itself.

											
										
										
											2014-06-30 19:22:40 -05:00
-												DSTify [T]/str extension traits

This PR changes the signature of several methods from `foo(self, ...)` to
`foo(&self, ...)`/`foo(&mut self, ...)`, but there is no breakage of the usage
of these methods due to the autoref nature of `method.call()`s. This PR also
removes the lifetime parameter from some traits (`Trait<'a>` -> `Trait`). These
changes break any use of the extension traits for generic programming, but
those traits are not meant to be used for generic programming in the first
place. In the whole rust distribution there was only one misuse of a extension
trait as a bound, which got corrected (the bound was unnecessary and got
removed) as part of this PR.

[breaking-change]

											
										
										
											2014-10-23 10:43:18 -05:00
+								use core::kinds::Sized;
-												Fallout from stabilization

											
										
										
											2014-11-06 11:32:37 -06:00
+								use iter::IteratorExt;
-												libstd: use unboxed closures

											
										
										
											2014-12-07 13:15:25 -06:00
+								use ops::FnMut;
-												Remove Ascii, AsciiCast, OwnedAsciiCast, AsciiStr, IntoBytes, IntoString.

As a replacement, add is_ascii() to AsciiExt, and implement AsciiExt for u8 and char.

[breaking-change]

											
										
										
											2014-12-06 19:55:34 -06:00
+								use slice::SliceExt;
 								use str::StrExt;
 								use string::String;
-												rename std::vec_ng -> std::vec

Closes #12771

											
										
										
											2014-03-20 02:35:51 -05:00
+								use vec::Vec;
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								/// Extension methods for ASCII-subset only operations on owned strings
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								pub trait OwnedAsciiExt {
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								    /// Convert the string to ASCII upper case:
 								    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
 								    /// but non-ASCII letters are unchanged.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn into_ascii_uppercase(self) -> Self;
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
 								    /// Convert the string to ASCII lower case:
 								    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
 								    /// but non-ASCII letters are unchanged.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn into_ascii_lowercase(self) -> Self;
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								}
 								/// Extension methods for ASCII-subset only operations on string slices
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
-												Remove Ascii, AsciiCast, OwnedAsciiCast, AsciiStr, IntoBytes, IntoString.

As a replacement, add is_ascii() to AsciiExt, and implement AsciiExt for u8 and char.

[breaking-change]

											
										
										
											2014-12-06 19:55:34 -06:00
+								pub trait AsciiExt<T = Self> for Sized? {
 								    /// Check if within the ASCII range.
 								    fn is_ascii(&self) -> bool;
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								    /// Makes a copy of the string in ASCII upper case:
 								    /// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
 								    /// but non-ASCII letters are unchanged.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn to_ascii_uppercase(&self) -> T;
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
 								    /// Makes a copy of the string in ASCII lower case:
 								    /// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
 								    /// but non-ASCII letters are unchanged.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn to_ascii_lowercase(&self) -> T;
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
 								    /// Check that two strings are an ASCII case-insensitive match.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    /// Same as `to_ascii_lowercase(a) == to_ascii_lower(b)`,
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								    /// but without allocating and copying temporary strings.
-												DSTify [T]/str extension traits

This PR changes the signature of several methods from `foo(self, ...)` to
`foo(&self, ...)`/`foo(&mut self, ...)`, but there is no breakage of the usage
of these methods due to the autoref nature of `method.call()`s. This PR also
removes the lifetime parameter from some traits (`Trait<'a>` -> `Trait`). These
changes break any use of the extension traits for generic programming, but
those traits are not meant to be used for generic programming in the first
place. In the whole rust distribution there was only one misuse of a extension
trait as a bound, which got corrected (the bound was unnecessary and got
removed) as part of this PR.

[breaking-change]

											
										
										
											2014-10-23 10:43:18 -05:00
+								    fn eq_ignore_ascii_case(&self, other: &Self) -> bool;
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								}
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
-												DSTify [T]/str extension traits

This PR changes the signature of several methods from `foo(self, ...)` to
`foo(&self, ...)`/`foo(&mut self, ...)`, but there is no breakage of the usage
of these methods due to the autoref nature of `method.call()`s. This PR also
removes the lifetime parameter from some traits (`Trait<'a>` -> `Trait`). These
changes break any use of the extension traits for generic programming, but
those traits are not meant to be used for generic programming in the first
place. In the whole rust distribution there was only one misuse of a extension
trait as a bound, which got corrected (the bound was unnecessary and got
removed) as part of this PR.

[breaking-change]

											
										
										
											2014-10-23 10:43:18 -05:00
+								impl AsciiExt<String> for str {
-												Remove Ascii, AsciiCast, OwnedAsciiCast, AsciiStr, IntoBytes, IntoString.

As a replacement, add is_ascii() to AsciiExt, and implement AsciiExt for u8 and char.

[breaking-change]

											
										
										
											2014-12-06 19:55:34 -06:00
+								    #[inline]
 								    fn is_ascii(&self) -> bool {
 								        self.bytes().all(|b| b.is_ascii())
 								    }
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn to_ascii_uppercase(&self) -> String {
 								        // Vec<u8>::to_ascii_uppercase() preserves the UTF-8 invariant.
 								        unsafe { String::from_utf8_unchecked(self.as_bytes().to_ascii_uppercase()) }
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								    }
 								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn to_ascii_lowercase(&self) -> String {
 								        // Vec<u8>::to_ascii_lowercase() preserves the UTF-8 invariant.
 								        unsafe { String::from_utf8_unchecked(self.as_bytes().to_ascii_lowercase()) }
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								    }
 								    #[inline]
 								    fn eq_ignore_ascii_case(&self, other: &str) -> bool {
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								        self.as_bytes().eq_ignore_ascii_case(other.as_bytes())
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								    }
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								}
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								impl OwnedAsciiExt for String {
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn into_ascii_uppercase(self) -> String {
 								        // Vec<u8>::into_ascii_uppercase() preserves the UTF-8 invariant.
 								        unsafe { String::from_utf8_unchecked(self.into_bytes().into_ascii_uppercase()) }
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								    }
 								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn into_ascii_lowercase(self) -> String {
 								        // Vec<u8>::into_ascii_lowercase() preserves the UTF-8 invariant.
 								        unsafe { String::from_utf8_unchecked(self.into_bytes().into_ascii_lowercase()) }
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								    }
 								}
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
-												DSTify [T]/str extension traits

This PR changes the signature of several methods from `foo(self, ...)` to
`foo(&self, ...)`/`foo(&mut self, ...)`, but there is no breakage of the usage
of these methods due to the autoref nature of `method.call()`s. This PR also
removes the lifetime parameter from some traits (`Trait<'a>` -> `Trait`). These
changes break any use of the extension traits for generic programming, but
those traits are not meant to be used for generic programming in the first
place. In the whole rust distribution there was only one misuse of a extension
trait as a bound, which got corrected (the bound was unnecessary and got
removed) as part of this PR.

[breaking-change]

											
										
										
											2014-10-23 10:43:18 -05:00
+								impl AsciiExt<Vec<u8>> for [u8] {
-												Remove Ascii, AsciiCast, OwnedAsciiCast, AsciiStr, IntoBytes, IntoString.

As a replacement, add is_ascii() to AsciiExt, and implement AsciiExt for u8 and char.

[breaking-change]

											
										
										
											2014-12-06 19:55:34 -06:00
+								    #[inline]
 								    fn is_ascii(&self) -> bool {
 								        self.iter().all(|b| b.is_ascii())
 								    }
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn to_ascii_uppercase(&self) -> Vec<u8> {
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								        self.iter().map(|&byte| ASCII_UPPER_MAP[byte as uint]).collect()
 								    }
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn to_ascii_lowercase(&self) -> Vec<u8> {
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								        self.iter().map(|&byte| ASCII_LOWER_MAP[byte as uint]).collect()
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								    }
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								    #[inline]
 								    fn eq_ignore_ascii_case(&self, other: &[u8]) -> bool {
 								        self.len() == other.len() &&
 								            self.iter().zip(other.iter()).all(
 								            |(byte_self, byte_other)| {
 								                ASCII_LOWER_MAP[*byte_self as uint] ==
 								                    ASCII_LOWER_MAP[*byte_other as uint]
 								            })
 								    }
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								}
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								impl OwnedAsciiExt for Vec<u8> {
 								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn into_ascii_uppercase(mut self) -> Vec<u8> {
-												Fallout from renaming

											
										
										
											2014-09-14 22:27:36 -05:00
+								        for byte in self.iter_mut() {
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								            *byte = ASCII_UPPER_MAP[*byte as uint];
 								        }
 								        self
 								    }
 								    #[inline]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn into_ascii_lowercase(mut self) -> Vec<u8> {
-												Fallout from renaming

											
										
										
											2014-09-14 22:27:36 -05:00
+								        for byte in self.iter_mut() {
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
+								            *byte = ASCII_LOWER_MAP[*byte as uint];
 								        }
 								        self
-												Handle fallout in std::ascii and std::strconv

API changes:

- OwnedAsciiCast returns Vec<Ascii> instead of ~[Ascii]
- OwnedAsciiCast is implemented on Vec<u8>
- AsciiStr.to_lower/upper() returns Vec<Ascii>
- IntoBytes::into_bytes() returns Vec<u8>
- float_to_str_bytes_common() returns (Vec<u8>, bool)

											
										
										
											2014-05-04 00:02:59 -05:00
+								    }
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								}
-												Remove Ascii, AsciiCast, OwnedAsciiCast, AsciiStr, IntoBytes, IntoString.

As a replacement, add is_ascii() to AsciiExt, and implement AsciiExt for u8 and char.

[breaking-change]

											
										
										
											2014-12-06 19:55:34 -06:00
+								#[experimental = "would prefer to do this in a more general way"]
 								impl AsciiExt for u8 {
 								    #[inline]
 								    fn is_ascii(&self) -> bool {
 								        *self & 128 == 0u8
 								    }
 								    #[inline]
 								    fn to_ascii_uppercase(&self) -> u8 {
 								        ASCII_UPPER_MAP[*self as uint]
 								    }
 								    #[inline]
 								    fn to_ascii_lowercase(&self) -> u8 {
 								        ASCII_LOWER_MAP[*self as uint]
 								    }
 								    #[inline]
 								    fn eq_ignore_ascii_case(&self, other: &u8) -> bool {
 								        ASCII_LOWER_MAP[*self as uint] == ASCII_LOWER_MAP[*other as uint]
 								    }
 								}
 								#[experimental = "would prefer to do this in a more general way"]
 								impl AsciiExt for char {
 								    #[inline]
 								    fn is_ascii(&self) -> bool {
 								        *self as u32 <= 0x7F
 								    }
 								    #[inline]
 								    fn to_ascii_uppercase(&self) -> char {
 								        if self.is_ascii() {
 								            ASCII_UPPER_MAP[*self as uint] as char
 								        } else {
 								            *self
 								        }
 								    }
 								    #[inline]
 								    fn to_ascii_lowercase(&self) -> char {
 								        if self.is_ascii() {
 								            ASCII_UPPER_MAP[*self as uint] as char
 								        } else {
 								            *self
 								        }
 								    }
 								    #[inline]
 								    fn eq_ignore_ascii_case(&self, other: &char) -> bool {
 								        self.to_ascii_lowercase() == other.to_ascii_lowercase()
 								    }
 								}
-												libsyntax: Forbid escapes in the inclusive range `\x80`-`\xff` in
Unicode characters and strings.

Use `\u0080`-`\u00ff` instead. ASCII/byte literals are unaffected.

This PR introduces a new function, `escape_default`, into the ASCII
module. This was necessary for the pretty printer to continue to
function.

RFC #326.

Closes #18062.

[breaking-change]

											
										
										
											2014-10-27 11:13:51 -05:00
+								/// Returns a 'default' ASCII and C++11-like literal escape of a `u8`
 								///
 								/// The default is chosen with a bias toward producing literals that are
 								/// legal in a variety of languages, including C++11 and similar C-family
 								/// languages. The exact rules are:
 								///
 								/// - Tab, CR and LF are escaped as '\t', '\r' and '\n' respectively.
 								/// - Single-quote, double-quote and backslash chars are backslash-escaped.
 								/// - Any other chars in the range [0x20,0x7e] are not escaped.
 								/// - Any other chars are given hex escapes.
 								/// - Unicode escapes are never generated by this function.
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								#[unstable = "needs to be updated to use an iterator"]
-												libstd: use unboxed closures

											
										
										
											2014-12-07 13:15:25 -06:00
+								pub fn escape_default<F>(c: u8, mut f: F) where
 								    F: FnMut(u8),
 								{
-												libsyntax: Forbid escapes in the inclusive range `\x80`-`\xff` in
Unicode characters and strings.

Use `\u0080`-`\u00ff` instead. ASCII/byte literals are unaffected.

This PR introduces a new function, `escape_default`, into the ASCII
module. This was necessary for the pretty printer to continue to
function.

RFC #326.

Closes #18062.

[breaking-change]

											
										
										
											2014-10-27 11:13:51 -05:00
+								    match c {
 								        b'\t' => { f(b'\\'); f(b't'); }
 								        b'\r' => { f(b'\\'); f(b'r'); }
 								        b'\n' => { f(b'\\'); f(b'n'); }
 								        b'\\' => { f(b'\\'); f(b'\\'); }
 								        b'\'' => { f(b'\\'); f(b'\''); }
 								        b'"'  => { f(b'\\'); f(b'"'); }
 								        b'\x20' ... b'\x7e' => { f(c); }
 								        _ => {
 								            f(b'\\');
 								            f(b'x');
 								            for &offset in [4u, 0u].iter() {
 								                match ((c as i32) >> offset) & 0xf {
 								                    i @ 0 ... 9 => f(b'0' + (i as u8)),
 								                    i => f(b'a' + (i as u8 - 10)),
 								                }
 								            }
 								        }
 								    }
 								}
-												Rename the std::ascii::{Owned,}StrAsciiExt traits to {Owned,}AsciiExt

… and implement them on Vec<u8> / &[u8].

[breaking-change]

											
										
										
											2014-07-18 08:53:29 -05:00
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								static ASCII_LOWER_MAP: [u8, ..256] = [
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
 x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
 x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
 x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
-												Use byte literals in std::ascii::ASCII_{UPPER,LOWER}_MAP for readability.

											
										
										
											2014-07-18 08:11:40 -05:00
+								    b' ', b'!', b'"', b'#', b'$', b'%', b'&', b'\'',
 								    b'(', b')', b'*', b'+', b',', b'-', b'.', b'/',
 								    b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7',
 								    b'8', b'9', b':', b';', b'<', b'=', b'>', b'?',
 								    b'@',
 								          b'a', b'b', b'c', b'd', b'e', b'f', b'g',
 								    b'h', b'i', b'j', b'k', b'l', b'm', b'n', b'o',
 								    b'p', b'q', b'r', b's', b't', b'u', b'v', b'w',
 								    b'x', b'y', b'z',
 								                      b'[', b'\\', b']', b'^', b'_',
 								    b'`', b'a', b'b', b'c', b'd', b'e', b'f', b'g',
 								    b'h', b'i', b'j', b'k', b'l', b'm', b'n', b'o',
 								    b'p', b'q', b'r', b's', b't', b'u', b'v', b'w',
 								    b'x', b'y', b'z', b'{', b'|', b'}', b'~', 0x7f,
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
 x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
 x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
 x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
 xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
 xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
 xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
 xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
 xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
 xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
 xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
 xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
 xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
 xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
 xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
 xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
 								];
-												libs: stabilize ascii module

This is an initial API stabilization pass for `std::ascii`. Aside from
some renaming to match conversion conventions, and deprecations in favor
of using iterators directly, almost nothing is changed here. However,
the static case conversion tables that were previously public are now private.

The stabilization of the (rather large!) set of extension traits is left
to a follow-up pass, because we hope to land some more general machinery
that will provide the same functionality without custom traits.

[breaking-change]

											
										
										
											2014-11-21 14:00:05 -06:00
+								static ASCII_UPPER_MAP: [u8, ..256] = [
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
 x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
 x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
 x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
-												Use byte literals in std::ascii::ASCII_{UPPER,LOWER}_MAP for readability.

											
										
										
											2014-07-18 08:11:40 -05:00
+								    b' ', b'!', b'"', b'#', b'$', b'%', b'&', b'\'',
 								    b'(', b')', b'*', b'+', b',', b'-', b'.', b'/',
 								    b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7',
 								    b'8', b'9', b':', b';', b'<', b'=', b'>', b'?',
 								    b'@', b'A', b'B', b'C', b'D', b'E', b'F', b'G',
 								    b'H', b'I', b'J', b'K', b'L', b'M', b'N', b'O',
 								    b'P', b'Q', b'R', b'S', b'T', b'U', b'V', b'W',
 								    b'X', b'Y', b'Z', b'[', b'\\', b']', b'^', b'_',
 								    b'`',
 								          b'A', b'B', b'C', b'D', b'E', b'F', b'G',
 								    b'H', b'I', b'J', b'K', b'L', b'M', b'N', b'O',
 								    b'P', b'Q', b'R', b'S', b'T', b'U', b'V', b'W',
 								    b'X', b'Y', b'Z',
 								                      b'{', b'|', b'}', b'~', 0x7f,
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
 x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
 x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
 x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
 xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
 xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
 xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
 xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
 xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
 xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
 xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
 xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
 xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
 xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
 xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
 xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
 								];
-												Fixing some various warnings about unused imports

											
										
										
											2013-04-23 18:38:49 -05:00
+								#[cfg(test)]
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
+								mod tests {
-												stdtest: Fix all leaked trait imports

											
										
										
											2014-01-07 00:33:37 -06:00
+								    use prelude::*;
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
+								    use super::*;
-												stop treating char as an integer type

Closes #7609

											
										
										
											2013-09-03 18:24:12 -05:00
+								    use char::from_u32;
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
 								    #[test]
 								    fn test_ascii() {
-												Removed unneccessary `_iter` suffixes from various APIs

											
										
										
											2013-11-23 04:18:51 -06:00
+								        assert!("banana".chars().all(|c| c.is_ascii()));
 								        assert!(!"ประเทศไทย中华Việt Nam".chars().all(|c| c.is_ascii()));
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
+								    }
 								    #[test]
 								    fn test_ascii_vec() {
-												Removed ascii functions from other modules

Replaced str::to_lowercase and str::to_uppercase

											
										
										
											2013-04-23 04:08:13 -05:00
+								        assert!("".is_ascii());
 								        assert!("a".is_ascii());
-												Register new snapshots

											
										
										
											2014-12-09 16:08:10 -06:00
+								        assert!(!"\u{2009}".is_ascii());
-												Removed ascii functions from other modules

Replaced str::to_lowercase and str::to_uppercase

											
										
										
											2013-04-23 04:08:13 -05:00
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
+								    }
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								    #[test]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn test_to_ascii_uppercase() {
 								        assert_eq!("url()URL()uRl()ürl".to_ascii_uppercase(), "URL()URL()URL()üRL");
 								        assert_eq!("hıKß".to_ascii_uppercase(), "HıKß");
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
 								        let mut i = 0;
 								        while i <= 500 {
-												stop treating char as an integer type

Closes #7609

											
										
										
											2013-09-03 18:24:12 -05:00
+								            let upper = if 'a' as u32 <= i && i <= 'z' as u32 { i + 'A' as u32 - 'a' as u32 }
 								                        else { i };
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								            assert_eq!((from_u32(i).unwrap()).to_string().to_ascii_uppercase(),
-												librustc: Always parse `macro!()`/`macro![]` as expressions if not
followed by a semicolon.

This allows code like `vec![1i, 2, 3].len();` to work.

This breaks code that uses macros as statements without putting
semicolons after them, such as:

    fn main() {
        ...
        assert!(a == b)
        assert!(c == d)
        println(...);
    }

It also breaks code that uses macros as items without semicolons:

    local_data_key!(foo)

    fn main() {
        println("hello world")
    }

Add semicolons to fix this code. Those two examples can be fixed as
follows:

    fn main() {
        ...
        assert!(a == b);
        assert!(c == d);
        println(...);
    }

    local_data_key!(foo);

    fn main() {
        println("hello world")
    }

RFC #378.

Closes #18635.

[breaking-change]

											
										
										
											2014-11-14 11:18:10 -06:00
+								                       (from_u32(upper).unwrap()).to_string());
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								            i += 1;
 								        }
 								    }
 								    #[test]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn test_to_ascii_lowercase() {
 								        assert_eq!("url()URL()uRl()Ürl".to_ascii_lowercase(), "url()url()url()Ürl");
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								        // Dotted capital I, Kelvin sign, Sharp S.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								        assert_eq!("HİKß".to_ascii_lowercase(), "hİKß");
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
 								        let mut i = 0;
 								        while i <= 500 {
-												stop treating char as an integer type

Closes #7609

											
										
										
											2013-09-03 18:24:12 -05:00
+								            let lower = if 'A' as u32 <= i && i <= 'Z' as u32 { i + 'a' as u32 - 'A' as u32 }
 								                        else { i };
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								            assert_eq!((from_u32(i).unwrap()).to_string().to_ascii_lowercase(),
-												librustc: Always parse `macro!()`/`macro![]` as expressions if not
followed by a semicolon.

This allows code like `vec![1i, 2, 3].len();` to work.

This breaks code that uses macros as statements without putting
semicolons after them, such as:

    fn main() {
        ...
        assert!(a == b)
        assert!(c == d)
        println(...);
    }

It also breaks code that uses macros as items without semicolons:

    local_data_key!(foo)

    fn main() {
        println("hello world")
    }

Add semicolons to fix this code. Those two examples can be fixed as
follows:

    fn main() {
        ...
        assert!(a == b);
        assert!(c == d);
        println(...);
    }

    local_data_key!(foo);

    fn main() {
        println("hello world")
    }

RFC #378.

Closes #18635.

[breaking-change]

											
										
										
											2014-11-14 11:18:10 -06:00
+								                       (from_u32(lower).unwrap()).to_string());
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								            i += 1;
 								        }
 								    }
 								    #[test]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn test_into_ascii_uppercase() {
 								        assert_eq!(("url()URL()uRl()ürl".to_string()).into_ascii_uppercase(),
-												std: Rename strbuf operations to string

[breaking-change]

											
										
										
											2014-05-25 05:17:19 -05:00
+								                   "URL()URL()URL()üRL".to_string());
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								        assert_eq!(("hıKß".to_string()).into_ascii_uppercase(), "HıKß");
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
 								        let mut i = 0;
 								        while i <= 500 {
 								            let upper = if 'a' as u32 <= i && i <= 'z' as u32 { i + 'A' as u32 - 'a' as u32 }
 								                        else { i };
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								            assert_eq!((from_u32(i).unwrap()).to_string().into_ascii_uppercase(),
-												librustc: Always parse `macro!()`/`macro![]` as expressions if not
followed by a semicolon.

This allows code like `vec![1i, 2, 3].len();` to work.

This breaks code that uses macros as statements without putting
semicolons after them, such as:

    fn main() {
        ...
        assert!(a == b)
        assert!(c == d)
        println(...);
    }

It also breaks code that uses macros as items without semicolons:

    local_data_key!(foo)

    fn main() {
        println("hello world")
    }

Add semicolons to fix this code. Those two examples can be fixed as
follows:

    fn main() {
        ...
        assert!(a == b);
        assert!(c == d);
        println(...);
    }

    local_data_key!(foo);

    fn main() {
        println("hello world")
    }

RFC #378.

Closes #18635.

[breaking-change]

											
										
										
											2014-11-14 11:18:10 -06:00
+								                       (from_u32(upper).unwrap()).to_string());
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								            i += 1;
 								        }
 								    }
 								    #[test]
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								    fn test_into_ascii_lowercase() {
 								        assert_eq!(("url()URL()uRl()Ürl".to_string()).into_ascii_lowercase(),
-												libstd: remove unnecessary `to_string()` calls

											
										
										
											2014-11-27 18:45:47 -06:00
+								                   "url()url()url()Ürl");
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
+								        // Dotted capital I, Kelvin sign, Sharp S.
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								        assert_eq!(("HİKß".to_string()).into_ascii_lowercase(), "hİKß");
-												Some work on std::ascii: Marked unsafe function unsafe, added moving implementations

											
										
										
											2013-09-08 18:45:14 -05:00
 								        let mut i = 0;
 								        while i <= 500 {
 								            let lower = if 'A' as u32 <= i && i <= 'Z' as u32 { i + 'a' as u32 - 'A' as u32 }
 								                        else { i };
-												Rename to_ascii_{lower,upper} to to_ascii_{lower,upper}case, per #14401

[breaking-change]

											
										
										
											2014-12-05 11:57:42 -06:00
+								            assert_eq!((from_u32(i).unwrap()).to_string().into_ascii_lowercase(),
-												librustc: Always parse `macro!()`/`macro![]` as expressions if not
followed by a semicolon.

This allows code like `vec![1i, 2, 3].len();` to work.

This breaks code that uses macros as statements without putting
semicolons after them, such as:

    fn main() {
        ...
        assert!(a == b)
        assert!(c == d)
        println(...);
    }

It also breaks code that uses macros as items without semicolons:

    local_data_key!(foo)

    fn main() {
        println("hello world")
    }

Add semicolons to fix this code. Those two examples can be fixed as
follows:

    fn main() {
        ...
        assert!(a == b);
        assert!(c == d);
        println(...);
    }

    local_data_key!(foo);

    fn main() {
        println("hello world")
    }

RFC #378.

Closes #18635.

[breaking-change]

											
										
										
											2014-11-14 11:18:10 -06:00
+								                       (from_u32(lower).unwrap()).to_string());
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								            i += 1;
 								        }
 								    }
 								    #[test]
 								    fn test_eq_ignore_ascii_case() {
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								        assert!("url()URL()uRl()Ürl".eq_ignore_ascii_case("url()url()url()Ürl"));
 								        assert!(!"Ürl".eq_ignore_ascii_case("ürl"));
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								        // Dotted capital I, Kelvin sign, Sharp S.
-												Methodyfied the string ascii extionsion functions
Added into_owned() method for vectors
Added DoubleEnded Iterator impl to Option
Renamed nil.rs to unit.rs

											
										
										
											2013-08-10 21:21:31 -05:00
+								        assert!("HİKß".eq_ignore_ascii_case("hİKß"));
 								        assert!(!"İ".eq_ignore_ascii_case("i"));
 								        assert!(!"K".eq_ignore_ascii_case("k"));
 								        assert!(!"ß".eq_ignore_ascii_case("s"));
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
 								        let mut i = 0;
 								        while i <= 500 {
-												stop treating char as an integer type

Closes #7609

											
										
										
											2013-09-03 18:24:12 -05:00
+								            let c = i;
 								            let lower = if 'A' as u32 <= c && c <= 'Z' as u32 { c + 'a' as u32 - 'A' as u32 }
 								                        else { c };
-												libstd: remove unnecessary `as_slice()` calls

											
										
										
											2014-11-27 13:43:55 -06:00
+								            assert!((from_u32(i).unwrap()).to_string().eq_ignore_ascii_case(
-												Fix errors

											
										
										
											2014-07-04 15:38:13 -05:00
+								                    (from_u32(lower).unwrap()).to_string().as_slice()));
-												Add to_ascii_upper, to_ascii_lower and eq_ignore_ascii_case in std::ascii

											
										
										
											2013-08-02 15:39:57 -05:00
+								            i += 1;
 								        }
 								    }
-												Added Ascii type

											
										
										
											2013-04-20 12:39:15 -05:00
+								}