2014-01-30 12:29:35 -06:00
|
|
|
|
// Copyright 2013-2014 The Rust Project Developers. See the COPYRIGHT
|
2013-04-20 12:39:15 -05:00
|
|
|
|
// file at the top-level directory of this distribution and at
|
|
|
|
|
// http://rust-lang.org/COPYRIGHT.
|
|
|
|
|
//
|
|
|
|
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
|
|
|
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
|
|
|
|
// option. This file may not be copied, modified, or distributed
|
|
|
|
|
// except according to those terms.
|
2014-07-14 22:46:04 -05:00
|
|
|
|
//
|
|
|
|
|
// ignore-lexer-test FIXME #15679
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
2013-12-24 10:08:28 -06:00
|
|
|
|
//! Operations on ASCII strings and characters
|
2013-05-03 01:20:01 -05:00
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#![unstable = "unsure about placement and naming"]
|
2014-11-21 14:51:22 -06:00
|
|
|
|
#![allow(deprecated)]
|
2014-06-30 19:22:40 -05:00
|
|
|
|
|
2014-10-23 10:43:18 -05:00
|
|
|
|
use core::kinds::Sized;
|
2014-02-12 13:41:34 -06:00
|
|
|
|
use fmt;
|
2014-11-06 11:32:37 -06:00
|
|
|
|
use iter::IteratorExt;
|
librustc: Make `Copy` opt-in.
This change makes the compiler no longer infer whether types (structures
and enumerations) implement the `Copy` trait (and thus are implicitly
copyable). Rather, you must implement `Copy` yourself via `impl Copy for
MyType {}`.
A new warning has been added, `missing_copy_implementations`, to warn
you if a non-generic public type has been added that could have
implemented `Copy` but didn't.
For convenience, you may *temporarily* opt out of this behavior by using
`#![feature(opt_out_copy)]`. Note though that this feature gate will never be
accepted and will be removed by the time that 1.0 is released, so you should
transition your code away from using it.
This breaks code like:
#[deriving(Show)]
struct Point2D {
x: int,
y: int,
}
fn main() {
let mypoint = Point2D {
x: 1,
y: 1,
};
let otherpoint = mypoint;
println!("{}{}", mypoint, otherpoint);
}
Change this code to:
#[deriving(Show)]
struct Point2D {
x: int,
y: int,
}
impl Copy for Point2D {}
fn main() {
let mypoint = Point2D {
x: 1,
y: 1,
};
let otherpoint = mypoint;
println!("{}{}", mypoint, otherpoint);
}
This is the backwards-incompatible part of #13231.
Part of RFC #3.
[breaking-change]
2014-12-05 19:01:33 -06:00
|
|
|
|
use kinds::Copy;
|
core: Remove the cast module
This commit revisits the `cast` module in libcore and libstd, and scrutinizes
all functions inside of it. The result was to remove the `cast` module entirely,
folding all functionality into the `mem` module. Specifically, this is the fate
of each function in the `cast` module.
* transmute - This function was moved to `mem`, but it is now marked as
#[unstable]. This is due to planned changes to the `transmute`
function and how it can be invoked (see the #[unstable] comment).
For more information, see RFC 5 and #12898
* transmute_copy - This function was moved to `mem`, with clarification that is
is not an error to invoke it with T/U that are different
sizes, but rather that it is strongly discouraged. This
function is now #[stable]
* forget - This function was moved to `mem` and marked #[stable]
* bump_box_refcount - This function was removed due to the deprecation of
managed boxes as well as its questionable utility.
* transmute_mut - This function was previously deprecated, and removed as part
of this commit.
* transmute_mut_unsafe - This function doesn't serve much of a purpose when it
can be achieved with an `as` in safe code, so it was
removed.
* transmute_lifetime - This function was removed because it is likely a strong
indication that code is incorrect in the first place.
* transmute_mut_lifetime - This function was removed for the same reasons as
`transmute_lifetime`
* copy_lifetime - This function was moved to `mem`, but it is marked
`#[unstable]` now due to the likelihood of being removed in
the future if it is found to not be very useful.
* copy_mut_lifetime - This function was also moved to `mem`, but had the same
treatment as `copy_lifetime`.
* copy_lifetime_vec - This function was removed because it is not used today,
and its existence is not necessary with DST
(copy_lifetime will suffice).
In summary, the cast module was stripped down to these functions, and then the
functions were moved to the `mem` module.
transmute - #[unstable]
transmute_copy - #[stable]
forget - #[stable]
copy_lifetime - #[unstable]
copy_mut_lifetime - #[unstable]
[breaking-change]
2014-05-09 12:34:51 -05:00
|
|
|
|
use mem;
|
2014-11-28 10:57:41 -06:00
|
|
|
|
use option::Option;
|
|
|
|
|
use option::Option::{Some, None};
|
2014-11-02 19:04:32 -06:00
|
|
|
|
use slice::{SlicePrelude, AsSlice};
|
|
|
|
|
use str::{Str, StrPrelude};
|
2014-11-20 12:11:15 -06:00
|
|
|
|
use string::{String, IntoString};
|
2014-03-20 02:35:51 -05:00
|
|
|
|
use vec::Vec;
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
2013-06-16 04:04:53 -05:00
|
|
|
|
/// Datatype to hold one ascii character. It wraps a `u8`, with the highest bit always zero.
|
2014-05-31 12:43:52 -05:00
|
|
|
|
#[deriving(Clone, PartialEq, PartialOrd, Ord, Eq, Hash)]
|
2014-03-27 17:09:47 -05:00
|
|
|
|
pub struct Ascii { chr: u8 }
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
librustc: Make `Copy` opt-in.
This change makes the compiler no longer infer whether types (structures
and enumerations) implement the `Copy` trait (and thus are implicitly
copyable). Rather, you must implement `Copy` yourself via `impl Copy for
MyType {}`.
A new warning has been added, `missing_copy_implementations`, to warn
you if a non-generic public type has been added that could have
implemented `Copy` but didn't.
For convenience, you may *temporarily* opt out of this behavior by using
`#![feature(opt_out_copy)]`. Note though that this feature gate will never be
accepted and will be removed by the time that 1.0 is released, so you should
transition your code away from using it.
This breaks code like:
#[deriving(Show)]
struct Point2D {
x: int,
y: int,
}
fn main() {
let mypoint = Point2D {
x: 1,
y: 1,
};
let otherpoint = mypoint;
println!("{}{}", mypoint, otherpoint);
}
Change this code to:
#[deriving(Show)]
struct Point2D {
x: int,
y: int,
}
impl Copy for Point2D {}
fn main() {
let mypoint = Point2D {
x: 1,
y: 1,
};
let otherpoint = mypoint;
println!("{}{}", mypoint, otherpoint);
}
This is the backwards-incompatible part of #13231.
Part of RFC #3.
[breaking-change]
2014-12-05 19:01:33 -06:00
|
|
|
|
impl Copy for Ascii {}
|
|
|
|
|
|
2013-05-31 17:17:22 -05:00
|
|
|
|
impl Ascii {
|
2014-01-30 12:29:35 -06:00
|
|
|
|
/// Converts an ascii character into a `u8`.
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[unstable = "recently renamed"]
|
|
|
|
|
pub fn as_byte(&self) -> u8 {
|
2013-04-20 12:39:15 -05:00
|
|
|
|
self.chr
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:51:22 -06:00
|
|
|
|
/// Deprecated: use `as_byte` isntead.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[deprecated = "use as_byte"]
|
|
|
|
|
pub fn to_byte(self) -> u8 {
|
|
|
|
|
self.as_byte()
|
|
|
|
|
}
|
|
|
|
|
|
2014-01-30 12:29:35 -06:00
|
|
|
|
/// Converts an ascii character into a `char`.
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[unstable = "recently renamed"]
|
|
|
|
|
pub fn as_char(&self) -> char {
|
2013-04-20 12:39:15 -05:00
|
|
|
|
self.chr as char
|
|
|
|
|
}
|
2013-04-20 15:50:50 -05:00
|
|
|
|
|
2014-11-21 14:51:22 -06:00
|
|
|
|
/// Deprecated: use `as_char` isntead.
|
|
|
|
|
#[deprecated = "use as_char"]
|
|
|
|
|
pub fn to_char(self) -> char {
|
|
|
|
|
self.as_char()
|
|
|
|
|
}
|
|
|
|
|
|
2014-05-24 05:24:50 -05:00
|
|
|
|
/// Convert to lowercase.
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
|
|
|
|
pub fn to_lowercase(&self) -> Ascii {
|
2014-04-01 22:39:26 -05:00
|
|
|
|
Ascii{chr: ASCII_LOWER_MAP[self.chr as uint]}
|
2013-04-20 15:50:50 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-05-24 05:24:50 -05:00
|
|
|
|
/// Convert to uppercase.
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
|
|
|
|
pub fn to_uppercase(&self) -> Ascii {
|
2014-04-01 22:39:26 -05:00
|
|
|
|
Ascii{chr: ASCII_UPPER_MAP[self.chr as uint]}
|
2013-04-20 15:50:50 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-05-31 17:17:22 -05:00
|
|
|
|
/// Compares two ascii characters of equality, ignoring case.
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[deprecated = "normalize with to_lowercase"]
|
2013-05-31 17:17:22 -05:00
|
|
|
|
pub fn eq_ignore_case(self, other: Ascii) -> bool {
|
2014-04-01 22:39:26 -05:00
|
|
|
|
ASCII_LOWER_MAP[self.chr as uint] == ASCII_LOWER_MAP[other.chr as uint]
|
2013-04-20 15:50:50 -05:00
|
|
|
|
}
|
2013-11-22 10:38:50 -06:00
|
|
|
|
|
|
|
|
|
// the following methods are like ctype, and the implementation is inspired by musl
|
|
|
|
|
|
2014-05-24 05:24:50 -05:00
|
|
|
|
/// Check if the character is a letter (a-z, A-Z)
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2014-05-24 05:24:50 -05:00
|
|
|
|
pub fn is_alphabetic(&self) -> bool {
|
2013-11-22 10:38:50 -06:00
|
|
|
|
(self.chr >= 0x41 && self.chr <= 0x5A) || (self.chr >= 0x61 && self.chr <= 0x7A)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Check if the character is a number (0-9)
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[unstable = "may be renamed"]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_digit(&self) -> bool {
|
2013-11-26 20:13:25 -06:00
|
|
|
|
self.chr >= 0x30 && self.chr <= 0x39
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
2014-05-24 05:24:50 -05:00
|
|
|
|
/// Check if the character is a letter or number
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2014-05-24 05:24:50 -05:00
|
|
|
|
pub fn is_alphanumeric(&self) -> bool {
|
2014-09-17 12:47:05 -05:00
|
|
|
|
self.is_alphabetic() || self.is_digit()
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Check if the character is a space or horizontal tab
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "likely to be removed"]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_blank(&self) -> bool {
|
2014-08-06 01:02:50 -05:00
|
|
|
|
self.chr == b' ' || self.chr == b'\t'
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Check if the character is a control character
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_control(&self) -> bool {
|
2013-11-26 20:13:25 -06:00
|
|
|
|
self.chr < 0x20 || self.chr == 0x7F
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Checks if the character is printable (except space)
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "unsure about naming, or whether this is needed"]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_graph(&self) -> bool {
|
|
|
|
|
(self.chr - 0x21) < 0x5E
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Checks if the character is printable (including space)
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[unstable = "unsure about naming"]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_print(&self) -> bool {
|
|
|
|
|
(self.chr - 0x20) < 0x5F
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
/// Checks if the character is alphabetic and lowercase
|
2014-05-24 05:24:50 -05:00
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2014-05-24 05:24:50 -05:00
|
|
|
|
pub fn is_lowercase(&self) -> bool {
|
2014-08-06 01:02:50 -05:00
|
|
|
|
(self.chr - b'a') < 26
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
/// Checks if the character is alphabetic and uppercase
|
2014-05-24 05:24:50 -05:00
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2014-05-24 05:24:50 -05:00
|
|
|
|
pub fn is_uppercase(&self) -> bool {
|
2014-08-06 01:02:50 -05:00
|
|
|
|
(self.chr - b'A') < 26
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Checks if the character is punctuation
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_punctuation(&self) -> bool {
|
2014-09-17 12:47:05 -05:00
|
|
|
|
self.is_graph() && !self.is_alphanumeric()
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Checks if the character is a valid hex digit
|
|
|
|
|
#[inline]
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[stable]
|
2013-11-22 10:38:50 -06:00
|
|
|
|
pub fn is_hex(&self) -> bool {
|
2014-08-06 01:02:50 -05:00
|
|
|
|
self.is_digit() || ((self.chr | 32u8) - b'a') < 6
|
2013-11-22 10:38:50 -06:00
|
|
|
|
}
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-02-12 13:41:34 -06:00
|
|
|
|
impl<'a> fmt::Show for Ascii {
|
|
|
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
|
|
|
|
(self.chr as char).fmt(f)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2013-04-20 12:39:15 -05:00
|
|
|
|
/// Trait for converting into an ascii type.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
pub trait AsciiCast<T> {
|
2014-10-09 14:17:22 -05:00
|
|
|
|
/// Convert to an ascii type, panic on non-ASCII input.
|
2013-12-05 14:38:04 -06:00
|
|
|
|
#[inline]
|
|
|
|
|
fn to_ascii(&self) -> T {
|
|
|
|
|
assert!(self.is_ascii());
|
|
|
|
|
unsafe {self.to_ascii_nocheck()}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Convert to an ascii type, return None on non-ASCII input.
|
|
|
|
|
#[inline]
|
|
|
|
|
fn to_ascii_opt(&self) -> Option<T> {
|
|
|
|
|
if self.is_ascii() {
|
|
|
|
|
Some(unsafe { self.to_ascii_nocheck() })
|
|
|
|
|
} else {
|
|
|
|
|
None
|
|
|
|
|
}
|
|
|
|
|
}
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
2013-06-16 04:04:53 -05:00
|
|
|
|
/// Convert to an ascii type, not doing any range asserts
|
|
|
|
|
unsafe fn to_ascii_nocheck(&self) -> T;
|
|
|
|
|
|
2013-04-20 12:39:15 -05:00
|
|
|
|
/// Check if convertible to ascii
|
|
|
|
|
fn is_ascii(&self) -> bool;
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-12-10 01:16:18 -06:00
|
|
|
|
impl<'a> AsciiCast<&'a[Ascii]> for &'a [u8] {
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-12-10 01:16:18 -06:00
|
|
|
|
unsafe fn to_ascii_nocheck(&self) -> &'a[Ascii] {
|
core: Remove the cast module
This commit revisits the `cast` module in libcore and libstd, and scrutinizes
all functions inside of it. The result was to remove the `cast` module entirely,
folding all functionality into the `mem` module. Specifically, this is the fate
of each function in the `cast` module.
* transmute - This function was moved to `mem`, but it is now marked as
#[unstable]. This is due to planned changes to the `transmute`
function and how it can be invoked (see the #[unstable] comment).
For more information, see RFC 5 and #12898
* transmute_copy - This function was moved to `mem`, with clarification that is
is not an error to invoke it with T/U that are different
sizes, but rather that it is strongly discouraged. This
function is now #[stable]
* forget - This function was moved to `mem` and marked #[stable]
* bump_box_refcount - This function was removed due to the deprecation of
managed boxes as well as its questionable utility.
* transmute_mut - This function was previously deprecated, and removed as part
of this commit.
* transmute_mut_unsafe - This function doesn't serve much of a purpose when it
can be achieved with an `as` in safe code, so it was
removed.
* transmute_lifetime - This function was removed because it is likely a strong
indication that code is incorrect in the first place.
* transmute_mut_lifetime - This function was removed for the same reasons as
`transmute_lifetime`
* copy_lifetime - This function was moved to `mem`, but it is marked
`#[unstable]` now due to the likelihood of being removed in
the future if it is found to not be very useful.
* copy_mut_lifetime - This function was also moved to `mem`, but had the same
treatment as `copy_lifetime`.
* copy_lifetime_vec - This function was removed because it is not used today,
and its existence is not necessary with DST
(copy_lifetime will suffice).
In summary, the cast module was stripped down to these functions, and then the
functions were moved to the `mem` module.
transmute - #[unstable]
transmute_copy - #[stable]
forget - #[stable]
copy_lifetime - #[unstable]
copy_mut_lifetime - #[unstable]
[breaking-change]
2014-05-09 12:34:51 -05:00
|
|
|
|
mem::transmute(*self)
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
fn is_ascii(&self) -> bool {
|
2013-08-03 11:45:23 -05:00
|
|
|
|
for b in self.iter() {
|
2013-04-20 12:39:15 -05:00
|
|
|
|
if !b.is_ascii() { return false; }
|
|
|
|
|
}
|
|
|
|
|
true
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-12-10 01:16:18 -06:00
|
|
|
|
impl<'a> AsciiCast<&'a [Ascii]> for &'a str {
|
2013-08-04 15:22:56 -05:00
|
|
|
|
#[inline]
|
2013-12-10 01:16:18 -06:00
|
|
|
|
unsafe fn to_ascii_nocheck(&self) -> &'a [Ascii] {
|
core: Remove the cast module
This commit revisits the `cast` module in libcore and libstd, and scrutinizes
all functions inside of it. The result was to remove the `cast` module entirely,
folding all functionality into the `mem` module. Specifically, this is the fate
of each function in the `cast` module.
* transmute - This function was moved to `mem`, but it is now marked as
#[unstable]. This is due to planned changes to the `transmute`
function and how it can be invoked (see the #[unstable] comment).
For more information, see RFC 5 and #12898
* transmute_copy - This function was moved to `mem`, with clarification that is
is not an error to invoke it with T/U that are different
sizes, but rather that it is strongly discouraged. This
function is now #[stable]
* forget - This function was moved to `mem` and marked #[stable]
* bump_box_refcount - This function was removed due to the deprecation of
managed boxes as well as its questionable utility.
* transmute_mut - This function was previously deprecated, and removed as part
of this commit.
* transmute_mut_unsafe - This function doesn't serve much of a purpose when it
can be achieved with an `as` in safe code, so it was
removed.
* transmute_lifetime - This function was removed because it is likely a strong
indication that code is incorrect in the first place.
* transmute_mut_lifetime - This function was removed for the same reasons as
`transmute_lifetime`
* copy_lifetime - This function was moved to `mem`, but it is marked
`#[unstable]` now due to the likelihood of being removed in
the future if it is found to not be very useful.
* copy_mut_lifetime - This function was also moved to `mem`, but had the same
treatment as `copy_lifetime`.
* copy_lifetime_vec - This function was removed because it is not used today,
and its existence is not necessary with DST
(copy_lifetime will suffice).
In summary, the cast module was stripped down to these functions, and then the
functions were moved to the `mem` module.
transmute - #[unstable]
transmute_copy - #[stable]
forget - #[stable]
copy_lifetime - #[unstable]
copy_mut_lifetime - #[unstable]
[breaking-change]
2014-05-09 12:34:51 -05:00
|
|
|
|
mem::transmute(*self)
|
2013-08-04 15:22:56 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
fn is_ascii(&self) -> bool {
|
2013-11-23 04:18:51 -06:00
|
|
|
|
self.bytes().all(|b| b.is_ascii())
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
impl AsciiCast<Ascii> for u8 {
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-06-16 04:04:53 -05:00
|
|
|
|
unsafe fn to_ascii_nocheck(&self) -> Ascii {
|
2013-04-20 12:39:15 -05:00
|
|
|
|
Ascii{ chr: *self }
|
|
|
|
|
}
|
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
fn is_ascii(&self) -> bool {
|
|
|
|
|
*self & 128 == 0u8
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
impl AsciiCast<Ascii> for char {
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-06-16 04:04:53 -05:00
|
|
|
|
unsafe fn to_ascii_nocheck(&self) -> Ascii {
|
2013-04-20 12:39:15 -05:00
|
|
|
|
Ascii{ chr: *self as u8 }
|
|
|
|
|
}
|
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
fn is_ascii(&self) -> bool {
|
2013-09-03 18:24:12 -05:00
|
|
|
|
*self as u32 - ('\x7F' as u32 & *self as u32) == 0
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Trait for copyless casting to an ascii vector.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
pub trait OwnedAsciiCast {
|
2013-12-05 14:38:04 -06:00
|
|
|
|
/// Check if convertible to ascii
|
|
|
|
|
fn is_ascii(&self) -> bool;
|
|
|
|
|
|
2014-11-08 09:47:51 -06:00
|
|
|
|
/// Take ownership and cast to an ascii vector.
|
|
|
|
|
/// # Panics
|
|
|
|
|
///
|
|
|
|
|
/// Panic on non-ASCII input.
|
2013-12-05 14:38:04 -06:00
|
|
|
|
#[inline]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
fn into_ascii(self) -> Vec<Ascii> {
|
2013-12-05 14:38:04 -06:00
|
|
|
|
assert!(self.is_ascii());
|
|
|
|
|
unsafe {self.into_ascii_nocheck()}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Take ownership and cast to an ascii vector. Return None on non-ASCII input.
|
|
|
|
|
#[inline]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
fn into_ascii_opt(self) -> Option<Vec<Ascii>> {
|
2013-12-05 14:38:04 -06:00
|
|
|
|
if self.is_ascii() {
|
|
|
|
|
Some(unsafe { self.into_ascii_nocheck() })
|
|
|
|
|
} else {
|
|
|
|
|
None
|
|
|
|
|
}
|
|
|
|
|
}
|
2013-06-16 04:04:53 -05:00
|
|
|
|
|
2013-11-07 01:59:40 -06:00
|
|
|
|
/// Take ownership and cast to an ascii vector.
|
2013-06-16 04:04:53 -05:00
|
|
|
|
/// Does not perform validation checks.
|
2014-05-04 00:02:59 -05:00
|
|
|
|
unsafe fn into_ascii_nocheck(self) -> Vec<Ascii>;
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2014-05-22 18:57:53 -05:00
|
|
|
|
impl OwnedAsciiCast for String {
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2013-12-05 14:38:04 -06:00
|
|
|
|
fn is_ascii(&self) -> bool {
|
|
|
|
|
self.as_slice().is_ascii()
|
2013-06-16 04:04:53 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-08-04 15:22:56 -05:00
|
|
|
|
#[inline]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
unsafe fn into_ascii_nocheck(self) -> Vec<Ascii> {
|
2014-10-27 10:04:55 -05:00
|
|
|
|
self.into_bytes().into_ascii_nocheck()
|
2014-05-04 00:02:59 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
impl OwnedAsciiCast for Vec<u8> {
|
|
|
|
|
#[inline]
|
|
|
|
|
fn is_ascii(&self) -> bool {
|
|
|
|
|
self.as_slice().is_ascii()
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
unsafe fn into_ascii_nocheck(self) -> Vec<Ascii> {
|
2014-10-27 11:11:07 -05:00
|
|
|
|
let v = Vec::from_raw_parts(self.as_ptr() as *mut Ascii,
|
|
|
|
|
self.len(),
|
|
|
|
|
self.capacity());
|
2014-10-27 10:04:55 -05:00
|
|
|
|
|
|
|
|
|
// We forget `self` to avoid freeing it at the end of the scope
|
|
|
|
|
// Otherwise, the returned `Vec` would point to freed memory
|
|
|
|
|
mem::forget(self);
|
|
|
|
|
v
|
2013-08-04 15:22:56 -05:00
|
|
|
|
}
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-11-07 01:59:40 -06:00
|
|
|
|
/// Trait for converting an ascii type to a string. Needed to convert
|
|
|
|
|
/// `&[Ascii]` to `&str`.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
pub trait AsciiStr for Sized? {
|
2013-04-20 12:39:15 -05:00
|
|
|
|
/// Convert to a string.
|
2013-11-07 01:59:40 -06:00
|
|
|
|
fn as_str_ascii<'a>(&'a self) -> &'a str;
|
2013-04-22 14:42:25 -05:00
|
|
|
|
|
2014-10-11 05:50:35 -05:00
|
|
|
|
/// Deprecated: use `to_lowercase`
|
|
|
|
|
#[deprecated="renamed `to_lowercase`"]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
fn to_lower(&self) -> Vec<Ascii>;
|
2013-04-22 14:42:25 -05:00
|
|
|
|
|
2014-10-11 05:50:35 -05:00
|
|
|
|
/// Convert to vector representing a lower cased ascii string.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[deprecated = "use iterators instead"]
|
2014-10-11 05:50:35 -05:00
|
|
|
|
fn to_lowercase(&self) -> Vec<Ascii>;
|
|
|
|
|
|
|
|
|
|
/// Deprecated: use `to_uppercase`
|
|
|
|
|
#[deprecated="renamed `to_uppercase`"]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
fn to_upper(&self) -> Vec<Ascii>;
|
2013-04-22 14:42:25 -05:00
|
|
|
|
|
2014-10-11 05:50:35 -05:00
|
|
|
|
/// Convert to vector representing a upper cased ascii string.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[deprecated = "use iterators instead"]
|
2014-10-11 05:50:35 -05:00
|
|
|
|
fn to_uppercase(&self) -> Vec<Ascii>;
|
|
|
|
|
|
2013-11-07 01:59:40 -06:00
|
|
|
|
/// Compares two Ascii strings ignoring case.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[deprecated = "use iterators instead"]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
fn eq_ignore_case(&self, other: &[Ascii]) -> bool;
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
impl AsciiStr for [Ascii] {
|
2013-08-04 15:22:56 -05:00
|
|
|
|
#[inline]
|
2013-11-07 01:59:40 -06:00
|
|
|
|
fn as_str_ascii<'a>(&'a self) -> &'a str {
|
2014-10-23 10:43:18 -05:00
|
|
|
|
unsafe { mem::transmute(self) }
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
2013-04-22 14:42:25 -05:00
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
fn to_lower(&self) -> Vec<Ascii> {
|
2014-10-11 05:50:35 -05:00
|
|
|
|
self.to_lowercase()
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
fn to_lowercase(&self) -> Vec<Ascii> {
|
2014-09-17 12:47:05 -05:00
|
|
|
|
self.iter().map(|a| a.to_lowercase()).collect()
|
2013-04-22 14:42:25 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
fn to_upper(&self) -> Vec<Ascii> {
|
2014-10-11 05:50:35 -05:00
|
|
|
|
self.to_uppercase()
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
fn to_uppercase(&self) -> Vec<Ascii> {
|
2014-09-17 12:47:05 -05:00
|
|
|
|
self.iter().map(|a| a.to_uppercase()).collect()
|
2013-04-22 14:42:25 -05:00
|
|
|
|
}
|
2013-06-16 04:04:53 -05:00
|
|
|
|
|
2013-06-18 16:45:18 -05:00
|
|
|
|
#[inline]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
fn eq_ignore_case(&self, other: &[Ascii]) -> bool {
|
2013-11-20 16:17:12 -06:00
|
|
|
|
self.iter().zip(other.iter()).all(|(&a, &b)| a.eq_ignore_case(b))
|
2013-06-16 04:04:53 -05:00
|
|
|
|
}
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-15 05:09:26 -06:00
|
|
|
|
impl IntoString for Vec<Ascii> {
|
2014-03-17 01:30:27 -05:00
|
|
|
|
#[inline]
|
2014-06-21 05:39:03 -05:00
|
|
|
|
fn into_string(self) -> String {
|
2014-11-20 12:11:15 -06:00
|
|
|
|
unsafe { String::from_utf8_unchecked(self.into_bytes()) }
|
2014-03-17 01:30:27 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-05-04 00:02:59 -05:00
|
|
|
|
/// Trait to convert to an owned byte vector by consuming self
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2013-12-14 08:04:22 -06:00
|
|
|
|
pub trait IntoBytes {
|
2014-05-04 00:02:59 -05:00
|
|
|
|
/// Converts to an owned byte vector by consuming self
|
|
|
|
|
fn into_bytes(self) -> Vec<u8>;
|
2013-06-16 04:04:53 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "may be replaced by generic conversion traits"]
|
2014-05-04 00:02:59 -05:00
|
|
|
|
impl IntoBytes for Vec<Ascii> {
|
|
|
|
|
fn into_bytes(self) -> Vec<u8> {
|
2014-10-27 10:04:55 -05:00
|
|
|
|
unsafe {
|
2014-10-27 11:11:07 -05:00
|
|
|
|
let v = Vec::from_raw_parts(self.as_ptr() as *mut u8,
|
|
|
|
|
self.len(),
|
|
|
|
|
self.capacity());
|
2014-10-27 10:04:55 -05:00
|
|
|
|
|
|
|
|
|
// We forget `self` to avoid freeing it at the end of the scope
|
|
|
|
|
// Otherwise, the returned `Vec` would point to freed memory
|
|
|
|
|
mem::forget(self);
|
|
|
|
|
v
|
|
|
|
|
}
|
2013-06-16 04:04:53 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-07-18 08:53:29 -05:00
|
|
|
|
|
2013-09-08 18:45:14 -05:00
|
|
|
|
/// Extension methods for ASCII-subset only operations on owned strings
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "would prefer to do this in a more general way"]
|
2014-07-18 08:53:29 -05:00
|
|
|
|
pub trait OwnedAsciiExt {
|
2013-08-10 21:21:31 -05:00
|
|
|
|
/// Convert the string to ASCII upper case:
|
|
|
|
|
/// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
|
|
|
|
|
/// but non-ASCII letters are unchanged.
|
2014-07-18 08:53:29 -05:00
|
|
|
|
fn into_ascii_upper(self) -> Self;
|
2013-08-10 21:21:31 -05:00
|
|
|
|
|
|
|
|
|
/// Convert the string to ASCII lower case:
|
|
|
|
|
/// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
|
|
|
|
|
/// but non-ASCII letters are unchanged.
|
2014-07-18 08:53:29 -05:00
|
|
|
|
fn into_ascii_lower(self) -> Self;
|
2013-09-08 18:45:14 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// Extension methods for ASCII-subset only operations on string slices
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "would prefer to do this in a more general way"]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
pub trait AsciiExt<T> for Sized? {
|
2013-09-08 18:45:14 -05:00
|
|
|
|
/// Makes a copy of the string in ASCII upper case:
|
|
|
|
|
/// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
|
|
|
|
|
/// but non-ASCII letters are unchanged.
|
2014-07-18 08:53:29 -05:00
|
|
|
|
fn to_ascii_upper(&self) -> T;
|
2013-09-08 18:45:14 -05:00
|
|
|
|
|
|
|
|
|
/// Makes a copy of the string in ASCII lower case:
|
|
|
|
|
/// ASCII letters 'A' to 'Z' are mapped to 'a' to 'z',
|
|
|
|
|
/// but non-ASCII letters are unchanged.
|
2014-07-18 08:53:29 -05:00
|
|
|
|
fn to_ascii_lower(&self) -> T;
|
2013-08-10 21:21:31 -05:00
|
|
|
|
|
|
|
|
|
/// Check that two strings are an ASCII case-insensitive match.
|
|
|
|
|
/// Same as `to_ascii_lower(a) == to_ascii_lower(b)`,
|
|
|
|
|
/// but without allocating and copying temporary strings.
|
2014-10-23 10:43:18 -05:00
|
|
|
|
fn eq_ignore_ascii_case(&self, other: &Self) -> bool;
|
2013-08-02 15:39:57 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "would prefer to do this in a more general way"]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
impl AsciiExt<String> for str {
|
2013-08-10 21:21:31 -05:00
|
|
|
|
#[inline]
|
2014-05-22 18:57:53 -05:00
|
|
|
|
fn to_ascii_upper(&self) -> String {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
// Vec<u8>::to_ascii_upper() preserves the UTF-8 invariant.
|
2014-11-20 12:11:15 -06:00
|
|
|
|
unsafe { String::from_utf8_unchecked(self.as_bytes().to_ascii_upper()) }
|
2013-08-10 21:21:31 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
2014-05-22 18:57:53 -05:00
|
|
|
|
fn to_ascii_lower(&self) -> String {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
// Vec<u8>::to_ascii_lower() preserves the UTF-8 invariant.
|
2014-11-20 12:11:15 -06:00
|
|
|
|
unsafe { String::from_utf8_unchecked(self.as_bytes().to_ascii_lower()) }
|
2013-08-10 21:21:31 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
fn eq_ignore_ascii_case(&self, other: &str) -> bool {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
self.as_bytes().eq_ignore_ascii_case(other.as_bytes())
|
2013-08-10 21:21:31 -05:00
|
|
|
|
}
|
2013-08-02 15:39:57 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "would prefer to do this in a more general way"]
|
2014-07-18 08:53:29 -05:00
|
|
|
|
impl OwnedAsciiExt for String {
|
2013-09-08 18:45:14 -05:00
|
|
|
|
#[inline]
|
2014-05-22 18:57:53 -05:00
|
|
|
|
fn into_ascii_upper(self) -> String {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
// Vec<u8>::into_ascii_upper() preserves the UTF-8 invariant.
|
2014-11-20 12:11:15 -06:00
|
|
|
|
unsafe { String::from_utf8_unchecked(self.into_bytes().into_ascii_upper()) }
|
2013-09-08 18:45:14 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
2014-05-22 18:57:53 -05:00
|
|
|
|
fn into_ascii_lower(self) -> String {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
// Vec<u8>::into_ascii_lower() preserves the UTF-8 invariant.
|
2014-11-20 12:11:15 -06:00
|
|
|
|
unsafe { String::from_utf8_unchecked(self.into_bytes().into_ascii_lower()) }
|
2013-09-08 18:45:14 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "would prefer to do this in a more general way"]
|
2014-10-23 10:43:18 -05:00
|
|
|
|
impl AsciiExt<Vec<u8>> for [u8] {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
#[inline]
|
|
|
|
|
fn to_ascii_upper(&self) -> Vec<u8> {
|
|
|
|
|
self.iter().map(|&byte| ASCII_UPPER_MAP[byte as uint]).collect()
|
|
|
|
|
}
|
2013-09-08 18:45:14 -05:00
|
|
|
|
|
2014-07-18 08:53:29 -05:00
|
|
|
|
#[inline]
|
|
|
|
|
fn to_ascii_lower(&self) -> Vec<u8> {
|
|
|
|
|
self.iter().map(|&byte| ASCII_LOWER_MAP[byte as uint]).collect()
|
2013-08-02 15:39:57 -05:00
|
|
|
|
}
|
2013-09-08 18:45:14 -05:00
|
|
|
|
|
2014-07-18 08:53:29 -05:00
|
|
|
|
#[inline]
|
|
|
|
|
fn eq_ignore_ascii_case(&self, other: &[u8]) -> bool {
|
|
|
|
|
self.len() == other.len() &&
|
|
|
|
|
self.iter().zip(other.iter()).all(
|
|
|
|
|
|(byte_self, byte_other)| {
|
|
|
|
|
ASCII_LOWER_MAP[*byte_self as uint] ==
|
|
|
|
|
ASCII_LOWER_MAP[*byte_other as uint]
|
|
|
|
|
})
|
|
|
|
|
}
|
2013-09-08 18:45:14 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[experimental = "would prefer to do this in a more general way"]
|
2014-07-18 08:53:29 -05:00
|
|
|
|
impl OwnedAsciiExt for Vec<u8> {
|
|
|
|
|
#[inline]
|
|
|
|
|
fn into_ascii_upper(mut self) -> Vec<u8> {
|
2014-09-14 22:27:36 -05:00
|
|
|
|
for byte in self.iter_mut() {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
*byte = ASCII_UPPER_MAP[*byte as uint];
|
|
|
|
|
}
|
|
|
|
|
self
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[inline]
|
|
|
|
|
fn into_ascii_lower(mut self) -> Vec<u8> {
|
2014-09-14 22:27:36 -05:00
|
|
|
|
for byte in self.iter_mut() {
|
2014-07-18 08:53:29 -05:00
|
|
|
|
*byte = ASCII_LOWER_MAP[*byte as uint];
|
|
|
|
|
}
|
|
|
|
|
self
|
2014-05-04 00:02:59 -05:00
|
|
|
|
}
|
2013-08-02 15:39:57 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-10-27 11:13:51 -05:00
|
|
|
|
/// Returns a 'default' ASCII and C++11-like literal escape of a `u8`
|
|
|
|
|
///
|
|
|
|
|
/// The default is chosen with a bias toward producing literals that are
|
|
|
|
|
/// legal in a variety of languages, including C++11 and similar C-family
|
|
|
|
|
/// languages. The exact rules are:
|
|
|
|
|
///
|
|
|
|
|
/// - Tab, CR and LF are escaped as '\t', '\r' and '\n' respectively.
|
|
|
|
|
/// - Single-quote, double-quote and backslash chars are backslash-escaped.
|
|
|
|
|
/// - Any other chars in the range [0x20,0x7e] are not escaped.
|
|
|
|
|
/// - Any other chars are given hex escapes.
|
|
|
|
|
/// - Unicode escapes are never generated by this function.
|
2014-11-21 14:00:05 -06:00
|
|
|
|
#[unstable = "needs to be updated to use an iterator"]
|
2014-10-27 11:13:51 -05:00
|
|
|
|
pub fn escape_default(c: u8, f: |u8|) {
|
|
|
|
|
match c {
|
|
|
|
|
b'\t' => { f(b'\\'); f(b't'); }
|
|
|
|
|
b'\r' => { f(b'\\'); f(b'r'); }
|
|
|
|
|
b'\n' => { f(b'\\'); f(b'n'); }
|
|
|
|
|
b'\\' => { f(b'\\'); f(b'\\'); }
|
|
|
|
|
b'\'' => { f(b'\\'); f(b'\''); }
|
|
|
|
|
b'"' => { f(b'\\'); f(b'"'); }
|
|
|
|
|
b'\x20' ... b'\x7e' => { f(c); }
|
|
|
|
|
_ => {
|
|
|
|
|
f(b'\\');
|
|
|
|
|
f(b'x');
|
|
|
|
|
for &offset in [4u, 0u].iter() {
|
|
|
|
|
match ((c as i32) >> offset) & 0xf {
|
|
|
|
|
i @ 0 ... 9 => f(b'0' + (i as u8)),
|
|
|
|
|
i => f(b'a' + (i as u8 - 10)),
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2014-07-18 08:53:29 -05:00
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
static ASCII_LOWER_MAP: [u8, ..256] = [
|
2013-08-02 15:39:57 -05:00
|
|
|
|
0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
|
|
|
|
|
0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
|
|
|
|
|
0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
|
|
|
|
|
0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
|
2014-07-18 08:11:40 -05:00
|
|
|
|
b' ', b'!', b'"', b'#', b'$', b'%', b'&', b'\'',
|
|
|
|
|
b'(', b')', b'*', b'+', b',', b'-', b'.', b'/',
|
|
|
|
|
b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7',
|
|
|
|
|
b'8', b'9', b':', b';', b'<', b'=', b'>', b'?',
|
|
|
|
|
b'@',
|
|
|
|
|
|
|
|
|
|
b'a', b'b', b'c', b'd', b'e', b'f', b'g',
|
|
|
|
|
b'h', b'i', b'j', b'k', b'l', b'm', b'n', b'o',
|
|
|
|
|
b'p', b'q', b'r', b's', b't', b'u', b'v', b'w',
|
|
|
|
|
b'x', b'y', b'z',
|
|
|
|
|
|
|
|
|
|
b'[', b'\\', b']', b'^', b'_',
|
|
|
|
|
b'`', b'a', b'b', b'c', b'd', b'e', b'f', b'g',
|
|
|
|
|
b'h', b'i', b'j', b'k', b'l', b'm', b'n', b'o',
|
|
|
|
|
b'p', b'q', b'r', b's', b't', b'u', b'v', b'w',
|
|
|
|
|
b'x', b'y', b'z', b'{', b'|', b'}', b'~', 0x7f,
|
2013-08-02 15:39:57 -05:00
|
|
|
|
0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
|
|
|
|
|
0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
|
|
|
|
|
0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
|
|
|
|
|
0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
|
|
|
|
|
0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
|
|
|
|
|
0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
|
|
|
|
|
0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
|
|
|
|
|
0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
|
|
|
|
|
0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
|
|
|
|
|
0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
|
|
|
|
|
0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
|
|
|
|
|
0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
|
|
|
|
|
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
|
|
|
|
|
0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
|
|
|
|
|
0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
|
|
|
|
|
0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
|
|
|
|
|
];
|
|
|
|
|
|
2014-11-21 14:00:05 -06:00
|
|
|
|
static ASCII_UPPER_MAP: [u8, ..256] = [
|
2013-08-02 15:39:57 -05:00
|
|
|
|
0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07,
|
|
|
|
|
0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f,
|
|
|
|
|
0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
|
|
|
|
|
0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f,
|
2014-07-18 08:11:40 -05:00
|
|
|
|
b' ', b'!', b'"', b'#', b'$', b'%', b'&', b'\'',
|
|
|
|
|
b'(', b')', b'*', b'+', b',', b'-', b'.', b'/',
|
|
|
|
|
b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7',
|
|
|
|
|
b'8', b'9', b':', b';', b'<', b'=', b'>', b'?',
|
|
|
|
|
b'@', b'A', b'B', b'C', b'D', b'E', b'F', b'G',
|
|
|
|
|
b'H', b'I', b'J', b'K', b'L', b'M', b'N', b'O',
|
|
|
|
|
b'P', b'Q', b'R', b'S', b'T', b'U', b'V', b'W',
|
|
|
|
|
b'X', b'Y', b'Z', b'[', b'\\', b']', b'^', b'_',
|
|
|
|
|
b'`',
|
|
|
|
|
|
|
|
|
|
b'A', b'B', b'C', b'D', b'E', b'F', b'G',
|
|
|
|
|
b'H', b'I', b'J', b'K', b'L', b'M', b'N', b'O',
|
|
|
|
|
b'P', b'Q', b'R', b'S', b'T', b'U', b'V', b'W',
|
|
|
|
|
b'X', b'Y', b'Z',
|
|
|
|
|
|
|
|
|
|
b'{', b'|', b'}', b'~', 0x7f,
|
2013-08-02 15:39:57 -05:00
|
|
|
|
0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
|
|
|
|
|
0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f,
|
|
|
|
|
0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97,
|
|
|
|
|
0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f,
|
|
|
|
|
0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
|
|
|
|
|
0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf,
|
|
|
|
|
0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7,
|
|
|
|
|
0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf,
|
|
|
|
|
0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7,
|
|
|
|
|
0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf,
|
|
|
|
|
0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7,
|
|
|
|
|
0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf,
|
|
|
|
|
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7,
|
|
|
|
|
0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef,
|
|
|
|
|
0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7,
|
|
|
|
|
0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff,
|
|
|
|
|
];
|
|
|
|
|
|
|
|
|
|
|
2013-04-23 18:38:49 -05:00
|
|
|
|
#[cfg(test)]
|
2013-04-20 12:39:15 -05:00
|
|
|
|
mod tests {
|
2014-01-07 00:33:37 -06:00
|
|
|
|
use prelude::*;
|
2013-04-20 12:39:15 -05:00
|
|
|
|
use super::*;
|
2013-09-03 18:24:12 -05:00
|
|
|
|
use char::from_u32;
|
2014-11-02 19:04:32 -06:00
|
|
|
|
use str::StrPrelude;
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
|
|
|
|
macro_rules! v2ascii (
|
2014-02-28 03:23:06 -06:00
|
|
|
|
( [$($e:expr),*]) => (&[$(Ascii{chr:$e}),*]);
|
2013-12-05 14:38:04 -06:00
|
|
|
|
(&[$($e:expr),*]) => (&[$(Ascii{chr:$e}),*]);
|
2013-04-20 12:39:15 -05:00
|
|
|
|
)
|
|
|
|
|
|
2014-03-17 01:30:27 -05:00
|
|
|
|
macro_rules! vec2ascii (
|
2014-10-15 01:05:01 -05:00
|
|
|
|
($($e:expr),*) => ([$(Ascii{chr:$e}),*].to_vec());
|
2014-03-17 01:30:27 -05:00
|
|
|
|
)
|
|
|
|
|
|
2013-04-20 12:39:15 -05:00
|
|
|
|
#[test]
|
|
|
|
|
fn test_ascii() {
|
|
|
|
|
assert_eq!(65u8.to_ascii().to_byte(), 65u8);
|
|
|
|
|
assert_eq!(65u8.to_ascii().to_char(), 'A');
|
|
|
|
|
assert_eq!('A'.to_ascii().to_char(), 'A');
|
|
|
|
|
assert_eq!('A'.to_ascii().to_byte(), 65u8);
|
2013-04-20 15:50:50 -05:00
|
|
|
|
|
2014-10-11 05:50:35 -05:00
|
|
|
|
assert_eq!('A'.to_ascii().to_lowercase().to_char(), 'a');
|
|
|
|
|
assert_eq!('Z'.to_ascii().to_lowercase().to_char(), 'z');
|
|
|
|
|
assert_eq!('a'.to_ascii().to_uppercase().to_char(), 'A');
|
|
|
|
|
assert_eq!('z'.to_ascii().to_uppercase().to_char(), 'Z');
|
2013-04-20 15:50:50 -05:00
|
|
|
|
|
2014-10-11 05:50:35 -05:00
|
|
|
|
assert_eq!('@'.to_ascii().to_lowercase().to_char(), '@');
|
|
|
|
|
assert_eq!('['.to_ascii().to_lowercase().to_char(), '[');
|
|
|
|
|
assert_eq!('`'.to_ascii().to_uppercase().to_char(), '`');
|
|
|
|
|
assert_eq!('{'.to_ascii().to_uppercase().to_char(), '{');
|
2013-04-23 04:08:13 -05:00
|
|
|
|
|
2013-11-27 09:54:54 -06:00
|
|
|
|
assert!('0'.to_ascii().is_digit());
|
|
|
|
|
assert!('9'.to_ascii().is_digit());
|
|
|
|
|
assert!(!'/'.to_ascii().is_digit());
|
|
|
|
|
assert!(!':'.to_ascii().is_digit());
|
|
|
|
|
|
|
|
|
|
assert!((0x1fu8).to_ascii().is_control());
|
|
|
|
|
assert!(!' '.to_ascii().is_control());
|
|
|
|
|
assert!((0x7fu8).to_ascii().is_control());
|
|
|
|
|
|
2013-11-23 04:18:51 -06:00
|
|
|
|
assert!("banana".chars().all(|c| c.is_ascii()));
|
|
|
|
|
assert!(!"ประเทศไทย中华Việt Nam".chars().all(|c| c.is_ascii()));
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn test_ascii_vec() {
|
2014-01-15 13:39:08 -06:00
|
|
|
|
let test = &[40u8, 32u8, 59u8];
|
2014-08-04 07:19:02 -05:00
|
|
|
|
let b: &[_] = v2ascii!([40, 32, 59]);
|
|
|
|
|
assert_eq!(test.to_ascii(), b);
|
|
|
|
|
assert_eq!("( ;".to_ascii(), b);
|
2014-06-06 12:27:49 -05:00
|
|
|
|
let v = vec![40u8, 32u8, 59u8];
|
2014-11-27 13:43:55 -06:00
|
|
|
|
assert_eq!(v.to_ascii(), b);
|
|
|
|
|
assert_eq!("( ;".to_string().to_ascii(), b);
|
2013-04-22 14:42:25 -05:00
|
|
|
|
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!("abCDef&?#".to_ascii().to_lowercase().into_string(), "abcdef&?#");
|
|
|
|
|
assert_eq!("abCDef&?#".to_ascii().to_uppercase().into_string(), "ABCDEF&?#");
|
2013-04-23 04:08:13 -05:00
|
|
|
|
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!("".to_ascii().to_lowercase().into_string(), "");
|
|
|
|
|
assert_eq!("YMCA".to_ascii().to_lowercase().into_string(), "ymca");
|
2014-10-11 05:50:35 -05:00
|
|
|
|
let mixed = "abcDEFxyz:.;".to_ascii();
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(mixed.to_uppercase().into_string(), "ABCDEFXYZ:.;");
|
2013-04-23 04:08:13 -05:00
|
|
|
|
|
2013-06-16 04:04:53 -05:00
|
|
|
|
assert!("aBcDeF&?#".to_ascii().eq_ignore_case("AbCdEf&?#".to_ascii()));
|
|
|
|
|
|
2013-04-23 04:08:13 -05:00
|
|
|
|
assert!("".is_ascii());
|
|
|
|
|
assert!("a".is_ascii());
|
|
|
|
|
assert!(!"\u2009".is_ascii());
|
|
|
|
|
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-03-17 01:30:27 -05:00
|
|
|
|
#[test]
|
|
|
|
|
fn test_ascii_vec_ng() {
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!("abCDef&?#".to_ascii().to_lowercase().into_string(), "abcdef&?#");
|
|
|
|
|
assert_eq!("abCDef&?#".to_ascii().to_uppercase().into_string(), "ABCDEF&?#");
|
|
|
|
|
assert_eq!("".to_ascii().to_lowercase().into_string(), "");
|
|
|
|
|
assert_eq!("YMCA".to_ascii().to_lowercase().into_string(), "ymca");
|
2014-10-11 05:50:35 -05:00
|
|
|
|
let mixed = "abcDEFxyz:.;".to_ascii();
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(mixed.to_uppercase().into_string(), "ABCDEFXYZ:.;");
|
2014-03-17 01:30:27 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-04-20 12:39:15 -05:00
|
|
|
|
#[test]
|
|
|
|
|
fn test_owned_ascii_vec() {
|
2014-05-25 05:17:19 -05:00
|
|
|
|
assert_eq!(("( ;".to_string()).into_ascii(), vec2ascii![40, 32, 59]);
|
2014-06-06 12:27:49 -05:00
|
|
|
|
assert_eq!((vec![40u8, 32u8, 59u8]).into_ascii(), vec2ascii![40, 32, 59]);
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
2013-11-07 01:59:40 -06:00
|
|
|
|
fn test_ascii_as_str() {
|
|
|
|
|
let v = v2ascii!([40, 32, 59]);
|
|
|
|
|
assert_eq!(v.as_str_ascii(), "( ;");
|
|
|
|
|
}
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
|
|
|
|
#[test]
|
2014-06-21 05:39:03 -05:00
|
|
|
|
fn test_ascii_into_string() {
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(vec2ascii![40, 32, 59].into_string(), "( ;");
|
|
|
|
|
assert_eq!(vec2ascii!(40, 32, 59).into_string(), "( ;");
|
2013-06-16 04:04:53 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn test_ascii_to_bytes() {
|
2014-05-04 00:02:59 -05:00
|
|
|
|
assert_eq!(vec2ascii![40, 32, 59].into_bytes(), vec![40u8, 32u8, 59u8]);
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test] #[should_fail]
|
2014-10-09 14:17:22 -05:00
|
|
|
|
fn test_ascii_vec_panic_u8_slice() { (&[127u8, 128u8, 255u8]).to_ascii(); }
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
|
|
|
|
#[test] #[should_fail]
|
2014-10-09 14:17:22 -05:00
|
|
|
|
fn test_ascii_vec_panic_str_slice() { "zoä华".to_ascii(); }
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
|
|
|
|
#[test] #[should_fail]
|
2014-10-09 14:17:22 -05:00
|
|
|
|
fn test_ascii_panic_u8_slice() { 255u8.to_ascii(); }
|
2013-04-20 12:39:15 -05:00
|
|
|
|
|
|
|
|
|
#[test] #[should_fail]
|
2014-10-09 14:17:22 -05:00
|
|
|
|
fn test_ascii_panic_char_slice() { 'λ'.to_ascii(); }
|
2013-08-02 15:39:57 -05:00
|
|
|
|
|
2014-01-05 12:05:02 -06:00
|
|
|
|
#[test]
|
2013-12-05 14:38:04 -06:00
|
|
|
|
fn test_opt() {
|
|
|
|
|
assert_eq!(65u8.to_ascii_opt(), Some(Ascii { chr: 65u8 }));
|
|
|
|
|
assert_eq!(255u8.to_ascii_opt(), None);
|
|
|
|
|
|
|
|
|
|
assert_eq!('A'.to_ascii_opt(), Some(Ascii { chr: 65u8 }));
|
|
|
|
|
assert_eq!('λ'.to_ascii_opt(), None);
|
|
|
|
|
|
|
|
|
|
assert_eq!("zoä华".to_ascii_opt(), None);
|
|
|
|
|
|
2014-01-15 13:39:08 -06:00
|
|
|
|
let test1 = &[127u8, 128u8, 255u8];
|
|
|
|
|
assert_eq!((test1).to_ascii_opt(), None);
|
2013-12-05 14:38:04 -06:00
|
|
|
|
|
|
|
|
|
let v = [40u8, 32u8, 59u8];
|
2014-08-04 07:19:02 -05:00
|
|
|
|
let v2: &[_] = v2ascii!(&[40, 32, 59]);
|
2014-01-15 13:39:08 -06:00
|
|
|
|
assert_eq!(v.to_ascii_opt(), Some(v2));
|
2013-12-05 14:38:04 -06:00
|
|
|
|
let v = [127u8, 128u8, 255u8];
|
|
|
|
|
assert_eq!(v.to_ascii_opt(), None);
|
|
|
|
|
|
2014-01-15 13:39:08 -06:00
|
|
|
|
let v = "( ;";
|
|
|
|
|
assert_eq!(v.to_ascii_opt(), Some(v2));
|
2013-12-05 14:38:04 -06:00
|
|
|
|
assert_eq!("zoä华".to_ascii_opt(), None);
|
|
|
|
|
|
2014-05-04 00:02:59 -05:00
|
|
|
|
assert_eq!((vec![40u8, 32u8, 59u8]).into_ascii_opt(), Some(vec2ascii![40, 32, 59]));
|
|
|
|
|
assert_eq!((vec![127u8, 128u8, 255u8]).into_ascii_opt(), None);
|
2013-12-05 14:38:04 -06:00
|
|
|
|
|
2014-05-25 05:17:19 -05:00
|
|
|
|
assert_eq!(("( ;".to_string()).into_ascii_opt(), Some(vec2ascii![40, 32, 59]));
|
|
|
|
|
assert_eq!(("zoä华".to_string()).into_ascii_opt(), None);
|
2013-12-05 14:38:04 -06:00
|
|
|
|
}
|
|
|
|
|
|
2013-08-02 15:39:57 -05:00
|
|
|
|
#[test]
|
|
|
|
|
fn test_to_ascii_upper() {
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!("url()URL()uRl()ürl".to_ascii_upper(), "URL()URL()URL()üRL");
|
|
|
|
|
assert_eq!("hıKß".to_ascii_upper(), "HıKß");
|
2013-08-02 15:39:57 -05:00
|
|
|
|
|
|
|
|
|
let mut i = 0;
|
|
|
|
|
while i <= 500 {
|
2013-09-03 18:24:12 -05:00
|
|
|
|
let upper = if 'a' as u32 <= i && i <= 'z' as u32 { i + 'A' as u32 - 'a' as u32 }
|
|
|
|
|
else { i };
|
2014-11-27 13:43:55 -06:00
|
|
|
|
assert_eq!((from_u32(i).unwrap()).to_string().to_ascii_upper(),
|
2014-07-04 15:38:13 -05:00
|
|
|
|
(from_u32(upper).unwrap()).to_string())
|
2013-08-02 15:39:57 -05:00
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn test_to_ascii_lower() {
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!("url()URL()uRl()Ürl".to_ascii_lower(), "url()url()url()Ürl");
|
2013-08-02 15:39:57 -05:00
|
|
|
|
// Dotted capital I, Kelvin sign, Sharp S.
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!("HİKß".to_ascii_lower(), "hİKß");
|
2013-08-02 15:39:57 -05:00
|
|
|
|
|
|
|
|
|
let mut i = 0;
|
|
|
|
|
while i <= 500 {
|
2013-09-03 18:24:12 -05:00
|
|
|
|
let lower = if 'A' as u32 <= i && i <= 'Z' as u32 { i + 'a' as u32 - 'A' as u32 }
|
|
|
|
|
else { i };
|
2014-11-27 13:43:55 -06:00
|
|
|
|
assert_eq!((from_u32(i).unwrap()).to_string().to_ascii_lower(),
|
2014-07-04 15:38:13 -05:00
|
|
|
|
(from_u32(lower).unwrap()).to_string())
|
2013-09-08 18:45:14 -05:00
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn test_into_ascii_upper() {
|
2014-05-25 05:17:19 -05:00
|
|
|
|
assert_eq!(("url()URL()uRl()ürl".to_string()).into_ascii_upper(),
|
|
|
|
|
"URL()URL()URL()üRL".to_string());
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(("hıKß".to_string()).into_ascii_upper(), "HıKß");
|
2013-09-08 18:45:14 -05:00
|
|
|
|
|
|
|
|
|
let mut i = 0;
|
|
|
|
|
while i <= 500 {
|
|
|
|
|
let upper = if 'a' as u32 <= i && i <= 'z' as u32 { i + 'A' as u32 - 'a' as u32 }
|
|
|
|
|
else { i };
|
2014-07-04 15:38:13 -05:00
|
|
|
|
assert_eq!((from_u32(i).unwrap()).to_string().into_ascii_upper(),
|
|
|
|
|
(from_u32(upper).unwrap()).to_string())
|
2013-09-08 18:45:14 -05:00
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn test_into_ascii_lower() {
|
2014-05-25 05:17:19 -05:00
|
|
|
|
assert_eq!(("url()URL()uRl()Ürl".to_string()).into_ascii_lower(),
|
2014-11-27 18:45:47 -06:00
|
|
|
|
"url()url()url()Ürl");
|
2013-09-08 18:45:14 -05:00
|
|
|
|
// Dotted capital I, Kelvin sign, Sharp S.
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(("HİKß".to_string()).into_ascii_lower(), "hİKß");
|
2013-09-08 18:45:14 -05:00
|
|
|
|
|
|
|
|
|
let mut i = 0;
|
|
|
|
|
while i <= 500 {
|
|
|
|
|
let lower = if 'A' as u32 <= i && i <= 'Z' as u32 { i + 'a' as u32 - 'A' as u32 }
|
|
|
|
|
else { i };
|
2014-07-04 15:38:13 -05:00
|
|
|
|
assert_eq!((from_u32(i).unwrap()).to_string().into_ascii_lower(),
|
|
|
|
|
(from_u32(lower).unwrap()).to_string())
|
2013-08-02 15:39:57 -05:00
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
fn test_eq_ignore_ascii_case() {
|
2013-08-10 21:21:31 -05:00
|
|
|
|
assert!("url()URL()uRl()Ürl".eq_ignore_ascii_case("url()url()url()Ürl"));
|
|
|
|
|
assert!(!"Ürl".eq_ignore_ascii_case("ürl"));
|
2013-08-02 15:39:57 -05:00
|
|
|
|
// Dotted capital I, Kelvin sign, Sharp S.
|
2013-08-10 21:21:31 -05:00
|
|
|
|
assert!("HİKß".eq_ignore_ascii_case("hİKß"));
|
|
|
|
|
assert!(!"İ".eq_ignore_ascii_case("i"));
|
|
|
|
|
assert!(!"K".eq_ignore_ascii_case("k"));
|
|
|
|
|
assert!(!"ß".eq_ignore_ascii_case("s"));
|
2013-08-02 15:39:57 -05:00
|
|
|
|
|
|
|
|
|
let mut i = 0;
|
|
|
|
|
while i <= 500 {
|
2013-09-03 18:24:12 -05:00
|
|
|
|
let c = i;
|
|
|
|
|
let lower = if 'A' as u32 <= c && c <= 'Z' as u32 { c + 'a' as u32 - 'A' as u32 }
|
|
|
|
|
else { c };
|
2014-11-27 13:43:55 -06:00
|
|
|
|
assert!((from_u32(i).unwrap()).to_string().eq_ignore_ascii_case(
|
2014-07-04 15:38:13 -05:00
|
|
|
|
(from_u32(lower).unwrap()).to_string().as_slice()));
|
2013-08-02 15:39:57 -05:00
|
|
|
|
i += 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
2013-09-03 20:04:36 -05:00
|
|
|
|
|
|
|
|
|
#[test]
|
2014-06-21 05:39:03 -05:00
|
|
|
|
fn test_to_string() {
|
2014-08-06 01:02:50 -05:00
|
|
|
|
let s = Ascii{ chr: b't' }.to_string();
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(s, "t");
|
2013-09-03 20:04:36 -05:00
|
|
|
|
}
|
|
|
|
|
|
2014-02-12 13:41:34 -06:00
|
|
|
|
#[test]
|
|
|
|
|
fn test_show() {
|
2014-08-06 01:02:50 -05:00
|
|
|
|
let c = Ascii { chr: b't' };
|
2014-11-27 18:45:47 -06:00
|
|
|
|
assert_eq!(format!("{}", c), "t");
|
2014-02-12 13:41:34 -06:00
|
|
|
|
}
|
2013-04-20 12:39:15 -05:00
|
|
|
|
}
|