2013-08-04 14:42:39 -04:00
|
|
|
|
// Copyright 2013 The Rust Project Developers. See the COPYRIGHT
|
|
|
|
|
// file at the top-level directory of this distribution and at
|
|
|
|
|
// http://rust-lang.org/COPYRIGHT.
|
|
|
|
|
//
|
|
|
|
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
|
|
|
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
|
|
|
|
// option. This file may not be copied, modified, or distributed
|
|
|
|
|
// except according to those terms.
|
|
|
|
|
|
|
|
|
|
//! Hex binary-to-text encoding
|
|
|
|
|
use std::str;
|
|
|
|
|
use std::vec;
|
|
|
|
|
|
|
|
|
|
/// A trait for converting a value to hexadecimal encoding
|
|
|
|
|
pub trait ToHex {
|
|
|
|
|
/// Converts the value of `self` to a hex value, returning the owned
|
|
|
|
|
/// string.
|
|
|
|
|
fn to_hex(&self) -> ~str;
|
|
|
|
|
}
|
|
|
|
|
|
2013-08-04 23:51:26 -04:00
|
|
|
|
static CHARS: &'static[u8] = bytes!("0123456789abcdef");
|
2013-08-04 14:42:39 -04:00
|
|
|
|
|
|
|
|
|
impl<'self> ToHex for &'self [u8] {
|
|
|
|
|
/**
|
|
|
|
|
* Turn a vector of `u8` bytes into a hexadecimal string.
|
|
|
|
|
*
|
|
|
|
|
* # Example
|
|
|
|
|
*
|
2013-09-23 17:20:36 -07:00
|
|
|
|
* ```rust
|
2013-08-04 14:42:39 -04:00
|
|
|
|
* extern mod extra;
|
|
|
|
|
* use extra::hex::ToHex;
|
|
|
|
|
*
|
|
|
|
|
* fn main () {
|
|
|
|
|
* let str = [52,32].to_hex();
|
2013-09-24 22:16:43 -07:00
|
|
|
|
* println!("{}", str);
|
2013-08-04 14:42:39 -04:00
|
|
|
|
* }
|
2013-09-23 17:20:36 -07:00
|
|
|
|
* ```
|
2013-08-04 14:42:39 -04:00
|
|
|
|
*/
|
|
|
|
|
fn to_hex(&self) -> ~str {
|
2013-08-05 00:08:13 -04:00
|
|
|
|
let mut v = vec::with_capacity(self.len() * 2);
|
2013-08-04 14:42:39 -04:00
|
|
|
|
for &byte in self.iter() {
|
2013-08-04 23:51:26 -04:00
|
|
|
|
v.push(CHARS[byte >> 4]);
|
|
|
|
|
v.push(CHARS[byte & 0xf]);
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
|
2013-08-04 23:51:26 -04:00
|
|
|
|
unsafe {
|
2013-09-05 14:17:24 +02:00
|
|
|
|
str::raw::from_utf8_owned(v)
|
2013-08-04 23:51:26 -04:00
|
|
|
|
}
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// A trait for converting hexadecimal encoded values
|
|
|
|
|
pub trait FromHex {
|
2013-08-04 16:09:04 -04:00
|
|
|
|
/// Converts the value of `self`, interpreted as hexadecimal encoded data,
|
|
|
|
|
/// into an owned vector of bytes, returning the vector.
|
2013-08-04 14:42:39 -04:00
|
|
|
|
fn from_hex(&self) -> Result<~[u8], ~str>;
|
|
|
|
|
}
|
|
|
|
|
|
2013-08-05 01:25:15 -04:00
|
|
|
|
impl<'self> FromHex for &'self str {
|
2013-08-04 14:42:39 -04:00
|
|
|
|
/**
|
2013-08-05 01:25:15 -04:00
|
|
|
|
* Convert any hexadecimal encoded string (literal, `@`, `&`, or `~`)
|
|
|
|
|
* to the byte values it encodes.
|
|
|
|
|
*
|
2013-09-05 14:17:24 +02:00
|
|
|
|
* You can use the `from_utf8` function in `std::str`
|
2013-08-05 01:25:15 -04:00
|
|
|
|
* to turn a `[u8]` into a string with characters corresponding to those
|
|
|
|
|
* values.
|
2013-08-04 14:42:39 -04:00
|
|
|
|
*
|
|
|
|
|
* # Example
|
|
|
|
|
*
|
2013-08-05 01:25:15 -04:00
|
|
|
|
* This converts a string literal to hexadecimal and back.
|
|
|
|
|
*
|
2013-09-23 17:20:36 -07:00
|
|
|
|
* ```rust
|
2013-08-04 14:42:39 -04:00
|
|
|
|
* extern mod extra;
|
2013-08-05 01:25:15 -04:00
|
|
|
|
* use extra::hex::{FromHex, ToHex};
|
|
|
|
|
* use std::str;
|
2013-08-04 14:42:39 -04:00
|
|
|
|
*
|
|
|
|
|
* fn main () {
|
2013-08-05 01:25:15 -04:00
|
|
|
|
* let hello_str = "Hello, World".to_hex();
|
2013-09-24 22:16:43 -07:00
|
|
|
|
* println!("{}", hello_str);
|
2013-08-06 10:42:06 -07:00
|
|
|
|
* let bytes = hello_str.from_hex().unwrap();
|
2013-09-24 22:16:43 -07:00
|
|
|
|
* println!("{:?}", bytes);
|
2013-09-05 14:17:24 +02:00
|
|
|
|
* let result_str = str::from_utf8(bytes);
|
2013-09-24 22:16:43 -07:00
|
|
|
|
* println!("{}", result_str);
|
2013-08-04 14:42:39 -04:00
|
|
|
|
* }
|
2013-09-23 17:20:36 -07:00
|
|
|
|
* ```
|
2013-08-04 14:42:39 -04:00
|
|
|
|
*/
|
|
|
|
|
fn from_hex(&self) -> Result<~[u8], ~str> {
|
|
|
|
|
// This may be an overestimate if there is any whitespace
|
|
|
|
|
let mut b = vec::with_capacity(self.len() / 2);
|
|
|
|
|
let mut modulus = 0;
|
|
|
|
|
let mut buf = 0u8;
|
|
|
|
|
|
2013-08-05 01:25:15 -04:00
|
|
|
|
for (idx, byte) in self.byte_iter().enumerate() {
|
2013-08-04 14:42:39 -04:00
|
|
|
|
buf <<= 4;
|
|
|
|
|
|
|
|
|
|
match byte as char {
|
|
|
|
|
'A'..'F' => buf |= byte - ('A' as u8) + 10,
|
|
|
|
|
'a'..'f' => buf |= byte - ('a' as u8) + 10,
|
|
|
|
|
'0'..'9' => buf |= byte - ('0' as u8),
|
2013-08-04 16:09:04 -04:00
|
|
|
|
' '|'\r'|'\n'|'\t' => {
|
2013-08-04 14:42:39 -04:00
|
|
|
|
buf >>= 4;
|
2013-10-01 14:31:03 -07:00
|
|
|
|
continue
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
2013-09-27 20:18:50 -07:00
|
|
|
|
_ => return Err(format!("Invalid character '{}' at position {}",
|
|
|
|
|
self.char_at(idx), idx))
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
modulus += 1;
|
|
|
|
|
if modulus == 2 {
|
|
|
|
|
modulus = 0;
|
|
|
|
|
b.push(buf);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
match modulus {
|
|
|
|
|
0 => Ok(b),
|
|
|
|
|
_ => Err(~"Invalid input length")
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
|
mod tests {
|
|
|
|
|
use test::BenchHarness;
|
|
|
|
|
use hex::*;
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_to_hex() {
|
2013-08-05 01:25:15 -04:00
|
|
|
|
assert_eq!("foobar".as_bytes().to_hex(), ~"666f6f626172");
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_from_hex_okay() {
|
2013-08-06 10:42:06 -07:00
|
|
|
|
assert_eq!("666f6f626172".from_hex().unwrap(),
|
2013-08-04 14:42:39 -04:00
|
|
|
|
"foobar".as_bytes().to_owned());
|
2013-08-06 10:42:06 -07:00
|
|
|
|
assert_eq!("666F6F626172".from_hex().unwrap(),
|
2013-08-04 14:42:39 -04:00
|
|
|
|
"foobar".as_bytes().to_owned());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_from_hex_odd_len() {
|
|
|
|
|
assert!("666".from_hex().is_err());
|
|
|
|
|
assert!("66 6".from_hex().is_err());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_from_hex_invalid_char() {
|
|
|
|
|
assert!("66y6".from_hex().is_err());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_from_hex_ignores_whitespace() {
|
2013-08-06 10:42:06 -07:00
|
|
|
|
assert_eq!("666f 6f6\r\n26172 ".from_hex().unwrap(),
|
2013-08-04 14:42:39 -04:00
|
|
|
|
"foobar".as_bytes().to_owned());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_to_hex_all_bytes() {
|
|
|
|
|
for i in range(0, 256) {
|
2013-09-27 20:18:50 -07:00
|
|
|
|
assert_eq!([i as u8].to_hex(), format!("{:02x}", i as uint));
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
|
pub fn test_from_hex_all_bytes() {
|
|
|
|
|
for i in range(0, 256) {
|
2013-09-27 20:18:50 -07:00
|
|
|
|
assert_eq!(format!("{:02x}", i as uint).from_hex().unwrap(), ~[i as u8]);
|
|
|
|
|
assert_eq!(format!("{:02X}", i as uint).from_hex().unwrap(), ~[i as u8]);
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
|
pub fn bench_to_hex(bh: & mut BenchHarness) {
|
|
|
|
|
let s = "イロハニホヘト チリヌルヲ ワカヨタレソ ツネナラム \
|
|
|
|
|
ウヰノオクヤマ ケフコエテ アサキユメミシ ヱヒモセスン";
|
|
|
|
|
do bh.iter {
|
2013-08-05 01:25:15 -04:00
|
|
|
|
s.as_bytes().to_hex();
|
2013-08-04 14:42:39 -04:00
|
|
|
|
}
|
|
|
|
|
bh.bytes = s.len() as u64;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
|
pub fn bench_from_hex(bh: & mut BenchHarness) {
|
|
|
|
|
let s = "イロハニホヘト チリヌルヲ ワカヨタレソ ツネナラム \
|
|
|
|
|
ウヰノオクヤマ ケフコエテ アサキユメミシ ヱヒモセスン";
|
2013-08-05 01:25:15 -04:00
|
|
|
|
let b = s.as_bytes().to_hex();
|
2013-08-04 14:42:39 -04:00
|
|
|
|
do bh.iter {
|
|
|
|
|
b.from_hex();
|
|
|
|
|
}
|
|
|
|
|
bh.bytes = b.len() as u64;
|
|
|
|
|
}
|
|
|
|
|
}
|