3f6e8ffe64
and add a test.
49 lines
1.0 KiB
Rust
49 lines
1.0 KiB
Rust
import rustrt.sbuf;
|
|
|
|
native "rust" mod rustrt {
|
|
type sbuf;
|
|
fn str_buf(str s) -> sbuf;
|
|
fn str_byte_len(str s) -> uint;
|
|
fn str_alloc(uint n_bytes) -> str;
|
|
fn refcount[T](str s) -> uint;
|
|
}
|
|
|
|
fn is_utf8(vec[u8] v) -> bool {
|
|
fail; // FIXME
|
|
}
|
|
|
|
fn is_ascii(str s) -> bool {
|
|
let uint i = byte_len(s);
|
|
while (i > 0u) {
|
|
i -= 1u;
|
|
if ((s.(i) & 0x80u8) != 0u8) {
|
|
ret false;
|
|
}
|
|
}
|
|
ret true;
|
|
}
|
|
|
|
fn alloc(uint n_bytes) -> str {
|
|
ret rustrt.str_alloc(n_bytes);
|
|
}
|
|
|
|
// Returns the number of bytes (a.k.a. UTF-8 code units) in s.
|
|
// Contrast with a function that would return the number of code
|
|
// points (char's), combining character sequences, words, etc. See
|
|
// http://icu-project.org/apiref/icu4c/classBreakIterator.html for a
|
|
// way to implement those.
|
|
fn byte_len(str s) -> uint {
|
|
ret rustrt.str_byte_len(s);
|
|
}
|
|
|
|
fn buf(str s) -> sbuf {
|
|
ret rustrt.str_buf(s);
|
|
}
|
|
|
|
fn bytes(&str s) -> vec[u8] {
|
|
fn ith(str s, uint i) -> u8 {
|
|
ret s.(i);
|
|
}
|
|
ret _vec.init_fn[u8](bind ith(s, _), _str.byte_len(s));
|
|
}
|