diff options
Diffstat (limited to 'base32/src')
-rw-r--r-- | base32/src/lib.rs | 221 |
1 files changed, 221 insertions, 0 deletions
diff --git a/base32/src/lib.rs b/base32/src/lib.rs new file mode 100644 index 0000000..e21cf97 --- /dev/null +++ b/base32/src/lib.rs @@ -0,0 +1,221 @@ +#[cfg(test)] +extern crate quickcheck; +#[cfg(test)] +extern crate rand; + +use std::cmp::min; + +#[derive(Copy,Clone)] +pub enum Alphabet { + RFC4648 { padding: bool }, + Crockford, +} + +const RFC4648_ALPHABET: &'static [u8] = b"ABCDEFGHIJKLMNOPQRSTUVWXYZ234567"; +const CROCKFORD_ALPHABET: &'static [u8] = b"0123456789ABCDEFGHJKMNPQRSTVWXYZ"; + +pub fn encode(alphabet: Alphabet, data: &[u8]) -> String { + let (alphabet, padding) = match alphabet { + Alphabet::RFC4648 { padding } => (RFC4648_ALPHABET, padding), + Alphabet::Crockford => (CROCKFORD_ALPHABET, false), + }; + let mut ret = Vec::with_capacity((data.len()+3)/4*5); + + for chunk in data.chunks(5) { + let buf = { + let mut buf = [0u8; 5]; + for (i, &b) in chunk.iter().enumerate() { + buf[i] = b; + } + buf + }; + ret.push(alphabet[((buf[0] & 0xF8) >> 3) as usize]); + ret.push(alphabet[(((buf[0] & 0x07) << 2) | ((buf[1] & 0xC0) >> 6)) as usize]); + ret.push(alphabet[((buf[1] & 0x3E) >> 1) as usize]); + ret.push(alphabet[(((buf[1] & 0x01) << 4) | ((buf[2] & 0xF0) >> 4)) as usize]); + ret.push(alphabet[(((buf[2] & 0x0F) << 1) | (buf[3] >> 7)) as usize]); + ret.push(alphabet[((buf[3] & 0x7C) >> 2) as usize]); + ret.push(alphabet[(((buf[3] & 0x03) << 3) | ((buf[4] & 0xE0) >> 5)) as usize]); + ret.push(alphabet[(buf[4] & 0x1F) as usize]); + } + + if data.len() % 5 != 0 { + let len = ret.len(); + let num_extra = 8-(data.len()%5*8+4)/5; + if padding { + for i in 1..num_extra+1 { + ret[len-i] = b'='; + } + } else { + ret.truncate(len-num_extra); + } + } + + String::from_utf8(ret).unwrap() +} + +const RFC4648_INV_ALPHABET: [i8; 43] = [-1, -1, 26, 27, 28, 29, 30, 31, -1, -1, -1, -1, -1, 0, -1, -1, -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25]; +const CROCKFORD_INV_ALPHABET: [i8; 43] = [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, -1, -1, -1, -1, -1, -1, -1, 10, 11, 12, 13, 14, 15, 16, 17, 1, 18, 19, 1, 20, 21, 0, 22, 23, 24, 25, 26, -1, 27, 28, 29, 30, 31]; + +pub fn decode(alphabet: Alphabet, data: &str) -> Option<Vec<u8>> { + if !data.is_ascii() { + return None; + } + let data = data.as_bytes(); + let alphabet = match alphabet { + Alphabet::RFC4648 {..} => RFC4648_INV_ALPHABET, + Alphabet::Crockford => CROCKFORD_INV_ALPHABET + }; + let mut unpadded_data_length = data.len(); + for i in 1..min(6, data.len())+1 { + if data[data.len() - i] != b'=' { + break; + } + unpadded_data_length -= 1; + } + let output_length = unpadded_data_length*5/8; + let mut ret = Vec::with_capacity((output_length+4)/5*5); + for chunk in data.chunks(8) { + let buf = { + let mut buf = [0u8; 8]; + for (i, &c) in chunk.iter().enumerate() { + match alphabet.get(c.to_ascii_uppercase().wrapping_sub(b'0') as usize) { + Some(&-1) | None => return None, + Some(&value) => buf[i] = value as u8, + }; + } + buf + }; + ret.push((buf[0] << 3) | (buf[1] >> 2)); + ret.push((buf[1] << 6) | (buf[2] << 1) | (buf[3] >> 4)); + ret.push((buf[3] << 4) | (buf[4] >> 1)); + ret.push((buf[4] << 7) | (buf[5] << 2) | (buf[6] >> 3)); + ret.push((buf[6] << 5) | buf[7]); + } + ret.truncate(output_length); + Some(ret) +} + +#[cfg(test)] +#[allow(dead_code, unused_attributes)] +mod test { + use super::{encode, decode}; + use super::Alphabet::{Crockford, RFC4648}; + use quickcheck; + use std; + use rand::Rng; + + #[derive(Clone)] + struct B32 { + c: u8 + } + + impl quickcheck::Arbitrary for B32 { + fn arbitrary<G: quickcheck::Gen>(g: &mut G) -> B32 { + let alphabet = b"0123456789ABCDEFGHJKMNPQRSTVWXYZ"; + B32 { + c: alphabet[g.gen_range(0, alphabet.len())] + } + } + } + + impl std::fmt::Debug for B32 { + fn fmt(&self, f: &mut std::fmt::Formatter) -> Result<(), std::fmt::Error> { + (self.c as char).fmt(f) + } + } + + #[test] + fn masks_crockford() { + assert_eq!(encode(Crockford, &[0xF8, 0x3E, 0x0F, 0x83, 0xE0]), "Z0Z0Z0Z0"); + assert_eq!(encode(Crockford, &[0x07, 0xC1, 0xF0, 0x7C, 0x1F]), "0Z0Z0Z0Z"); + assert_eq!(decode(Crockford, "Z0Z0Z0Z0").unwrap(), [0xF8, 0x3E, 0x0F, 0x83, 0xE0]); + assert_eq!(decode(Crockford, "0Z0Z0Z0Z").unwrap(), [0x07, 0xC1, 0xF0, 0x7C, 0x1F]); + } + + #[test] + fn masks_rfc4648() { + assert_eq!(encode(RFC4648 { padding: true }, &[0xF8, 0x3E, 0x7F, 0x83, 0xE7]), "7A7H7A7H"); + assert_eq!(encode(RFC4648 { padding: true }, &[0x77, 0xC1, 0xF7, 0x7C, 0x1F]), "O7A7O7A7"); + assert_eq!(decode(RFC4648 { padding: true }, "7A7H7A7H").unwrap(), [0xF8, 0x3E, 0x7F, 0x83, 0xE7]); + assert_eq!(decode(RFC4648 { padding: true }, "O7A7O7A7").unwrap(), [0x77, 0xC1, 0xF7, 0x7C, 0x1F]); + assert_eq!(encode(RFC4648 { padding: true }, &[0xF8, 0x3E, 0x7F, 0x83]), "7A7H7AY="); + } + + #[test] + fn masks_unpadded_rfc4648() { + assert_eq!(encode(RFC4648 { padding: false }, &[0xF8, 0x3E, 0x7F, 0x83, 0xE7]), "7A7H7A7H"); + assert_eq!(encode(RFC4648 { padding: false }, &[0x77, 0xC1, 0xF7, 0x7C, 0x1F]), "O7A7O7A7"); + assert_eq!(decode(RFC4648 { padding: false }, "7A7H7A7H").unwrap(), [0xF8, 0x3E, 0x7F, 0x83, 0xE7]); + assert_eq!(decode(RFC4648 { padding: false }, "O7A7O7A7").unwrap(), [0x77, 0xC1, 0xF7, 0x7C, 0x1F]); + assert_eq!(encode(RFC4648 { padding: false }, &[0xF8, 0x3E, 0x7F, 0x83]), "7A7H7AY"); + } + + #[test] + fn padding() { + let num_padding = [0, 6, 4, 3, 1]; + for i in 1..6 { + let encoded = encode(RFC4648 { padding: true }, (0..(i as u8)).collect::<Vec<u8>>().as_ref()); + assert_eq!(encoded.len(), 8); + for j in 0..(num_padding[i % 5]) { + assert_eq!(encoded.as_bytes()[encoded.len()-j-1], b'='); + } + for j in 0..(8 - num_padding[i % 5]) { + assert!(encoded.as_bytes()[j] != b'='); + } + } + } + + #[test] + fn invertible_crockford() { + fn test(data: Vec<u8>) -> bool { + decode(Crockford, encode(Crockford, data.as_ref()).as_ref()).unwrap() == data + } + quickcheck::quickcheck(test as fn(Vec<u8>) -> bool) + } + + #[test] + fn invertible_rfc4648() { + fn test(data: Vec<u8>) -> bool { + decode(RFC4648 { padding: true }, encode(RFC4648 { padding: true }, data.as_ref()).as_ref()).unwrap() == data + } + quickcheck::quickcheck(test as fn(Vec<u8>) -> bool) + } + #[test] + fn invertible_unpadded_rfc4648() { + fn test(data: Vec<u8>) -> bool { + decode(RFC4648 { padding: false }, encode(RFC4648 { padding: false }, data.as_ref()).as_ref()).unwrap() == data + } + quickcheck::quickcheck(test as fn(Vec<u8>) -> bool) + } + + #[test] + fn lower_case() { + fn test(data: Vec<B32>) -> bool { + let data: String = data.iter().map(|e| e.c as char).collect(); + decode(Crockford, data.as_ref()) == decode(Crockford, data.to_ascii_lowercase().as_ref()) + } + quickcheck::quickcheck(test as fn(Vec<B32>) -> bool) + } + + #[test] + #[allow(non_snake_case)] + fn iIlL1_oO0() { + assert_eq!(decode(Crockford, "IiLlOo"), decode(Crockford, "111100")); + } + + #[test] + fn invalid_chars_crockford() { + assert_eq!(decode(Crockford, ","), None) + } + + #[test] + fn invalid_chars_rfc4648() { + assert_eq!(decode(RFC4648 { padding: true }, ","), None) + } + + #[test] + fn invalid_chars_unpadded_rfc4648() { + assert_eq!(decode(RFC4648 { padding: false }, ","), None) + } +} |