2024-04-03 20:35:05 +11:00
|
|
|
use std::{slice::ChunksExact, sync::OnceLock};
|
|
|
|
|
|
|
|
const ALPHABET: &[u8] = b"0123456789=ABCDEFGHIJKLMNOPQRSTUVWXYZ_abcdefghijklmnopqrstuvwxyz";
|
|
|
|
|
|
|
|
// pub fn encode_16(input: u16) -> [u8; 3] {
|
|
|
|
// let input = input as usize;
|
|
|
|
// [
|
|
|
|
// ALPHABET[input >> (16 - 5)],
|
|
|
|
// ALPHABET[(input >> (16 - 10)) & 0b11111],
|
|
|
|
// ALPHABET[input & 0b111111],
|
|
|
|
// ]
|
|
|
|
// }
|
|
|
|
|
|
|
|
// pub fn encode_32(input: u32) -> [u8; 6] {
|
|
|
|
// let input = input as usize;
|
|
|
|
// let output_16 = encode_16(input as u16);
|
|
|
|
// [
|
|
|
|
// ALPHABET[(input >> (32 - 5)) | 0b100000],
|
|
|
|
// ALPHABET[(input >> (32 - 10)) & 0b11111],
|
|
|
|
// ALPHABET[(input >> (32 - 16)) & 0b111111],
|
|
|
|
// output_16[0],
|
|
|
|
// output_16[1],
|
|
|
|
// output_16[2],
|
|
|
|
// ]
|
|
|
|
// }
|
|
|
|
|
|
|
|
pub fn gwilym_decode(input: &str) -> anyhow::Result<GwilymDecodeIter<'_>> {
|
|
|
|
GwilymDecodeIter::new(input)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub struct GwilymDecodeIter<'a> {
|
|
|
|
chunks: ChunksExact<'a, u8>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> GwilymDecodeIter<'a> {
|
|
|
|
fn new(input: &'a str) -> anyhow::Result<Self> {
|
|
|
|
let Some((input, version)) = input.rsplit_once('v') else {
|
|
|
|
anyhow::bail!("Does not contain version");
|
|
|
|
};
|
|
|
|
|
|
|
|
if version != "1" {
|
|
|
|
anyhow::bail!("Only version 1 is supported");
|
|
|
|
}
|
|
|
|
|
|
|
|
if input.len() % 3 != 0 {
|
|
|
|
anyhow::bail!("Input string must have length a multiple of 3");
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(Self {
|
|
|
|
chunks: input.as_bytes().chunks_exact(3),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<'a> Iterator for GwilymDecodeIter<'a> {
|
|
|
|
type Item = u32;
|
|
|
|
|
|
|
|
fn next(&mut self) -> Option<Self::Item> {
|
|
|
|
let Some(chunk) = self.chunks.next() else {
|
|
|
|
return None;
|
|
|
|
};
|
|
|
|
|
|
|
|
let value = decode_chunk(chunk);
|
2024-04-03 20:57:34 +11:00
|
|
|
if value & (1 << 16) != 0 {
|
|
|
|
let upper_bits = value << 16;
|
|
|
|
let lower_bits = self.next().unwrap_or(0) & 0xffff;
|
|
|
|
|
|
|
|
return Some(upper_bits | lower_bits);
|
2024-04-03 20:35:05 +11:00
|
|
|
}
|
|
|
|
|
|
|
|
Some(value | 0x0800_0000)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn decode_chunk(chunk: &[u8]) -> u32 {
|
|
|
|
let a = get_value_for_char(chunk[0]);
|
|
|
|
let b = get_value_for_char(chunk[1]);
|
|
|
|
let c = get_value_for_char(chunk[2]);
|
|
|
|
|
|
|
|
(a << (16 - 5)) | (b << (16 - 10)) | c
|
|
|
|
}
|
|
|
|
|
|
|
|
fn get_value_for_char(input: u8) -> u32 {
|
|
|
|
static REVERSE_ALHPABET: OnceLock<[u8; 128]> = OnceLock::new();
|
|
|
|
|
|
|
|
REVERSE_ALHPABET.get_or_init(|| {
|
|
|
|
let mut result = [0; 128];
|
|
|
|
for (i, &c) in ALPHABET.iter().enumerate() {
|
|
|
|
result[c as usize] = i as u8;
|
|
|
|
}
|
|
|
|
|
|
|
|
result
|
|
|
|
})[input as usize] as u32
|
|
|
|
}
|
2024-04-03 20:57:34 +11:00
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod test {
|
|
|
|
use super::{gwilym_decode, ALPHABET};
|
|
|
|
use std::fmt::Write;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn should_correctly_decode_16s() -> anyhow::Result<()> {
|
|
|
|
assert_eq!(
|
|
|
|
&gwilym_decode("2QI65Q69306Kv1")?.collect::<Vec<_>>(),
|
|
|
|
&[0x0800_16d3, 0x0800_315b, 0x0800_3243, 0x0800_0195]
|
|
|
|
);
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
fn encode_16(input: u16) -> [u8; 3] {
|
|
|
|
let input = input as usize;
|
|
|
|
[
|
|
|
|
ALPHABET[input >> (16 - 5)],
|
|
|
|
ALPHABET[(input >> (16 - 10)) & 0b11111],
|
|
|
|
ALPHABET[input & 0b111111],
|
|
|
|
]
|
|
|
|
}
|
|
|
|
|
|
|
|
fn encode_32(input: u32) -> [u8; 6] {
|
|
|
|
let input = input as usize;
|
|
|
|
let output_lower_16 = encode_16(input as u16);
|
|
|
|
let input_upper_16 = input >> 16;
|
|
|
|
[
|
|
|
|
ALPHABET[(input_upper_16 >> (16 - 5)) | (1 << 5)],
|
|
|
|
ALPHABET[(input_upper_16 >> (16 - 10)) & 0b11111],
|
|
|
|
ALPHABET[input_upper_16 & 0b111111],
|
|
|
|
output_lower_16[0],
|
|
|
|
output_lower_16[1],
|
|
|
|
output_lower_16[2],
|
|
|
|
]
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn should_correctly_decode_16s_and_32s() -> anyhow::Result<()> {
|
|
|
|
let trace: &[u32] = &[
|
|
|
|
0x0300_2990,
|
|
|
|
0x0800_3289,
|
|
|
|
0x0500_2993,
|
|
|
|
0x3829_2910,
|
|
|
|
0xffff_ffff,
|
|
|
|
0x0000_0000,
|
|
|
|
];
|
|
|
|
|
|
|
|
let mut result = String::new();
|
|
|
|
for &ip in trace {
|
|
|
|
if ip & 0xFFFF_0000 == 0x0800_0000 {
|
|
|
|
let encoded = encode_16(ip as u16);
|
|
|
|
let encoded_s = std::str::from_utf8(&encoded)?;
|
|
|
|
write!(&mut result, "{encoded_s}")?
|
|
|
|
} else {
|
|
|
|
let encoded = encode_32(ip);
|
|
|
|
let encoded_s = std::str::from_utf8(&encoded)?;
|
|
|
|
write!(&mut result, "{encoded_s}")?
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
write!(&mut result, "v1")?;
|
|
|
|
|
|
|
|
assert_eq!(&gwilym_decode(&result)?.collect::<Vec<_>>(), trace);
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|