cat2text-rs/src/anybase.rs
2025-01-15 12:22:50 -06:00

141 lines
4.8 KiB
Rust

//! This module translates text
use crate::core;
/// Encodes text into catspeak using any base up to [`max_base()`]
///
/// `char_length` is set manually, but the minimum can be generated using [`char_length()`]
///
/// ```
/// use cat2text::{anybase::encode, core::char_length};
///
/// let text = "i love cats".to_string();
/// let base = 10;
/// let char_length = char_length(base);
///
/// assert_eq!("meow mewo; mrrp mreow mrrp nyaaaa~ mreow mreow meow nyaaaa~; meow mrow meow mrrp mreow meow mrrp mewo", encode(text, base, char_length));
/// ```
pub fn encode(text: String, base: u32, char_length: u32) -> String {
let mut shortened_alphabet = core::alphabet();
shortened_alphabet.truncate(base as usize);
// makes it lowercase and split by spaces
let words: Vec<String> = text
.to_ascii_lowercase()
.split(" ")
.map(|item| return item.to_string())
.collect();
let mut words_as_bytes: Vec<Vec<u8>> = Vec::new();
for word in words {
// convert to bytes then subtract by 96
words_as_bytes.push(word.as_bytes().into_iter().map(|item| item - 96).collect());
}
let mut results: Vec<Vec<String>> = Vec::new();
for i in 0..words_as_bytes.len() {
results.push(Vec::new());
for j in 0..words_as_bytes[i].len() {
results[i].push(core::num_to_cat(
words_as_bytes[i][j] as u32,
shortened_alphabet.clone(),
char_length,
));
}
}
let results: Vec<String> = results.into_iter().map(|item| item.join(" ")).collect();
let results = results.join("; ");
return results;
}
/// Decodes catspeak into text using any base up to [`max_base()`]
///
/// `char_length` is set manually, but the minimum can be generated using [`char_length()`]
///
/// ```
/// use cat2text::{anybase::decode, core::char_length};
///
/// let text = "meow mewo; mrrp mreow mrrp nyaaaa~ mreow mreow meow nyaaaa~; meow mrow meow mrrp mreow meow mrrp mewo".to_string();
/// let base = 10;
/// let char_length = char_length(base);
/// assert_eq!("i love cats", decode(text, base, char_length));
/// ```
pub fn decode(text: String, base: u32, char_length: u32) -> String {
let catspeak_words: Vec<String> = text.split("; ").map(|item| item.to_string()).collect();
let mut output: String = String::new();
let mut shortened_alphabet = core::alphabet();
shortened_alphabet.truncate(base as usize);
for engl_word in catspeak_words {
let mut word = String::new();
for engl_letter in core::split_every_x(engl_word, char_length) {
let char_num = core::cat_to_num(
engl_letter
.split(" ")
.map(|item| item.to_string())
.collect(),
shortened_alphabet.clone(),
char_length,
);
word += String::from_utf8(vec![(char_num + 96) as u8])
.unwrap()
.as_str();
}
word += " ";
output += word.as_str();
}
return output.trim().to_string();
}
pub mod bytes {
use crate::core;
/// Encodes from bytes into catspeak
///
/// ```
/// use cat2text::{anybase::bytes::encode, core::bytes::char_length};
///
/// let bytes = &[243, 10];
/// let base = 16;
/// let char_length = char_length(base);
///
/// assert_eq!("mrow~ mrow meow purrrr", encode(bytes, base, char_length));
/// ```
pub fn encode(bytes: impl AsRef<[u8]>, base: u32, char_length: u32) -> String {
let mut output = String::new();
let mut shortened_alphabet = core::alphabet();
shortened_alphabet.truncate(base as usize);
for byte in bytes.as_ref() {
output +=
core::num_to_cat(*byte as u32, shortened_alphabet.clone(), char_length).as_str();
output += " ";
}
return output.trim().to_string();
}
/// Decodes catspeak into bytes
///
/// ```
/// use cat2text::{anybase::bytes::decode, core::bytes::char_length};
///
/// let text = "mrow~ mrow meow purrrr".to_string();
/// let base = 16;
/// let char_length = char_length(base);
///
/// assert_eq!(
/// vec![243, 10],
/// decode(text, base, char_length)
/// );
/// ```
pub fn decode(text: String, base: u32, char_length: u32) -> Vec<u8> {
let mut output: Vec<u8> = Vec::new();
let mut shortened_alphabet = core::alphabet();
shortened_alphabet.truncate(base as usize);
for byte in core::split_every_x(text.clone(), char_length) {
output.push(core::cat_to_num(
byte.split(" ").map(|item| item.to_string()).collect(),
shortened_alphabet.clone(),
char_length,
) as u8);
}
return output.into();
}
}