use sha2::{Sha256, Digest};
pub fn inchi_key(inchi_str: &str) -> String {
let inchi_content = if let Some(pos) = inchi_str.find("/") {
&inchi_str[pos..]
} else {
inchi_str
};
let parts: Vec<&str> = inchi_content.split('/').collect();
let connectivity_input = if parts.len() >= 3 {
format!("{}/{}", parts[1], parts[2])
} else if parts.len() >= 2 {
parts[1].to_string()
} else {
inchi_content.to_string()
};
let remaining_input = if parts.len() > 3 {
parts[3..].join("/")
} else {
String::new()
};
let hash1_bytes = sha256_hash(&connectivity_input);
let hash2_bytes = sha256_hash(&remaining_input);
let block1 = bytes_to_base26(&hash1_bytes[..12]); let block2 = bytes_to_base26(&hash2_bytes[..9]);
let block1_padded = format!("{:<14}", block1);
let block2_padded = format!("{:<9}", block2);
let block1_final = &block1_padded[..14];
let block2_final = &block2_padded[..10];
format!("{}-{}-N", block1_final, block2_final)
}
fn sha256_hash(input: &str) -> Vec<u8> {
let mut hasher = Sha256::new();
hasher.update(input.as_bytes());
hasher.finalize().to_vec()
}
fn bytes_to_base26(bytes: &[u8]) -> String {
let mut result = String::new();
for &byte in bytes {
let d1 = (byte / 26) % 26;
let d2 = byte % 26;
result.push((b'A' + d1) as char);
result.push((b'A' + d2) as char);
}
result
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_inchi_key_format() {
let inchi = "InChI=1S/C6H6/c1-2-3-4-5-6-1/h1-6H";
let key = inchi_key(inchi);
assert_eq!(key.len(), 27);
assert_eq!(&key[14..15], "-");
assert_eq!(&key[25..26], "-");
assert_eq!(&key[26..27], "N");
}
#[test]
fn test_inchi_key_deterministic() {
let inchi = "InChI=1S/C6H6/c1-2-3-4-5-6-1/h1-6H";
let key1 = inchi_key(inchi);
let key2 = inchi_key(inchi);
assert_eq!(key1, key2);
}
#[test]
fn test_inchi_key_different_for_different_inchi() {
let inchi1 = "InChI=1S/CH4/h1H4";
let inchi2 = "InChI=1S/C2H6/c1-2/h1-2H3";
let key1 = inchi_key(inchi1);
let key2 = inchi_key(inchi2);
assert_ne!(key1, key2);
}
}