pub fn process_data_from_string(
    word_list: Vec<String>,
    lemma_map: HashMap<String, String>
)