pub unsafe extern "C" fn spp_unk_id(
    spp: *mut SentencePieceProcessor
) -> c_int