Crate unic [] [src]

UNIC: Unicode and Internationalization Crates for Rust

The unic super-crate (this) is a collection of all UNIC components, providing an easy way of access to all functionalities, when all or many are needed, instead of importing components one-by-one, and ensuring all components imported are compatible in algorithms and consistent data-wise.

Components

  • ucd: Unicode Character Database.

  • bidi: Unicode Bidirectional Algorithm (USA#9).

  • normal: Unicode Normalization Forms (USA#15).

  • idna: Unicode IDNA Compatibility Processing (UTS#46).

A Basic Example

extern crate unic;

use unic::bidi::BidiInfo;
use unic::normal::StrNormalForm;
use unic::ucd::{Age, BidiClass, CharAge, CharBidiClass, StrBidiClass, UnicodeVersion};
use unic::ucd::normal::compose;

fn main() {

    // Age

    assert_eq!(Age::of('A'), Age::Assigned(UnicodeVersion { major: 1, minor: 1, micro: 0 }));
    assert_eq!(Age::of('\u{A0000}'), Age::Unassigned);
    assert_eq!(
        Age::of('\u{10FFFF}'),
        Age::Assigned(UnicodeVersion { major: 2, minor: 0, micro: 0 })
    );

    if let Some(uni_ver) = '🦊'.age().assigned() {
        assert_eq!(uni_ver.major, 9);
        assert_eq!(uni_ver.minor, 0);
        assert_eq!(uni_ver.micro, 0);
    }

    // Bidi

    let text = concat![
        "א",
        "ב",
        "ג",
        "a",
        "b",
        "c",
    ];

    assert!(!text.has_bidi_explicit());
    assert!(text.has_rtl());
    assert!(text.has_ltr());

    assert_eq!(text.chars().nth(0).unwrap().bidi_class(), BidiClass::RightToLeft);
    assert!(!text.chars().nth(0).unwrap().is_ltr());
    assert!(text.chars().nth(0).unwrap().is_rtl());

    assert_eq!(text.chars().nth(3).unwrap().bidi_class(), BidiClass::LeftToRight);
    assert!(text.chars().nth(3).unwrap().is_ltr());
    assert!(!text.chars().nth(3).unwrap().is_rtl());

    let bidi_info = BidiInfo::new(&text, None);
    assert_eq!(bidi_info.paragraphs.len(), 1);

    let para = &bidi_info.paragraphs[0];
    assert_eq!(para.level.number(), 1);
    assert_eq!(para.level.is_rtl(), true);

    let line = para.range.clone();
    let display = bidi_info.reorder_line(para, line);
    assert_eq!(
        display,
        concat![
            "a",
            "b",
            "c",
            "ג",
            "ב",
            "א",
        ]
    );

    // Normalization

    assert_eq!(compose('A', '\u{30a}'), Some('Å'));

    let s = "ÅΩ";
    let c = s.nfc().collect::<String>();
    assert_eq!(c, "ÅΩ");
}

Reexports

pub extern crate unic_bidi as bidi;
pub extern crate unic_idna as idna;
pub extern crate unic_normal as normal;
pub extern crate unic_ucd as ucd;

Constants

UNICODE_VERSION

The Unicode version of data