addr 0.15.6

A library for parsing domain names
Documentation
[
    {
        "description": "validation of internationalized host names",
        "schema": {"format": "idn-hostname"},
        "tests": [
            {
                "description": "a valid host name (example.test in Hangul)",
                "data": "실례.테스트",
                "valid": true
            },
            {
                "description": "illegal first char U+302E Hangul single dot tone mark",
                "data": "〮실례.테스트",
                "valid": false
            },
            {
                "description": "contains illegal char U+302E Hangul single dot tone mark",
                "data": "실〮례.테스트",
                "valid": false
            },
            {
                "description": "a host name with a component too long",
                "data": "실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실실례례테스트례례례례례례례례례례례례례례례례례테스트례례례례례례례례례례례례례례례례례례례테스트례례례례례례례례례례례례테스트례례실례.테스트",
                "valid": false
            },
            {
                "description": "invalid label, correct Punycode",
                "comment": "https://tools.ietf.org/html/rfc5890#section-2.3.2.1 https://tools.ietf.org/html/rfc5891#section-4.4 https://tools.ietf.org/html/rfc3492#section-7.1",
                "data": "-> $1.00 <--",
                "valid": false
            },
            {
                "description": "valid Chinese Punycode",
                "comment": "https://tools.ietf.org/html/rfc5890#section-2.3.2.1 https://tools.ietf.org/html/rfc5891#section-4.4",
                "data": "xn--ihqwcrb4cv8a8dqg056pqjye",
                "valid": true
            },
            {
                "description": "invalid Punycode",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.4 https://tools.ietf.org/html/rfc5890#section-2.3.2.1",
                "data": "xn--X",
                "valid": false
            },
            {
                "description": "U-label contains \"--\" in the 3rd and 4th position",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.1 https://tools.ietf.org/html/rfc5890#section-2.3.2.1",
                "data": "XN--aa---o47jg78q",
                "valid": false
            },
            {
                "description": "U-label starts with a dash",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.1",
                "data": "-hello",
                "valid": false
            },
            {
                "description": "U-label ends with a dash",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.1",
                "data": "hello-",
                "valid": false
            },
            {
                "description": "U-label starts and ends with a dash",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.1",
                "data": "-hello-",
                "valid": false
            },
            {
                "description": "Begins with a Spacing Combining Mark",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.2",
                "data": "\u0903hello",
                "valid": false
            },
            {
                "description": "Begins with a Nonspacing Mark",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.2",
                "data": "\u0300hello",
                "valid": false
            },
            {
                "description": "Begins with an Enclosing Mark",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.2",
                "data": "\u0488hello",
                "valid": false
            },
            {
                "description": "Exceptions that are PVALID, left-to-right chars",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.2 https://tools.ietf.org/html/rfc5892#section-2.6",
                "data": "\u00df\u03c2\u0f0b\u3007",
                "valid": true
            },
            {
                "description": "Exceptions that are PVALID, right-to-left chars",
                "comment": "https://tools.ietf.org/html/rfc/rfc5891#section-4.2.2 https://tools.ietf.org/html/rfc5892#section-2.6",
                "data": "\u06fd\u06fe",
                "valid": true
            },
            {
                "description": "Exceptions that are DISALLOWED, right-to-left chars",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.2 https://tools.ietf.org/html/rfc5892#section-2.6",
                "data": "\u0640\u07fa",
                "valid": false
            },
            {
                "description": "Exceptions that are DISALLOWED, left-to-right chars",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.2 https://tools.ietf.org/html/rfc5892#section-2.6 Note: The two combining marks (U+302E and U+302F) are in the middle and not at the start",
                "data": "\u3031\u3032\u3033\u3034\u3035\u302e\u302f\u303b",
                "valid": false
            },
            {
                "description": "MIDDLE DOT with no preceding 'l'",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.3",
                "data": "a\u00b7l",
                "valid": false
            },
            {
                "description": "MIDDLE DOT with nothing preceding",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.3",
                "data": "\u00b7l",
                "valid": false
            },
            {
                "description": "MIDDLE DOT with no following 'l'",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.3",
                "data": "l\u00b7a",
                "valid": false
            },
            {
                "description": "MIDDLE DOT with nothing following",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.3",
                "data": "l\u00b7",
                "valid": false
            },
            {
                "description": "MIDDLE DOT with surrounding 'l's",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.3",
                "data": "l\u00b7l",
                "valid": true
            },
            {
                "description": "Greek KERAIA not followed by Greek",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.4",
                "data": "\u03b1\u0375S",
                "valid": false
            },
            {
                "description": "Greek KERAIA not followed by anything",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.4",
                "data": "\u03b1\u0375",
                "valid": false
            },
            {
                "description": "Greek KERAIA followed by Greek",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.4",
                "data": "\u03b1\u0375\u03b2",
                "valid": true
            },
            {
                "description": "Hebrew GERESH not preceded by Hebrew",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.5",
                "data": "A\u05f3\u05d1",
                "valid": false
            },
            {
                "description": "Hebrew GERESH not preceded by anything",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.5",
                "data": "\u05f3\u05d1",
                "valid": false
            },
            {
                "description": "Hebrew GERESH preceded by Hebrew",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.5",
                "data": "\u05d0\u05f3\u05d1",
                "valid": true
            },
            {
                "description": "Hebrew GERSHAYIM not preceded by Hebrew",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.6",
                "data": "A\u05f4\u05d1",
                "valid": false
            },
            {
                "description": "Hebrew GERSHAYIM not preceded by anything",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.6",
                "data": "\u05f4\u05d1",
                "valid": false
            },
            {
                "description": "Hebrew GERSHAYIM preceded by Hebrew",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.6",
                "data": "\u05d0\u05f4\u05d1",
                "valid": true
            },
            {
                "description": "KATAKANA MIDDLE DOT with no Hiragana, Katakana, or Han",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.7",
                "data": "def\u30fbabc",
                "valid": false
            },
            {
                "description": "KATAKANA MIDDLE DOT with no other characters",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.7",
                "data": "\u30fb",
                "valid": false
            },
            {
                "description": "KATAKANA MIDDLE DOT with Hiragana",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.7",
                "data": "\u30fb\u3041",
                "valid": true
            },
            {
                "description": "KATAKANA MIDDLE DOT with Katakana",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.7",
                "data": "\u30fb\u30a1",
                "valid": true
            },
            {
                "description": "KATAKANA MIDDLE DOT with Han",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.7",
                "data": "\u30fb\u4e08",
                "valid": true
            },
            {
                "description": "Arabic-Indic digits mixed with Extended Arabic-Indic digits",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.8",
                "data": "\u0660\u06f0",
                "valid": false
            },
            {
                "description": "Arabic-Indic digits not mixed with Extended Arabic-Indic digits",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.8",
                "data": "\u0628\u0660\u0628",
                "valid": true
            },
            {
                "description": "Extended Arabic-Indic digits not mixed with Arabic-Indic digits",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.9",
                "data": "\u06f00",
                "valid": true
            },
            {
                "description": "ZERO WIDTH JOINER not preceded by Virama",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.2 https://www.unicode.org/review/pr-37.pdf",
                "data": "\u0915\u200d\u0937",
                "valid": false
            },
            {
                "description": "ZERO WIDTH JOINER not preceded by anything",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.2 https://www.unicode.org/review/pr-37.pdf",
                "data": "\u200d\u0937",
                "valid": false
            },
            {
                "description": "ZERO WIDTH JOINER preceded by Virama",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.2 https://www.unicode.org/review/pr-37.pdf",
                "data": "\u0915\u094d\u200d\u0937",
                "valid": true
            },
            {
                "description": "ZERO WIDTH NON-JOINER preceded by Virama",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.1",
                "data": "\u0915\u094d\u200c\u0937",
                "valid": true
            },
            {
                "description": "ZERO WIDTH NON-JOINER not preceded by Virama but matches regexp",
                "comment": "https://tools.ietf.org/html/rfc5891#section-4.2.3.3 https://tools.ietf.org/html/rfc5892#appendix-A.1 https://www.w3.org/TR/alreq/#h_disjoining_enforcement",
                "data": "\u0628\u064a\u200c\u0628\u064a",
                "valid": true
            }
        ]
    }
]