diff options
Diffstat (limited to 'src/u8c/main.h.d/uniblk.c')
-rw-r--r-- | src/u8c/main.h.d/uniblk.c | 517 |
1 files changed, 517 insertions, 0 deletions
diff --git a/src/u8c/main.h.d/uniblk.c b/src/u8c/main.h.d/uniblk.c new file mode 100644 index 0000000..332f8aa --- /dev/null +++ b/src/u8c/main.h.d/uniblk.c @@ -0,0 +1,517 @@ +/* + Copyright 2021 Gabriel Jensen + + This file is part of u8c. + + u8c is free software: you can redistribute it and/or modify it under the terms of the GNU Affero General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. + + u8c is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. + + See the GNU Affero General Public License for more details. + + You should have received a copy of the GNU Affero General Public License along with u8c. + + If not, see <https://www.gnu.org/licenses/>. +*/ +# include <stdbool.h> +# include <u8c/main.h> +# include <u8c/str.h> +# include <uchar.h> +# define u8c_uniblk_isinrng(val,start,end) (val >= start && val <= end) +struct u8c_uniblk_tuple u8c_uniblk(char32_t const _chr) { + struct u8c_uniblk_tuple ret = { + .stat = false, + }; + char32_t const * blk = U"UNDEFINED IN UNICODE"; + if(_chr <= U'\x7F') { + blk = U"BASIC LATIN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\x80',U'\u00FF')) { + blk = U"LATIN-1 SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0100',U'\u017F')) { + blk = U"LATIN EXTENDED-A"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0180',U'\u024F')) { + blk = U"LATIN EXTENDED-B"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0250',U'\u02AF')) { + blk = U"IPA EXTENSIONS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u02B0',U'\u02FF')) { + blk = U"SPACING MODIFIER LETTERS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0300',U'\u036F')) { + blk = U"COMBINING DIRACITICAL MARKS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0370',U'\u03FF')) { + blk = U"GREEK AND COPTIC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0400',U'\u04FF')) { + blk = U"CYRILLIC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0500',U'\u052F')) { + blk = U"CYRILLIC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0530',U'\u058F')) { + blk = U"ARMENIAN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0590',U'\u05FF')) { + blk = U"HEBREW"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0600',U'\u06FF')) { + blk = U"ARABIC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0700',U'\u074F')) { + blk = U"SYRIAC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0750',U'\u077F')) { + blk = U"ARABIC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0780',U'\u07BF')) { + blk = U"THAANA"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u07C0',U'\u07FF')) { + blk = U"NKO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0800',U'\u083F')) { + blk = U"SAMARITAN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0840',U'\u085F')) { + blk = U"MANDAIC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0860',U'\u086F')) { + blk = U"SYRIAC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u08A0',U'\u08FF')) { + blk = U"ARABIC EXTENDED-A"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0900',U'\u097F')) { + blk = U"DEVANAGARI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0980',U'\u09FF')) { + blk = U"BENGALI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0A00',U'\u0A7F')) { + blk = U"GURMUKHI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0A80',U'\u0AFF')) { + blk = U"GUJARATI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0B00',U'\u0B7F')) { + blk = U"ORIYAS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0B80',U'\u0BFF')) { + blk = U"TAMIL"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0C00',U'\u0C7F')) { + blk = U"TELUGU"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0C80',U'\u0CFF')) { + blk = U"KANNADA"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0D00',U'\u0D7F')) { + blk = U"MALAYALAM"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0D80',U'\u0DFF')) { + blk = U"SINHALA"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0E00',U'\u0E7F')) { + blk = U"THAI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0E80',U'\u0EFF')) { + blk = U"LAO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u0F00',U'\u0FFF')) { + blk = U"TIBETAN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1000',U'\u109F')) { + blk = U"MYANMAR"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u10A0',U'\u10FF')) { + blk = U"GEORGIAN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1100',U'\u11FF')) { + blk = U"HANGUL JAMO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1200',U'\u137F')) { + blk = U"ETHIOPIC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1380',U'\u139F')) { + blk = U"ETHIOPIC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u13A0',U'\u13FF')) { + blk = U"CHEROKEE"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1400',U'\u167F')) { + blk = U"UNIFIED CANADIAN ABORIGINAL SYLLABICS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1680',U'\u169F')) { + blk = U"OGHAM"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u16A0',U'\u16FF')) { + blk = U"RUNIC"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\u1700',U'\u171F')) { + blk = U"TAGALOG"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011A00',U'\U00011A4F')) { + blk = U"ZANABAZAR SQUARE"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011A50',U'\U00011AAF')) { + blk = U"SOYOMBO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011AC0',U'\U00011AFF')) { + blk = U"PAU CIN HAU"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011C00',U'\U00011C6F')) { + blk = U"BHAIKSUKI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011C70',U'\U00011CBF')) { + blk = U"MARCHEN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011D00',U'\U00011D5F')) { + blk = U"MASARAM GONDI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011D60',U'\U00011DAF')) { + blk = U"GUNJALA GONDI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011EE0',U'\U00011EFF')) { + blk = U"MAKASAR"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011FB0',U'\U00011FBF')) { + blk = U"LISU SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00011FC0',U'\U00011FFF')) { + blk = U"TAMIL SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00012000',U'\U000123FF')) { + blk = U"CUNEIFORM"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00012400',U'\U0001247F')) { + blk = U"CUNEIFORM NUMBERS AND PUNCTUATION"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00012480',U'\U0001254F')) { + blk = U"EARLY DYNASTIC CUNEIFORM"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00013000',U'\U0001342F')) { + blk = U"EGYPTIAN HIEROGLYPHS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00013430',U'\U0001343F')) { + blk = U"EGYPTIAN HIEROGLYPH FORMAT CONTROLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00014400',U'\U0001467F')) { + blk = U"ANATOLIAN HIEROGLYPHS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016800',U'\U00016A3F')) { + blk = U"BAMUM SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016A40',U'\U00016A6F')) { + blk = U"MRO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016AD0',U'\U00016AFF')) { + blk = U"BASSA VAH"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016B00',U'\U00016B8F')) { + blk = U"PAHAWH HMONG"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016E40',U'\U00016E9F')) { + blk = U"MEDEFAIDRIN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016F00',U'\U00016F9F')) { + blk = U"MIAO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00016FE0',U'\U00016FFF')) { + blk = U"IDEOGRAPHIC SYMBOLS AND PUNCTUATION"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00017000',U'\U000187FF')) { + blk = U"TANGUT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00018800',U'\U00018AFF')) { + blk = U"TANGUT COMPONENTS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00018B00',U'\U00018CFF')) { + blk = U"KHITAN SMALL SCRIPT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00018D00',U'\U00018D8F')) { + blk = U"TANGUT SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001B000',U'\U0001B0FF')) { + blk = U"KANA SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001B100',U'\U0001B12F')) { + blk = U"KANA EXTENDED-A"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001B130',U'\U0001B16F')) { + blk = U"SMALL KANA EXTENSION"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001B170',U'\U0001B2FF')) { + blk = U"NUSHU"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001BC00',U'\U0001BC9F')) { + blk = U"DUPLOYAN"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001BCA0',U'\U0001BCAF')) { + blk = U"SHORTHAND FORMAT CONTROLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D000',U'\U0001D0FF')) { + blk = U"BYZANTINE MUSICAL SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D100',U'\U0001D1FF')) { + blk = U"MUSICAL SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D200',U'\U0001D24F')) { + blk = U"ANCIENT GREEK MUSICAL NOTATION"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D2E0',U'\U0001D2FF')) { + blk = U"MAYAN NUMERALS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D300',U'\U0001D35F')) { + blk = U"TAI XUAN JING SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D360',U'\U0001D37F')) { + blk = U"COUNTING ROD NUMERALS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D400',U'\U0001D7FF')) { + blk = U"MATHEMATICAL ALPHANUMERIC SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001D800',U'\U0001DAAF')) { + blk = U"SUTTON SIGNWRITING"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001E000',U'\U0001E02F')) { + blk = U"GLAGOLITIC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001E100',U'\U0001E14F')) { + blk = U"NYIAKENG PUACHUE HMONG"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001E2C0',U'\U0001E2FF')) { + blk = U"WANCHO"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001E800',U'\U0001E8DF')) { + blk = U"MENDE KIKAKUI"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001E900',U'\U0001E95F')) { + blk = U"ADLAM"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001EC70',U'\U0001ECBF')) { + blk = U"INDIC SIYAQ NUMBERS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001ED00',U'\U0001ED4F')) { + blk = U"OTTOMAN SIYAQ NUMBERS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001EE00',U'\U0001EEFF')) { + blk = U"ARABIC MATHEMATICAL ALPHABETIC SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F000',U'\U0001F02F')) { + blk = U"MAHJONG TILES"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F030',U'\U0001F09F')) { + blk = U"DOMINO TILES"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F0A0',U'\U0001F0FF')) { + blk = U"PLAYING CARDS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F100',U'\U0001F1FF')) { + blk = U"ENCLOSED ALPHANUMERIC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F200',U'\U0001F2FF')) { + blk = U"ENCLOSED IDEOGRAPHIC SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F300',U'\U0001F5FF')) { + blk = U"MISCELLANEOUS SYMBOLS AND PICTOGRAPHS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F600',U'\U0001F64F')) { + blk = U"EMOTICONS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F650',U'\U0001F67F')) { + blk = U"ORNAMENTAL DINGBATS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F680',U'\U0001F6FF')) { + blk = U"TRANSPORT AND MAP SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F700',U'\U0001F77F')) { + blk = U"ALCHEMICAL SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F780',U'\U0001F7FF')) { + blk = U"GEOMETRIC SHAPES EXTENDED"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F800',U'\U0001F8FF')) { + blk = U"SUPPLEMENTAL ARROWS-C"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001F900',U'\U0001F9FF')) { + blk = U"SUPPLEMENTAL SYMBOLS AND PICTOGRAPHS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001FA00',U'\U0001FA6F')) { + blk = U"CHESS SYMBOLS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001FA70',U'\U0001FAFF')) { + blk = U"SYMBOLS AND PICTOGRAPHS EXTENDED-A"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0001FB00',U'\U0001FBFF')) { + blk = U"SYMBOLS FOR LEGACY COMPUTING"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00020000',U'\U0002A6DF')) { + blk = U"CJK UNIFIED IDEOGRAPHS EXTENSION B"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0002A700',U'\U0002B73F')) { + blk = U"CJK UNIFIED IDEOGRAPHS EXTENSION C"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0002B740',U'\U0002B81F')) { + blk = U"CJK UNIFIED IDEOGRAPHS EXTENSION D"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0002B820',U'\U0002CEAF')) { + blk = U"CJK UNIFIED IDEOGRAPHS EXTENSION E"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0002CEB0',U'\U0002EBEF')) { + blk = U"CJK UNIFIED IDEOGRAPHS EXTENSION F"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U0002F800',U'\U0002FA1F')) { + blk = U"CJK COMPATIBILITY IDEOGRAPHS SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00030000',U'\U0003134F')) { + blk = U"CJK UNIFIED IDEOGRAPHS EXTENSION G"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U000E0000',U'\U000E007F')) { + blk = U"TAGS"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U000E0100',U'\U000E1EFF')) { + blk = U"VARIATION SELECTORS SUPPLEMENT"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U000F0000',U'\U000FFFFF')) { + blk = U"SUPPLEMENTARY PRIVATE USE AREA-A"; + goto end; + } + if(u8c_uniblk_isinrng(_chr,U'\U00100000',U'\U0010FFFF')) { + blk = U"SUPPLEMENTARY PRIVATE USE AREA-B"; + goto end; + } + if(_chr > u8c_unimax) { + ret.stat = true; + return ret; + } +end:; + { + struct u8c_strcp_tuple const tuple = u8c_strcp(blk); + ret.blk = tuple.str; + ret.blksz = tuple.strsz; + } + return ret; +} |