]> git.wh0rd.org - tt-rss.git/blame - plugins/af_lang_detect/languagedetect/data/unicode_blocks.php
Merge branch 'pullreq-fix-undefined-index-warning' of tkappe/tt-rss into master
[tt-rss.git] / plugins / af_lang_detect / languagedetect / data / unicode_blocks.php
CommitLineData
31b40448 1<?php
2return array (
3 0 =>
4 array (
5 0 => 0x0000,
6 1 => 0x007F,
7 2 => 'Basic Latin',
8 ),
9 1 =>
10 array (
11 0 => 0x0080,
12 1 => 0x00FF,
13 2 => 'Latin-1 Supplement',
14 ),
15 2 =>
16 array (
17 0 => 0x0100,
18 1 => 0x017F,
19 2 => 'Latin Extended-A',
20 ),
21 3 =>
22 array (
23 0 => 0x0180,
24 1 => 0x024F,
25 2 => 'Latin Extended-B',
26 ),
27 4 =>
28 array (
29 0 => 0x0250,
30 1 => 0x02AF,
31 2 => 'IPA Extensions',
32 ),
33 5 =>
34 array (
35 0 => 0x02B0,
36 1 => 0x02FF,
37 2 => 'Spacing Modifier Letters',
38 ),
39 6 =>
40 array (
41 0 => 0x0300,
42 1 => 0x036F,
43 2 => 'Combining Diacritical Marks',
44 ),
45 7 =>
46 array (
47 0 => 0x0370,
48 1 => 0x03FF,
49 2 => 'Greek and Coptic',
50 ),
51 8 =>
52 array (
53 0 => 0x0400,
54 1 => 0x04FF,
55 2 => 'Cyrillic',
56 ),
57 9 =>
58 array (
59 0 => 0x0500,
60 1 => 0x052F,
61 2 => 'Cyrillic Supplement',
62 ),
63 10 =>
64 array (
65 0 => 0x0530,
66 1 => 0x058F,
67 2 => 'Armenian',
68 ),
69 11 =>
70 array (
71 0 => 0x0590,
72 1 => 0x05FF,
73 2 => 'Hebrew',
74 ),
75 12 =>
76 array (
77 0 => 0x0600,
78 1 => 0x06FF,
79 2 => 'Arabic',
80 ),
81 13 =>
82 array (
83 0 => 0x0700,
84 1 => 0x074F,
85 2 => 'Syriac',
86 ),
87 14 =>
88 array (
89 0 => 0x0750,
90 1 => 0x077F,
91 2 => 'Arabic Supplement',
92 ),
93 15 =>
94 array (
95 0 => 0x0780,
96 1 => 0x07BF,
97 2 => 'Thaana',
98 ),
99 16 =>
100 array (
101 0 => 0x0900,
102 1 => 0x097F,
103 2 => 'Devanagari',
104 ),
105 17 =>
106 array (
107 0 => 0x0980,
108 1 => 0x09FF,
109 2 => 'Bengali',
110 ),
111 18 =>
112 array (
113 0 => 0x0A00,
114 1 => 0x0A7F,
115 2 => 'Gurmukhi',
116 ),
117 19 =>
118 array (
119 0 => 0x0A80,
120 1 => 0x0AFF,
121 2 => 'Gujarati',
122 ),
123 20 =>
124 array (
125 0 => 0x0B00,
126 1 => 0x0B7F,
127 2 => 'Oriya',
128 ),
129 21 =>
130 array (
131 0 => 0x0B80,
132 1 => 0x0BFF,
133 2 => 'Tamil',
134 ),
135 22 =>
136 array (
137 0 => 0x0C00,
138 1 => 0x0C7F,
139 2 => 'Telugu',
140 ),
141 23 =>
142 array (
143 0 => 0x0C80,
144 1 => 0x0CFF,
145 2 => 'Kannada',
146 ),
147 24 =>
148 array (
149 0 => 0x0D00,
150 1 => 0x0D7F,
151 2 => 'Malayalam',
152 ),
153 25 =>
154 array (
155 0 => 0x0D80,
156 1 => 0x0DFF,
157 2 => 'Sinhala',
158 ),
159 26 =>
160 array (
161 0 => 0x0E00,
162 1 => 0x0E7F,
163 2 => 'Thai',
164 ),
165 27 =>
166 array (
167 0 => 0x0E80,
168 1 => 0x0EFF,
169 2 => 'Lao',
170 ),
171 28 =>
172 array (
173 0 => 0x0F00,
174 1 => 0x0FFF,
175 2 => 'Tibetan',
176 ),
177 29 =>
178 array (
179 0 => 0x1000,
180 1 => 0x109F,
181 2 => 'Myanmar',
182 ),
183 30 =>
184 array (
185 0 => 0x10A0,
186 1 => 0x10FF,
187 2 => 'Georgian',
188 ),
189 31 =>
190 array (
191 0 => 0x1100,
192 1 => 0x11FF,
193 2 => 'Hangul Jamo',
194 ),
195 32 =>
196 array (
197 0 => 0x1200,
198 1 => 0x137F,
199 2 => 'Ethiopic',
200 ),
201 33 =>
202 array (
203 0 => 0x1380,
204 1 => 0x139F,
205 2 => 'Ethiopic Supplement',
206 ),
207 34 =>
208 array (
209 0 => 0x13A0,
210 1 => 0x13FF,
211 2 => 'Cherokee',
212 ),
213 35 =>
214 array (
215 0 => 0x1400,
216 1 => 0x167F,
217 2 => 'Unified Canadian Aboriginal Syllabics',
218 ),
219 36 =>
220 array (
221 0 => 0x1680,
222 1 => 0x169F,
223 2 => 'Ogham',
224 ),
225 37 =>
226 array (
227 0 => 0x16A0,
228 1 => 0x16FF,
229 2 => 'Runic',
230 ),
231 38 =>
232 array (
233 0 => 0x1700,
234 1 => 0x171F,
235 2 => 'Tagalog',
236 ),
237 39 =>
238 array (
239 0 => 0x1720,
240 1 => 0x173F,
241 2 => 'Hanunoo',
242 ),
243 40 =>
244 array (
245 0 => 0x1740,
246 1 => 0x175F,
247 2 => 'Buhid',
248 ),
249 41 =>
250 array (
251 0 => 0x1760,
252 1 => 0x177F,
253 2 => 'Tagbanwa',
254 ),
255 42 =>
256 array (
257 0 => 0x1780,
258 1 => 0x17FF,
259 2 => 'Khmer',
260 ),
261 43 =>
262 array (
263 0 => 0x1800,
264 1 => 0x18AF,
265 2 => 'Mongolian',
266 ),
267 44 =>
268 array (
269 0 => 0x1900,
270 1 => 0x194F,
271 2 => 'Limbu',
272 ),
273 45 =>
274 array (
275 0 => 0x1950,
276 1 => 0x197F,
277 2 => 'Tai Le',
278 ),
279 46 =>
280 array (
281 0 => 0x1980,
282 1 => 0x19DF,
283 2 => 'New Tai Lue',
284 ),
285 47 =>
286 array (
287 0 => 0x19E0,
288 1 => 0x19FF,
289 2 => 'Khmer Symbols',
290 ),
291 48 =>
292 array (
293 0 => 0x1A00,
294 1 => 0x1A1F,
295 2 => 'Buginese',
296 ),
297 49 =>
298 array (
299 0 => 0x1D00,
300 1 => 0x1D7F,
301 2 => 'Phonetic Extensions',
302 ),
303 50 =>
304 array (
305 0 => 0x1D80,
306 1 => 0x1DBF,
307 2 => 'Phonetic Extensions Supplement',
308 ),
309 51 =>
310 array (
311 0 => 0x1DC0,
312 1 => 0x1DFF,
313 2 => 'Combining Diacritical Marks Supplement',
314 ),
315 52 =>
316 array (
317 0 => 0x1E00,
318 1 => 0x1EFF,
319 2 => 'Latin Extended Additional',
320 ),
321 53 =>
322 array (
323 0 => 0x1F00,
324 1 => 0x1FFF,
325 2 => 'Greek Extended',
326 ),
327 54 =>
328 array (
329 0 => 0x2000,
330 1 => 0x206F,
331 2 => 'General Punctuation',
332 ),
333 55 =>
334 array (
335 0 => 0x2070,
336 1 => 0x209F,
337 2 => 'Superscripts and Subscripts',
338 ),
339 56 =>
340 array (
341 0 => 0x20A0,
342 1 => 0x20CF,
343 2 => 'Currency Symbols',
344 ),
345 57 =>
346 array (
347 0 => 0x20D0,
348 1 => 0x20FF,
349 2 => 'Combining Diacritical Marks for Symbols',
350 ),
351 58 =>
352 array (
353 0 => 0x2100,
354 1 => 0x214F,
355 2 => 'Letterlike Symbols',
356 ),
357 59 =>
358 array (
359 0 => 0x2150,
360 1 => 0x218F,
361 2 => 'Number Forms',
362 ),
363 60 =>
364 array (
365 0 => 0x2190,
366 1 => 0x21FF,
367 2 => 'Arrows',
368 ),
369 61 =>
370 array (
371 0 => 0x2200,
372 1 => 0x22FF,
373 2 => 'Mathematical Operators',
374 ),
375 62 =>
376 array (
377 0 => 0x2300,
378 1 => 0x23FF,
379 2 => 'Miscellaneous Technical',
380 ),
381 63 =>
382 array (
383 0 => 0x2400,
384 1 => 0x243F,
385 2 => 'Control Pictures',
386 ),
387 64 =>
388 array (
389 0 => 0x2440,
390 1 => 0x245F,
391 2 => 'Optical Character Recognition',
392 ),
393 65 =>
394 array (
395 0 => 0x2460,
396 1 => 0x24FF,
397 2 => 'Enclosed Alphanumerics',
398 ),
399 66 =>
400 array (
401 0 => 0x2500,
402 1 => 0x257F,
403 2 => 'Box Drawing',
404 ),
405 67 =>
406 array (
407 0 => 0x2580,
408 1 => 0x259F,
409 2 => 'Block Elements',
410 ),
411 68 =>
412 array (
413 0 => 0x25A0,
414 1 => 0x25FF,
415 2 => 'Geometric Shapes',
416 ),
417 69 =>
418 array (
419 0 => 0x2600,
420 1 => 0x26FF,
421 2 => 'Miscellaneous Symbols',
422 ),
423 70 =>
424 array (
425 0 => 0x2700,
426 1 => 0x27BF,
427 2 => 'Dingbats',
428 ),
429 71 =>
430 array (
431 0 => 0x27C0,
432 1 => 0x27EF,
433 2 => 'Miscellaneous Mathematical Symbols-A',
434 ),
435 72 =>
436 array (
437 0 => 0x27F0,
438 1 => 0x27FF,
439 2 => 'Supplemental Arrows-A',
440 ),
441 73 =>
442 array (
443 0 => 0x2800,
444 1 => 0x28FF,
445 2 => 'Braille Patterns',
446 ),
447 74 =>
448 array (
449 0 => 0x2900,
450 1 => 0x297F,
451 2 => 'Supplemental Arrows-B',
452 ),
453 75 =>
454 array (
455 0 => 0x2980,
456 1 => 0x29FF,
457 2 => 'Miscellaneous Mathematical Symbols-B',
458 ),
459 76 =>
460 array (
461 0 => 0x2A00,
462 1 => 0x2AFF,
463 2 => 'Supplemental Mathematical Operators',
464 ),
465 77 =>
466 array (
467 0 => 0x2B00,
468 1 => 0x2BFF,
469 2 => 'Miscellaneous Symbols and Arrows',
470 ),
471 78 =>
472 array (
473 0 => 0x2C00,
474 1 => 0x2C5F,
475 2 => 'Glagolitic',
476 ),
477 79 =>
478 array (
479 0 => 0x2C80,
480 1 => 0x2CFF,
481 2 => 'Coptic',
482 ),
483 80 =>
484 array (
485 0 => 0x2D00,
486 1 => 0x2D2F,
487 2 => 'Georgian Supplement',
488 ),
489 81 =>
490 array (
491 0 => 0x2D30,
492 1 => 0x2D7F,
493 2 => 'Tifinagh',
494 ),
495 82 =>
496 array (
497 0 => 0x2D80,
498 1 => 0x2DDF,
499 2 => 'Ethiopic Extended',
500 ),
501 83 =>
502 array (
503 0 => 0x2E00,
504 1 => 0x2E7F,
505 2 => 'Supplemental Punctuation',
506 ),
507 84 =>
508 array (
509 0 => 0x2E80,
510 1 => 0x2EFF,
511 2 => 'CJK Radicals Supplement',
512 ),
513 85 =>
514 array (
515 0 => 0x2F00,
516 1 => 0x2FDF,
517 2 => 'Kangxi Radicals',
518 ),
519 86 =>
520 array (
521 0 => 0x2FF0,
522 1 => 0x2FFF,
523 2 => 'Ideographic Description Characters',
524 ),
525 87 =>
526 array (
527 0 => 0x3000,
528 1 => 0x303F,
529 2 => 'CJK Symbols and Punctuation',
530 ),
531 88 =>
532 array (
533 0 => 0x3040,
534 1 => 0x309F,
535 2 => 'Hiragana',
536 ),
537 89 =>
538 array (
539 0 => 0x30A0,
540 1 => 0x30FF,
541 2 => 'Katakana',
542 ),
543 90 =>
544 array (
545 0 => 0x3100,
546 1 => 0x312F,
547 2 => 'Bopomofo',
548 ),
549 91 =>
550 array (
551 0 => 0x3130,
552 1 => 0x318F,
553 2 => 'Hangul Compatibility Jamo',
554 ),
555 92 =>
556 array (
557 0 => 0x3190,
558 1 => 0x319F,
559 2 => 'Kanbun',
560 ),
561 93 =>
562 array (
563 0 => 0x31A0,
564 1 => 0x31BF,
565 2 => 'Bopomofo Extended',
566 ),
567 94 =>
568 array (
569 0 => 0x31C0,
570 1 => 0x31EF,
571 2 => 'CJK Strokes',
572 ),
573 95 =>
574 array (
575 0 => 0x31F0,
576 1 => 0x31FF,
577 2 => 'Katakana Phonetic Extensions',
578 ),
579 96 =>
580 array (
581 0 => 0x3200,
582 1 => 0x32FF,
583 2 => 'Enclosed CJK Letters and Months',
584 ),
585 97 =>
586 array (
587 0 => 0x3300,
588 1 => 0x33FF,
589 2 => 'CJK Compatibility',
590 ),
591 98 =>
592 array (
593 0 => 0x3400,
594 1 => 0x4DBF,
595 2 => 'CJK Unified Ideographs Extension A',
596 ),
597 99 =>
598 array (
599 0 => 0x4DC0,
600 1 => 0x4DFF,
601 2 => 'Yijing Hexagram Symbols',
602 ),
603 100 =>
604 array (
605 0 => 0x4E00,
606 1 => 0x9FFF,
607 2 => 'CJK Unified Ideographs',
608 ),
609 101 =>
610 array (
611 0 => 0xA000,
612 1 => 0xA48F,
613 2 => 'Yi Syllables',
614 ),
615 102 =>
616 array (
617 0 => 0xA490,
618 1 => 0xA4CF,
619 2 => 'Yi Radicals',
620 ),
621 103 =>
622 array (
623 0 => 0xA700,
624 1 => 0xA71F,
625 2 => 'Modifier Tone Letters',
626 ),
627 104 =>
628 array (
629 0 => 0xA800,
630 1 => 0xA82F,
631 2 => 'Syloti Nagri',
632 ),
633 105 =>
634 array (
635 0 => 0xAC00,
636 1 => 0xD7AF,
637 2 => 'Hangul Syllables',
638 ),
639 106 =>
640 array (
641 0 => 0xD800,
642 1 => 0xDB7F,
643 2 => 'High Surrogates',
644 ),
645 107 =>
646 array (
647 0 => 0xDB80,
648 1 => 0xDBFF,
649 2 => 'High Private Use Surrogates',
650 ),
651 108 =>
652 array (
653 0 => 0xDC00,
654 1 => 0xDFFF,
655 2 => 'Low Surrogates',
656 ),
657 109 =>
658 array (
659 0 => 0xE000,
660 1 => 0xF8FF,
661 2 => 'Private Use Area',
662 ),
663 110 =>
664 array (
665 0 => 0xF900,
666 1 => 0xFAFF,
667 2 => 'CJK Compatibility Ideographs',
668 ),
669 111 =>
670 array (
671 0 => 0xFB00,
672 1 => 0xFB4F,
673 2 => 'Alphabetic Presentation Forms',
674 ),
675 112 =>
676 array (
677 0 => 0xFB50,
678 1 => 0xFDFF,
679 2 => 'Arabic Presentation Forms-A',
680 ),
681 113 =>
682 array (
683 0 => 0xFE00,
684 1 => 0xFE0F,
685 2 => 'Variation Selectors',
686 ),
687 114 =>
688 array (
689 0 => 0xFE10,
690 1 => 0xFE1F,
691 2 => 'Vertical Forms',
692 ),
693 115 =>
694 array (
695 0 => 0xFE20,
696 1 => 0xFE2F,
697 2 => 'Combining Half Marks',
698 ),
699 116 =>
700 array (
701 0 => 0xFE30,
702 1 => 0xFE4F,
703 2 => 'CJK Compatibility Forms',
704 ),
705 117 =>
706 array (
707 0 => 0xFE50,
708 1 => 0xFE6F,
709 2 => 'Small Form Variants',
710 ),
711 118 =>
712 array (
713 0 => 0xFE70,
714 1 => 0xFEFF,
715 2 => 'Arabic Presentation Forms-B',
716 ),
717 119 =>
718 array (
719 0 => 0xFF00,
720 1 => 0xFFEF,
721 2 => 'Halfwidth and Fullwidth Forms',
722 ),
723 120 =>
724 array (
725 0 => 0xFFF0,
726 1 => 0xFFFF,
727 2 => 'Specials',
728 ),
729 121 =>
730 array (
731 0 => 0x10000,
732 1 => 0x1007F,
733 2 => 'Linear B Syllabary',
734 ),
735 122 =>
736 array (
737 0 => 0x10080,
738 1 => 0x100FF,
739 2 => 'Linear B Ideograms',
740 ),
741 123 =>
742 array (
743 0 => 0x10100,
744 1 => 0x1013F,
745 2 => 'Aegean Numbers',
746 ),
747 124 =>
748 array (
749 0 => 0x10140,
750 1 => 0x1018F,
751 2 => 'Ancient Greek Numbers',
752 ),
753 125 =>
754 array (
755 0 => 0x10300,
756 1 => 0x1032F,
757 2 => 'Old Italic',
758 ),
759 126 =>
760 array (
761 0 => 0x10330,
762 1 => 0x1034F,
763 2 => 'Gothic',
764 ),
765 127 =>
766 array (
767 0 => 0x10380,
768 1 => 0x1039F,
769 2 => 'Ugaritic',
770 ),
771 128 =>
772 array (
773 0 => 0x103A0,
774 1 => 0x103DF,
775 2 => 'Old Persian',
776 ),
777 129 =>
778 array (
779 0 => 0x10400,
780 1 => 0x1044F,
781 2 => 'Deseret',
782 ),
783 130 =>
784 array (
785 0 => 0x10450,
786 1 => 0x1047F,
787 2 => 'Shavian',
788 ),
789 131 =>
790 array (
791 0 => 0x10480,
792 1 => 0x104AF,
793 2 => 'Osmanya',
794 ),
795 132 =>
796 array (
797 0 => 0x10800,
798 1 => 0x1083F,
799 2 => 'Cypriot Syllabary',
800 ),
801 133 =>
802 array (
803 0 => 0x10A00,
804 1 => 0x10A5F,
805 2 => 'Kharoshthi',
806 ),
807 134 =>
808 array (
809 0 => 0x1D000,
810 1 => 0x1D0FF,
811 2 => 'Byzantine Musical Symbols',
812 ),
813 135 =>
814 array (
815 0 => 0x1D100,
816 1 => 0x1D1FF,
817 2 => 'Musical Symbols',
818 ),
819 136 =>
820 array (
821 0 => 0x1D200,
822 1 => 0x1D24F,
823 2 => 'Ancient Greek Musical Notation',
824 ),
825 137 =>
826 array (
827 0 => 0x1D300,
828 1 => 0x1D35F,
829 2 => 'Tai Xuan Jing Symbols',
830 ),
831 138 =>
832 array (
833 0 => 0x1D400,
834 1 => 0x1D7FF,
835 2 => 'Mathematical Alphanumeric Symbols',
836 ),
837 139 =>
838 array (
839 0 => 0x20000,
840 1 => 0x2A6DF,
841 2 => 'CJK Unified Ideographs Extension B',
842 ),
843 140 =>
844 array (
845 0 => 0x2F800,
846 1 => 0x2FA1F,
847 2 => 'CJK Compatibility Ideographs Supplement',
848 ),
849 141 =>
850 array (
851 0 => 0xE0000,
852 1 => 0xE007F,
853 2 => 'Tags',
854 ),
855 142 =>
856 array (
857 0 => 0xE0100,
858 1 => 0xE01EF,
859 2 => 'Variation Selectors Supplement',
860 ),
861 143 =>
862 array (
863 0 => 0xF0000,
864 1 => 0xFFFFF,
865 2 => 'Supplementary Private Use Area-A',
866 ),
867 144 =>
868 array (
869 0 => 0x100000,
870 1 => 0x10FFFF,
871 2 => 'Supplementary Private Use Area-B',
872 ),
873);