xref: /openbsd-src/regress/usr.bin/mandoc/char/unicode/input.out_utf8 (revision c2eb3b8c127d64282143b29045ee1e714290db9e)
1CHAR-UNICODE-INPUT(1)       General Commands Manual      CHAR-UNICODE-INPUT(1)
2
3NNAAMMEE
4     char-unicode-input - Unicode characters in the input file
5
6DDEESSCCRRIIPPTTIIOONN
7     lowest valid: �
8
9   OOnnee--bbyyttee rraannggee
10     U+0000   0x00   �?   lowest ASCII
11     U+001f   0x1f   �?   highest ASCII control character
12     U+007f   0x7f   �?   highest ASCII
13              0x80   ?    leading lowest continuation
14              0xbf   ?    leading highest continuation
15
16   TTwwoo--bbyyttee rraannggee
17     U+0000   0xc080     ??   lowest obfuscated ASCII
18     U+007f   0xc1bf     ??   highest obfuscated ASCII
19     U+0080   0xc280     ��   lowest two-byte
20     U+07FF   0xdfbf     ߿߿   highest two-byte
21              0xc278     ?x   ASCII instead of continuation
22              0xc2c380   ?À   start byte instead of continuation
23
24   TThhrreeee--bbyyttee rraannggee
25     U+0000   0xe08080   ???    lowest obfuscated ASCII
26     U+007f   0xe081bf   ???    highest obfuscated ASCII
27     U+0080   0xe08280   ???    lowest obfuscated two-byte
28     U+07FF   0xe09fbf   ???    highest obfuscated two-byte
29     U+0800   0xe0a080   ࠀࠀ     lowest three-byte
30     U+0FFF   0xe0bfbf   ࿿࿿       end of first start byte
31     U+1000   0xe18080   ကက     begin of second start byte
32     U+CFFF   0xecbfbf   쿿쿿   end of last normal start byte
33     U+D000   0xed8080   퀀퀀   begin of last start byte
34     U+D7FB   0xed9fbb   ퟻퟻ   highest valid public three-byte
35     U+D7FF   0xed9fbf   ퟿퟿       highest public three-byte
36     U+D800   0xeda080   ???    lowest surrogate
37     U+DFFF   0xedbfbf   ???    highest surrogate
38     U+E000   0xee8080        lowest private use
39     U+F8FF   0xefa3bf        highest private use
40     U+F900   0xefa480   豈豈   lowest post-private
41     U+FEFF   0xefbbbf          byte-order mark
42     U+FFFC   0xefbfbc        object replacement character
43     U+FFFD   0xefbfbd   ��     replacement character
44     U+FFFE   0xefbfbe   ￾￾       reversed byte-order mark
45     U+FFFF   0xefbfbf   ￿￿       highest three-byte
46
47   FFoouurr--bbyyttee rraannggee
48     U+0000     0xf0808080     ????    lowest obfuscated ASCII
49     U+007f     0xf08081bf     ????    highest obfuscated ASCII
50     U+0080     0xf0808280     ????    lowest obfuscated two-byte
51     U+07FF     0xf0809fbf     ????    highest obfuscated two-byte
52     U+0800     0xf080a080     ????    lowest obfuscated three-byte
53     U+FFFF     0xf08fbfbf     ????    highest obfuscated three-byte
54     U+10000    0xf0908080     ����      lowest four-byte
55     U+3FFFF    0xf0bfbfbf     ����        end of first start byte
56     U+40000    0xf1808080     ����        begin of second start byte
57     U+EFFFF    0xf2bfbfbf     ����        highest public character
58     U+F0000    0xf3808080     ����       lowest plane 15 private use
59     U+FFFFF    0xf3bfbfbf     ����        highest plane 15 private use
60     U+100000   0xf4808080     ����      lowest plane 16 private use
61     U+10FFFF   0xf48fbfbf     ����        highest valid four-byte
62     U+110000   0xf4908080     ????    lowest beyond Unicode
63     U+13FFFF   0xf4bfbfbf     ????    end of last start byte
64     U+140000   0xf5808080     ????    lowest invalid start byte
65     U+1FFFFF   0xf7bfbfbf     ????    highest invalid four-byte
66     U+200000   0xf888808080   ?????   lowest five-byte
67
68OpenBSD                          May 16, 2024            CHAR-UNICODE-INPUT(1)
69