1*8ccd4a63SDavid du Colombier #include "u.h"
2*8ccd4a63SDavid du Colombier #include "libc.h"
37dd7cddfSDavid du Colombier
47dd7cddfSDavid du Colombier /*
57dd7cddfSDavid du Colombier * The code makes two assumptions: strlen(ld) is 1 or 2; latintab[i].ld can be a
67dd7cddfSDavid du Colombier * prefix of latintab[j].ld only when j<i.
77dd7cddfSDavid du Colombier */
87dd7cddfSDavid du Colombier struct cvlist
97dd7cddfSDavid du Colombier {
107dd7cddfSDavid du Colombier char *ld; /* must be seen before using this conversion */
117dd7cddfSDavid du Colombier char *si; /* options for last input characters */
127dd7cddfSDavid du Colombier Rune so[50]; /* the corresponding Rune for each si entry */
137dd7cddfSDavid du Colombier } latintab[] = {
147dd7cddfSDavid du Colombier " ", " i", { 0x2423, 0x0131 },
157dd7cddfSDavid du Colombier "w", "kqrbnp", { 0x2654, 0x2655, 0x2656, 0x2657, 0x2658, 0x2659, },
167dd7cddfSDavid du Colombier "x", "O", { 0x2297, },
177dd7cddfSDavid du Colombier "f", "a", { 0x2200, },
187dd7cddfSDavid du Colombier "=", "V:=O<>", { 0x21D2, 0x2255, 0x2261, 0x229C, 0x22DC, 0x22DD, },
197dd7cddfSDavid du Colombier "V", "=", { 0x21D0, },
207dd7cddfSDavid du Colombier "7", "8", { 0x215E, },
217dd7cddfSDavid du Colombier "5", "68", { 0x215A, 0x215D, },
227dd7cddfSDavid du Colombier "4", "5", { 0x2158, },
237dd7cddfSDavid du Colombier "R", "R", { 0x211D, },
247dd7cddfSDavid du Colombier "Q", "Q", { 0x211A, },
257dd7cddfSDavid du Colombier "P", "P", { 0x2119, },
267dd7cddfSDavid du Colombier "C", "CAU", { 0x2102, 0x22C2, 0x22C3, },
277dd7cddfSDavid du Colombier "e", "nmsl", { 0x2013, 0x2014, 0x2205, 0x22EF, },
287dd7cddfSDavid du Colombier "b", "u0123456789+-=()kqrbnp", { 0x2022, 0x2080, 0x2081, 0x2082, 0x2083, 0x2084, 0x2085, 0x2086, 0x2087, 0x2088, 0x2089, 0x208A, 0x208B, 0x208C, 0x208D, 0x208E, 0x265A, 0x265B, 0x265C, 0x265D, 0x265E, 0x265F, },
297dd7cddfSDavid du Colombier "@e", "h", { 0x44D, },
307dd7cddfSDavid du Colombier "@\'", "\'", { 0x44A, },
317dd7cddfSDavid du Colombier "@s", "hc", { 0x448, 0x449, },
327dd7cddfSDavid du Colombier "@c", "h", { 0x447, },
337dd7cddfSDavid du Colombier "@t", "s", { 0x446, },
347dd7cddfSDavid du Colombier "@k", "h", { 0x445, },
357dd7cddfSDavid du Colombier "@z", "h", { 0x436, },
367dd7cddfSDavid du Colombier "@y", "euao", { 0x435, 0x44E, 0x44F, 0x451, },
377dd7cddfSDavid du Colombier "@E", "Hh", { 0x42D, 0x42D, },
387dd7cddfSDavid du Colombier "@S", "HhCc", { 0x428, 0x428, 0x429, 0x429, },
397dd7cddfSDavid du Colombier "@C", "Hh", { 0x427, 0x427, },
407dd7cddfSDavid du Colombier "@T", "Ss", { 0x426, 0x426, },
417dd7cddfSDavid du Colombier "@K", "Hh", { 0x425, 0x425, },
427dd7cddfSDavid du Colombier "@Z", "Hh", { 0x416, 0x416, },
437dd7cddfSDavid du Colombier "@@", "EZKSTYezksty\'", { 0x415, 0x417, 0x41A, 0x421, 0x422, 0x42B, 0x435, 0x437, 0x43A, 0x441, 0x442, 0x44B, 0x44C, },
447dd7cddfSDavid du Colombier "@Y", "OoEeUuAa", { 0x401, 0x401, 0x415, 0x415, 0x42E, 0x42E, 0x42F, 0x42F, },
457dd7cddfSDavid du Colombier "@", "ABVGDIJLMNOPRUFXabvgdijlmnoprufx", { 0x410, 0x411, 0x412, 0x413, 0x414, 0x418, 0x419, 0x41B, 0x41C, 0x41D, 0x41E, 0x41F, 0x420, 0x423, 0x424, 0x425, 0x430, 0x431, 0x432, 0x433, 0x434, 0x438, 0x439, 0x43B, 0x43C, 0x43D, 0x43E, 0x43F, 0x440, 0x443, 0x444, 0x445, },
467dd7cddfSDavid du Colombier "*", "ABGDEZYHIKLMNCOPRSTUFXQWabgdezyhiklmncoprstufxqw*", { 0x391, 0x392, 0x393, 0x394, 0x395, 0x396, 0x397, 0x398, 0x399, 0x39A, 0x39B, 0x39C, 0x39D, 0x39E, 0x39F, 0x3A0, 0x3A1, 0x3A3, 0x3A4, 0x3A5, 0x3A6, 0x3A7, 0x3A8, 0x3A9, 0x3B1, 0x3B2, 0x3B3, 0x3B4, 0x3B5, 0x3B6, 0x3B7, 0x3B8, 0x3B9, 0x3BA, 0x3BB, 0x3BC, 0x3BD, 0x3BE, 0x3BF, 0x3C0, 0x3C1, 0x3C3, 0x3C4, 0x3C5, 0x3C6, 0x3C7, 0x3C8, 0x3C9, 0x2217, },
477dd7cddfSDavid du Colombier "G", "-", { 0x1E4, },
487dd7cddfSDavid du Colombier "N", "JjN", { 0x1CA, 0x1CB, 0x2115, },
497dd7cddfSDavid du Colombier "2", "-35", { 0x1BB, 0x2154, 0x2156, },
507dd7cddfSDavid du Colombier "z", "-", { 0x1B6, },
517dd7cddfSDavid du Colombier "Z", "-Z", { 0x1B5, 0x2124, },
527dd7cddfSDavid du Colombier "Y", "R", { 0x1A6, },
537dd7cddfSDavid du Colombier "h", "v-", { 0x195, 0x210F, },
547dd7cddfSDavid du Colombier "$*", "hfk", { 0x3D1, 0x3D5, 0x3F0, },
557dd7cddfSDavid du Colombier "$", "fVavgHILlpRBeEFMo", { 0x192, 0x1B2, 0x251, 0x28B, 0x210A, 0x210B, 0x2110, 0x2112, 0x2113, 0x2118, 0x211B, 0x212C, 0x212F, 0x2130, 0x2131, 0x2133, 0x2134, },
567dd7cddfSDavid du Colombier "t", "-smefu", { 0x167, 0x3C2, 0x2122, 0x2203, 0x2234, 0x22A2, },
577dd7cddfSDavid du Colombier "T", "-u", { 0x166, 0x22A8, },
587dd7cddfSDavid du Colombier "L", "-Jj&|", { 0x141, 0x1C7, 0x1C8, 0x22C0, 0x22C1, },
597dd7cddfSDavid du Colombier "i", "j-fsbp", { 0x133, 0x268, 0x221E, 0x222B, 0x2286, 0x2287, },
607dd7cddfSDavid du Colombier "I", "J-", { 0x132, 0x197, },
617dd7cddfSDavid du Colombier "H", "-H", { 0x126, 0x210D, },
627dd7cddfSDavid du Colombier "v\"", "Uu", { 0x1D9, 0x1DA, },
637dd7cddfSDavid du Colombier "v", "CcDdEeLlNnRrSsTtZzAaIiOoUuGgKkj", { 0x10C, 0x10D, 0x10E, 0x10F, 0x11A, 0x11B, 0x13D, 0x13E, 0x147, 0x148, 0x158, 0x159, 0x160, 0x161, 0x164, 0x165, 0x17D, 0x17E, 0x1CD, 0x1CE, 0x1CF, 0x1D0, 0x1D1, 0x1D2, 0x1D3, 0x1D4, 0x1E6, 0x1E7, 0x1E8, 0x1E9, 0x1F0, },
647dd7cddfSDavid du Colombier "u", "AEeGgIiOoUu-a", { 0x102, 0x114, 0x115, 0x11E, 0x11F, 0x12C, 0x12D, 0x14E, 0x14F, 0x16C, 0x16D, 0x289, 0x2191, },
659b943567SDavid du Colombier ":", "-=()", { 0xF7, 0x2254, 0x2639, 0x263A, },
667dd7cddfSDavid du Colombier "a", "ebn", { 0xE6, 0x2194, 0x2220, },
677dd7cddfSDavid du Colombier "/", "Oo", { 0xD8, 0xF8, },
687dd7cddfSDavid du Colombier "Dv", "Zz", { 0x1C4, 0x1C5, },
697dd7cddfSDavid du Colombier "D", "-e", { 0xD0, 0x2206, },
707dd7cddfSDavid du Colombier "A", "E", { 0xC6, },
717dd7cddfSDavid du Colombier "o", "AaeUuiO", { 0xC5, 0xE5, 0x153, 0x16E, 0x16F, 0x1A3, 0x229A, },
727dd7cddfSDavid du Colombier "~!", "=", { 0x2246, },
737dd7cddfSDavid du Colombier "~", "ANOanoIiUu-=~", { 0xC3, 0xD1, 0xD5, 0xE3, 0xF1, 0xF5, 0x128, 0x129, 0x168, 0x169, 0x2243, 0x2245, 0x2248, },
747dd7cddfSDavid du Colombier "^", "AEIOUaeiouCcGgHhJjSsWwYy", { 0xC2, 0xCA, 0xCE, 0xD4, 0xDB, 0xE2, 0xEA, 0xEE, 0xF4, 0xFB, 0x108, 0x109, 0x11C, 0x11D, 0x124, 0x125, 0x134, 0x135, 0x15C, 0x15D, 0x174, 0x175, 0x176, 0x177, },
757dd7cddfSDavid du Colombier "`\"", "Uu", { 0x1DB, 0x1DC, },
767dd7cddfSDavid du Colombier "`", "AEIOUaeiou", { 0xC0, 0xC8, 0xCC, 0xD2, 0xD9, 0xE0, 0xE8, 0xEC, 0xF2, 0xF9, },
777dd7cddfSDavid du Colombier "?", "?!", { 0xBF, 0x203D, },
787dd7cddfSDavid du Colombier "3", "458", { 0xBE, 0x2157, 0x215C, },
797dd7cddfSDavid du Colombier "1", "423568", { 0xBC, 0xBD, 0x2153, 0x2155, 0x2159, 0x215B, },
807dd7cddfSDavid du Colombier ">!", "=~", { 0x2269, 0x22E7, },
817dd7cddfSDavid du Colombier ">", ">=~<", { 0xBB, 0x2265, 0x2273, 0x2277, },
827dd7cddfSDavid du Colombier ",", ",CcAaEeGgIiKkLlNnRrSsTtUuOo", { 0xB8, 0xC7, 0xE7, 0x104, 0x105, 0x118, 0x119, 0x122, 0x123, 0x12E, 0x12F, 0x136, 0x137, 0x13B, 0x13C, 0x145, 0x146, 0x156, 0x157, 0x15E, 0x15F, 0x162, 0x163, 0x172, 0x173, 0x1EA, 0x1EB, },
837dd7cddfSDavid du Colombier ".", ".CcEeGgILlZzO", { 0xB7, 0x10A, 0x10B, 0x116, 0x117, 0x120, 0x121, 0x130, 0x13F, 0x140, 0x17B, 0x17C, 0x2299, },
847dd7cddfSDavid du Colombier "p", "gOdrt", { 0xB6, 0x2117, 0x2202, 0x220F, 0x221D, },
857dd7cddfSDavid du Colombier "m", "iuo", { 0xB5, 0xD7, 0x2208, },
867dd7cddfSDavid du Colombier "\'\"", "Uu", { 0x1D7, 0x1D8, },
877dd7cddfSDavid du Colombier "\'", "\'AEIOUYaeiouyCcgLlNnRrSsZz", { 0xB4, 0xC1, 0xC9, 0xCD, 0xD3, 0xDA, 0xDD, 0xE1, 0xE9, 0xED, 0xF3, 0xFA, 0xFD, 0x106, 0x107, 0x123, 0x139, 0x13A, 0x143, 0x144, 0x154, 0x155, 0x15A, 0x15B, 0x179, 0x17A, },
887dd7cddfSDavid du Colombier "+", "-O", { 0xB1, 0x2295, },
897dd7cddfSDavid du Colombier "dv", "z", { 0x1C6, },
907dd7cddfSDavid du Colombier "d", "e-zgda", { 0xB0, 0xF0, 0x2A3, 0x2020, 0x2021, 0x2193, },
917dd7cddfSDavid du Colombier "_,", "Oo", { 0x1EC, 0x1ED, },
927dd7cddfSDavid du Colombier "_.", "Aa", { 0x1E0, 0x1E1, },
937dd7cddfSDavid du Colombier "_\"", "UuAa", { 0x1D5, 0x1D6, 0x1DE, 0x1DF, },
947dd7cddfSDavid du Colombier "_", "_AaEeIiOoUu", { 0xAF, 0x100, 0x101, 0x112, 0x113, 0x12A, 0x12B, 0x14C, 0x14D, 0x16A, 0x16B, },
957dd7cddfSDavid du Colombier "r", "O\'\"", { 0xAE, 0x2019, 0x201D, },
967dd7cddfSDavid du Colombier "-*", "l", { 0x19B, },
977dd7cddfSDavid du Colombier "-", "-Dd:HLlTtbIZz2Ggiuh>+~O", { 0xAD, 0xD0, 0xF0, 0xF7, 0x126, 0x141, 0x142, 0x166, 0x167, 0x180, 0x197, 0x1B5, 0x1B6, 0x1BB, 0x1E4, 0x1E5, 0x268, 0x289, 0x210F, 0x2192, 0x2213, 0x2242, 0x2296, },
987dd7cddfSDavid du Colombier "n", "oj", { 0xAC, 0x1CC, },
997dd7cddfSDavid du Colombier "<!", "=~", { 0x2268, 0x22E6, },
1007dd7cddfSDavid du Colombier "<", "<-=~>", { 0xAB, 0x2190, 0x2264, 0x2272, 0x2276, },
1017dd7cddfSDavid du Colombier "s", "a231os0456789+-=()nturbp", { 0xAA, 0xB2, 0xB3, 0xB9, 0xBA, 0xDF, 0x2070, 0x2074, 0x2075, 0x2076, 0x2077, 0x2078, 0x2079, 0x207A, 0x207B, 0x207C, 0x207D, 0x207E, 0x207F, 0x220D, 0x2211, 0x221A, 0x2282, 0x2283, },
1027dd7cddfSDavid du Colombier "O", "crEIp+-x/.o*=", { 0xA9, 0xAE, 0x152, 0x1A2, 0x2117, 0x2295, 0x2296, 0x2297, 0x2298, 0x2299, 0x229A, 0x229B, 0x229C, },
1037dd7cddfSDavid du Colombier "\"*", "IUiu", { 0x3AA, 0x3AB, 0x3CA, 0x3CB, },
1047dd7cddfSDavid du Colombier "\"", "\"AEIOUaeiouyY", { 0xA8, 0xC4, 0xCB, 0xCF, 0xD6, 0xDC, 0xE4, 0xEB, 0xEF, 0xF6, 0xFC, 0xFF, 0x178, },
1057dd7cddfSDavid du Colombier "S", "S", { 0xA7, },
1067dd7cddfSDavid du Colombier "|", "|Pp", { 0xA6, 0xDE, 0xFE, },
1077dd7cddfSDavid du Colombier "y", "$", { 0xA5, },
1087dd7cddfSDavid du Colombier "g", "$-r", { 0xA4, 0x1E5, 0x2207, },
1097dd7cddfSDavid du Colombier "l", "$-j\'\"&|z", { 0xA3, 0x142, 0x1C9, 0x2018, 0x201C, 0x2227, 0x2228, 0x22C4, },
1107dd7cddfSDavid du Colombier "c", "$Oaug", { 0xA2, 0xA9, 0x2229, 0x222A, 0x2245, },
1117dd7cddfSDavid du Colombier "!~", "-=~", { 0x2244, 0x2247, 0x2249, },
1127dd7cddfSDavid du Colombier "!", "!?m=<>bp", { 0xA1, 0x203D, 0x2209, 0x2260, 0x226E, 0x226F, 0x2284, 0x2285, },
1137dd7cddfSDavid du Colombier 0, 0, { 0, }
1147dd7cddfSDavid du Colombier };
1157dd7cddfSDavid du Colombier
1167dd7cddfSDavid du Colombier /*
1177dd7cddfSDavid du Colombier * Given 5 characters k[0]..k[4], find the rune or return -1 for failure.
1187dd7cddfSDavid du Colombier */
1197dd7cddfSDavid du Colombier long
unicode(Rune * k)1207dd7cddfSDavid du Colombier unicode(Rune *k)
1217dd7cddfSDavid du Colombier {
1227dd7cddfSDavid du Colombier long i, c;
1237dd7cddfSDavid du Colombier
1247dd7cddfSDavid du Colombier k++; /* skip 'X' */
1257dd7cddfSDavid du Colombier c = 0;
1267dd7cddfSDavid du Colombier for(i=0; i<4; i++,k++){
1277dd7cddfSDavid du Colombier c <<= 4;
1287dd7cddfSDavid du Colombier if('0'<=*k && *k<='9')
1297dd7cddfSDavid du Colombier c += *k-'0';
1307dd7cddfSDavid du Colombier else if('a'<=*k && *k<='f')
1317dd7cddfSDavid du Colombier c += 10 + *k-'a';
1327dd7cddfSDavid du Colombier else if('A'<=*k && *k<='F')
1337dd7cddfSDavid du Colombier c += 10 + *k-'A';
1347dd7cddfSDavid du Colombier else
1357dd7cddfSDavid du Colombier return -1;
1367dd7cddfSDavid du Colombier }
1377dd7cddfSDavid du Colombier return c;
1387dd7cddfSDavid du Colombier }
1397dd7cddfSDavid du Colombier
1407dd7cddfSDavid du Colombier /*
1417dd7cddfSDavid du Colombier * Given n characters k[0]..k[n-1], find the corresponding rune or return -1 for
1427dd7cddfSDavid du Colombier * failure, or something < -1 if n is too small. In the latter case, the result
1437dd7cddfSDavid du Colombier * is minus the required n.
1447dd7cddfSDavid du Colombier */
1457dd7cddfSDavid du Colombier long
latin1(Rune * k,int n)1467dd7cddfSDavid du Colombier latin1(Rune *k, int n)
1477dd7cddfSDavid du Colombier {
1487dd7cddfSDavid du Colombier struct cvlist *l;
1497dd7cddfSDavid du Colombier int c;
1507dd7cddfSDavid du Colombier char* p;
1517dd7cddfSDavid du Colombier
1527dd7cddfSDavid du Colombier if(k[0] == 'X'){
1537dd7cddfSDavid du Colombier if(n>=5)
1547dd7cddfSDavid du Colombier return unicode(k);
1557dd7cddfSDavid du Colombier else
1567dd7cddfSDavid du Colombier return -5;
1577dd7cddfSDavid du Colombier }
1587dd7cddfSDavid du Colombier
1597dd7cddfSDavid du Colombier for(l=latintab; l->ld!=0; l++)
1607dd7cddfSDavid du Colombier if(k[0] == l->ld[0]){
1617dd7cddfSDavid du Colombier if(n == 1)
1627dd7cddfSDavid du Colombier return -2;
1637dd7cddfSDavid du Colombier if(l->ld[1] == 0)
1647dd7cddfSDavid du Colombier c = k[1];
1657dd7cddfSDavid du Colombier else if(l->ld[1] != k[1])
1667dd7cddfSDavid du Colombier continue;
1677dd7cddfSDavid du Colombier else if(n == 2)
1687dd7cddfSDavid du Colombier return -3;
1697dd7cddfSDavid du Colombier else
1707dd7cddfSDavid du Colombier c = k[2];
1717dd7cddfSDavid du Colombier for(p=l->si; *p!=0; p++)
1727dd7cddfSDavid du Colombier if(*p == c)
1737dd7cddfSDavid du Colombier return l->so[p - l->si];
1747dd7cddfSDavid du Colombier return -1;
1757dd7cddfSDavid du Colombier }
1767dd7cddfSDavid du Colombier return -1;
1777dd7cddfSDavid du Colombier }
178