blob: 613de0922e1c5189740ea68e0835d54d3ab49062 [file] [log] [blame]
/*
#include <sys/types.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <errno.h>
*/
/*
the our_* routines are implementations for the corresponding library
routines. for a while, i tried to actually name them wctomb etc
but stopped that after i found a system which made wchar_t an
unsigned char.
*/
enum {
T1 = 0x00,
Tx = 0x80,
T2 = 0xC0,
T3 = 0xE0,
T4 = 0xF0,
T5 = 0xF8,
T6 = 0xFC,
Bit1 = 7,
Bitx = 6,
Bit2 = 5,
Bit3 = 4,
Bit4 = 3,
Bit5 = 2,
Bit6 = 2,
Mask1 = (1 << Bit1) - 1,
Maskx = (1 << Bitx) - 1,
Mask2 = (1 << Bit2) - 1,
Mask3 = (1 << Bit3) - 1,
Mask4 = (1 << Bit4) - 1,
Mask5 = (1 << Bit5) - 1,
Mask6 = (1 << Bit6) - 1,
Wchar1 = (1UL << Bit1) - 1,
Wchar2 = (1UL << (Bit2 + Bitx)) - 1,
Wchar3 = (1UL << (Bit3 + 2 * Bitx)) - 1,
Wchar4 = (1UL << (Bit4 + 3 * Bitx)) - 1,
Wchar5 = (1UL << (Bit5 + 4 * Bitx)) - 1
#ifndef EILSEQ
, /* we hate ansi c's comma rules */
EILSEQ = 123
#endif /* PLAN9 */
};
static int
our_wctomb(char *s, unsigned long wc)
{
if (s == 0)
return 0; /* no shift states */
if (wc & ~Wchar2) {
if (wc & ~Wchar4) {
if (wc & ~Wchar5) {
/* 6 bytes */
s[0] = T6 | ((wc >> 5 * Bitx) & Mask6);
s[1] = Tx | ((wc >> 4 * Bitx) & Maskx);
s[2] = Tx | ((wc >> 3 * Bitx) & Maskx);
s[3] = Tx | ((wc >> 2 * Bitx) & Maskx);
s[4] = Tx | ((wc >> 1 * Bitx) & Maskx);
s[5] = Tx | (wc & Maskx);
return 6;
}
/* 5 bytes */
s[0] = T5 | (wc >> 4 * Bitx);
s[1] = Tx | ((wc >> 3 * Bitx) & Maskx);
s[2] = Tx | ((wc >> 2 * Bitx) & Maskx);
s[3] = Tx | ((wc >> 1 * Bitx) & Maskx);
s[4] = Tx | (wc & Maskx);
return 5;
}
if (wc & ~Wchar3) {
/* 4 bytes */
s[0] = T4 | (wc >> 3 * Bitx);
s[1] = Tx | ((wc >> 2 * Bitx) & Maskx);
s[2] = Tx | ((wc >> 1 * Bitx) & Maskx);
s[3] = Tx | (wc & Maskx);
return 4;
}
/* 3 bytes */
s[0] = T3 | (wc >> 2 * Bitx);
s[1] = Tx | ((wc >> 1 * Bitx) & Maskx);
s[2] = Tx | (wc & Maskx);
return 3;
}
if (wc & ~Wchar1) {
/* 2 bytes */
s[0] = T2 | (wc >> 1 * Bitx);
s[1] = Tx | (wc & Maskx);
return 2;
}
/* 1 byte */
s[0] = T1 | wc;
return 1;
}