/programs/develop/libraries/iconv/cp1251.h |
---|
0,0 → 1,131 |
/* |
* Copyright (C) 1999-2001 Free Software Foundation, Inc. |
* This file is part of the GNU LIBICONV Library. |
* |
* The GNU LIBICONV Library is free software; you can redistribute it |
* and/or modify it under the terms of the GNU Library General Public |
* License as published by the Free Software Foundation; either version 2 |
* of the License, or (at your option) any later version. |
* |
* The GNU LIBICONV Library is distributed in the hope that it will be |
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
* Library General Public License for more details. |
* |
* You should have received a copy of the GNU Library General Public |
* License along with the GNU LIBICONV Library; see the file COPYING.LIB. |
* If not, write to the Free Software Foundation, Inc., 51 Franklin Street, |
* Fifth Floor, Boston, MA 02110-1301, USA. |
*/ |
/* |
* CP1251 |
*/ |
static const unsigned short cp1251_2uni[128] = { |
/* 0x80 */ |
0x0402, 0x0403, 0x201a, 0x0453, 0x201e, 0x2026, 0x2020, 0x2021, |
0x20ac, 0x2030, 0x0409, 0x2039, 0x040a, 0x040c, 0x040b, 0x040f, |
/* 0x90 */ |
0x0452, 0x2018, 0x2019, 0x201c, 0x201d, 0x2022, 0x2013, 0x2014, |
0xfffd, 0x2122, 0x0459, 0x203a, 0x045a, 0x045c, 0x045b, 0x045f, |
/* 0xa0 */ |
0x00a0, 0x040e, 0x045e, 0x0408, 0x00a4, 0x0490, 0x00a6, 0x00a7, |
0x0401, 0x00a9, 0x0404, 0x00ab, 0x00ac, 0x00ad, 0x00ae, 0x0407, |
/* 0xb0 */ |
0x00b0, 0x00b1, 0x0406, 0x0456, 0x0491, 0x00b5, 0x00b6, 0x00b7, |
0x0451, 0x2116, 0x0454, 0x00bb, 0x0458, 0x0405, 0x0455, 0x0457, |
/* 0xc0 */ |
0x0410, 0x0411, 0x0412, 0x0413, 0x0414, 0x0415, 0x0416, 0x0417, |
0x0418, 0x0419, 0x041a, 0x041b, 0x041c, 0x041d, 0x041e, 0x041f, |
/* 0xd0 */ |
0x0420, 0x0421, 0x0422, 0x0423, 0x0424, 0x0425, 0x0426, 0x0427, |
0x0428, 0x0429, 0x042a, 0x042b, 0x042c, 0x042d, 0x042e, 0x042f, |
/* 0xe0 */ |
0x0430, 0x0431, 0x0432, 0x0433, 0x0434, 0x0435, 0x0436, 0x0437, |
0x0438, 0x0439, 0x043a, 0x043b, 0x043c, 0x043d, 0x043e, 0x043f, |
/* 0xf0 */ |
0x0440, 0x0441, 0x0442, 0x0443, 0x0444, 0x0445, 0x0446, 0x0447, |
0x0448, 0x0449, 0x044a, 0x044b, 0x044c, 0x044d, 0x044e, 0x044f, |
}; |
static int |
cp1251_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n) |
{ |
unsigned char c = *s; |
if (c < 0x80) { |
*pwc = (ucs4_t) c; |
return 1; |
} |
else { |
unsigned short wc = cp1251_2uni[c-0x80]; |
if (wc != 0xfffd) { |
*pwc = (ucs4_t) wc; |
return 1; |
} |
} |
return RET_ILSEQ; |
} |
static const unsigned char cp1251_page00[32] = { |
0xa0, 0x00, 0x00, 0x00, 0xa4, 0x00, 0xa6, 0xa7, /* 0xa0-0xa7 */ |
0x00, 0xa9, 0x00, 0xab, 0xac, 0xad, 0xae, 0x00, /* 0xa8-0xaf */ |
0xb0, 0xb1, 0x00, 0x00, 0x00, 0xb5, 0xb6, 0xb7, /* 0xb0-0xb7 */ |
0x00, 0x00, 0x00, 0xbb, 0x00, 0x00, 0x00, 0x00, /* 0xb8-0xbf */ |
}; |
static const unsigned char cp1251_page04[152] = { |
0x00, 0xa8, 0x80, 0x81, 0xaa, 0xbd, 0xb2, 0xaf, /* 0x00-0x07 */ |
0xa3, 0x8a, 0x8c, 0x8e, 0x8d, 0x00, 0xa1, 0x8f, /* 0x08-0x0f */ |
0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, /* 0x10-0x17 */ |
0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, /* 0x18-0x1f */ |
0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, /* 0x20-0x27 */ |
0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, /* 0x28-0x2f */ |
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, /* 0x30-0x37 */ |
0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, /* 0x38-0x3f */ |
0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, /* 0x40-0x47 */ |
0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff, /* 0x48-0x4f */ |
0x00, 0xb8, 0x90, 0x83, 0xba, 0xbe, 0xb3, 0xbf, /* 0x50-0x57 */ |
0xbc, 0x9a, 0x9c, 0x9e, 0x9d, 0x00, 0xa2, 0x9f, /* 0x58-0x5f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x60-0x67 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x68-0x6f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x70-0x77 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x78-0x7f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x80-0x87 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x88-0x8f */ |
0xa5, 0xb4, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x90-0x97 */ |
}; |
static const unsigned char cp1251_page20[48] = { |
0x00, 0x00, 0x00, 0x96, 0x97, 0x00, 0x00, 0x00, /* 0x10-0x17 */ |
0x91, 0x92, 0x82, 0x00, 0x93, 0x94, 0x84, 0x00, /* 0x18-0x1f */ |
0x86, 0x87, 0x95, 0x00, 0x00, 0x00, 0x85, 0x00, /* 0x20-0x27 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x28-0x2f */ |
0x89, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x30-0x37 */ |
0x00, 0x8b, 0x9b, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x38-0x3f */ |
}; |
static int |
cp1251_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n) |
{ |
unsigned char c = 0; |
if (wc < 0x0080) { |
*r = wc; |
return 1; |
} |
else if (wc >= 0x00a0 && wc < 0x00c0) |
c = cp1251_page00[wc-0x00a0]; |
else if (wc >= 0x0400 && wc < 0x0498) |
c = cp1251_page04[wc-0x0400]; |
else if (wc >= 0x2010 && wc < 0x2040) |
c = cp1251_page20[wc-0x2010]; |
else if (wc == 0x20ac) |
c = 0x88; |
else if (wc == 0x2116) |
c = 0xb9; |
else if (wc == 0x2122) |
c = 0x99; |
if (c != 0) { |
*r = c; |
return 1; |
} |
return RET_ILUNI; |
} |
/programs/develop/libraries/iconv/cp1252.h |
---|
0,0 → 1,103 |
/* |
* Copyright (C) 1999-2001 Free Software Foundation, Inc. |
* This file is part of the GNU LIBICONV Library. |
* |
* The GNU LIBICONV Library is free software; you can redistribute it |
* and/or modify it under the terms of the GNU Library General Public |
* License as published by the Free Software Foundation; either version 2 |
* of the License, or (at your option) any later version. |
* |
* The GNU LIBICONV Library is distributed in the hope that it will be |
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
* Library General Public License for more details. |
* |
* You should have received a copy of the GNU Library General Public |
* License along with the GNU LIBICONV Library; see the file COPYING.LIB. |
* If not, write to the Free Software Foundation, Inc., 51 Franklin Street, |
* Fifth Floor, Boston, MA 02110-1301, USA. |
*/ |
/* |
* CP1252 |
*/ |
static const unsigned short cp1252_2uni[32] = { |
/* 0x80 */ |
0x20ac, 0xfffd, 0x201a, 0x0192, 0x201e, 0x2026, 0x2020, 0x2021, |
0x02c6, 0x2030, 0x0160, 0x2039, 0x0152, 0xfffd, 0x017d, 0xfffd, |
/* 0x90 */ |
0xfffd, 0x2018, 0x2019, 0x201c, 0x201d, 0x2022, 0x2013, 0x2014, |
0x02dc, 0x2122, 0x0161, 0x203a, 0x0153, 0xfffd, 0x017e, 0x0178, |
}; |
static int |
cp1252_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n) |
{ |
unsigned char c = *s; |
if (c < 0x80 || c >= 0xa0) { |
*pwc = (ucs4_t) c; |
return 1; |
} |
else { |
unsigned short wc = cp1252_2uni[c-0x80]; |
if (wc != 0xfffd) { |
*pwc = (ucs4_t) wc; |
return 1; |
} |
} |
return RET_ILSEQ; |
} |
static const unsigned char cp1252_page01[72] = { |
0x00, 0x00, 0x8c, 0x9c, 0x00, 0x00, 0x00, 0x00, /* 0x50-0x57 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x58-0x5f */ |
0x8a, 0x9a, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x60-0x67 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x68-0x6f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x70-0x77 */ |
0x9f, 0x00, 0x00, 0x00, 0x00, 0x8e, 0x9e, 0x00, /* 0x78-0x7f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x80-0x87 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x88-0x8f */ |
0x00, 0x00, 0x83, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x90-0x97 */ |
}; |
static const unsigned char cp1252_page02[32] = { |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x88, 0x00, /* 0xc0-0xc7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xc8-0xcf */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xd0-0xd7 */ |
0x00, 0x00, 0x00, 0x00, 0x98, 0x00, 0x00, 0x00, /* 0xd8-0xdf */ |
}; |
static const unsigned char cp1252_page20[48] = { |
0x00, 0x00, 0x00, 0x96, 0x97, 0x00, 0x00, 0x00, /* 0x10-0x17 */ |
0x91, 0x92, 0x82, 0x00, 0x93, 0x94, 0x84, 0x00, /* 0x18-0x1f */ |
0x86, 0x87, 0x95, 0x00, 0x00, 0x00, 0x85, 0x00, /* 0x20-0x27 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x28-0x2f */ |
0x89, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x30-0x37 */ |
0x00, 0x8b, 0x9b, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x38-0x3f */ |
}; |
static int |
cp1252_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n) |
{ |
unsigned char c = 0; |
if (wc < 0x0080) { |
*r = wc; |
return 1; |
} |
else if (wc >= 0x00a0 && wc < 0x0100) |
c = wc; |
else if (wc >= 0x0150 && wc < 0x0198) |
c = cp1252_page01[wc-0x0150]; |
else if (wc >= 0x02c0 && wc < 0x02e0) |
c = cp1252_page02[wc-0x02c0]; |
else if (wc >= 0x2010 && wc < 0x2040) |
c = cp1252_page20[wc-0x2010]; |
else if (wc == 0x20ac) |
c = 0x80; |
else if (wc == 0x2122) |
c = 0x99; |
if (c != 0) { |
*r = c; |
return 1; |
} |
return RET_ILUNI; |
} |
/programs/develop/libraries/iconv/cp866.h |
---|
0,0 → 1,125 |
/* |
* Copyright (C) 1999-2001 Free Software Foundation, Inc. |
* This file is part of the GNU LIBICONV Library. |
* |
* The GNU LIBICONV Library is free software; you can redistribute it |
* and/or modify it under the terms of the GNU Library General Public |
* License as published by the Free Software Foundation; either version 2 |
* of the License, or (at your option) any later version. |
* |
* The GNU LIBICONV Library is distributed in the hope that it will be |
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
* Library General Public License for more details. |
* |
* You should have received a copy of the GNU Library General Public |
* License along with the GNU LIBICONV Library; see the file COPYING.LIB. |
* If not, write to the Free Software Foundation, Inc., 51 Franklin Street, |
* Fifth Floor, Boston, MA 02110-1301, USA. |
*/ |
/* |
* CP866 |
*/ |
static const unsigned short cp866_2uni[80] = { |
/* 0xb0 */ |
0x2591, 0x2592, 0x2593, 0x2502, 0x2524, 0x2561, 0x2562, 0x2556, |
0x2555, 0x2563, 0x2551, 0x2557, 0x255d, 0x255c, 0x255b, 0x2510, |
/* 0xc0 */ |
0x2514, 0x2534, 0x252c, 0x251c, 0x2500, 0x253c, 0x255e, 0x255f, |
0x255a, 0x2554, 0x2569, 0x2566, 0x2560, 0x2550, 0x256c, 0x2567, |
/* 0xd0 */ |
0x2568, 0x2564, 0x2565, 0x2559, 0x2558, 0x2552, 0x2553, 0x256b, |
0x256a, 0x2518, 0x250c, 0x2588, 0x2584, 0x258c, 0x2590, 0x2580, |
/* 0xe0 */ |
0x0440, 0x0441, 0x0442, 0x0443, 0x0444, 0x0445, 0x0446, 0x0447, |
0x0448, 0x0449, 0x044a, 0x044b, 0x044c, 0x044d, 0x044e, 0x044f, |
/* 0xf0 */ |
0x0401, 0x0451, 0x0404, 0x0454, 0x0407, 0x0457, 0x040e, 0x045e, |
0x00b0, 0x2219, 0x00b7, 0x221a, 0x2116, 0x00a4, 0x25a0, 0x00a0, |
}; |
static int |
cp866_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n) |
{ |
unsigned char c = *s; |
if (c < 0x80) |
*pwc = (ucs4_t) c; |
else if (c < 0xb0) |
*pwc = (ucs4_t) c + 0x0390; |
else |
*pwc = (ucs4_t) cp866_2uni[c-0xb0]; |
return 1; |
} |
static const unsigned char cp866_page00[24] = { |
0xff, 0x00, 0x00, 0x00, 0xfd, 0x00, 0x00, 0x00, /* 0xa0-0xa7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xa8-0xaf */ |
0xf8, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xfa, /* 0xb0-0xb7 */ |
}; |
static const unsigned char cp866_page04[96] = { |
0x00, 0xf0, 0x00, 0x00, 0xf2, 0x00, 0x00, 0xf4, /* 0x00-0x07 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xf6, 0x00, /* 0x08-0x0f */ |
0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, /* 0x10-0x17 */ |
0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, /* 0x18-0x1f */ |
0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, /* 0x20-0x27 */ |
0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f, /* 0x28-0x2f */ |
0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, /* 0x30-0x37 */ |
0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf, /* 0x38-0x3f */ |
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, /* 0x40-0x47 */ |
0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, /* 0x48-0x4f */ |
0x00, 0xf1, 0x00, 0x00, 0xf3, 0x00, 0x00, 0xf5, /* 0x50-0x57 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xf7, 0x00, /* 0x58-0x5f */ |
}; |
static const unsigned char cp866_page22[8] = { |
0x00, 0xf9, 0xfb, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x18-0x1f */ |
}; |
static const unsigned char cp866_page25[168] = { |
0xc4, 0x00, 0xb3, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x00-0x07 */ |
0x00, 0x00, 0x00, 0x00, 0xda, 0x00, 0x00, 0x00, /* 0x08-0x0f */ |
0xbf, 0x00, 0x00, 0x00, 0xc0, 0x00, 0x00, 0x00, /* 0x10-0x17 */ |
0xd9, 0x00, 0x00, 0x00, 0xc3, 0x00, 0x00, 0x00, /* 0x18-0x1f */ |
0x00, 0x00, 0x00, 0x00, 0xb4, 0x00, 0x00, 0x00, /* 0x20-0x27 */ |
0x00, 0x00, 0x00, 0x00, 0xc2, 0x00, 0x00, 0x00, /* 0x28-0x2f */ |
0x00, 0x00, 0x00, 0x00, 0xc1, 0x00, 0x00, 0x00, /* 0x30-0x37 */ |
0x00, 0x00, 0x00, 0x00, 0xc5, 0x00, 0x00, 0x00, /* 0x38-0x3f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x40-0x47 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x48-0x4f */ |
0xcd, 0xba, 0xd5, 0xd6, 0xc9, 0xb8, 0xb7, 0xbb, /* 0x50-0x57 */ |
0xd4, 0xd3, 0xc8, 0xbe, 0xbd, 0xbc, 0xc6, 0xc7, /* 0x58-0x5f */ |
0xcc, 0xb5, 0xb6, 0xb9, 0xd1, 0xd2, 0xcb, 0xcf, /* 0x60-0x67 */ |
0xd0, 0xca, 0xd8, 0xd7, 0xce, 0x00, 0x00, 0x00, /* 0x68-0x6f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x70-0x77 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x78-0x7f */ |
0xdf, 0x00, 0x00, 0x00, 0xdc, 0x00, 0x00, 0x00, /* 0x80-0x87 */ |
0xdb, 0x00, 0x00, 0x00, 0xdd, 0x00, 0x00, 0x00, /* 0x88-0x8f */ |
0xde, 0xb0, 0xb1, 0xb2, 0x00, 0x00, 0x00, 0x00, /* 0x90-0x97 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x98-0x9f */ |
0xfe, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xa0-0xa7 */ |
}; |
static int |
cp866_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n) |
{ |
unsigned char c = 0; |
if (wc < 0x0080) { |
*r = wc; |
return 1; |
} |
else if (wc >= 0x00a0 && wc < 0x00b8) |
c = cp866_page00[wc-0x00a0]; |
else if (wc >= 0x0400 && wc < 0x0460) |
c = cp866_page04[wc-0x0400]; |
else if (wc == 0x2116) |
c = 0xfc; |
else if (wc >= 0x2218 && wc < 0x2220) |
c = cp866_page22[wc-0x2218]; |
else if (wc >= 0x2500 && wc < 0x25a8) |
c = cp866_page25[wc-0x2500]; |
if (c != 0) { |
*r = c; |
return 1; |
} |
return RET_ILUNI; |
} |
/programs/develop/libraries/iconv/iconv.c |
---|
0,0 → 1,210 |
#include <string.h> |
#include <stdio.h> |
typedef int conv_t; |
typedef unsigned int ucs4_t; |
typedef int iconv_t; |
/* Return code if invalid input after a shift sequence of n bytes was read. |
(xxx_mbtowc) */ |
#define RET_SHIFT_ILSEQ(n) (-1-2*(n)) |
/* Return code if invalid. (xxx_mbtowc) */ |
#define RET_ILSEQ RET_SHIFT_ILSEQ(0) |
/* Return code if only a shift sequence of n bytes was read. (xxx_mbtowc) */ |
#define RET_TOOFEW(n) (-2-2*(n)) |
/* Return code if invalid. (xxx_wctomb) */ |
#define RET_ILUNI -1 |
/* Return code if output buffer is too small. (xxx_wctomb, xxx_reset) */ |
#define RET_TOOSMALL -2 |
#define CP866 0 |
#define CP1251 1 |
#define CP1252 2 |
#define KOI8_RU 3 |
#define ISO8859_5 4 |
#define UTF_8 5 |
int strcmp (const char* a, const char* b) |
{ |
return (*a && *b && (*a == *b)) ? ((*(a+1) || *(b+1)) ? (strcmp(a+1, b+1)) : (0)) : ((*a > *b) ? (1) : (-1)); |
} |
#include "cp866.h" |
#include "cp1251.h" |
#include "cp1252.h" |
#include "koi8_ru.h" |
#include "iso8859_5.h" |
#include "utf8.h" |
int encoding(const char *what) { |
if (!strcmp(what,"CP866")) return CP866; |
if (!strcmp(what,"CP1251")) return CP1251; |
if (!strcmp(what,"CP1252")) return CP1252; |
if (!strcmp(what,"KOI8-RU")) return KOI8_RU; |
if (!strcmp(what,"ISO8859-5")) return ISO8859_5; |
if (!strcmp(what,"UTF-8")) return UTF_8; |
return -1; |
} |
iconv_t iconv_open(const char *tocode, const char *fromcode) { |
int to, from; |
if ((to=encoding(tocode))==-1) return -1; |
if ((from=encoding(fromcode))==-1) return -1; |
to=to<<16&0xFFFF0000; |
from=from&0xFFFF; |
return to+from; |
} |
size_t iconv(iconv_t cd, const char **inbuf, size_t *inbytesleft, |
char **outbuf, size_t *outbytesleft) |
{ |
int n, to, from, count1,count2; |
int pwc, converted,written; |
int (*mbtowc)(conv_t, ucs4_t *, const unsigned char *, int); |
int (*wctomb)(conv_t, ucs4_t *, const unsigned char *, int); |
char *str; |
str=*outbuf; |
from=cd>>16; |
to=cd&0xFFFF; |
switch (from) |
{ |
case CP866: mbtowc=cp866_mbtowc; break; |
case CP1251: mbtowc=cp1251_mbtowc; break; |
case CP1252: mbtowc=cp1252_mbtowc; break; |
case ISO8859_5: mbtowc=iso8859_5_mbtowc; break; |
case KOI8_RU: mbtowc=koi8_ru_mbtowc; break; |
case UTF_8: mbtowc=utf8_mbtowc; break; |
default: return -2; |
} |
switch (to) |
{ |
case CP866: wctomb=cp866_wctomb; break; |
case CP1251: wctomb=cp1251_wctomb; break; |
case CP1252: wctomb=cp1252_wctomb; break; |
case ISO8859_5: wctomb=iso8859_5_wctomb; break; |
case KOI8_RU: wctomb=koi8_ru_wctomb; break; |
case UTF_8: wctomb=utf8_wctomb; break; |
default: return -3; |
} |
count1=0; |
count2=0; |
while ( *inbytesleft>0 && *outbytesleft>1) |
{ |
n=1; |
do { |
//converted= (utf8_mbtowc)(0,&pwc,((*inbuf)+count1),n); |
// printf("%d\n",n); |
converted= (mbtowc)(0,&pwc,((*inbuf)+count1),n); |
n++; |
} while (converted==RET_TOOFEW(0)); |
if (converted<0) return -10; |
//written= (cp866_wctomb)(0,str+count2,pwc,1); |
written= (wctomb)(0,str+count2,pwc,1); |
if (written<0) written=0;//return -11; |
//printf("Conv:%d Wri:%d In:%d Out:%d UTF:%x UCS:%x 866:%s\n",converted, written, *inbytesleft,*outbytesleft,*((*inbuf)+count1),pwc, str); |
(*inbytesleft)-=converted; |
(*outbytesleft)-=written; |
count1+=converted; |
count2+=written; |
} |
*(str+count2)='\0'; |
if (*inbytesleft>0 && *outbytesleft==0) return -12; |
return 0; |
} |
/* |
int main() |
{ |
char *s;// ="вертолет"; |
char *z; |
//unsigned int pwc; |
iconv_t cd; |
int in, out; |
FILE *infile; |
char *fname = "file.txt"; |
infile = fopen(fname,"r"); |
fseek(infile, 0, SEEK_END); |
size_t file_size = ftell(infile); |
rewind(infile); |
//printf ("LOL\n"); |
char *buffer = (char*)malloc(file_size * sizeof(char)); |
if (buffer == NULL) |
{ |
fclose(infile); |
printf("Error allocating %d bytes.\n", file_size * sizeof(char)); |
return -1; |
} |
size_t bytes_read = fread(buffer, sizeof(char), file_size, infile); |
if (bytes_read != file_size) |
{ |
printf("Have read only %d bytes of %d.\n", bytes_read, file_size); |
free(buffer); |
fclose(infile); |
return -1; |
} |
in=strlen(buffer); |
z=malloc(in+1); |
out=in+1; |
cd=iconv_open("CP1251","CP866"); |
// printf("%x\n",cd); |
int t; |
t=iconv(cd, &buffer, &in, &z, &out); |
printf("\nResult: %d", t); |
puts(z); |
//for (;s<s+strlen(s);s++) {cp866_mbtowc (0, &pwc, s, 1);printf("%c=%u\n",*s,pwc);} |
} |
*/ |
typedef struct |
{ |
char *name; |
void *f; |
} export_t; |
char szStart[] = "START"; |
char szVersion[] = "version"; |
char sziconv_open[] = "iconv_open"; |
char sziconv[] = "iconv"; |
export_t EXPORTS[] __asm__("EXPORTS") = |
{ |
{ szStart, (void*)0x0 }, |
{ szVersion, (void*)0x00010001 }, |
{ sziconv_open, iconv_open }, |
{ sziconv, iconv }, |
{ NULL, NULL }, |
}; |
/programs/develop/libraries/iconv/iso8859_5.h |
---|
0,0 → 1,95 |
/* |
* Copyright (C) 1999-2001 Free Software Foundation, Inc. |
* This file is part of the GNU LIBICONV Library. |
* |
* The GNU LIBICONV Library is free software; you can redistribute it |
* and/or modify it under the terms of the GNU Library General Public |
* License as published by the Free Software Foundation; either version 2 |
* of the License, or (at your option) any later version. |
* |
* The GNU LIBICONV Library is distributed in the hope that it will be |
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
* Library General Public License for more details. |
* |
* You should have received a copy of the GNU Library General Public |
* License along with the GNU LIBICONV Library; see the file COPYING.LIB. |
* If not, write to the Free Software Foundation, Inc., 51 Franklin Street, |
* Fifth Floor, Boston, MA 02110-1301, USA. |
*/ |
/* |
* ISO-8859-5 |
*/ |
static const unsigned short iso8859_5_2uni[96] = { |
/* 0xa0 */ |
0x00a0, 0x0401, 0x0402, 0x0403, 0x0404, 0x0405, 0x0406, 0x0407, |
0x0408, 0x0409, 0x040a, 0x040b, 0x040c, 0x00ad, 0x040e, 0x040f, |
/* 0xb0 */ |
0x0410, 0x0411, 0x0412, 0x0413, 0x0414, 0x0415, 0x0416, 0x0417, |
0x0418, 0x0419, 0x041a, 0x041b, 0x041c, 0x041d, 0x041e, 0x041f, |
/* 0xc0 */ |
0x0420, 0x0421, 0x0422, 0x0423, 0x0424, 0x0425, 0x0426, 0x0427, |
0x0428, 0x0429, 0x042a, 0x042b, 0x042c, 0x042d, 0x042e, 0x042f, |
/* 0xd0 */ |
0x0430, 0x0431, 0x0432, 0x0433, 0x0434, 0x0435, 0x0436, 0x0437, |
0x0438, 0x0439, 0x043a, 0x043b, 0x043c, 0x043d, 0x043e, 0x043f, |
/* 0xe0 */ |
0x0440, 0x0441, 0x0442, 0x0443, 0x0444, 0x0445, 0x0446, 0x0447, |
0x0448, 0x0449, 0x044a, 0x044b, 0x044c, 0x044d, 0x044e, 0x044f, |
/* 0xf0 */ |
0x2116, 0x0451, 0x0452, 0x0453, 0x0454, 0x0455, 0x0456, 0x0457, |
0x0458, 0x0459, 0x045a, 0x045b, 0x045c, 0x00a7, 0x045e, 0x045f, |
}; |
static int |
iso8859_5_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n) |
{ |
unsigned char c = *s; |
if (c < 0xa0) |
*pwc = (ucs4_t) c; |
else |
*pwc = (ucs4_t) iso8859_5_2uni[c-0xa0]; |
return 1; |
} |
static const unsigned char iso8859_5_page00[16] = { |
0xa0, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xfd, /* 0xa0-0xa7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0xad, 0x00, 0x00, /* 0xa8-0xaf */ |
}; |
static const unsigned char iso8859_5_page04[96] = { |
0x00, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, /* 0x00-0x07 */ |
0xa8, 0xa9, 0xaa, 0xab, 0xac, 0x00, 0xae, 0xaf, /* 0x08-0x0f */ |
0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, /* 0x10-0x17 */ |
0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, /* 0x18-0x1f */ |
0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, /* 0x20-0x27 */ |
0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, /* 0x28-0x2f */ |
0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, /* 0x30-0x37 */ |
0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, /* 0x38-0x3f */ |
0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, /* 0x40-0x47 */ |
0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, /* 0x48-0x4f */ |
0x00, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, /* 0x50-0x57 */ |
0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0x00, 0xfe, 0xff, /* 0x58-0x5f */ |
}; |
static int |
iso8859_5_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n) |
{ |
unsigned char c = 0; |
if (wc < 0x00a0) { |
*r = wc; |
return 1; |
} |
else if (wc >= 0x00a0 && wc < 0x00b0) |
c = iso8859_5_page00[wc-0x00a0]; |
else if (wc >= 0x0400 && wc < 0x0460) |
c = iso8859_5_page04[wc-0x0400]; |
else if (wc == 0x2116) |
c = 0xf0; |
if (c != 0) { |
*r = c; |
return 1; |
} |
return RET_ILUNI; |
} |
/programs/develop/libraries/iconv/koi8_ru.h |
---|
0,0 → 1,159 |
/* |
* Copyright (C) 1999-2001 Free Software Foundation, Inc. |
* This file is part of the GNU LIBICONV Library. |
* |
* The GNU LIBICONV Library is free software; you can redistribute it |
* and/or modify it under the terms of the GNU Library General Public |
* License as published by the Free Software Foundation; either version 2 |
* of the License, or (at your option) any later version. |
* |
* The GNU LIBICONV Library is distributed in the hope that it will be |
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
* Library General Public License for more details. |
* |
* You should have received a copy of the GNU Library General Public |
* License along with the GNU LIBICONV Library; see the file COPYING.LIB. |
* If not, write to the Free Software Foundation, Inc., 51 Franklin Street, |
* Fifth Floor, Boston, MA 02110-1301, USA. |
*/ |
/* |
* KOI8-RU |
*/ |
static const unsigned short koi8_ru_2uni[128] = { |
/* 0x80 */ |
0x2500, 0x2502, 0x250c, 0x2510, 0x2514, 0x2518, 0x251c, 0x2524, |
0x252c, 0x2534, 0x253c, 0x2580, 0x2584, 0x2588, 0x258c, 0x2590, |
/* 0x90 */ |
0x2591, 0x2592, 0x2593, 0x2320, 0x25a0, 0x2219, 0x221a, 0x2248, |
0x2264, 0x2265, 0x00a0, 0x2321, 0x00b0, 0x00b2, 0x00b7, 0x00f7, |
/* 0xa0 */ |
0x2550, 0x2551, 0x2552, 0x0451, 0x0454, 0x2554, 0x0456, 0x0457, |
0x2557, 0x2558, 0x2559, 0x255a, 0x255b, 0x0491, 0x045e, 0x255e, |
/* 0xb0 */ |
0x255f, 0x2560, 0x2561, 0x0401, 0x0404, 0x2563, 0x0406, 0x0407, |
0x2566, 0x2567, 0x2568, 0x2569, 0x256a, 0x0490, 0x040e, 0x00a9, |
/* 0xc0 */ |
0x044e, 0x0430, 0x0431, 0x0446, 0x0434, 0x0435, 0x0444, 0x0433, |
0x0445, 0x0438, 0x0439, 0x043a, 0x043b, 0x043c, 0x043d, 0x043e, |
/* 0xd0 */ |
0x043f, 0x044f, 0x0440, 0x0441, 0x0442, 0x0443, 0x0436, 0x0432, |
0x044c, 0x044b, 0x0437, 0x0448, 0x044d, 0x0449, 0x0447, 0x044a, |
/* 0xe0 */ |
0x042e, 0x0410, 0x0411, 0x0426, 0x0414, 0x0415, 0x0424, 0x0413, |
0x0425, 0x0418, 0x0419, 0x041a, 0x041b, 0x041c, 0x041d, 0x041e, |
/* 0xf0 */ |
0x041f, 0x042f, 0x0420, 0x0421, 0x0422, 0x0423, 0x0416, 0x0412, |
0x042c, 0x042b, 0x0417, 0x0428, 0x042d, 0x0429, 0x0427, 0x042a, |
}; |
static int |
koi8_ru_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n) |
{ |
unsigned char c = *s; |
if (c < 0x80) |
*pwc = (ucs4_t) c; |
else |
*pwc = (ucs4_t) koi8_ru_2uni[c-0x80]; |
return 1; |
} |
static const unsigned char koi8_ru_page00[88] = { |
0x9a, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xa0-0xa7 */ |
0x00, 0xbf, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xa8-0xaf */ |
0x9c, 0x00, 0x9d, 0x00, 0x00, 0x00, 0x00, 0x9e, /* 0xb0-0xb7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xb8-0xbf */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xc0-0xc7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xc8-0xcf */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xd0-0xd7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xd8-0xdf */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xe0-0xe7 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xe8-0xef */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x9f, /* 0xf0-0xf7 */ |
}; |
static const unsigned char koi8_ru_page04[152] = { |
0x00, 0xb3, 0x00, 0x00, 0xb4, 0x00, 0xb6, 0xb7, /* 0x00-0x07 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xbe, 0x00, /* 0x08-0x0f */ |
0xe1, 0xe2, 0xf7, 0xe7, 0xe4, 0xe5, 0xf6, 0xfa, /* 0x10-0x17 */ |
0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, 0xf0, /* 0x18-0x1f */ |
0xf2, 0xf3, 0xf4, 0xf5, 0xe6, 0xe8, 0xe3, 0xfe, /* 0x20-0x27 */ |
0xfb, 0xfd, 0xff, 0xf9, 0xf8, 0xfc, 0xe0, 0xf1, /* 0x28-0x2f */ |
0xc1, 0xc2, 0xd7, 0xc7, 0xc4, 0xc5, 0xd6, 0xda, /* 0x30-0x37 */ |
0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, 0xd0, /* 0x38-0x3f */ |
0xd2, 0xd3, 0xd4, 0xd5, 0xc6, 0xc8, 0xc3, 0xde, /* 0x40-0x47 */ |
0xdb, 0xdd, 0xdf, 0xd9, 0xd8, 0xdc, 0xc0, 0xd1, /* 0x48-0x4f */ |
0x00, 0xa3, 0x00, 0x00, 0xa4, 0x00, 0xa6, 0xa7, /* 0x50-0x57 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xae, 0x00, /* 0x58-0x5f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x60-0x67 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x68-0x6f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x70-0x77 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x78-0x7f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x80-0x87 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x88-0x8f */ |
0xbd, 0xad, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x90-0x97 */ |
}; |
static const unsigned char koi8_ru_page22[80] = { |
0x00, 0x95, 0x96, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x18-0x1f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x20-0x27 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x28-0x2f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x30-0x37 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x38-0x3f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x40-0x47 */ |
0x97, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x48-0x4f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x50-0x57 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x58-0x5f */ |
0x00, 0x00, 0x00, 0x00, 0x98, 0x99, 0x00, 0x00, /* 0x60-0x67 */ |
}; |
static const unsigned char koi8_ru_page23[8] = { |
0x93, 0x9b, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x20-0x27 */ |
}; |
static const unsigned char koi8_ru_page25[168] = { |
0x80, 0x00, 0x81, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x00-0x07 */ |
0x00, 0x00, 0x00, 0x00, 0x82, 0x00, 0x00, 0x00, /* 0x08-0x0f */ |
0x83, 0x00, 0x00, 0x00, 0x84, 0x00, 0x00, 0x00, /* 0x10-0x17 */ |
0x85, 0x00, 0x00, 0x00, 0x86, 0x00, 0x00, 0x00, /* 0x18-0x1f */ |
0x00, 0x00, 0x00, 0x00, 0x87, 0x00, 0x00, 0x00, /* 0x20-0x27 */ |
0x00, 0x00, 0x00, 0x00, 0x88, 0x00, 0x00, 0x00, /* 0x28-0x2f */ |
0x00, 0x00, 0x00, 0x00, 0x89, 0x00, 0x00, 0x00, /* 0x30-0x37 */ |
0x00, 0x00, 0x00, 0x00, 0x8a, 0x00, 0x00, 0x00, /* 0x38-0x3f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x40-0x47 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x48-0x4f */ |
0xa0, 0xa1, 0xa2, 0x00, 0xa5, 0x00, 0x00, 0xa8, /* 0x50-0x57 */ |
0xa9, 0xaa, 0xab, 0xac, 0x00, 0x00, 0xaf, 0xb0, /* 0x58-0x5f */ |
0xb1, 0xb2, 0x00, 0xb5, 0x00, 0x00, 0xb8, 0xb9, /* 0x60-0x67 */ |
0xba, 0xbb, 0xbc, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x68-0x6f */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x70-0x77 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x78-0x7f */ |
0x8b, 0x00, 0x00, 0x00, 0x8c, 0x00, 0x00, 0x00, /* 0x80-0x87 */ |
0x8d, 0x00, 0x00, 0x00, 0x8e, 0x00, 0x00, 0x00, /* 0x88-0x8f */ |
0x8f, 0x90, 0x91, 0x92, 0x00, 0x00, 0x00, 0x00, /* 0x90-0x97 */ |
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x98-0x9f */ |
0x94, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0xa0-0xa7 */ |
}; |
static int |
koi8_ru_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n) |
{ |
unsigned char c = 0; |
if (wc < 0x0080) { |
*r = wc; |
return 1; |
} |
else if (wc >= 0x00a0 && wc < 0x00f8) |
c = koi8_ru_page00[wc-0x00a0]; |
else if (wc >= 0x0400 && wc < 0x0498) |
c = koi8_ru_page04[wc-0x0400]; |
else if (wc >= 0x2218 && wc < 0x2268) |
c = koi8_ru_page22[wc-0x2218]; |
else if (wc >= 0x2320 && wc < 0x2328) |
c = koi8_ru_page23[wc-0x2320]; |
else if (wc >= 0x2500 && wc < 0x25a8) |
c = koi8_ru_page25[wc-0x2500]; |
if (c != 0) { |
*r = c; |
return 1; |
} |
return RET_ILUNI; |
} |
/programs/develop/libraries/iconv/readme.txt |
---|
0,0 → 1,4 |
Åñëè íóæíû äðóãèå êîäèðîâêè- ïðîñòî ñêà÷àé èñõîäíèêè gnu iconv, âûáåðè íóæíûå h-ôàéëû (ñêàæåì, mac_cyrillic.h), äîáàâü èõ â ïàïêó ñ iconv, è ñîîòâåòñòâåííî â iconv.ñ äîáàâü ýòè h-ôàéëû è óêàçàíèå òîãî, ÷òî êîäèðîâêà ïîääåðæèâàåòñÿ. |
Ëèöåíçèÿ GPLv2, ôàéëû ïåðåêîäèðîâùèêà èñïîëüçóþò GNU iconv |
iconv - ýòî obj, òàê ÷òî å¸ ñîáèðàåò mingw êîìàíäîé gcc -c iconv.c -o iconv.obj |
/programs/develop/libraries/iconv/utf8.h |
---|
0,0 → 1,128 |
/* |
* Copyright (C) 1999-2001, 2004 Free Software Foundation, Inc. |
* This file is part of the GNU LIBICONV Library. |
* |
* The GNU LIBICONV Library is free software; you can redistribute it |
* and/or modify it under the terms of the GNU Library General Public |
* License as published by the Free Software Foundation; either version 2 |
* of the License, or (at your option) any later version. |
* |
* The GNU LIBICONV Library is distributed in the hope that it will be |
* useful, but WITHOUT ANY WARRANTY; without even the implied warranty of |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
* Library General Public License for more details. |
* |
* You should have received a copy of the GNU Library General Public |
* License along with the GNU LIBICONV Library; see the file COPYING.LIB. |
* If not, write to the Free Software Foundation, Inc., 51 Franklin Street, |
* Fifth Floor, Boston, MA 02110-1301, USA. |
*/ |
/* |
* UTF-8 |
*/ |
/* Specification: RFC 3629 */ |
static int |
utf8_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n) |
{ |
unsigned char c = s[0]; |
if (c < 0x80) { |
*pwc = c; |
return 1; |
} else if (c < 0xc2) { |
return RET_ILSEQ; |
} else if (c < 0xe0) { |
if (n < 2) |
return RET_TOOFEW(0); |
if (!((s[1] ^ 0x80) < 0x40)) |
return RET_ILSEQ; |
*pwc = ((ucs4_t) (c & 0x1f) << 6) |
| (ucs4_t) (s[1] ^ 0x80); |
return 2; |
} else if (c < 0xf0) { |
if (n < 3) |
return RET_TOOFEW(0); |
if (!((s[1] ^ 0x80) < 0x40 && (s[2] ^ 0x80) < 0x40 |
&& (c >= 0xe1 || s[1] >= 0xa0))) |
return RET_ILSEQ; |
*pwc = ((ucs4_t) (c & 0x0f) << 12) |
| ((ucs4_t) (s[1] ^ 0x80) << 6) |
| (ucs4_t) (s[2] ^ 0x80); |
return 3; |
} else if (c < 0xf8 && sizeof(ucs4_t)*8 >= 32) { |
if (n < 4) |
return RET_TOOFEW(0); |
if (!((s[1] ^ 0x80) < 0x40 && (s[2] ^ 0x80) < 0x40 |
&& (s[3] ^ 0x80) < 0x40 |
&& (c >= 0xf1 || s[1] >= 0x90))) |
return RET_ILSEQ; |
*pwc = ((ucs4_t) (c & 0x07) << 18) |
| ((ucs4_t) (s[1] ^ 0x80) << 12) |
| ((ucs4_t) (s[2] ^ 0x80) << 6) |
| (ucs4_t) (s[3] ^ 0x80); |
return 4; |
} else if (c < 0xfc && sizeof(ucs4_t)*8 >= 32) { |
if (n < 5) |
return RET_TOOFEW(0); |
if (!((s[1] ^ 0x80) < 0x40 && (s[2] ^ 0x80) < 0x40 |
&& (s[3] ^ 0x80) < 0x40 && (s[4] ^ 0x80) < 0x40 |
&& (c >= 0xf9 || s[1] >= 0x88))) |
return RET_ILSEQ; |
*pwc = ((ucs4_t) (c & 0x03) << 24) |
| ((ucs4_t) (s[1] ^ 0x80) << 18) |
| ((ucs4_t) (s[2] ^ 0x80) << 12) |
| ((ucs4_t) (s[3] ^ 0x80) << 6) |
| (ucs4_t) (s[4] ^ 0x80); |
return 5; |
} else if (c < 0xfe && sizeof(ucs4_t)*8 >= 32) { |
if (n < 6) |
return RET_TOOFEW(0); |
if (!((s[1] ^ 0x80) < 0x40 && (s[2] ^ 0x80) < 0x40 |
&& (s[3] ^ 0x80) < 0x40 && (s[4] ^ 0x80) < 0x40 |
&& (s[5] ^ 0x80) < 0x40 |
&& (c >= 0xfd || s[1] >= 0x84))) |
return RET_ILSEQ; |
*pwc = ((ucs4_t) (c & 0x01) << 30) |
| ((ucs4_t) (s[1] ^ 0x80) << 24) |
| ((ucs4_t) (s[2] ^ 0x80) << 18) |
| ((ucs4_t) (s[3] ^ 0x80) << 12) |
| ((ucs4_t) (s[4] ^ 0x80) << 6) |
| (ucs4_t) (s[5] ^ 0x80); |
return 6; |
} else |
return RET_ILSEQ; |
} |
static int |
utf8_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n) /* n == 0 is acceptable */ |
{ |
int count; |
if (wc < 0x80) |
count = 1; |
else if (wc < 0x800) |
count = 2; |
else if (wc < 0x10000) |
count = 3; |
else if (wc < 0x200000) |
count = 4; |
else if (wc < 0x4000000) |
count = 5; |
else if (wc <= 0x7fffffff) |
count = 6; |
else |
return RET_ILUNI; |
if (n < count) |
return RET_TOOSMALL; |
switch (count) { /* note: code falls through cases! */ |
case 6: r[5] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0x4000000; |
case 5: r[4] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0x200000; |
case 4: r[3] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0x10000; |
case 3: r[2] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0x800; |
case 2: r[1] = 0x80 | (wc & 0x3f); wc = wc >> 6; wc |= 0xc0; |
case 1: r[0] = wc; |
} |
return count; |
} |