123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443 |
- /*
- * WideCharToMultiByte implementation
- *
- * Copyright 2000 Alexandre Julliard
- *
- * This library is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2.1 of the License, or (at your option) any later version.
- *
- * This library is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with this library; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
- */
- #include <string.h>
- #include "wine/asm.h"
- #ifdef __ASM_OBSOLETE
- #include "unicode.h"
- extern WCHAR wine_compose( const WCHAR *str ) DECLSPEC_HIDDEN;
- /****************************************************************/
- /* sbcs support */
- /* check if 'ch' is an acceptable sbcs mapping for 'wch' */
- static inline int is_valid_sbcs_mapping( const struct sbcs_table *table, int flags,
- WCHAR wch, unsigned char ch )
- {
- if ((flags & WC_NO_BEST_FIT_CHARS) || ch == (unsigned char)table->info.def_char)
- return (table->cp2uni[ch] == wch);
- return 1;
- }
- /* query necessary dst length for src string */
- static int get_length_sbcs( const struct sbcs_table *table, int flags,
- const WCHAR *src, unsigned int srclen, int *used )
- {
- const unsigned char * const uni2cp_low = table->uni2cp_low;
- const unsigned short * const uni2cp_high = table->uni2cp_high;
- int ret, tmp;
- WCHAR composed;
- if (!used) used = &tmp; /* avoid checking on every char */
- *used = 0;
- for (ret = 0; srclen; ret++, src++, srclen--)
- {
- WCHAR wch = *src;
- unsigned char ch;
- if ((flags & WC_COMPOSITECHECK) && (srclen > 1) && (composed = wine_compose(src)))
- {
- /* now check if we can use the composed char */
- ch = uni2cp_low[uni2cp_high[composed >> 8] + (composed & 0xff)];
- if (is_valid_sbcs_mapping( table, flags, composed, ch ))
- {
- /* we have a good mapping, use it */
- src++;
- srclen--;
- continue;
- }
- /* no mapping for the composed char, check the other flags */
- if (flags & WC_DEFAULTCHAR) /* use the default char instead */
- {
- *used = 1;
- src++; /* skip the non-spacing char */
- srclen--;
- continue;
- }
- if (flags & WC_DISCARDNS) /* skip the second char of the composition */
- {
- src++;
- srclen--;
- }
- /* WC_SEPCHARS is the default */
- }
- if (!*used)
- {
- ch = uni2cp_low[uni2cp_high[wch >> 8] + (wch & 0xff)];
- *used = !is_valid_sbcs_mapping( table, flags, wch, ch );
- }
- }
- return ret;
- }
- /* wcstombs for single-byte code page */
- static inline int wcstombs_sbcs( const struct sbcs_table *table,
- const WCHAR *src, unsigned int srclen,
- char *dst, unsigned int dstlen )
- {
- const unsigned char * const uni2cp_low = table->uni2cp_low;
- const unsigned short * const uni2cp_high = table->uni2cp_high;
- int ret = srclen;
- if (dstlen < srclen)
- {
- /* buffer too small: fill it up to dstlen and return error */
- srclen = dstlen;
- ret = -1;
- }
- while (srclen >= 16)
- {
- dst[0] = uni2cp_low[uni2cp_high[src[0] >> 8] + (src[0] & 0xff)];
- dst[1] = uni2cp_low[uni2cp_high[src[1] >> 8] + (src[1] & 0xff)];
- dst[2] = uni2cp_low[uni2cp_high[src[2] >> 8] + (src[2] & 0xff)];
- dst[3] = uni2cp_low[uni2cp_high[src[3] >> 8] + (src[3] & 0xff)];
- dst[4] = uni2cp_low[uni2cp_high[src[4] >> 8] + (src[4] & 0xff)];
- dst[5] = uni2cp_low[uni2cp_high[src[5] >> 8] + (src[5] & 0xff)];
- dst[6] = uni2cp_low[uni2cp_high[src[6] >> 8] + (src[6] & 0xff)];
- dst[7] = uni2cp_low[uni2cp_high[src[7] >> 8] + (src[7] & 0xff)];
- dst[8] = uni2cp_low[uni2cp_high[src[8] >> 8] + (src[8] & 0xff)];
- dst[9] = uni2cp_low[uni2cp_high[src[9] >> 8] + (src[9] & 0xff)];
- dst[10] = uni2cp_low[uni2cp_high[src[10] >> 8] + (src[10] & 0xff)];
- dst[11] = uni2cp_low[uni2cp_high[src[11] >> 8] + (src[11] & 0xff)];
- dst[12] = uni2cp_low[uni2cp_high[src[12] >> 8] + (src[12] & 0xff)];
- dst[13] = uni2cp_low[uni2cp_high[src[13] >> 8] + (src[13] & 0xff)];
- dst[14] = uni2cp_low[uni2cp_high[src[14] >> 8] + (src[14] & 0xff)];
- dst[15] = uni2cp_low[uni2cp_high[src[15] >> 8] + (src[15] & 0xff)];
- src += 16;
- dst += 16;
- srclen -= 16;
- }
- /* now handle remaining characters */
- src += srclen;
- dst += srclen;
- switch(srclen)
- {
- case 15: dst[-15] = uni2cp_low[uni2cp_high[src[-15] >> 8] + (src[-15] & 0xff)];
- case 14: dst[-14] = uni2cp_low[uni2cp_high[src[-14] >> 8] + (src[-14] & 0xff)];
- case 13: dst[-13] = uni2cp_low[uni2cp_high[src[-13] >> 8] + (src[-13] & 0xff)];
- case 12: dst[-12] = uni2cp_low[uni2cp_high[src[-12] >> 8] + (src[-12] & 0xff)];
- case 11: dst[-11] = uni2cp_low[uni2cp_high[src[-11] >> 8] + (src[-11] & 0xff)];
- case 10: dst[-10] = uni2cp_low[uni2cp_high[src[-10] >> 8] + (src[-10] & 0xff)];
- case 9: dst[-9] = uni2cp_low[uni2cp_high[src[-9] >> 8] + (src[-9] & 0xff)];
- case 8: dst[-8] = uni2cp_low[uni2cp_high[src[-8] >> 8] + (src[-8] & 0xff)];
- case 7: dst[-7] = uni2cp_low[uni2cp_high[src[-7] >> 8] + (src[-7] & 0xff)];
- case 6: dst[-6] = uni2cp_low[uni2cp_high[src[-6] >> 8] + (src[-6] & 0xff)];
- case 5: dst[-5] = uni2cp_low[uni2cp_high[src[-5] >> 8] + (src[-5] & 0xff)];
- case 4: dst[-4] = uni2cp_low[uni2cp_high[src[-4] >> 8] + (src[-4] & 0xff)];
- case 3: dst[-3] = uni2cp_low[uni2cp_high[src[-3] >> 8] + (src[-3] & 0xff)];
- case 2: dst[-2] = uni2cp_low[uni2cp_high[src[-2] >> 8] + (src[-2] & 0xff)];
- case 1: dst[-1] = uni2cp_low[uni2cp_high[src[-1] >> 8] + (src[-1] & 0xff)];
- case 0: break;
- }
- return ret;
- }
- /* slow version of wcstombs_sbcs that handles the various flags */
- static int wcstombs_sbcs_slow( const struct sbcs_table *table, int flags,
- const WCHAR *src, unsigned int srclen,
- char *dst, unsigned int dstlen,
- const char *defchar, int *used )
- {
- const unsigned char * const uni2cp_low = table->uni2cp_low;
- const unsigned short * const uni2cp_high = table->uni2cp_high;
- unsigned char def;
- unsigned int len;
- int tmp;
- WCHAR composed;
- if (!defchar)
- def = table->info.def_char & 0xff;
- else
- def = *defchar;
- if (!used) used = &tmp; /* avoid checking on every char */
- *used = 0;
- for (len = dstlen; srclen && len; dst++, len--, src++, srclen--)
- {
- WCHAR wch = *src;
- if ((flags & WC_COMPOSITECHECK) && (srclen > 1) && (composed = wine_compose(src)))
- {
- /* now check if we can use the composed char */
- *dst = uni2cp_low[uni2cp_high[composed >> 8] + (composed & 0xff)];
- if (is_valid_sbcs_mapping( table, flags, composed, *dst ))
- {
- /* we have a good mapping, use it */
- src++;
- srclen--;
- continue;
- }
- /* no mapping for the composed char, check the other flags */
- if (flags & WC_DEFAULTCHAR) /* use the default char instead */
- {
- *dst = def;
- *used = 1;
- src++; /* skip the non-spacing char */
- srclen--;
- continue;
- }
- if (flags & WC_DISCARDNS) /* skip the second char of the composition */
- {
- src++;
- srclen--;
- }
- /* WC_SEPCHARS is the default */
- }
- *dst = uni2cp_low[uni2cp_high[wch >> 8] + (wch & 0xff)];
- if (!is_valid_sbcs_mapping( table, flags, wch, *dst ))
- {
- *dst = def;
- *used = 1;
- }
- }
- if (srclen) return -1; /* overflow */
- return dstlen - len;
- }
- /****************************************************************/
- /* dbcs support */
- /* check if 'ch' is an acceptable dbcs mapping for 'wch' */
- static inline int is_valid_dbcs_mapping( const struct dbcs_table *table, int flags,
- WCHAR wch, unsigned short ch )
- {
- if ((flags & WC_NO_BEST_FIT_CHARS) || ch == table->info.def_char)
- {
- /* check if char maps back to the same Unicode value */
- if (ch & 0xff00)
- {
- unsigned char off = table->cp2uni_leadbytes[ch >> 8];
- return (table->cp2uni[(off << 8) + (ch & 0xff)] == wch);
- }
- return (table->cp2uni[ch & 0xff] == wch);
- }
- return 1;
- }
- /* compute the default char for the dbcs case */
- static inline WCHAR get_defchar_dbcs( const struct dbcs_table *table, const char *defchar )
- {
- if (!defchar) return table->info.def_char;
- if (!defchar[1]) return (unsigned char)defchar[0];
- return ((unsigned char)defchar[0] << 8) | (unsigned char)defchar[1];
- }
- /* query necessary dst length for src string */
- static int get_length_dbcs( const struct dbcs_table *table, int flags,
- const WCHAR *src, unsigned int srclen,
- const char *defchar, int *used )
- {
- const unsigned short * const uni2cp_low = table->uni2cp_low;
- const unsigned short * const uni2cp_high = table->uni2cp_high;
- WCHAR defchar_value, composed;
- int len, tmp;
- if (!defchar && !used && !(flags & WC_COMPOSITECHECK))
- {
- for (len = 0; srclen; srclen--, src++, len++)
- {
- if (uni2cp_low[uni2cp_high[*src >> 8] + (*src & 0xff)] & 0xff00) len++;
- }
- return len;
- }
- defchar_value = get_defchar_dbcs( table, defchar );
- if (!used) used = &tmp; /* avoid checking on every char */
- *used = 0;
- for (len = 0; srclen; len++, srclen--, src++)
- {
- unsigned short res;
- WCHAR wch = *src;
- if ((flags & WC_COMPOSITECHECK) && (srclen > 1) && (composed = wine_compose(src)))
- {
- /* now check if we can use the composed char */
- res = uni2cp_low[uni2cp_high[composed >> 8] + (composed & 0xff)];
- if (is_valid_dbcs_mapping( table, flags, composed, res ))
- {
- /* we have a good mapping for the composed char, use it */
- if (res & 0xff00) len++;
- src++;
- srclen--;
- continue;
- }
- /* no mapping for the composed char, check the other flags */
- if (flags & WC_DEFAULTCHAR) /* use the default char instead */
- {
- if (defchar_value & 0xff00) len++;
- *used = 1;
- src++; /* skip the non-spacing char */
- srclen--;
- continue;
- }
- if (flags & WC_DISCARDNS) /* skip the second char of the composition */
- {
- src++;
- srclen--;
- }
- /* WC_SEPCHARS is the default */
- }
- res = uni2cp_low[uni2cp_high[wch >> 8] + (wch & 0xff)];
- if (!is_valid_dbcs_mapping( table, flags, wch, res ))
- {
- res = defchar_value;
- *used = 1;
- }
- if (res & 0xff00) len++;
- }
- return len;
- }
- /* wcstombs for double-byte code page */
- static inline int wcstombs_dbcs( const struct dbcs_table *table,
- const WCHAR *src, unsigned int srclen,
- char *dst, unsigned int dstlen )
- {
- const unsigned short * const uni2cp_low = table->uni2cp_low;
- const unsigned short * const uni2cp_high = table->uni2cp_high;
- int len;
- for (len = dstlen; srclen && len; len--, srclen--, src++)
- {
- unsigned short res = uni2cp_low[uni2cp_high[*src >> 8] + (*src & 0xff)];
- if (res & 0xff00)
- {
- if (len == 1) break; /* do not output a partial char */
- len--;
- *dst++ = res >> 8;
- }
- *dst++ = (char)res;
- }
- if (srclen) return -1; /* overflow */
- return dstlen - len;
- }
- /* slow version of wcstombs_dbcs that handles the various flags */
- static int wcstombs_dbcs_slow( const struct dbcs_table *table, int flags,
- const WCHAR *src, unsigned int srclen,
- char *dst, unsigned int dstlen,
- const char *defchar, int *used )
- {
- const unsigned short * const uni2cp_low = table->uni2cp_low;
- const unsigned short * const uni2cp_high = table->uni2cp_high;
- WCHAR defchar_value = get_defchar_dbcs( table, defchar );
- WCHAR composed;
- int len, tmp;
- if (!used) used = &tmp; /* avoid checking on every char */
- *used = 0;
- for (len = dstlen; srclen && len; len--, srclen--, src++)
- {
- unsigned short res;
- WCHAR wch = *src;
- if ((flags & WC_COMPOSITECHECK) && (srclen > 1) && (composed = wine_compose(src)))
- {
- /* now check if we can use the composed char */
- res = uni2cp_low[uni2cp_high[composed >> 8] + (composed & 0xff)];
- if (is_valid_dbcs_mapping( table, flags, composed, res ))
- {
- /* we have a good mapping for the composed char, use it */
- src++;
- srclen--;
- goto output_char;
- }
- /* no mapping for the composed char, check the other flags */
- if (flags & WC_DEFAULTCHAR) /* use the default char instead */
- {
- res = defchar_value;
- *used = 1;
- src++; /* skip the non-spacing char */
- srclen--;
- goto output_char;
- }
- if (flags & WC_DISCARDNS) /* skip the second char of the composition */
- {
- src++;
- srclen--;
- }
- /* WC_SEPCHARS is the default */
- }
- res = uni2cp_low[uni2cp_high[wch >> 8] + (wch & 0xff)];
- if (!is_valid_dbcs_mapping( table, flags, wch, res ))
- {
- res = defchar_value;
- *used = 1;
- }
- output_char:
- if (res & 0xff00)
- {
- if (len == 1) break; /* do not output a partial char */
- len--;
- *dst++ = res >> 8;
- }
- *dst++ = (char)res;
- }
- if (srclen) return -1; /* overflow */
- return dstlen - len;
- }
- /* wide char to multi byte string conversion */
- /* return -1 on dst buffer overflow */
- int wine_cp_wcstombs_obsolete( const union cptable *table, int flags,
- const WCHAR *src, int srclen,
- char *dst, int dstlen, const char *defchar, int *used )
- {
- if (table->info.char_size == 1)
- {
- if (flags || defchar || used)
- {
- if (!dstlen) return get_length_sbcs( &table->sbcs, flags, src, srclen, used );
- return wcstombs_sbcs_slow( &table->sbcs, flags, src, srclen,
- dst, dstlen, defchar, used );
- }
- if (!dstlen) return srclen;
- return wcstombs_sbcs( &table->sbcs, src, srclen, dst, dstlen );
- }
- else /* mbcs */
- {
- if (!dstlen) return get_length_dbcs( &table->dbcs, flags, src, srclen, defchar, used );
- if (flags || defchar || used)
- return wcstombs_dbcs_slow( &table->dbcs, flags, src, srclen,
- dst, dstlen, defchar, used );
- return wcstombs_dbcs( &table->dbcs, src, srclen, dst, dstlen );
- }
- }
- __ASM_OBSOLETE(wine_cp_wcstombs);
- #endif /* __ASM_OBSOLETE */
|