cp950ext.h 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161
  1. /*
  2. * Copyright (C) 1999-2001 Free Software Foundation, Inc.
  3. * This file is part of the GNU LIBICONV Library.
  4. *
  5. * The GNU LIBICONV Library is free software; you can redistribute it
  6. * and/or modify it under the terms of the GNU Library General Public
  7. * License as published by the Free Software Foundation; either version 2
  8. * of the License, or (at your option) any later version.
  9. *
  10. * The GNU LIBICONV Library is distributed in the hope that it will be
  11. * useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  13. * Library General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU Library General Public
  16. * License along with the GNU LIBICONV Library; see the file COPYING.LIB.
  17. * If not, write to the Free Software Foundation, Inc., 51 Franklin Street,
  18. * Fifth Floor, Boston, MA 02110-1301, USA.
  19. */
  20. /*
  21. * CP950 extensions
  22. */
  23. static const unsigned short cp950ext_2uni_pagef9[157-116] = {
  24. /* 0xf9 */
  25. 0x7881, 0x92b9, 0x88cf, 0x58bb,
  26. 0x6052, 0x7ca7, 0x5afa, 0x2554, 0x2566, 0x2557, 0x2560, 0x256c,
  27. 0x2563, 0x255a, 0x2569, 0x255d, 0x2552, 0x2564, 0x2555, 0x255e,
  28. 0x256a, 0x2561, 0x2558, 0x2567, 0x255b, 0x2553, 0x2565, 0x2556,
  29. 0x255f, 0x256b, 0x2562, 0x2559, 0x2568, 0x255c, 0x2551, 0x2550,
  30. 0x256d, 0x256e, 0x2570, 0x256f, 0x2593,
  31. };
  32. static int
  33. cp950ext_mbtowc (conv_t conv, ucs4_t *pwc, const unsigned char *s, int n)
  34. {
  35. unsigned char c1 = s[0];
  36. if ((c1 == 0xf9)) {
  37. if (n >= 2) {
  38. unsigned char c2 = s[1];
  39. if ((c2 >= 0x40 && c2 < 0x7f) || (c2 >= 0xa1 && c2 < 0xff)) {
  40. unsigned int i = 157 * (c1 - 0xa1) + (c2 - (c2 >= 0xa1 ? 0x62 : 0x40));
  41. unsigned short wc = 0xfffd;
  42. {
  43. if (i >= 13932 && i < 13973)
  44. wc = cp950ext_2uni_pagef9[i-13932];
  45. }
  46. if (wc != 0xfffd) {
  47. *pwc = (ucs4_t) wc;
  48. return 2;
  49. }
  50. }
  51. return RET_ILSEQ;
  52. }
  53. return RET_TOOFEW(0);
  54. }
  55. return RET_ILSEQ;
  56. }
  57. static const unsigned short cp950ext_2charset[41] = {
  58. 0xf9f9, 0xf9f8, 0xf9e6, 0xf9ef, 0xf9dd, 0xf9e8, 0xf9f1, 0xf9df,
  59. 0xf9ec, 0xf9f5, 0xf9e3, 0xf9ee, 0xf9f7, 0xf9e5, 0xf9e9, 0xf9f2,
  60. 0xf9e0, 0xf9eb, 0xf9f4, 0xf9e2, 0xf9e7, 0xf9f0, 0xf9de, 0xf9ed,
  61. 0xf9f6, 0xf9e4, 0xf9ea, 0xf9f3, 0xf9e1, 0xf9fa, 0xf9fb, 0xf9fd,
  62. 0xf9fc, 0xf9fe, 0xf9d9, 0xf9dc, 0xf9da, 0xf9d6, 0xf9db, 0xf9d8,
  63. 0xf9d7,
  64. };
  65. static const Summary16 cp950ext_uni2indx_page25[10] = {
  66. /* 0x2500 */
  67. { 0, 0x0000 }, { 0, 0x0000 }, { 0, 0x0000 }, { 0, 0x0000 },
  68. { 0, 0x0000 }, { 0, 0xffff }, { 16, 0xffff }, { 32, 0x0001 },
  69. { 33, 0x0000 }, { 33, 0x0008 },
  70. };
  71. static const Summary16 cp950ext_uni2indx_page58[12] = {
  72. /* 0x5800 */
  73. { 34, 0x0000 }, { 34, 0x0000 }, { 34, 0x0000 }, { 34, 0x0000 },
  74. { 34, 0x0000 }, { 34, 0x0000 }, { 34, 0x0000 }, { 34, 0x0000 },
  75. { 34, 0x0000 }, { 34, 0x0000 }, { 34, 0x0000 }, { 34, 0x0800 },
  76. };
  77. static const Summary16 cp950ext_uni2indx_page5a[16] = {
  78. /* 0x5a00 */
  79. { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 },
  80. { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 },
  81. { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 },
  82. { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0000 }, { 35, 0x0400 },
  83. };
  84. static const Summary16 cp950ext_uni2indx_page60[6] = {
  85. /* 0x6000 */
  86. { 36, 0x0000 }, { 36, 0x0000 }, { 36, 0x0000 }, { 36, 0x0000 },
  87. { 36, 0x0000 }, { 36, 0x0004 },
  88. };
  89. static const Summary16 cp950ext_uni2indx_page78[9] = {
  90. /* 0x7800 */
  91. { 37, 0x0000 }, { 37, 0x0000 }, { 37, 0x0000 }, { 37, 0x0000 },
  92. { 37, 0x0000 }, { 37, 0x0000 }, { 37, 0x0000 }, { 37, 0x0000 },
  93. { 37, 0x0002 },
  94. };
  95. static const Summary16 cp950ext_uni2indx_page7c[11] = {
  96. /* 0x7c00 */
  97. { 38, 0x0000 }, { 38, 0x0000 }, { 38, 0x0000 }, { 38, 0x0000 },
  98. { 38, 0x0000 }, { 38, 0x0000 }, { 38, 0x0000 }, { 38, 0x0000 },
  99. { 38, 0x0000 }, { 38, 0x0000 }, { 38, 0x0080 },
  100. };
  101. static const Summary16 cp950ext_uni2indx_page88[13] = {
  102. /* 0x8800 */
  103. { 39, 0x0000 }, { 39, 0x0000 }, { 39, 0x0000 }, { 39, 0x0000 },
  104. { 39, 0x0000 }, { 39, 0x0000 }, { 39, 0x0000 }, { 39, 0x0000 },
  105. { 39, 0x0000 }, { 39, 0x0000 }, { 39, 0x0000 }, { 39, 0x0000 },
  106. { 39, 0x8000 },
  107. };
  108. static const Summary16 cp950ext_uni2indx_page92[12] = {
  109. /* 0x9200 */
  110. { 40, 0x0000 }, { 40, 0x0000 }, { 40, 0x0000 }, { 40, 0x0000 },
  111. { 40, 0x0000 }, { 40, 0x0000 }, { 40, 0x0000 }, { 40, 0x0000 },
  112. { 40, 0x0000 }, { 40, 0x0000 }, { 40, 0x0000 }, { 40, 0x0200 },
  113. };
  114. static int
  115. cp950ext_wctomb (conv_t conv, unsigned char *r, ucs4_t wc, int n)
  116. {
  117. if (n >= 2) {
  118. const Summary16 *summary = NULL;
  119. if (wc >= 0x2500 && wc < 0x25a0)
  120. summary = &cp950ext_uni2indx_page25[(wc>>4)-0x250];
  121. else if (wc >= 0x5800 && wc < 0x58c0)
  122. summary = &cp950ext_uni2indx_page58[(wc>>4)-0x580];
  123. else if (wc >= 0x5a00 && wc < 0x5b00)
  124. summary = &cp950ext_uni2indx_page5a[(wc>>4)-0x5a0];
  125. else if (wc >= 0x6000 && wc < 0x6060)
  126. summary = &cp950ext_uni2indx_page60[(wc>>4)-0x600];
  127. else if (wc >= 0x7800 && wc < 0x7890)
  128. summary = &cp950ext_uni2indx_page78[(wc>>4)-0x780];
  129. else if (wc >= 0x7c00 && wc < 0x7cb0)
  130. summary = &cp950ext_uni2indx_page7c[(wc>>4)-0x7c0];
  131. else if (wc >= 0x8800 && wc < 0x88d0)
  132. summary = &cp950ext_uni2indx_page88[(wc>>4)-0x880];
  133. else if (wc >= 0x9200 && wc < 0x92c0)
  134. summary = &cp950ext_uni2indx_page92[(wc>>4)-0x920];
  135. if (summary) {
  136. unsigned short used = summary->used;
  137. unsigned int i = wc & 0x0f;
  138. if (used & ((unsigned short) 1 << i)) {
  139. unsigned short c;
  140. /* Keep in `used' only the bits 0..i-1. */
  141. used &= ((unsigned short) 1 << i) - 1;
  142. /* Add `summary->indx' and the number of bits set in `used'. */
  143. used = (used & 0x5555) + ((used & 0xaaaa) >> 1);
  144. used = (used & 0x3333) + ((used & 0xcccc) >> 2);
  145. used = (used & 0x0f0f) + ((used & 0xf0f0) >> 4);
  146. used = (used & 0x00ff) + (used >> 8);
  147. c = cp950ext_2charset[summary->indx + used];
  148. r[0] = (c >> 8); r[1] = (c & 0xff);
  149. return 2;
  150. }
  151. }
  152. return RET_ILUNI;
  153. }
  154. return RET_TOOSMALL;
  155. }