18#ifndef MAGICKCORE_TOKEN_PRIVATE_H
19#define MAGICKCORE_TOKEN_PRIVATE_H
21#if defined(__cplusplus) || defined(c_plusplus)
29#define MaxMultibyteCodes 6
41 utf_info[MaxMultibyteCodes] =
43 { 0x80, 0x00, 0x000007f, 0x0000000 },
44 { 0xE0, 0xC0, 0x00007ff, 0x0000080 },
45 { 0xF0, 0xE0, 0x000ffff, 0x0000800 },
46 { 0xF8, 0xF0, 0x01fffff, 0x0010000 },
47 { 0xFC, 0xF8, 0x03fffff, 0x0200000 },
48 { 0xFE, 0xFC, 0x7ffffff, 0x4000000 },
51static inline unsigned char *ConvertLatin1ToUTF8(
52 const unsigned char *magick_restrict content)
68 for (p=content; *p !=
'\0'; p++)
69 length+=(*p & 0x80) != 0 ? 2 : 1;
70 utf8=(
unsigned char *) NULL;
72 utf8=(
unsigned char *) AcquireQuantumMemory(length+1UL,
sizeof(*utf8));
73 if (utf8 == (
unsigned char *) NULL)
74 return((
unsigned char *) NULL);
76 for (p=content; *p !=
'\0'; p++)
83 *q++=0xc0 | ((c >> 6) & 0x3f);
84 *q++=0x80 | (c & 0x3f);
91static inline unsigned char *ConvertMacRomanToUTF8(
92 const unsigned char *magick_restrict content)
94 static const uint16_t macroman_unicode[128] = {
95 0x00C4,0x00C5,0x00C7,0x00C9,0x00D1,0x00D6,0x00DC,0x00E1,
96 0x00E0,0x00E2,0x00E4,0x00E3,0x00E5,0x00E7,0x00E9,0x00E8,
97 0x00EA,0x00EB,0x00ED,0x00EC,0x00EE,0x00EF,0x00F1,0x00F3,
98 0x00F2,0x00F4,0x00F6,0x00F5,0x00FA,0x00F9,0x00FB,0x00FC,
99 0x2020,0x00B0,0x00A2,0x00A3,0x00A7,0x2022,0x00B6,0x00DF,
100 0x00AE,0x00A9,0x2122,0x00B4,0x00A8,0x2260,0x00C6,0x00D8,
101 0x221E,0x00B1,0x2264,0x2265,0x00A5,0x00B5,0x2202,0x2211,
102 0x220F,0x03C0,0x222B,0x00AA,0x00BA,0x03A9,0x00E6,0x00F8,
103 0x00BF,0x00A1,0x00AC,0x221A,0x0192,0x2248,0x2206,0x00AB,
104 0x00BB,0x2026,0x00A0,0x00C0,0x00C3,0x00D5,0x0152,0x0153,
105 0x2013,0x2014,0x201C,0x201D,0x2018,0x2019,0x00F7,0x25CA,
106 0x00FF,0x0178,0x2044,0x20AC,0x2039,0x203A,0xFB01,0xFB02,
107 0x2021,0x00B7,0x201A,0x201E,0x2030,0x00C2,0x00CA,0x00C1,
108 0x00CB,0x00C8,0x00CD,0x00CE,0x00CF,0x00CC,0x00D3,0x00D4,
109 0xF8FF,0x00D2,0x00DA,0x00DB,0x00D9,0x0131,0x02C6,0x02DC,
110 0x00AF,0x02D8,0x02D9,0x02DA,0x00B8,0x02DD,0x02DB,0x02C7
127 for (p=content; *p !=
'\0'; p++)
128 length+=(*p & 0x80) != 0 ? 4 : 1;
129 utf8=(
unsigned char *) NULL;
131 utf8=(
unsigned char *) AcquireQuantumMemory(length+1UL,
sizeof(*utf8));
132 if (utf8 == (
unsigned char *) NULL)
133 return((
unsigned char *) NULL);
135 for (p=content; *p !=
'\0'; p++)
139 c=macroman_unicode[c-128];
141 *q++=(
unsigned char) c;
145 *q++=(
unsigned char) (0xc0 | ((c >> 6) & 0x3f));
146 *q++=(
unsigned char) (0x80 | (c & 0x3f));
151 *q++=(
unsigned char) (0xe0 | (c >> 12));
152 *q++=(
unsigned char) (0x80 | ((c >> 6) & 0x3f));
153 *q++=(
unsigned char) (0x80 | (c & 0x3f));
157 *q++=(
unsigned char) (0xf0 | (c >> 18));
158 *q++=(
unsigned char) (0x80 | ((c >> 12) & 0x3f));
159 *q++=(
unsigned char) (0x80 | ((c >> 6) & 0x3f));
160 *q++=(
unsigned char) (0x80 | (c & 0x3f));
167static inline int GetNextUTFCode(
const char *magick_restrict text,
168 unsigned int *magick_restrict octets)
181 if (text == (
const char *) NULL)
186 code=(int) (*text++) & 0xff;
188 for (i=0; i < MaxMultibyteCodes; i++)
190 if ((code & utf_info[i].code_mask) == utf_info[i].code_value)
192 unicode&=utf_info[i].utf_mask;
193 if (unicode < utf_info[i].utf_value)
195 *octets=(
unsigned int) (i+1);
198 c=(int) (*text++ ^ 0x80) & 0xff;
201 if (unicode > 0x10FFFF)
203 unicode=(unicode << 6) | c;
209static inline int GetUTFCode(
const char *magick_restrict text)
214 return(GetNextUTFCode(text,&octets));
217static inline unsigned int GetUTFOctets(
const char *magick_restrict text)
222 (void) GetNextUTFCode(text,&octets);
226static inline MagickBooleanType IsNonBreakingUTFSpace(
const int code)
233static inline MagickBooleanType IsUTFSpace(
int code)
235 if (((code >= 0x0009) && (code <= 0x000d)) || (code == 0x0020) ||
236 (code == 0x0085) || (code == 0x00a0) || (code == 0x1680) ||
237 (code == 0x180e) || ((code >= 0x2000) && (code <= 0x200a)) ||
238 (code == 0x2028) || (code == 0x2029) || (code == 0x202f) ||
239 (code == 0x205f) || (code == 0x3000))
244static inline MagickBooleanType IsUTFValid(
const int code)
249 mask=(int) 0x7fffffff;
250 if (((code & ~mask) != 0) && ((code < 0xd800) || (code > 0xdfff)) &&
251 (code != 0xfffe) && (code != 0xffff))
256static inline MagickBooleanType IsUTFAscii(
int code)
262 if ((code & ~mask) != 0)
267#if defined(__cplusplus) || defined(c_plusplus)