#include "antlr3convertutf.h"
Functions | |
ConversionResult | ConvertUTF16toUTF32 (const UTF16 **sourceStart, const UTF16 *sourceEnd, UTF32 **targetStart, UTF32 *targetEnd, ConversionFlags flags) |
ConversionResult | ConvertUTF16toUTF8 (const UTF16 **sourceStart, const UTF16 *sourceEnd, UTF8 **targetStart, UTF8 *targetEnd, ConversionFlags flags) |
ConversionResult | ConvertUTF32toUTF16 (const UTF32 **sourceStart, const UTF32 *sourceEnd, UTF16 **targetStart, UTF16 *targetEnd, ConversionFlags flags) |
ConversionResult | ConvertUTF32toUTF8 (const UTF32 **sourceStart, const UTF32 *sourceEnd, UTF8 **targetStart, UTF8 *targetEnd, ConversionFlags flags) |
ConversionResult | ConvertUTF8toUTF16 (const UTF8 **sourceStart, const UTF8 *sourceEnd, UTF16 **targetStart, UTF16 *targetEnd, ConversionFlags flags) |
ConversionResult | ConvertUTF8toUTF32 (const UTF8 **sourceStart, const UTF8 *sourceEnd, UTF32 **targetStart, UTF32 *targetEnd, ConversionFlags flags) |
static ANTLR3_BOOLEAN | isLegalUTF8 (const UTF8 *source, int length) |
ANTLR3_BOOLEAN | isLegalUTF8Sequence (const UTF8 *source, const UTF8 *sourceEnd) |
Variables | |
static const UTF8 | firstByteMark [7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC } |
static const UTF32 | offsetsFromUTF8 [6] |
static const char | trailingBytesForUTF8 [256] |
ConversionResult ConvertUTF16toUTF32 | ( | const UTF16 ** | sourceStart, | |
const UTF16 * | sourceEnd, | |||
UTF32 ** | targetStart, | |||
UTF32 * | targetEnd, | |||
ConversionFlags | flags | |||
) |
ConversionResult ConvertUTF16toUTF8 | ( | const UTF16 ** | sourceStart, | |
const UTF16 * | sourceEnd, | |||
UTF8 ** | targetStart, | |||
UTF8 * | targetEnd, | |||
ConversionFlags | flags | |||
) |
References conversionOK, firstByteMark, halfBase, halfShift, sourceExhausted, sourceIllegal, strictConversion, targetExhausted, UNI_REPLACEMENT_CHAR, UNI_SUR_HIGH_END, UNI_SUR_HIGH_START, UNI_SUR_LOW_END, and UNI_SUR_LOW_START.
Referenced by toUTF8_UTF16().
ConversionResult ConvertUTF32toUTF16 | ( | const UTF32 ** | sourceStart, | |
const UTF32 * | sourceEnd, | |||
UTF16 ** | targetStart, | |||
UTF16 * | targetEnd, | |||
ConversionFlags | flags | |||
) |
ConversionResult ConvertUTF32toUTF8 | ( | const UTF32 ** | sourceStart, | |
const UTF32 * | sourceEnd, | |||
UTF8 ** | targetStart, | |||
UTF8 * | targetEnd, | |||
ConversionFlags | flags | |||
) |
ConversionResult ConvertUTF8toUTF16 | ( | const UTF8 ** | sourceStart, | |
const UTF8 * | sourceEnd, | |||
UTF16 ** | targetStart, | |||
UTF16 * | targetEnd, | |||
ConversionFlags | flags | |||
) |
References conversionOK, halfBase, halfMask, halfShift, isLegalUTF8(), offsetsFromUTF8, sourceExhausted, sourceIllegal, strictConversion, targetExhausted, trailingBytesForUTF8, UNI_MAX_BMP, UNI_MAX_UTF16, UNI_REPLACEMENT_CHAR, UNI_SUR_HIGH_START, UNI_SUR_LOW_END, and UNI_SUR_LOW_START.
ConversionResult ConvertUTF8toUTF32 | ( | const UTF8 ** | sourceStart, | |
const UTF8 * | sourceEnd, | |||
UTF32 ** | targetStart, | |||
UTF32 * | targetEnd, | |||
ConversionFlags | flags | |||
) |
References conversionOK, isLegalUTF8(), offsetsFromUTF8, sourceExhausted, sourceIllegal, strictConversion, targetExhausted, trailingBytesForUTF8, UNI_MAX_LEGAL_UTF32, UNI_REPLACEMENT_CHAR, UNI_SUR_HIGH_START, and UNI_SUR_LOW_END.
static ANTLR3_BOOLEAN isLegalUTF8 | ( | const UTF8 * | source, | |
int | length | |||
) | [static] |
Referenced by ConvertUTF8toUTF16(), ConvertUTF8toUTF32(), and isLegalUTF8Sequence().
ANTLR3_BOOLEAN isLegalUTF8Sequence | ( | const UTF8 * | source, | |
const UTF8 * | sourceEnd | |||
) |
const UTF8 firstByteMark[7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC } [static] |
Referenced by ConvertUTF16toUTF8(), and ConvertUTF32toUTF8().
const UTF32 offsetsFromUTF8[6] [static] |
Initial value:
{ 0x00000000UL, 0x00003080UL, 0x000E2080UL, 0x03C82080UL, 0xFA082080UL, 0x82082080UL }
Referenced by antlr3UTF8Consume(), antlr3UTF8LA(), ConvertUTF8toUTF16(), and ConvertUTF8toUTF32().
const char trailingBytesForUTF8[256] [static] |
Initial value:
{ 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1, 2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, 3,3,3,3,3,3,3,3,4,4,4,4,5,5,5,5 }
Referenced by antlr3UTF8Consume(), antlr3UTF8LA(), ConvertUTF8toUTF16(), ConvertUTF8toUTF32(), and isLegalUTF8Sequence().