2002-07-01 12:46:08 -04:00
|
|
|
const ENCODING *
|
|
|
|
NS(XmlGetUtf8InternalEncoding)(void)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
|
|
|
return &ns(internal_utf8_encoding).enc;
|
|
|
|
}
|
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
const ENCODING *
|
|
|
|
NS(XmlGetUtf16InternalEncoding)(void)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
2002-05-17 17:42:05 -04:00
|
|
|
#if BYTEORDER == 1234
|
1998-11-17 04:45:10 -05:00
|
|
|
return &ns(internal_little2_encoding).enc;
|
2002-05-17 17:42:05 -04:00
|
|
|
#elif BYTEORDER == 4321
|
1998-11-17 04:45:10 -05:00
|
|
|
return &ns(internal_big2_encoding).enc;
|
|
|
|
#else
|
|
|
|
const short n = 1;
|
2002-07-01 12:46:08 -04:00
|
|
|
return (*(const char *)&n
|
|
|
|
? &ns(internal_little2_encoding).enc
|
|
|
|
: &ns(internal_big2_encoding).enc);
|
1998-11-17 04:45:10 -05:00
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
static const ENCODING *NS(encodings)[] = {
|
1998-11-17 07:42:16 -05:00
|
|
|
&ns(latin1_encoding).enc,
|
|
|
|
&ns(ascii_encoding).enc,
|
|
|
|
&ns(utf8_encoding).enc,
|
|
|
|
&ns(big2_encoding).enc,
|
|
|
|
&ns(big2_encoding).enc,
|
|
|
|
&ns(little2_encoding).enc,
|
|
|
|
&ns(utf8_encoding).enc /* NO_ENC */
|
|
|
|
};
|
1998-11-17 04:45:10 -05:00
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
static int
|
|
|
|
NS(initScanProlog)(const ENCODING *enc, const char *ptr, const char *end,
|
|
|
|
const char **nextTokPtr)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
2002-07-01 12:46:08 -04:00
|
|
|
return initScan(NS(encodings), (const INIT_ENCODING *)enc,
|
|
|
|
XML_PROLOG_STATE, ptr, end, nextTokPtr);
|
1998-11-17 04:45:10 -05:00
|
|
|
}
|
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
static int
|
|
|
|
NS(initScanContent)(const ENCODING *enc, const char *ptr, const char *end,
|
|
|
|
const char **nextTokPtr)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
2002-07-01 12:46:08 -04:00
|
|
|
return initScan(NS(encodings), (const INIT_ENCODING *)enc,
|
|
|
|
XML_CONTENT_STATE, ptr, end, nextTokPtr);
|
1998-11-17 04:45:10 -05:00
|
|
|
}
|
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
int
|
|
|
|
NS(XmlInitEncoding)(INIT_ENCODING *p, const ENCODING **encPtr,
|
|
|
|
const char *name)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
1998-11-17 07:42:16 -05:00
|
|
|
int i = getEncodingIndex(name);
|
|
|
|
if (i == UNKNOWN_ENC)
|
|
|
|
return 0;
|
1999-06-02 07:20:06 -04:00
|
|
|
SET_INIT_ENC_INDEX(p, i);
|
1998-11-17 04:45:10 -05:00
|
|
|
p->initEnc.scanners[XML_PROLOG_STATE] = NS(initScanProlog);
|
|
|
|
p->initEnc.scanners[XML_CONTENT_STATE] = NS(initScanContent);
|
|
|
|
p->initEnc.updatePosition = initUpdatePosition;
|
|
|
|
p->encPtr = encPtr;
|
|
|
|
*encPtr = &(p->initEnc);
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
static const ENCODING *
|
|
|
|
NS(findEncoding)(const ENCODING *enc, const char *ptr, const char *end)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
|
|
|
#define ENCODING_MAX 128
|
|
|
|
char buf[ENCODING_MAX];
|
|
|
|
char *p = buf;
|
|
|
|
int i;
|
|
|
|
XmlUtf8Convert(enc, &ptr, end, &p, p + ENCODING_MAX - 1);
|
|
|
|
if (ptr != end)
|
|
|
|
return 0;
|
|
|
|
*p = 0;
|
1999-10-12 23:58:17 -04:00
|
|
|
if (streqci(buf, KW_UTF_16) && enc->minBytesPerChar == 2)
|
1998-11-17 07:42:16 -05:00
|
|
|
return enc;
|
|
|
|
i = getEncodingIndex(buf);
|
|
|
|
if (i == UNKNOWN_ENC)
|
|
|
|
return 0;
|
|
|
|
return NS(encodings)[i];
|
1998-11-17 04:45:10 -05:00
|
|
|
}
|
|
|
|
|
2002-07-01 12:46:08 -04:00
|
|
|
int
|
|
|
|
NS(XmlParseXmlDecl)(int isGeneralTextEntity,
|
|
|
|
const ENCODING *enc,
|
|
|
|
const char *ptr,
|
|
|
|
const char *end,
|
|
|
|
const char **badPtr,
|
|
|
|
const char **versionPtr,
|
|
|
|
const char **versionEndPtr,
|
|
|
|
const char **encodingName,
|
|
|
|
const ENCODING **encoding,
|
|
|
|
int *standalone)
|
1998-11-17 04:45:10 -05:00
|
|
|
{
|
|
|
|
return doParseXmlDecl(NS(findEncoding),
|
2002-07-01 12:46:08 -04:00
|
|
|
isGeneralTextEntity,
|
|
|
|
enc,
|
|
|
|
ptr,
|
|
|
|
end,
|
|
|
|
badPtr,
|
|
|
|
versionPtr,
|
|
|
|
versionEndPtr,
|
|
|
|
encodingName,
|
|
|
|
encoding,
|
|
|
|
standalone);
|
1998-11-17 04:45:10 -05:00
|
|
|
}
|