parseCommon.cxx revision 7c478bd95313f5f23a4c958a745db2134aa03244
// Copyright (c) 1994 James Clark
// See the file COPYING for copying permission.
#pragma ident "%Z%%M% %I% %E% SMI"
#include "splib.h"
#include "Parser.h"
#include "token.h"
#include "MessageArg.h"
#include "ParserMessages.h"
#include "constant.h"
#include "NumericCharRefOrigin.h"
#include "macros.h"
#ifdef SP_NAMESPACE
namespace SP_NAMESPACE {
#endif
{
currentInput()->startToken();
for (;;) {
break;
switch (token) {
case tokenEe:
return 0;
case tokenUnrecognized:
// fall through
case tokenChar:
return 0;
}
break;
}
}
if (options().warnPiMissingName) {
size_t i = 0;
break;
}
}
noteMarkup();
return 1;
}
const MessageType1 &tooLongMessage,
unsigned flags,
{
unsigned startLevel = inputLevel();
// If the literal gets to be longer than this, then we assume
// that the closing delimiter has been omitted if we're at the end
// of a line and at the starting input level.
? size_t(-1)
: maxLength * 2);
if (flags & literalDelimInfo)
for (;;) {
switch (token) {
case tokenEe:
if (inputLevel() == startLevel) {
return 0;
}
if (inputLevel() == startLevel)
break;
case tokenUnrecognized:
if (reportNonSgmlCharacter())
break;
break;
case tokenRs:
break;
case tokenRe:
#if 0
#endif
// guess that the closing delimiter has been omitted
return 0;
}
// fall through
case tokenSepchar:
if ((flags & literalSingleSpace)
else
currentChar()),
0));
break;
case tokenSpace:
if ((flags & literalSingleSpace)
else
break;
case tokenCroDigit:
case tokenHcroHexDigit:
{
Char c;
return 0;
if (!translateNumericCharRef(c, isSgmlChar))
break;
if (!isSgmlChar) {
if (flags & literalNonSgml)
else
NumberMessageArg(c));
break;
}
if (flags & literalDataTag) {
if (!syntax().isSgmlChar(c))
}
if ((flags & literalSingleSpace)
else
}
break;
case tokenCroNameStart:
if (!parseNamedCharRef())
return 0;
break;
case tokenEroGrpo:
break;
case tokenLit:
case tokenLita:
if (flags & literalDelimInfo)
goto done;
case tokenPeroNameStart:
&& inputLevel() == 1)
// fall through
case tokenEroNameStart:
{
return 0;
(flags & literalSingleSpace) != 0);
if (inputLevel() > startLevel)
}
break;
case tokenPeroGrpo:
break;
case tokenCharDelim:
currentInput()->currentTokenLength())));
// fall through
case tokenChar:
#if 0
#endif
// guess that the closing delimiter has been omitted
return 0;
}
break;
}
}
done:
if ((flags & literalSingleSpace)
switch (litMode) {
case alitMode:
case alitaMode:
case talitMode:
case talitaMode:
return 0;
default:
break;
}
}
return 1;
}
{
if (options().warnNamedCharRef)
in->discardInitial();
Char c;
valid = 0;
}
else {
valid = 1;
if (wantMarkup())
}
case tokenRefc:
break;
case tokenRe:
break;
default:
break;
}
in->startToken();
if (valid)
return 1;
}
{
in->discardInitial();
Char c = 0;
if (isHex) {
c += val;
else {
valid = 0;
break;
}
}
}
else {
c += val;
else {
valid = 0;
break;
}
}
}
valid = 0;
}
if (wantMarkup()) {
case tokenRefc:
break;
case tokenRe:
markupPtr->addRefEndRe();
break;
default:
break;
}
}
}
else
if (valid) {
ch = c;
currentLocation().index()
+ currentInput()->currentTokenLength()
- startLocation.index(),
0);
}
return valid;
}
// Translate a character number in the document character set
// into the internal character set.
// If it's a non-SGML char (ie described as UNUSED in SGML declaration),
// return 1 and set sgmlChar to 0.
{
if (sd().internalCharsetIsDocCharset()) {
isSgmlChar = 1;
return 1;
}
Number n;
if (options().warnNonSgmlCharRef)
isSgmlChar = 0;
return 1;
}
}
else
else
NumberMessageArg(n),
}
else {
resultChars)) {
case 1:
if (resultChar <= charMax) {
isSgmlChar = 1;
return 1;
}
// fall through
case 2:
break;
default:
break;
}
}
return 0;
}
// ignoreLevel: 0 means don't ignore;
// 1 means parse name group and ignore if inactive
// 2 means ignore
int ignoreLevel,
{
if (wantMarkup()) {
}
if (ignoreLevel == 1) {
if (savedCurrentMarkup)
if (markupPtr) {
}
return 0;
if (markupPtr)
if (savedCurrentMarkup)
if (!ignore)
ignoreLevel = 0;
in->startToken();
if (!syntax().isNameStartCharacter(c)) {
return 0;
}
}
in->discardInitial();
if (isParameter)
else
if (ignoreLevel)
: Entity::generalEntity);
else {
if (haveApplicableDtd()) {
if (!isParameter) {
}
else
}
else
}
}
if (markupPtr) {
case tokenRefc:
break;
case tokenRe:
markupPtr->addRefEndRe();
break;
default:
break;
}
}
}
else
currentLocation().index()
+ currentInput()->currentTokenLength()
- startLocation.index(),
else
origin = (EntityOrigin *)0;
return 1;
}
{
if (markup)
switch (token) {
case tokenUnrecognized:
if (!reportNonSgmlCharacter())
break;
case tokenEe:
return 0;
default:
if (markup)
break;
}
return 1;
}
const MessageType1 &tooLongMessage)
{
length++;
}
{
length++;
}
void Parser::extendHexNumber()
{
length++;
}
{
// In scanSuppress mode the non-SGML character will have been read.
if (!syntax().isSgmlChar(c)) {
return 1;
}
return 0;
}
{
length++;
}
#ifdef SP_NAMESPACE
}
#endif