536cd135cc
Former-commit-id: 5624ac747d633e885131e8349322922b6a59baaa
521 lines
21 KiB
C#
521 lines
21 KiB
C#
//------------------------------------------------------------------------------
|
|
// <copyright file="DtdValidator.cs" company="Microsoft">
|
|
// Copyright (c) Microsoft Corporation. All rights reserved.
|
|
// </copyright>
|
|
// <owner current="true" primary="true">Microsoft</owner>
|
|
//------------------------------------------------------------------------------
|
|
|
|
namespace System.Xml.Schema {
|
|
using System;
|
|
using System.Collections;
|
|
using System.Text;
|
|
using System.IO;
|
|
using System.Net;
|
|
using System.Diagnostics;
|
|
using System.Xml.Schema;
|
|
using System.Xml.XPath;
|
|
|
|
#pragma warning disable 618
|
|
|
|
internal sealed class DtdValidator : BaseValidator {
|
|
|
|
//required by ParseValue
|
|
class NamespaceManager : XmlNamespaceManager {
|
|
public override string LookupNamespace(string prefix) { return prefix; }
|
|
}
|
|
|
|
static NamespaceManager namespaceManager = new NamespaceManager();
|
|
const int STACK_INCREMENT = 10;
|
|
HWStack validationStack; // validaton contexts
|
|
Hashtable attPresence;
|
|
XmlQualifiedName name = XmlQualifiedName.Empty;
|
|
Hashtable IDs;
|
|
IdRefNode idRefListHead;
|
|
bool processIdentityConstraints;
|
|
|
|
internal DtdValidator(XmlValidatingReaderImpl reader, IValidationEventHandling eventHandling, bool processIdentityConstraints) : base(reader, null, eventHandling) {
|
|
this.processIdentityConstraints = processIdentityConstraints;
|
|
Init();
|
|
}
|
|
|
|
private void Init() {
|
|
Debug.Assert(reader != null);
|
|
validationStack = new HWStack(STACK_INCREMENT);
|
|
textValue = new StringBuilder();
|
|
name = XmlQualifiedName.Empty;
|
|
attPresence = new Hashtable();
|
|
schemaInfo = new SchemaInfo();
|
|
checkDatatype = false;
|
|
Push(name);
|
|
}
|
|
|
|
public override void Validate() {
|
|
if (schemaInfo.SchemaType == SchemaType.DTD) {
|
|
switch (reader.NodeType) {
|
|
case XmlNodeType.Element:
|
|
ValidateElement();
|
|
if (reader.IsEmptyElement) {
|
|
goto case XmlNodeType.EndElement;
|
|
}
|
|
break;
|
|
case XmlNodeType.Whitespace:
|
|
case XmlNodeType.SignificantWhitespace:
|
|
if (MeetsStandAloneConstraint()) {
|
|
ValidateWhitespace();
|
|
}
|
|
break;
|
|
case XmlNodeType.ProcessingInstruction:
|
|
case XmlNodeType.Comment:
|
|
ValidatePIComment();
|
|
break;
|
|
|
|
case XmlNodeType.Text: // text inside a node
|
|
case XmlNodeType.CDATA: // <![CDATA[...]]>
|
|
ValidateText();
|
|
break;
|
|
case XmlNodeType.EntityReference:
|
|
if (!GenEntity( new XmlQualifiedName(reader.LocalName, reader.Prefix) ) ){
|
|
ValidateText();
|
|
}
|
|
break;
|
|
case XmlNodeType.EndElement:
|
|
ValidateEndElement();
|
|
break;
|
|
}
|
|
}
|
|
else {
|
|
if(reader.Depth == 0 &&
|
|
reader.NodeType == XmlNodeType.Element) {
|
|
SendValidationEvent(Res.Xml_NoDTDPresent, this.name.ToString(), XmlSeverityType.Warning);
|
|
}
|
|
}
|
|
}
|
|
|
|
private bool MeetsStandAloneConstraint() {
|
|
if (reader.StandAlone && // VC 1 - iv
|
|
context.ElementDecl != null &&
|
|
context.ElementDecl.IsDeclaredInExternal &&
|
|
context.ElementDecl.ContentValidator.ContentType == XmlSchemaContentType.ElementOnly) {
|
|
SendValidationEvent(Res.Sch_StandAlone);
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
private void ValidatePIComment() {
|
|
// When validating with a dtd, empty elements should be lexically empty.
|
|
if (context.NeedValidateChildren ) {
|
|
if (context.ElementDecl.ContentValidator == ContentValidator.Empty) {
|
|
SendValidationEvent(Res.Sch_InvalidPIComment);
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
private void ValidateElement() {
|
|
elementName.Init(reader.LocalName, reader.Prefix);
|
|
if ( (reader.Depth == 0) &&
|
|
(!schemaInfo.DocTypeName.IsEmpty) &&
|
|
(!schemaInfo.DocTypeName.Equals(elementName)) ){ //VC 1
|
|
SendValidationEvent(Res.Sch_RootMatchDocType);
|
|
}
|
|
else {
|
|
ValidateChildElement();
|
|
}
|
|
ProcessElement();
|
|
}
|
|
|
|
private void ValidateChildElement() {
|
|
Debug.Assert(reader.NodeType == XmlNodeType.Element);
|
|
if (context.NeedValidateChildren) { //i think i can get away with removing this if cond since won't make this call for documentelement
|
|
int errorCode = 0;
|
|
context.ElementDecl.ContentValidator.ValidateElement(elementName, context, out errorCode);
|
|
if (errorCode < 0) {
|
|
XmlSchemaValidator.ElementValidationError(elementName, context, EventHandler, reader, reader.BaseURI, PositionInfo.LineNumber, PositionInfo.LinePosition, null);
|
|
}
|
|
}
|
|
}
|
|
|
|
private void ValidateStartElement() {
|
|
if (context.ElementDecl != null) {
|
|
Reader.SchemaTypeObject = context.ElementDecl.SchemaType;
|
|
|
|
if (Reader.IsEmptyElement && context.ElementDecl.DefaultValueTyped != null) {
|
|
Reader.TypedValueObject = context.ElementDecl.DefaultValueTyped;
|
|
context.IsNill = true; // reusing IsNill - what is this flag later used for??
|
|
}
|
|
if ( context.ElementDecl.HasRequiredAttribute ) {
|
|
attPresence.Clear();
|
|
}
|
|
}
|
|
|
|
if (Reader.MoveToFirstAttribute()) {
|
|
do {
|
|
try {
|
|
reader.SchemaTypeObject = null;
|
|
SchemaAttDef attnDef = context.ElementDecl.GetAttDef( new XmlQualifiedName( reader.LocalName, reader.Prefix) );
|
|
if (attnDef != null) {
|
|
if (context.ElementDecl != null && context.ElementDecl.HasRequiredAttribute) {
|
|
attPresence.Add(attnDef.Name, attnDef);
|
|
}
|
|
Reader.SchemaTypeObject = attnDef.SchemaType;
|
|
|
|
if (attnDef.Datatype != null && !reader.IsDefault) { //Since XmlTextReader adds default attributes, do not check again
|
|
// set typed value
|
|
CheckValue(Reader.Value, attnDef);
|
|
}
|
|
}
|
|
else {
|
|
SendValidationEvent(Res.Sch_UndeclaredAttribute, reader.Name);
|
|
}
|
|
}
|
|
catch (XmlSchemaException e) {
|
|
e.SetSource(Reader.BaseURI, PositionInfo.LineNumber, PositionInfo.LinePosition);
|
|
SendValidationEvent(e);
|
|
}
|
|
} while(Reader.MoveToNextAttribute());
|
|
Reader.MoveToElement();
|
|
}
|
|
|
|
}
|
|
|
|
private void ValidateEndStartElement() {
|
|
if (context.ElementDecl.HasRequiredAttribute) {
|
|
try {
|
|
context.ElementDecl.CheckAttributes(attPresence, Reader.StandAlone);
|
|
}
|
|
catch (XmlSchemaException e) {
|
|
e.SetSource(Reader.BaseURI, PositionInfo.LineNumber, PositionInfo.LinePosition);
|
|
SendValidationEvent(e);
|
|
}
|
|
}
|
|
|
|
if (context.ElementDecl.Datatype != null) {
|
|
checkDatatype = true;
|
|
hasSibling = false;
|
|
textString = string.Empty;
|
|
textValue.Length = 0;
|
|
}
|
|
}
|
|
|
|
private void ProcessElement() {
|
|
SchemaElementDecl elementDecl = schemaInfo.GetElementDecl(elementName);
|
|
Push(elementName);
|
|
if (elementDecl != null) {
|
|
context.ElementDecl = elementDecl;
|
|
ValidateStartElement();
|
|
ValidateEndStartElement();
|
|
context.NeedValidateChildren = true;
|
|
elementDecl.ContentValidator.InitValidation( context );
|
|
}
|
|
else {
|
|
SendValidationEvent(Res.Sch_UndeclaredElement, XmlSchemaValidator.QNameString(context.LocalName, context.Namespace));
|
|
context.ElementDecl = null;
|
|
}
|
|
}
|
|
|
|
public override void CompleteValidation() {
|
|
if (schemaInfo.SchemaType == SchemaType.DTD) {
|
|
do {
|
|
ValidateEndElement();
|
|
} while (Pop());
|
|
CheckForwardRefs();
|
|
}
|
|
}
|
|
|
|
private void ValidateEndElement() {
|
|
if (context.ElementDecl != null) {
|
|
if (context.NeedValidateChildren) {
|
|
if(!context.ElementDecl.ContentValidator.CompleteValidation(context)) {
|
|
XmlSchemaValidator.CompleteValidationError(context, EventHandler, reader, reader.BaseURI, PositionInfo.LineNumber, PositionInfo.LinePosition, null);
|
|
}
|
|
}
|
|
|
|
if (checkDatatype) {
|
|
string stringValue = !hasSibling ? textString : textValue.ToString(); // only for identity-constraint exception reporting
|
|
CheckValue(stringValue, null);
|
|
checkDatatype = false;
|
|
textValue.Length = 0; // cleanup
|
|
textString = string.Empty;
|
|
}
|
|
}
|
|
Pop();
|
|
|
|
}
|
|
|
|
public override bool PreserveWhitespace {
|
|
get { return context.ElementDecl != null ? context.ElementDecl.ContentValidator.PreserveWhitespace : false; }
|
|
}
|
|
|
|
|
|
void ProcessTokenizedType(
|
|
XmlTokenizedType ttype,
|
|
string name
|
|
) {
|
|
switch(ttype) {
|
|
case XmlTokenizedType.ID:
|
|
if (processIdentityConstraints) {
|
|
if (FindId(name) != null) {
|
|
SendValidationEvent(Res.Sch_DupId, name);
|
|
}
|
|
else {
|
|
AddID(name, context.LocalName);
|
|
}
|
|
}
|
|
break;
|
|
case XmlTokenizedType.IDREF:
|
|
if (processIdentityConstraints) {
|
|
object p = FindId(name);
|
|
if (p == null) { // add it to linked list to check it later
|
|
idRefListHead = new IdRefNode(idRefListHead, name, this.PositionInfo.LineNumber, this.PositionInfo.LinePosition);
|
|
}
|
|
}
|
|
|
|
break;
|
|
case XmlTokenizedType.ENTITY:
|
|
ProcessEntity(schemaInfo, name, this, EventHandler, Reader.BaseURI, PositionInfo.LineNumber, PositionInfo.LinePosition);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
//check the contents of this attribute to ensure it is valid according to the specified attribute type.
|
|
private void CheckValue(string value, SchemaAttDef attdef) {
|
|
try {
|
|
reader.TypedValueObject = null;
|
|
bool isAttn = attdef != null;
|
|
XmlSchemaDatatype dtype = isAttn ? attdef.Datatype : context.ElementDecl.Datatype;
|
|
if (dtype == null) {
|
|
return; // no reason to check
|
|
}
|
|
|
|
if (dtype.TokenizedType != XmlTokenizedType.CDATA) {
|
|
value = value.Trim();
|
|
}
|
|
|
|
object typedValue = dtype.ParseValue(value, NameTable, namespaceManager);
|
|
reader.TypedValueObject = typedValue;
|
|
// Check special types
|
|
XmlTokenizedType ttype = dtype.TokenizedType;
|
|
if (ttype == XmlTokenizedType.ENTITY || ttype == XmlTokenizedType.ID || ttype == XmlTokenizedType.IDREF) {
|
|
if (dtype.Variety == XmlSchemaDatatypeVariety.List) {
|
|
string[] ss = (string[])typedValue;
|
|
for (int i = 0; i < ss.Length; ++i) {
|
|
ProcessTokenizedType(dtype.TokenizedType, ss[i]);
|
|
}
|
|
}
|
|
else {
|
|
ProcessTokenizedType(dtype.TokenizedType, (string)typedValue);
|
|
}
|
|
}
|
|
|
|
SchemaDeclBase decl = isAttn ? (SchemaDeclBase)attdef : (SchemaDeclBase)context.ElementDecl;
|
|
if (decl.Values != null && !decl.CheckEnumeration(typedValue)) {
|
|
if (dtype.TokenizedType == XmlTokenizedType.NOTATION) {
|
|
SendValidationEvent(Res.Sch_NotationValue, typedValue.ToString());
|
|
}
|
|
else {
|
|
SendValidationEvent(Res.Sch_EnumerationValue, typedValue.ToString());
|
|
}
|
|
|
|
}
|
|
if (!decl.CheckValue(typedValue)) {
|
|
if (isAttn) {
|
|
SendValidationEvent(Res.Sch_FixedAttributeValue, attdef.Name.ToString());
|
|
}
|
|
else {
|
|
SendValidationEvent(Res.Sch_FixedElementValue, XmlSchemaValidator.QNameString(context.LocalName, context.Namespace));
|
|
}
|
|
}
|
|
}
|
|
catch (XmlSchemaException) {
|
|
if (attdef != null) {
|
|
SendValidationEvent(Res.Sch_AttributeValueDataType, attdef.Name.ToString());
|
|
}
|
|
else {
|
|
SendValidationEvent(Res.Sch_ElementValueDataType, XmlSchemaValidator.QNameString(context.LocalName, context.Namespace));
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
internal void AddID(string name, object node) {
|
|
// Note: It used to be true that we only called this if _fValidate was true,
|
|
// but due to the fact that you can now dynamically type somethign as an ID
|
|
// that is no longer true.
|
|
if (IDs == null) {
|
|
IDs = new Hashtable();
|
|
}
|
|
|
|
IDs.Add(name, node);
|
|
}
|
|
|
|
public override object FindId(string name) {
|
|
return IDs == null ? null : IDs[name];
|
|
}
|
|
|
|
private bool GenEntity(XmlQualifiedName qname) {
|
|
string n = qname.Name;
|
|
if (n[0] == '#') { // char entity reference
|
|
return false;
|
|
}
|
|
else if (SchemaEntity.IsPredefinedEntity(n)) {
|
|
return false;
|
|
}
|
|
else {
|
|
SchemaEntity en = GetEntity(qname, false);
|
|
if (en == null) {
|
|
// well-formness error, see xml spec [68]
|
|
throw new XmlException(Res.Xml_UndeclaredEntity, n);
|
|
}
|
|
if (!en.NData.IsEmpty) {
|
|
// well-formness error, see xml spec [68]
|
|
throw new XmlException(Res.Xml_UnparsedEntityRef, n);
|
|
}
|
|
|
|
if (reader.StandAlone && en.DeclaredInExternal) {
|
|
SendValidationEvent(Res.Sch_StandAlone);
|
|
}
|
|
return true;
|
|
}
|
|
}
|
|
|
|
|
|
private SchemaEntity GetEntity(XmlQualifiedName qname, bool fParameterEntity) {
|
|
SchemaEntity entity;
|
|
if (fParameterEntity) {
|
|
if (schemaInfo.ParameterEntities.TryGetValue(qname, out entity)) {
|
|
return entity;
|
|
}
|
|
}
|
|
else {
|
|
if (schemaInfo.GeneralEntities.TryGetValue(qname, out entity)) {
|
|
return entity;
|
|
}
|
|
}
|
|
return null;
|
|
}
|
|
|
|
private void CheckForwardRefs() {
|
|
IdRefNode next = idRefListHead;
|
|
while (next != null) {
|
|
if(FindId(next.Id) == null) {
|
|
SendValidationEvent(new XmlSchemaException(Res.Sch_UndeclaredId, next.Id, reader.BaseURI, next.LineNo, next.LinePos));
|
|
}
|
|
IdRefNode ptr = next.Next;
|
|
next.Next = null; // unhook each object so it is cleaned up by Garbage Collector
|
|
next = ptr;
|
|
}
|
|
// not needed any more.
|
|
idRefListHead = null;
|
|
}
|
|
|
|
private void Push(XmlQualifiedName elementName) {
|
|
context = (ValidationState)validationStack.Push();
|
|
if (context == null) {
|
|
context = new ValidationState();
|
|
validationStack.AddToTop(context);
|
|
}
|
|
context.LocalName = elementName.Name;
|
|
context.Namespace = elementName.Namespace;
|
|
context.HasMatched = false;
|
|
context.IsNill = false;
|
|
context.NeedValidateChildren = false;
|
|
}
|
|
|
|
private bool Pop() {
|
|
if (validationStack.Length > 1) {
|
|
validationStack.Pop();
|
|
context = (ValidationState)validationStack.Peek();
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
public static void SetDefaultTypedValue(
|
|
SchemaAttDef attdef,
|
|
IDtdParserAdapter readerAdapter
|
|
) {
|
|
try {
|
|
string value = attdef.DefaultValueExpanded;
|
|
XmlSchemaDatatype dtype = attdef.Datatype;
|
|
if (dtype == null) {
|
|
return; // no reason to check
|
|
}
|
|
if (dtype.TokenizedType != XmlTokenizedType.CDATA) {
|
|
value = value.Trim();
|
|
}
|
|
attdef.DefaultValueTyped = dtype.ParseValue(value, readerAdapter.NameTable, readerAdapter.NamespaceResolver);
|
|
}
|
|
#if DEBUG
|
|
catch (XmlSchemaException ex) {
|
|
Debug.WriteLineIf(DiagnosticsSwitches.XmlSchema.TraceError, ex.Message);
|
|
#else
|
|
catch (Exception) {
|
|
#endif
|
|
IValidationEventHandling eventHandling = ((IDtdParserAdapterWithValidation)readerAdapter).ValidationEventHandling;
|
|
if (eventHandling != null) {
|
|
XmlSchemaException e = new XmlSchemaException(Res.Sch_AttributeDefaultDataType, attdef.Name.ToString());
|
|
eventHandling.SendEvent(e, XmlSeverityType.Error);
|
|
}
|
|
}
|
|
}
|
|
|
|
public static void CheckDefaultValue(
|
|
SchemaAttDef attdef,
|
|
SchemaInfo sinfo,
|
|
IValidationEventHandling eventHandling,
|
|
string baseUriStr
|
|
) {
|
|
try {
|
|
if (baseUriStr == null) {
|
|
baseUriStr = string.Empty;
|
|
}
|
|
XmlSchemaDatatype dtype = attdef.Datatype;
|
|
if (dtype == null) {
|
|
return; // no reason to check
|
|
}
|
|
object typedValue = attdef.DefaultValueTyped;
|
|
|
|
// Check special types
|
|
XmlTokenizedType ttype = dtype.TokenizedType;
|
|
if (ttype == XmlTokenizedType.ENTITY) {
|
|
if (dtype.Variety == XmlSchemaDatatypeVariety.List) {
|
|
string[] ss = (string[])typedValue;
|
|
for (int i = 0; i < ss.Length; ++i) {
|
|
ProcessEntity(sinfo, ss[i], eventHandling, baseUriStr, attdef.ValueLineNumber, attdef.ValueLinePosition);
|
|
}
|
|
}
|
|
else {
|
|
ProcessEntity(sinfo, (string)typedValue, eventHandling, baseUriStr, attdef.ValueLineNumber, attdef.ValueLinePosition);
|
|
}
|
|
}
|
|
else if (ttype == XmlTokenizedType.ENUMERATION) {
|
|
if (!attdef.CheckEnumeration(typedValue)) {
|
|
if (eventHandling != null) {
|
|
XmlSchemaException e = new XmlSchemaException(Res.Sch_EnumerationValue, typedValue.ToString(), baseUriStr, attdef.ValueLineNumber, attdef.ValueLinePosition);
|
|
eventHandling.SendEvent(e, XmlSeverityType.Error);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
#if DEBUG
|
|
catch (XmlSchemaException ex) {
|
|
Debug.WriteLineIf(DiagnosticsSwitches.XmlSchema.TraceError, ex.Message);
|
|
#else
|
|
catch (Exception) {
|
|
#endif
|
|
|
|
if (eventHandling != null) {
|
|
XmlSchemaException e = new XmlSchemaException(Res.Sch_AttributeDefaultDataType, attdef.Name.ToString());
|
|
eventHandling.SendEvent(e, XmlSeverityType.Error);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
#pragma warning restore 618
|
|
|
|
}
|
|
|