This is second part of the post. Find first part here. So what is a better way of creating custom XmlReader/XmlWriter in .NET 2.0? Here is the idea - have an utility wrapper class, which wraps XmlReader/XmlWriter and does nothing else. Then derive from this class and override methods you
...
Btw, most likely the Mvp.Xml project will be rehosted to the CodePlex. SourceForge is ok, but the idea is that more Microsoft-friendly environment will induce more contributors both XML MVPs and others.
+
XmlWrappingReader class.
using System;
using System.Xml;
using System.Xml.Schema;
namespace Mvp.Xml.Common
{
public class XmlWrappingReader : XmlReader, IXmlLineInfo
{
protected XmlReader reader;
protected IXmlLineInfo readerAsIXmlLineInfo;
public XmlWrappingReader(XmlReader baseReader)
{
this.Reader = baseReader;
}
public override void Close()
{
this.reader.Close();
}
protected override void Dispose(bool disposing)
{
((IDisposable) this.reader).Dispose();
}
public override string GetAttribute(int i)
{
return this.reader.GetAttribute(i);
}
public override string GetAttribute(string name)
{
return this.reader.GetAttribute(name);
}
public override string GetAttribute(string name, string namespaceURI)
{
return this.reader.GetAttribute(name, namespaceURI);
}
public virtual bool HasLineInfo()
{
if (this.readerAsIXmlLineInfo != null)
{
return this.readerAsIXmlLineInfo.HasLineInfo();
}
return false;
}
public override string LookupNamespace(string prefix)
{
return this.reader.LookupNamespace(prefix);
}
public override void MoveToAttribute(int i)
{
this.reader.MoveToAttribute(i);
}
public override bool MoveToAttribute(string name)
{
return this.reader.MoveToAttribute(name);
}
public override bool MoveToAttribute(string name, string ns)
{
return this.reader.MoveToAttribute(name, ns);
}
public override bool MoveToElement()
{
return this.reader.MoveToElement();
}
public override bool MoveToFirstAttribute()
{
return this.reader.MoveToFirstAttribute();
}
public override bool MoveToNextAttribute()
{
return this.reader.MoveToNextAttribute();
}
public override bool Read()
{
return this.reader.Read();
}
public override bool ReadAttributeValue()
{
return this.reader.ReadAttributeValue();
}
public override void ResolveEntity()
{
this.reader.ResolveEntity();
}
public override void Skip()
{
this.reader.Skip();
}
public override int AttributeCount
{
get
{
return this.reader.AttributeCount;
}
}
public override string BaseURI
{
get
{
return this.reader.BaseURI;
}
}
public override bool CanResolveEntity
{
get
{
return this.reader.CanResolveEntity;
}
}
public override int Depth
{
get
{
return this.reader.Depth;
}
}
public override bool EOF
{
get
{
return this.reader.EOF;
}
}
public override bool HasAttributes
{
get
{
return this.reader.HasAttributes;
}
}
public override bool HasValue
{
get
{
return this.reader.HasValue;
}
}
public override bool IsDefault
{
get
{
return this.reader.IsDefault;
}
}
public override bool IsEmptyElement
{
get
{
return this.reader.IsEmptyElement;
}
}
public virtual int LineNumber
{
get
{
if (this.readerAsIXmlLineInfo != null)
{
return this.readerAsIXmlLineInfo.LineNumber;
}
return 0;
}
}
public virtual int LinePosition
{
get
{
if (this.readerAsIXmlLineInfo != null)
{
return this.readerAsIXmlLineInfo.LinePosition;
}
return 0;
}
}
public override string LocalName
{
get
{
return this.reader.LocalName;
}
}
public override string Name
{
get
{
return this.reader.Name;
}
}
public override string NamespaceURI
{
get
{
return this.reader.NamespaceURI;
}
}
public override XmlNameTable NameTable
{
get
{
return this.reader.NameTable;
}
}
public override XmlNodeType NodeType
{
get
{
return this.reader.NodeType;
}
}
public override string Prefix
{
get
{
return this.reader.Prefix;
}
}
public override char QuoteChar
{
get
{
return this.reader.QuoteChar;
}
}
protected XmlReader Reader
{
get
{
return this.reader;
}
set
{
this.reader = value;
this.readerAsIXmlLineInfo = value as IXmlLineInfo;
}
}
public override System.Xml.ReadState ReadState
{
get
{
return this.reader.ReadState;
}
}
public override IXmlSchemaInfo SchemaInfo
{
get
{
return this.reader.SchemaInfo;
}
}
public override XmlReaderSettings Settings
{
get
{
return this.reader.Settings;
}
}
public override string Value
{
get
{
return this.reader.Value;
}
}
public override Type ValueType
{
get
{
return this.reader.ValueType;
}
}
public override string XmlLang
{
get
{
return this.reader.XmlLang;
}
}
public override System.Xml.XmlSpace XmlSpace
{
get
{
return this.reader.XmlSpace;
}
}
}
}
+
XmlWrappingWriter class.
using System;
using System.Xml;
namespace Mvp.Xml.Common
{
public class XmlWrappingWriter : XmlWriter
{
protected XmlWriter writer;
public XmlWrappingWriter(XmlWriter baseWriter)
{
this.Writer = baseWriter;
}
public override void Close()
{
this.writer.Close();
}
protected override void Dispose(bool disposing)
{
((IDisposable) this.writer).Dispose();
}
public override void Flush()
{
this.writer.Flush();
}
public override string LookupPrefix(string ns)
{
return this.writer.LookupPrefix(ns);
}
public override void WriteBase64(byte[] buffer, int index, int count)
{
this.writer.WriteBase64(buffer, index, count);
}
public override void WriteCData(string text)
{
this.writer.WriteCData(text);
}
public override void WriteCharEntity(char ch)
{
this.writer.WriteCharEntity(ch);
}
public override void WriteChars(char[] buffer, int index, int count)
{
this.writer.WriteChars(buffer, index, count);
}
public override void WriteComment(string text)
{
this.writer.WriteComment(text);
}
public override void WriteDocType(string name, string pubid, string sysid, string subset)
{
this.writer.WriteDocType(name, pubid, sysid, subset);
}
public override void WriteEndAttribute()
{
this.writer.WriteEndAttribute();
}
public override void WriteEndDocument()
{
this.writer.WriteEndDocument();
}
public override void WriteEndElement()
{
this.writer.WriteEndElement();
}
public override void WriteEntityRef(string name)
{
this.writer.WriteEntityRef(name);
}
public override void WriteFullEndElement()
{
this.writer.WriteFullEndElement();
}
public override void WriteProcessingInstruction(string name, string text)
{
this.writer.WriteProcessingInstruction(name, text);
}
public override void WriteRaw(string data)
{
this.writer.WriteRaw(data);
}
public override void WriteRaw(char[] buffer, int index, int count)
{
this.writer.WriteRaw(buffer, index, count);
}
public override void WriteStartAttribute(string prefix, string localName, string ns)
{
this.writer.WriteStartAttribute(prefix, localName, ns);
}
public override void WriteStartDocument()
{
this.writer.WriteStartDocument();
}
public override void WriteStartDocument(bool standalone)
{
this.writer.WriteStartDocument(standalone);
}
public override void WriteStartElement(string prefix, string localName, string ns)
{
this.writer.WriteStartElement(prefix, localName, ns);
}
public override void WriteString(string text)
{
this.writer.WriteString(text);
}
public override void WriteSurrogateCharEntity(char lowChar, char highChar)
{
this.writer.WriteSurrogateCharEntity(lowChar, highChar);
}
public override void WriteValue(bool value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(DateTime value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(decimal value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(double value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(int value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(long value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(object value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(float value)
{
this.writer.WriteValue(value);
}
public override void WriteValue(string value)
{
this.writer.WriteValue(value);
}
public override void WriteWhitespace(string ws)
{
this.writer.WriteWhitespace(ws);
}
public override XmlWriterSettings Settings
{
get
{
return this.writer.Settings;
}
}
protected XmlWriter Writer
{
get
{
return this.writer;
}
set
{
this.writer = value;
}
}
public override System.Xml.WriteState WriteState
{
get
{
return this.writer.WriteState;
}
}
public override string XmlLang
{
get
{
return this.writer.XmlLang;
}
}
public override System.Xml.XmlSpace XmlSpace
{
get
{
return this.writer.XmlSpace;
}
}
}
}
Now instead of deriving from legacy XmlTextReader/XmlTextWriter you derive from XmlWrappingReader/XmlWrappingWriter passing to their constructors XmlReader/XmlWriter created via Create() factory method:
public class RenamingXmlReader : XmlWrappingReader
{
//Provide as many contructors as you need
public RenamingXmlReader(string file)
: base(XmlReader.Create(file)) { }
public override string Name
{
get
{
return (NodeType == XmlNodeType.Element &&
base.Name == "value") ?
"price" : base.Name;
}
}
public override string LocalName
{
get
{
return (NodeType == XmlNodeType.Element &&
base.LocalName == "value") ?
"price" : base.LocalName;
}
}
}
public class RenamingXmlWriter : XmlWrappingWriter
{
//Provide as many contructors as you need
public RenamingXmlWriter(TextWriter output)
: base(XmlWriter.Create(output)) { }
public override void WriteStartElement(string prefix, string localName, string ns)
{
if (string.IsNullOrEmpty(prefix) && localName == "price")
{
localName = "value";
}
base.WriteStartElement(prefix, localName, ns);
}
}
That's it. Not much different from previous option in terms of coding, but free of weird XmlTextReader/XmlTextWriter legacy.
AFAIK there is still one problem with this approach though, which is DTD validation. I mean cascading validating XmlReader on top of custom XmlReader scenario. E.g. if you need to resolve XInclude or rename couple of elements and validate resulting XML against DTD in one shot. In .NET 2.0 if you want to DTD validate XML that comes from another XmlReader that reader must be an instance of XmlTextReader. That's undocumented limitation and it was left sort of deliberatly - after all who cares about DTD nowadays? XML Schema validation is not affected by this limitation.
When developing custom XmlReader or XmlWriter in .NET 2.0 there is at least three options:
implement XmlReader/XmlWriter
extend one of concrete XmlReader/XmlWriter implementations and override only methods you need
implement XmlReader/XmlWriter by wrapping one of concrete XmlReader/XmlWriter implementations and overriding only methods you need
...
First way is a for full-blown XmlReader/XmlWriters, which need to implement each aspects of XML reading/writing in a different way, e.g. XmlCsvReader, which reads CSV as XML or XslReader, which streamlines XSLT output. This is the most clean while the hardest way - XmlReader has 26 (and XmlWriter - 24) abstract members you would have to implement. Second and third options are for override-style custom readers/writers. When you only need to partially modify XmlReader/XmlWriter behavior it's an overkill to reimplement it from scratch. As this is the most usual scenario I'll concentrate on these two options.
OOP taught us - inherit the class whose behaviour you want to modify and override its virtual members. That's the easiest and most popular way of writing custom XmlReader/XmlWriter. For example let's say you are receiving XML documents from your business partners and one particularly annoying one keeps sending element <value>, while according to the schema you expect it to be <price>. So you need renaming plumbing - XmlReader that reads <value> as <price> and XmlWriter that writes <price> as <value>. Here are implementations extending standard XmlTextReader and XmlTextWriter classes:
public class RenamingXmlReader : XmlTextReader
{
//Provide as many constructors as you need
public RenamingXmlReader(string file)
: base(file) { }
public override string Name
{
get
{
return (NodeType == XmlNodeType.Element &&
base.Name == "value") ?
"price" : base.Name;
}
}
public override string LocalName
{
get
{
return (NodeType == XmlNodeType.Element &&
base.LocalName == "value") ?
"price" : base.LocalName;
}
}
}
public class RenamingXmlWriter : XmlTextWriter
{
//Provide as many constructors as you need
public RenamingXmlWriter(TextWriter output)
: base(output) { }
public override void WriteStartElement(string prefix,
string localName, string ns)
{
if (string.IsNullOrEmpty(prefix) && localName == "price")
{
localName = "value";
}
base.WriteStartElement(prefix, localName, ns);
}
}
Looks nice, but there is a couple of serious drawbacks in this approach though:
- XmlTextReader and XmlTextWriter are kinda legacy classes. They were introduced in .NET 1.0 with some deviations from the XML standard and as it usually happens now Microsoft have to support those deviations for the sake of backwards compatibility. That means that there some aspects where XmlTextReader/XmlTextWriter and XmlReader/XmlWriter created via Create() method behave differently, in short - Create() method creates more conformant XmlReader/XmlWriter instances than XmlTextReader/XmlTextWriter, e.g. XmlTextWriter does not check for the following:
- Invalid characters in attribute and element names.
- Unicode characters that do not fit the specified encoding. If the Unicode characters do not fit the specified encoding, the XmlTextWriter does not escape the Unicode characters into character entities.
- Duplicate attributes.
- Characters in the DOCTYPE public identifier or system identifier.
And XmlTextReader doesn't check character range for numeric entities and so allows unless Normalization property (off by default) is turned on etc.
So beware that when deriving from XmlTextReader/XmlTextWriter you are gonna inherit all their crappy legacy weirdnesses too.
- Since .NET 1.1 XmlTextReader has FullTrust inheritance demand, i.e. only fully trusted classes can derive from XmlTextReader. That means that above RenaminXmlReader won't work in partially trusted environment such as ASP.NET or ClickOnce. I run into this unpleasant issue with my free eXml Web server control - since XmlBaseAwareXmlTextReader derives from XmlTextReader (just because I was too lazy when creating it) eXml control cannot do XInclude unless working under FullTrust.
So actually I wouldn't recommend deriving from XmlTextReader/XmlTextWriter.
A third approach is to wrap XmlReader/XmlWriter created via Create() method and override methods you need. This approach is used by .NET itself. This requires a little bit more code, but as a result you get clean design and easily composable implementation. I'll cover it tomorrow 'cause Tel-Aviv traffic jams are waiting for me now.
From .NET 1.X experience Microsoft seems finally figured out that providing a set of concrete poorly composable XmlReader and XmlWriter implementations (XmlTextReader, XmlTextWriter, XmlValidatingReader, XmlNodeReader) and emphasizing on programming with concrete classes instead of anstract XmlReader/Xmlwriter was really bad idea. One notorious horrible sample was XmlValidatingReader accepting abstract XmlReader instance
...
Well, unfortunately when you do something wrong for years you can't fix things "in a one swift stroke". Sadly, but MSDN documentation itself (even System.Xml namespace documentation!) is still full of samples using "not recommended" XmlTextReader and XmlTextWriters. And if you don't follow you words youself why would others do? Reality is that .NET developers didn't notice that shy recommendation and keep programming into concrete XML reader/writer classes.
So it wasn't a surprise for me to see fresh MSDN Magazine (06/2006) article "Five Ways to Emit Test Results as XML" promoting using XmlTextWriter class once again and not even mentioning XmlWriter.Create() pattern. Hey, I thought it's a requirement for MSDN authors to read MSDN documentation on a subject? Apparently it's not.
Another thing that bothers me is that XmlReader/XmlWriter factory has no extensibility points whatsoever. So that's not an option for non-Microsoft XML parsers and writers like XIncludingReader or MultiXmlTextWriter to be created in that factory. There is no way to plug in support for XML Base into a system without writing actual code that instantiates XmlBaseAwareXmlTextReader. Microsoft still considers providing abstract factory for XML readers/writers too geeky and similar (in terms or weirdness) to providing abstract factory for string class. Well, it probably would take another couple of .NET versions to grow up before .NET would come to extensibility Java already has for years.