/// <summary>
/// Reads articles from a Wikipedia dump. The file currently must be BUnzipped. XML is assumed to be valid. <seealso cref=""/>
/// </summary>
/// <param name="filename">An unzipped Wikipedia dump</param>
/// <returns>An IEnumerable of articles from the XML file</returns>
public static IEnumerable<WikipediaArticle> ReadArticlesFromXmlDump(string filename)
var settings = new XmlReaderSettings()
ValidationType = ValidationType.None,
ConformanceLevel = ConformanceLevel.Fragment
XmlReader x = XmlTextReader.Create(new StreamReader(filename), settings);
while (x.ReadToFollowing("page"))
if (x.NodeType == XmlNodeType.Element)
var article = ReadArticle(x);
yield return article;
