正在将XML解析为列表
本文关键字:列表 XML | 更新日期: 2023-09-27 18:28:12
我有一个非常复杂的XML,我已经能够解析其中的大部分内容,但我遇到了一棵树,它让我很困惑,我担心我会让它变得更难。这是我所指的XML。
<Codes>
<CustomFieldValueSet name="Account" label="Account" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>7200</Value>
<Description>General Supplies</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>7200</Value>
<Description>General Supplies</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>7200</Value>
<Description>General Supplies</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Activity" label="Activity" distributionType="PercentOfPrice" />
<CustomFieldValueSet name="Chart" label="Chart" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>T</Value>
<Description>University</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>T</Value>
<Description>University</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>T</Value>
<Description>University</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Fund" label="Fund" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>360806</Value>
<Description>National Institutes of Health</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>360903</Value>
<Description>National Institutes of Health</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>360957</Value>
<Description>National Institutes of Health</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Program" label="Program" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>02</Value>
<Description>Research</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>02</Value>
<Description>Research</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>02</Value>
<Description>Research</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Location" label="Location" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>015</Value>
<Description>Biology - Life Science</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>015</Value>
<Description>Biology - Life Science</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>015</Value>
<Description>Biology - Life Science</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Organization" label="Organization" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>04400</Value>
<Description>TUSM:Neuroscience</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>04400</Value>
<Description>TUSM:Neuroscience</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>04400</Value>
<Description>TUSM:Neuroscience</Description>
</CustomFieldValue>
</CustomFieldValueSet>
</Codes>
我想最后列出一个看起来像这样的清单。
Account distributionType Activity distributionValue Fund
7200 PercentOfPrice "" 10 360806
7200 PercentOfPrice "" 45 360903
7200 PercentOfPrice "" 45 360957
等等。。。
我写的代码看起来像这样。这是一个片段。请注意,我想我把这件事搞得太复杂了。
if (tagName == "Codes")
{
// Create another reader that contains just the accounting elements.
XmlReader inner = reader.ReadSubtree();
//inner.ReadToDescendant("Codes");
//printOutXML(inner);
while (inner.Read())
{
switch (inner.NodeType)
{
//walk down the xml hiearchy then simply fill in the values.
case XmlNodeType.Element:
switch (reader.Name)
{
case "CustomFieldValueSet":
//get the attribute that we are currently working with such as account and
innerTagName=inner.GetAttribute("name");
// activity and location can potentially be blank therefore i will check here if it is
//and if it is i will immediate assign the activity list a set of empty quotes.
if (innerTagName == "Activity")
{
if (inner.IsEmptyElement)
{ //quickly put fillers in .
for (int i = 0; i < thisInvoice.account.Count; i++)
{
thisInvoice.activity.Add("");
}
}
}
if (innerTagName == "Location")
{
if (inner.IsEmptyElement)
{ //quickly put fillers in .
for (int i = 0; i < thisInvoice.account.Count; i++)
{
thisInvoice.location.Add("");
}
//thisInvoice.activity.Add("");
}
}
if (null == inner.GetAttribute("distributionType"))
{
distType = null;
}
else if
(distributionSwitch == false)
{
thisInvoice.distributionType.Add(inner.GetAttribute("distributionType") ?? "");
distType = inner.GetAttribute("distributionType") ?? "";
}
//Console.WriteLine(inner.Value);
//Console.WriteLine(inner.Name);
break;
case "CustomFieldValue":
if(null == inner.GetAttribute("distributionValue"))
//thisInvoice.distributionValue.Add(inner.GetAttribute("distributionValue") ?? "");
{/*do nothing*/}
else if
(distributionSwitch == false)
{
thisInvoice.distributionValue.Add(inner.GetAttribute("distributionValue") ?? "");
}
//check the length of the current distribution if the lenght is less than the curren distribution value
// then we must then add the values to the new location.
if (thisInvoice.distributionValue.Count > thisInvoice.distributionType.Count)
{
for (int i = 0; i < thisInvoice.distributionValue.Count - thisInvoice.distributionType.Count; i++)
{
thisInvoice.distributionType.Add(distType);
}
}
break;
case "Value":
// XmlNodeType.Text
if (innerTagName == "Account"/*&& inner.NodeType ==XmlNodeType.Text*/)
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.account.Add(inner.Value);
}
if (innerTagName == "Activity")
{
// activitiy is not a mandartory field so it could be empty therefore we need
// to check if its a self closing tag and if it is then we need to assign and
if (inner.IsEmptyElement)
{
thisInvoice.activity.Add("");
}
else
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.activity.Add(inner.Value);
}
}
if (innerTagName == "Location")
{
if (inner.IsEmptyElement)
{
thisInvoice.location.Add("");
}
else
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.location.Add(inner.Value);
}
}
if (innerTagName == "Fund")
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.fund.Add(inner.Value);
}
if (innerTagName == "Organization")
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.org.Add(inner.Value);
}
if (innerTagName == "Program")
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.prog.Add(inner.Value);
}
break;
}//end switch
break;//brake the outside case.
case XmlNodeType.EndElement:
if (inner.Name == "CustomFieldValueSet" || inner.Value == "CustomFieldValueSet")
{
distributionSwitch = true;
Console.WriteLine(reader.Value);
Console.WriteLine(reader.Name);
}
if (inner.Name == "Codes")
{
distributionSwitch = false;
distType = null;
inner.Close();
}
break;
}//end switch
}//end while
}//end the if;
在标记distributionType的情况下,我需要使列表长度与account的列表一样长,换句话说,一旦我在变量上有了它,我就需要将其用作填充符,以使分发类型列表与account列表一样大。我无法想象没有更简单的方法可以做到这一点——我一直在研究linq-to-xml,但它没有多大意义。我很想听听你们中的一些专家会如何处理这个问题。我正在尝试用更少的代码构建一个优雅的解决方案。如有任何帮助,我们将不胜感激。
如注释部分所述,作为Mihai使用LINQ to XML
的解决方案的替代方案,您还可以使用预定义的类结构将XML反序列化为类型化的类和属性。
这样做的好处是,您将拥有一个表示XML的对象(希望如此),并允许您更轻松地处理XML 中的数据
使用提供的XML示例,并使用Visual Studio中的编辑->Paste Special->将XML粘贴为类 有了这个类结构,您就可以用下面的行反序列化XML了 注意: 更好的方法是控制XML的结构,并以更好的方式对其进行结构化,使其比当前更易于解释,因为似乎每个 关于XML序列化的进一步阅读:using System.Xml.Serialization;
[XmlTypeAttribute(AnonymousType = true)]
[XmlRootAttribute(Namespace = "", IsNullable = false)]
public partial class Codes
{
[XmlElementAttribute("CustomFieldValueSet")]
public List<CodesCustomFieldValueSet> CustomFieldValueSet { get; set; }
}
[XmlTypeAttribute(AnonymousType = true)]
public partial class CodesCustomFieldValueSet
{
[XmlElementAttribute("CustomFieldValue")]
public List<CodesCustomFieldValueSetCustomFieldValue> CustomFieldValue { get; set; }
[XmlAttributeAttribute(AttributeName="name")]
public string Name { get; set; }
[XmlAttributeAttribute(AttributeName = "label")]
public string Label { get; set; }
[XmlAttributeAttribute(AttributeName = "distributionType")]
public string DistributionType { get; set; }
}
[XmlTypeAttribute(AnonymousType = true)]
public partial class CodesCustomFieldValueSetCustomFieldValue
{
public string Value { get; set; }
public string Description { get; set; }
[XmlAttributeAttribute(AttributeName = "distributionValue")]
public decimal DistributionValue { get; set; }
[XmlAttributeAttribute(AttributeName = "splitindex")]
public byte SplitIndex { get; set; }
}
(其中txtInput.Text
是用于保存示例XML数据的TextBox)XmlSerializer serializer = new XmlSerializer(typeof(Codes));
Codes codesInput = serializer.Deserialize(new StringReader(txtInput.Text)) as Codes;
if (codesInput != null)
{
// Do something with the data
}
根据您所需的输出和您提供的示例XML的结构,将需要将反序列化对象中的信息转换为您想要的内容/方式,为此,我建议创建一个附加的类结构,结合List<T>
,以保存您所需输出中显示的所有信息。CustomFieldValueSet
之间的链接都是splitindex
,这是子节点的一个属性,这使它变得非常复杂。
MSDN:介绍XML序列化
XmlSerializer类
您可以使用Linq到XML来实现这一点。
using System.Xml;
using System.Xml.Linq;
static void Main(string[] args) {
// This txt file contains your xml.
var xml_sample = File.ReadAllText("xml_sample.txt");
var doc = XDocument.Parse(xml_sample);
// Get all <CustomFieldValueSet> that have the label attribute `Account`
var accounts = from item in doc.Descendants("Codes").Descendants("CustomFieldValueSet")
where (item.HasAttributes) &&
(item.Attribute("label").Value == "Account")
select item;
// Create an anonymous type containing the value of the
// distributionValue attribute and the <Value> node.
var accountValue = from el in accounts.Descendants("CustomFieldValue")
let distAttribute = el.Attribute("distributionValue")
select new
{
distValue = distAttribute != null ? distAttribute.Value : "0",
value = el.Descendants("Value").First().Value,
};
// Display stuff here just to make sure we got it right.
accounts.ToList().ForEach(el =>
Console.WriteLine(el.Name + " " + el.Attribute("distributionType").Value));
accountValue.ToList().ForEach(el =>
Console.WriteLine(el.distValue + ":"+ el.value));
}
您应该能够根据需要使用这些思想来解析XML文件。