【发布时间】:2014-12-25 04:53:37
【问题描述】:
我有一个非常精细的 XML,我已经能够解析其中的大部分内容,但是我遇到了一棵让我难过的树,我担心我会变得更加困难。 这是我指的 XML。
<Codes>
<CustomFieldValueSet name="Account" label="Account" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>7200</Value>
<Description>General Supplies</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>7200</Value>
<Description>General Supplies</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>7200</Value>
<Description>General Supplies</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Activity" label="Activity" distributionType="PercentOfPrice" />
<CustomFieldValueSet name="Chart" label="Chart" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>T</Value>
<Description>University</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>T</Value>
<Description>University</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>T</Value>
<Description>University</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Fund" label="Fund" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>360806</Value>
<Description>National Institutes of Health</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>360903</Value>
<Description>National Institutes of Health</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>360957</Value>
<Description>National Institutes of Health</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Program" label="Program" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>02</Value>
<Description>Research</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>02</Value>
<Description>Research</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>02</Value>
<Description>Research</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Location" label="Location" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>015</Value>
<Description>Biology - Life Science</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>015</Value>
<Description>Biology - Life Science</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>015</Value>
<Description>Biology - Life Science</Description>
</CustomFieldValue>
</CustomFieldValueSet>
<CustomFieldValueSet name="Organization" label="Organization" distributionType="PercentOfPrice">
<CustomFieldValue distributionValue="10.00" splitindex="0">
<Value>04400</Value>
<Description>TUSM:Neuroscience</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="1">
<Value>04400</Value>
<Description>TUSM:Neuroscience</Description>
</CustomFieldValue>
<CustomFieldValue distributionValue="45.00" splitindex="2">
<Value>04400</Value>
<Description>TUSM:Neuroscience</Description>
</CustomFieldValue>
</CustomFieldValueSet>
</Codes>
我试图最终得到一个看起来像这样的列表。
Account distributionType Activity distributionValue Fund
7200 PercentOfPrice "" 10 360806
7200 PercentOfPrice "" 45 360903
7200 PercentOfPrice "" 45 360957
等等……
我编写的代码看起来像这样。这是一个sn-p。请注意,我想我把这件事复杂化了。
if (tagName == "Codes")
{
// Create another reader that contains just the accounting elements.
XmlReader inner = reader.ReadSubtree();
//inner.ReadToDescendant("Codes");
//printOutXML(inner);
while (inner.Read())
{
switch (inner.NodeType)
{
//walk down the xml hiearchy then simply fill in the values.
case XmlNodeType.Element:
switch (reader.Name)
{
case "CustomFieldValueSet":
//get the attribute that we are currently working with such as account and
innerTagName=inner.GetAttribute("name");
// activity and location can potentially be blank therefore i will check here if it is
//and if it is i will immediate assign the activity list a set of empty quotes.
if (innerTagName == "Activity")
{
if (inner.IsEmptyElement)
{ //quickly put fillers in .
for (int i = 0; i < thisInvoice.account.Count; i++)
{
thisInvoice.activity.Add("");
}
}
}
if (innerTagName == "Location")
{
if (inner.IsEmptyElement)
{ //quickly put fillers in .
for (int i = 0; i < thisInvoice.account.Count; i++)
{
thisInvoice.location.Add("");
}
//thisInvoice.activity.Add("");
}
}
if (null == inner.GetAttribute("distributionType"))
{
distType = null;
}
else if
(distributionSwitch == false)
{
thisInvoice.distributionType.Add(inner.GetAttribute("distributionType") ?? "");
distType = inner.GetAttribute("distributionType") ?? "";
}
//Console.WriteLine(inner.Value);
//Console.WriteLine(inner.Name);
break;
case "CustomFieldValue":
if(null == inner.GetAttribute("distributionValue"))
//thisInvoice.distributionValue.Add(inner.GetAttribute("distributionValue") ?? "");
{/*do nothing*/}
else if
(distributionSwitch == false)
{
thisInvoice.distributionValue.Add(inner.GetAttribute("distributionValue") ?? "");
}
//check the length of the current distribution if the lenght is less than the curren distribution value
// then we must then add the values to the new location.
if (thisInvoice.distributionValue.Count > thisInvoice.distributionType.Count)
{
for (int i = 0; i < thisInvoice.distributionValue.Count - thisInvoice.distributionType.Count; i++)
{
thisInvoice.distributionType.Add(distType);
}
}
break;
case "Value":
// XmlNodeType.Text
if (innerTagName == "Account"/*&& inner.NodeType ==XmlNodeType.Text*/)
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.account.Add(inner.Value);
}
if (innerTagName == "Activity")
{
// activitiy is not a mandartory field so it could be empty therefore we need
// to check if its a self closing tag and if it is then we need to assign and
if (inner.IsEmptyElement)
{
thisInvoice.activity.Add("");
}
else
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.activity.Add(inner.Value);
}
}
if (innerTagName == "Location")
{
if (inner.IsEmptyElement)
{
thisInvoice.location.Add("");
}
else
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.location.Add(inner.Value);
}
}
if (innerTagName == "Fund")
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.fund.Add(inner.Value);
}
if (innerTagName == "Organization")
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.org.Add(inner.Value);
}
if (innerTagName == "Program")
{
inner.MoveToContent();// move to the text
inner.Read();
thisInvoice.prog.Add(inner.Value);
}
break;
}//end switch
break;//brake the outside case.
case XmlNodeType.EndElement:
if (inner.Name == "CustomFieldValueSet" || inner.Value == "CustomFieldValueSet")
{
distributionSwitch = true;
Console.WriteLine(reader.Value);
Console.WriteLine(reader.Name);
}
if (inner.Name == "Codes")
{
distributionSwitch = false;
distType = null;
inner.Close();
}
break;
}//end switch
}//end while
}//end the if;
在标签 distributionType 的情况下,我需要使列表长度与帐户列表一样长,换句话说,一旦我将它放在变量上,我需要将其用作填充物,以使分布类型列表为大如帐户列表。 我无法想象没有更简单的方法可以做到这一点,我一直在查看 linq to xml,但这没有多大意义。我很想听听你们中的一些专家将如何解决这个问题。我正在尝试用更少的代码组合出一个优雅的解决方案。 任何帮助将不胜感激。
【问题讨论】:
-
作为第一个问题,你为什么不走反序列化XML成类的路线,而是自己解析XML?
-
bernd 我是一个使用 xml 的菜鸟。我得到一个 xml 文件,然后打开并处理该文件。最终我必须制作一个数组列表以插入到 DB 表中。反序列化 xml 可能是最好的选择,但在这一点上我不知道更好。
-
给我一点,我会为你输入一些东西。同时查看this post中的答案和链接
-
谢谢 Bernd 我会仔细查看帖子的。
-
我可能错了(因此只是将其作为评论发布),但我看到您的 XML 具有以下结构:
CustomFieldValueSet带有name和CustomFieldValue孩子一个唯一的splitindex和用于抓取的数据。为什么不以相同的方式解析每个CustomFieldValueSet并根据子项的splitindex值将其抓取的数据添加到对象列表中?它会自动有一个与之关联的帐户并获取所有其他相应的信息......简单地说,Account不应该是你的“主键”,而是,splitindex应该是......
标签: c# xml-parsing