XML 到文本转换

本文关键字:转换 文本 XML | 更新日期: 2023-09-27 18:36:51

我想用C#写一些东西,它采用XML并将其转换为纯文本。

<note>
    <to>Tove</to>
    <from>Jani</from>
    <heading>Reminder</heading>
    <body>Don't forget me this weekend!</body>
</note>

会变成:

To Tove
From Jani
Heading Reminder
Body don't forget me this weekend!

有没有这样的事情?我该怎么做呢?

这只是我想要的想法仍然需要大量工作:

private void dataGridViewResult_SelectionChanged(object sender, EventArgs e)
        {
            if (this.dataGridViewResult.SelectedRows.Count > 0)
            {
                XslCompiledTransform xslt = new XslCompiledTransform();
                xslt.Load("SQL"); //.xml
                xslt.Transform("SQL","SQL"); //.xml, .html
                this.richTextBoxSQL.Text = this.dataGridViewResult.SelectedRows[0].Cells["SQL"].Value.ToString();
            }
        }

XML 到文本转换

以下 XSLT 脚本将执行所需的操作:

<?xml version="1.0" encoding="utf-8"?>
<xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
    <xsl:output method="text"/>
    <xsl:template match="*">
        <xsl:for-each select="*">
            <xsl:value-of select="local-name()"/>
            <xsl:text> </xsl:text>
            <xsl:value-of  select="."/>
            <xsl:text>
</xsl:text>
        </xsl:for-each>
    </xsl:template>
</xsl:stylesheet>

然后,您可以使用 XslCompiledTransform 类应用脚本,如下所示:

private string transformXml(string sourceXmlText, string xsltText)
{
    XmlDocument sourceXmlDocument = new XmlDocument();
    sourceXmlDocument.LoadXml(sourceXmlText);
    XslCompiledTransform transformer = new XslCompiledTransform();
    XmlTextReader xsltReader = new XmlTextReader(new StringReader(xsltText));
    transformer.Load(xsltReader);
    MemoryStream outputStream = new MemoryStream();
    XmlWriter xmlWriter = XmlWriter.Create(outputStream, transformer.OutputSettings);
    transformer.Transform(sourceXmlDocument, null, xmlWriter);
    outputStream.Position = 0;
    StreamReader streamReader = new StreamReader(outputStream);
    return streamReader.ReadToEnd();
}

它显然比人们发布的其他解决方案更复杂,但它的主要优点是如果您需要更改格式,可以轻松更改脚本。

像这样:

    XmlDocument doc = new XmlDocument();
    doc.LoadXml(your text string);
    StringBuilder sb = new StringBuilder();
    foreach (XmlNode node in doc.DocumentElement.ChildNodes)
    {
        sb.Append(char.ToUpper(node.Name[0]));
        sb.Append(node.Name.Substring(1));
        sb.Append(' ');
        sb.AppendLine(node.InnerText);
    }
    Console.WriteLine(sb);
你可以

做类似的事情

    string xml = @"<note>
                    <to>Tove</to>
                    <from>Jani</from>
                    <heading>Reminder</heading>
                    <body>Don't forget me this weekend!</body>
                </note>";
    StringBuilder sb = new StringBuilder();
    foreach (XElement element in XDocument.Parse(XML-STRING).Descendants("note"))
    {
        sb.AppendLine(string.Format("{0} {1}", element.Name, element.Value));
    }

这里给出的答案非常适合没有任何属性的简单XML文件。为了处理节点中可能包含属性和值的 XML,您需要更多...复杂。更不用说"列表项"(在同一组下具有相同节点名称但不同属性的项目,例如<书籍><书籍ID 作者="我" /><书籍ID 作者="您" />)。我需要将 XML 文件转换为 TAB 分隔的文本,并且必须包括所有情况。该代码已在具有数千个节点的几个 xml 文件上进行了测试,并且正在工作。"列表项"是通过使用"|"作为分隔符将每个属性或元素的"列表"值附加到现有列来处理的。我希望它可以帮助其他想要做类似事情并需要一个起点的人。如果有人正在阅读本文并知道更好的方法,我真的很想听听。

using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.IO;
using System.Xml;
public class FileProcessing
{
    static public void ConvertXmlFile(String theFile)
    {
        string theExportFile = theFile.Replace(".xml", ".txt");
        List<List<String>> theColumns = new List<List<string>>();
        List<String> theHeader = new List<string>();
        List<String> CurrentDepth = new List<string>();
        XmlDocument theXml = new XmlDocument();
        try
        {
            theXml.Load(theFile);
        }
        catch (Exception ex)
        {
            //handle as you seem fit. I use an error reporting system that is called here.
            return;
        }
        XmlElement theElement = theXml.DocumentElement;
        CurrentDepth.Add(theElement.ParentNode.Name);//Start at document level
        String ItemGroupTag = "";//this stores the element that groups all items(This element represents the complete line)
        String LastTagName = "";//detect if there is a listitem case(item with same tag appearing in a grouptag having different attribute values).
        int GroupItemDepth = 0;
        do
        {
            //null can occure on various errors. When it falls bellow the GroupItemDepth, the search is over
            if (theElement == null || CurrentDepth.Count <= GroupItemDepth) break;
            String CurrentTagName = theElement.ParentNode.Name + "." + theElement.Name;
            //only advance if this is not a listitem or the ItemGroupTag
            if (CurrentDepth[CurrentDepth.Count - 1] == CurrentTagName && LastTagName != CurrentTagName)
            {
                LastTagName = CurrentTagName;
                if (theElement.NextSibling != null)
                {
                    theElement = (XmlElement)theElement.NextSibling;
                    CurrentDepth[CurrentDepth.Count - 1] = LastTagName;
                    continue;
                }
                theElement = (XmlElement)theElement.ParentNode;
                CurrentDepth.RemoveAt(CurrentDepth.Count - 1);//I stepped one level up
                continue;
            }
            //only check the list until I get the group tag
            if (ItemGroupTag == "")
            {
                XmlNodeList theList = theXml.GetElementsByTagName(theElement.Name);
                if (theList.Count > 1)
                {
                    ItemGroupTag = CurrentTagName;
                    GroupItemDepth = CurrentDepth.Count;
                }
                else
                {
                    LastTagName = theElement.ParentNode.Name + "." + theElement.Name;
                    CurrentDepth.Add(LastTagName);//Stepped one level down
                    theElement = (XmlElement)theElement.FirstChild;
                    continue;
                }
            }
            //At this point I am in the GroupItem's entries
            //Check if the "line" has changed
            if (CurrentTagName == LastTagName && CurrentTagName == ItemGroupTag)
            {
                //It has changed. Make sure all columns have equal number of elements. If not, fill them with empty strings
                int MaxCount = 0;
                //First pass, find the number of items that should be in every column. Second pass, only one element apart in all occasions that
                //the count is not equal. Take in account that a column may appear out of nowhere, as an attribute, and fill it up to date
                for (int loop = 0; loop < theColumns.Count; loop++) if (theColumns[loop].Count > MaxCount) MaxCount = theColumns[loop].Count;
                for (int loop = 0; loop < theColumns.Count; loop++)
                {
                    //A problem will appear in cases that the second entry is a new attribute.
                    if (MaxCount > 2 && theColumns[loop].Count == 1)
                    {
                        while (theColumns[loop].Count != MaxCount) theColumns[loop].Insert(0, "");
                    }
                    else if (theColumns[loop].Count != MaxCount) theColumns[loop].Add("");
                }
                CurrentDepth.RemoveAt(CurrentDepth.Count - 1);//Remove the last entry of the group item
            }
            //Add a column for the tag, if there is none, or find its index, IF, this tag does not have child nodes
            int theColumnIndex = theHeader.IndexOf(CurrentTagName);
            if (theColumnIndex == -1 && !theElement.HasChildNodes)
            {
                theHeader.Add(CurrentTagName);
                theColumns.Add(new List<string>());
                theColumnIndex = theHeader.Count - 1;
            }
            if (theElement.HasAttributes)
            {
                XmlAttributeCollection theAttributes = theElement.Attributes;
                for (int loop = 0; loop < theAttributes.Count; loop++)
                {
                    theColumnIndex = theHeader.IndexOf(theElement.Name + "." + theAttributes[loop].Name);
                    if (theColumnIndex == -1)
                    {
                        theColumns.Add(new List<String>());
                        theHeader.Add(theElement.Name + "." + theAttributes[loop].Name);
                        theColumnIndex = theHeader.Count - 1;
                    }
                    if (theAttributes[loop].Value == null)
                    {
                        if (CurrentTagName == LastTagName && CurrentTagName != ItemGroupTag)
                            theColumns[theColumnIndex][theColumns[theColumnIndex].Count - 1] += "|";
                        else theColumns[theColumnIndex].Add("");
                    }
                    else
                    {
                        if (CurrentTagName == LastTagName && CurrentTagName != ItemGroupTag)
                            theColumns[theColumnIndex][theColumns[theColumnIndex].Count - 1] += "|" + theAttributes[loop].Value.ToString();
                        else theColumns[theColumnIndex].Add(theAttributes[loop].Value.ToString());
                    }
                }
            }
            else if (!theElement.HasChildNodes)
            {
                if (theElement.Value == null)
                {
                    if (CurrentTagName == LastTagName && CurrentTagName != ItemGroupTag) theColumns[theColumnIndex][theColumns[theColumnIndex].Count - 1] += "|";
                    else theColumns[theColumnIndex].Add("");//empty string for a null value
                }
                else
                {
                    if (CurrentTagName == LastTagName && CurrentTagName != ItemGroupTag) theColumns[theColumnIndex][theColumns[theColumnIndex].Count - 1] += "|" +
                        theElement.Value.ToString();
                    else theColumns[theColumnIndex].Add(theElement.Value.ToString());
                }
            }
            LastTagName = CurrentTagName;
            if (theElement.HasChildNodes)
            {
                theElement = (XmlElement)theElement.FirstChild;
                CurrentDepth.Add(LastTagName);//Went down a level
            }
            else if (theElement.NextSibling != null)
            {
                theElement = (XmlElement)theElement.NextSibling;
                //Prevent overwriting a previous group level when a list item occurs
                if (theElement.ParentNode.Name + "." + theElement.Name == LastTagName && CurrentDepth[CurrentDepth.Count - 1] != LastTagName)
                    CurrentDepth.Add(LastTagName);
                else CurrentDepth[CurrentDepth.Count - 1] = LastTagName;
            }
            else
            {
                theElement = (XmlElement)theElement.ParentNode;
                CurrentDepth.RemoveAt(CurrentDepth.Count - 1);//Went up a Level
            }
        } while (theElement != theXml.DocumentElement);
        //Put Everything together and write them to a file
        List<String> theLines = new List<string>();
        String theLine = "";
        for (int loop = 0; loop < theHeader.Count; loop++) theLine += "'t" + theHeader[loop];
        if (theLine != "") theLines.Add(theLine.Substring(1));
        int aMaxCount = 0;
        //Do a last check for row count consistency in columns
        for (int loop = 0; loop < theColumns.Count; loop++) if (theColumns[loop].Count > aMaxCount) aMaxCount = theColumns[loop].Count;
        for (int loop = 0; loop < theColumns.Count; loop++)
        {
            if (aMaxCount > 2 && theColumns[loop].Count == 1)
            {
                while (theColumns[loop].Count != aMaxCount) theColumns[loop].Insert(0, "");
            }
            else if (theColumns[loop].Count != aMaxCount) theColumns[loop].Add("");
        }
        for (int loop = 0; loop < theColumns[0].Count; loop++)
        {
            theLine = "";
            for (int loop1 = 0; loop1 < theColumns.Count; loop1++) theLine += "'t" + theColumns[loop1][loop].Replace(''t', ' ');
            if (theLine != "") theLines.Add(theLine.Substring(1));
        }
        File.WriteAllLines(theExportFile, theLines.ToArray(), Encoding.UTF8);
    }
}