获取System.Xml.XmlException:名称不能以''字符,十六进制值0x20开头。第42行,第36位

时间:2012-09-19 15:18:42

标签: c# asp.net

我收到了这个错误,到目前为止我发现的只是“移除空间”,但没有空间。这是一个我发现的脚本,它将从任何文件格式中获取一个简历并提取数据(解析它),以便将它放入SQL数据库......还没有那么远

ASP.net代码:

<%@ Page Language="C#" AutoEventWireup="true" CodeFile="ResumeParser.aspx.cs"       Inherits="CsharpSamCodeResumeParser_USAResume" Debug="true" ValidateRequest="false" %>

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">

<html xmlns="http://www.w3.org/1999/xhtml" >
<head runat="server">
<title>Untitled Page</title>
</head>
<body>
<form id="form1" runat="server">
<div>
    <table style="width: 574px; height: 95px">
        <tr>
            <td style="width: 507px">
                Resume
                URL</td>
            <td style="width: 737px">
                <asp:TextBox ID="TxtUrl" runat="server" Width="424px"></asp:TextBox>
            </td>
        </tr>            
        <tr>
           <td colspan="2" align="center">                  
                    <asp:Button ID="Button1" runat="server" OnClick="Button1_Click" Text="Resume parser" /></td>
            </tr>
        </table>

    <table>
        <tr>
            <td style="width: 247px; height: 287px">
                PARSING RESULTS</td>
            <td style="width: 568px; height: 287px">
                <asp:TextBox ID="TxtOutput" runat="server" Height="276px" TextMode="MultiLine" Width="565px"></asp:TextBox></td>
        </tr>
    </table>

</div>
</form>

C#:

public partial class CsharpSamCodeResumeParser_USAResume : System.Web.UI.Page
{
//////////Configuration Setting/////////////////// 
string ServiceUrl = (string)ConfigurationSettings.AppSettings["webServiceUrl"];
protected void Page_Load(object sender, EventArgs e)
{

}

protected void Button1_Click(object sender, EventArgs e)
{
    ///////////////////Variable Start///////////////
    string url = TxtUrl.Text;        
    StringBuilder  strRequest =new StringBuilder();
    string userkey = (string)ConfigurationSettings.AppSettings["userKey"];
    string version = (string)ConfigurationSettings.AppSettings["Version"];
    string countryKey=(string)ConfigurationSettings.AppSettings["CountryKey"];
    /////////////////Variable End///////////////////


    strRequest.Append("<?xml version='1.0' encoding='utf-8'?>");
    strRequest.Append("<soap:Envelope xmlns:xsi='http://www.w3.org/2001/XMLSchema-instance' xmlns:xsd='http://www.w3.org/2001/XMLSchema' xmlns:soap='http://schemas.xmlsoap.org/soap/envelope/'>");
    strRequest.Append("<soap:Body>");
    strRequest.Append("<ParseResume xmlns='http://tempuri.org/'>");
    strRequest.Append("<url>" + url + "</url>");
    strRequest.Append("<key>" + userkey + "</key>");
    strRequest.Append("<version>" + version + "</version>");
    strRequest.Append("<countryKey>" + countryKey + "</countryKey>");
    strRequest.Append("</ParseResume>");
    strRequest.Append("</soap:Body>");
    strRequest.Append("</soap:Envelope>");
    ///////////////SOAP XML END///////////////////


    /////////////////XML PROCESSED//////////////////////
    byte[] byteArray = Encoding.ASCII.GetBytes(strRequest.ToString());
    HttpWebRequest httpRequest = (HttpWebRequest)WebRequest.Create(ServiceUrl);
    httpRequest.Credentials = CredentialCache.DefaultCredentials;
    httpRequest.Method = "POST";
    httpRequest.ContentType = "text/xml";
    httpRequest.ContentLength = byteArray.Length;
    Stream dataStream = httpRequest.GetRequestStream();
    dataStream.Write(byteArray, 0, byteArray.Length);
    dataStream.Close();
    /////////////////////PROCESS END////////////////

    //////////////////RESPONSE RECEIVED///////////////////////
    HttpWebResponse httpResponse = (HttpWebResponse)httpRequest.GetResponse();
    StreamReader streamReader = new StreamReader(httpResponse.GetResponseStream(), System.Text.Encoding.UTF8);
    string ack = string.Empty;
    //ack = streamReader.ReadToEnd().ToString();
    ////////////////////GET NODE VALUE FROM RESPONSE XML/////////////
    using (XmlReader reader = XmlReader.Create(streamReader))
    {
        while (reader.Read())
        {

            if (reader.NodeType == XmlNodeType.Element)
            {

                for (int count = 1; count <= reader.Depth; count++)
                {
                    if (reader.Name == "ParseResumeResult")
                    {
                        ack = reader.ReadElementContentAsString();
                    }

                }

            }
        }

        TxtOutput.Text = ack;
    }
    /////////////////API CALL PROCESS END///////////////////

}

}

2 个答案:

答案 0 :(得分:6)

我怀疑因为你是通过字符串连接创建xml文档,所以你无意中从一个变量中添加了格式错误的xml。也许其中一个有一个小于号,这导致Xml解析器炸弹。您应该尝试通过DOM创建文档,或者使用CDATA部分来创建可配置值。

string url = TxtUrl.Text;        
string userkey = (string)ConfigurationSettings.AppSettings["userKey"];
string version = (string)ConfigurationSettings.AppSettings["Version"];
string countryKey=(string)ConfigurationSettings.AppSettings["CountryKey"];    

strRequest.Append("<url>" + url + "</url>");
strRequest.Append("<key>" + userkey + "</key>");
strRequest.Append("<version>" + version + "</version>");
strRequest.Append("<countryKey>" + countryKey + "</countryKey>");

我会尝试将strRequest StringBuilder写入文件,然后在xml编辑器中打开它,并找出问题所在。

答案 1 :(得分:0)

你在这里有相互矛盾的陈述:

strRequest.Append("<?xml version='1.0' encoding='utf-8'?>");

VS

byte[] byteArray = Encoding.ASCII.GetBytes(strRequest.ToString());

你可能搞乱编码并最终得到不需要的字符。

您应该Encoding.ASCII替换Encoding.UTF8