解決libxml2不支援中文的問題

來源:互聯網
上載者:User

使用libxml2處理xml檔案時,預設載入是使用utf-8編碼,所以在修改和儲存為GB2312編碼時,需要將資料轉換為utf-8編碼,然後再進行修改和儲存!

轉換使用iconv,以下是轉碼

char * ConvertEnc( char *encFrom, char *encTo, const char * in)
{
 
 static char bufin[1024], bufout[1024], *sin, *sout;
 int mode, lenin, lenout, ret, nline;
 iconv_t c_pt;
 
 if ((c_pt = iconv_open(encTo, encFrom)) == (iconv_t)-1)
 {
  printf("iconv_open false: %s ==> %s/n", encFrom, encTo);
  return NULL;
 }
 iconv(c_pt, NULL, NULL, NULL, NULL);
 
 lenin  = strlen(in) + 1;
 lenout = 1024;
 sin    = (char *)in;
 sout   = bufout;
 ret = iconv(c_pt, &sin, (size_t *)&lenin, &sout, (size_t *)&lenout);
               
 if (ret == -1)
 {
  return NULL;

 }

 iconv_close(c_pt);
 
 return bufout;
}

以下是執行個體

test.xml

<?xml version="1.0" encoding="gb2312"?>
<parent>測試</parent>

讀取代碼

int main(void)
{
        xmlDocPtr doc = NULL;
        xmlNodePtr cur = NULL;

        doc = xmlParseFile("test.xml");
        cur = xmlDocGetRootElement(doc);
        printf("%s/n", Convert("utf-8", "gb2312", (char *)xmlNodeGetContent(cur)));
}
修改、儲存代碼

test2.xml

<?xml version="1.0" encoding="gb2312"?>
<story>
  <storyinfo>
    <author>John Fleck</author>
    <datewritten>June 2, 2002</datewritten>
    <keyword>我來也 example keyword</keyword>
    <書目> C++ </書目>
    <測試> test </測試>
  </storyinfo>
  <body>
    <headline>This is the headline</headline>
    <para>This is the body text.</para>
  </body>
</story>

xmlDocPtr
parseDoc(char *docname, char *uri) {

 xmlDocPtr doc;
 xmlNodePtr cur;
 xmlNodePtr newnode;
 xmlAttrPtr newattr;

 doc = xmlParseFile(docname);
 
 if (doc == NULL ) {
  fprintf(stderr,"Document not parsed successfully. /n");
  return (NULL);
 }
 
 cur = xmlDocGetRootElement(doc);
 
 if (cur == NULL) {
  fprintf(stderr,"empty document/n");
  xmlFreeDoc(doc);
  return (NULL);
 }
 
 if (xmlStrcmp(cur->name, (const xmlChar *) "story")) {
  fprintf(stderr,"document of the wrong type, root node != story");
  xmlFreeDoc(doc);
  return (NULL);
 }
 
 newnode = xmlNewTextChild (cur, NULL, (xmlChar *)"reference", NULL);
 newattr = xmlNewProp (newnode, (xmlChar *)"uri", (xmlChar *)uri);
 return(doc);
}

int main(int argc, char ** argv )
{
    int options = 0;
    xmlDocPtr doc = NULL;
    char * output = NULL;
    char * szNode = NULL;
    int ret = 0;
   
    xmlAddEncodingAlias("UTF-8", "DVEnc");
    xmlKeepBlanksDefault(0);
 defaultEntityLoader = xmlGetExternalEntityLoader();
 xmlSetExternalEntityLoader(xmllintExternalEntityLoader);
 xmlLineNumbersDefault(1);
 
 szNode = Convert("gb2312", "utf-8", "測試" );
 doc = parseDoc( argv[2], szNode);
 
 ret = xmlSaveFormatFileEnc(output ? output : "-", doc, argv[1], 1);
 if (ret < 0)
 {
      fprintf(stderr, "failed save to %s/n",
              output ? output : "-");
 }
 return 0;
}

執行

xmlout gb2312 test2.xml

結果

<?xml version="1.0" encoding="gb2312"?>
<story>
  <storyinfo>
    <author>John Fleck</author>
    <datewritten>June 2, 2002</datewritten>
    <keyword>我來也 example keyword</keyword>
    <書目> C++ </書目>
    <測試> test </測試>
  </storyinfo>
  <body>
    <headline>This is the headline</headline>
    <para>This is the body text.</para>
  </body>
  <reference uri="測試"/>
</story>

聯繫我們

該頁面正文內容均來源於網絡整理,並不代表阿里雲官方的觀點,該頁面所提到的產品和服務也與阿里云無關,如果該頁面內容對您造成了困擾,歡迎寫郵件給我們,收到郵件我們將在5個工作日內處理。

如果您發現本社區中有涉嫌抄襲的內容,歡迎發送郵件至: info-contact@alibabacloud.com 進行舉報並提供相關證據,工作人員會在 5 個工作天內聯絡您,一經查實,本站將立刻刪除涉嫌侵權內容。

A Free Trial That Lets You Build Big!

Start building with 50+ products and up to 12 months usage for Elastic Compute Service

  • Sales Support

    1 on 1 presale consultation

  • After-Sales Support

    24/7 Technical Support 6 Free Tickets per Quarter Faster Response

  • Alibaba Cloud offers highly flexible support services tailored to meet your exact needs.