Exercise files such as localhtml.html used in this document
See here download: http://download.csdn.net/detail/jadyer/5127317
Package COM. jadyer. httpclient; import Java. io. fileinputstream; import Java. io. fileoutputstream; import Java. util. list; import Org. apache. commons. io. ioutils; import Org. apache. HTTP. httpentity; import Org. apache. HTTP. httpresponse; import Org. apache. HTTP. client. httpclient; import Org. apache. HTTP. client. methods. httpget; import Org. apache. HTTP. impl. client. defaulthttpclient; import Org. apache. HTTP. util. entityutils; Import org.html parser. node; import org.html parser. nodefilter; import org.html parser. parser; import org.html parser. tags. div; import org.html parser. tags. linktag; import org.html parser. tags. metatag; import org.html parser. util. nodelist;/*** htmlparser entry _ 02 _ web crawler prototype _ parse the topic, author, keyword, and other information of the article * @ see references * @ see all jar files See the following * @ see commons-io-2.3.jar * @ see commons-logging-1.1.1.jar * @ see fluent-hc-4.2.1.jar * @ see httpclient-4.2.1.jar * @ see httpclient-cache-4.2.1.jar * @ see httpcore-4.2.1.jar * @ see httpmime-4.2.1.jar * @ see) * @ see htmllexer. jar * @ s EE htmlparser. jar * @ see sitecapturer. jar * @ see Thumbelina. jar * @ see examples * @ see the htmlparser tool class used in this article, see my following article * @ see http://blog.csdn.net/jadyer/article/details/8656479 * @ see examples * @ create Ma R 10,201 3 5:05:55 * @ author Xuan Yu