ImportJava.io.File;Importjava.io.FileNotFoundException;ImportJava.io.FileOutputStream;Importjava.io.IOException;ImportJava.io.PrintWriter;ImportOrg.jsoup.Jsoup;Importorg.jsoup.nodes.Document;Importorg.jsoup.nodes.Element;Importorg.jsoup.select.Elements; Public classHreftest {/*** Output File Method *@paramFilePath *@paramSB *@throwsIOException*/ Public Static voidOuthref (String filepath,stringbuffer SB)throwsioexception{Try{File File=NewFile (FilePath); PrintWriter writer=NewPrintWriter (Newfileoutputstream (file)); Writer.write (Sb.tostring ()); Writer.close (); } Catch(FileNotFoundException e) {e.printstacktrace (); } } /*** Positioning elements *@paramargs*/ Public Static voidMain (string[] args) {String FilePath= "/users/liuqi/desktop/result.log"; FinalString url= "http://www.baidu.com/"; String Str=""; StringBuffer SB=NewStringBuffer (); Try{Document doc=jsoup.connect (URL). get (); Elements links=doc.getelementsbytag ("a"); for(Element link:links) {if(Link.attr ("href"). Contains ("Baidu"))) Str=link.attr ("href"). toString (); Sb.append (str+ "\ n"); System.out.println (Link.attr ("href")); Outhref (FilePath, SB); } } Catch(IOException e) {e.printstacktrace (); } } }
Need to load Jsoup-1.10.1.jar this jar
Find page elements and output to pinned files