Asp.Net、asp實現的搜尋引擎網址收錄檢查程式_實用技巧

來源:互聯網
上載者:User

使用asp.net或者asp檢查某個url地址,某篇文章是否被搜尋引擎,如百度,Google,搜狗收錄。

實現原理:直接搜尋你那篇文章的url地址(不帶協議,但上協議也行,代碼會自動去掉協議內容),如果被索引會返回搜尋結果,否則會提示找不到資訊。

Asp.Net檢查百度,Google,搜狗搜尋引擎是否收錄文章網址原始碼:

using System;using System.Net;using System.Text;using System.IO;using System.Web;public class SearchEngineIndex{  public static string[] urls = { //搜尋引擎檢查地址      "http://www.baidu.com/s?ie=utf-8&wd=",//百度索引url檢查地址      "https://www.google.com.hk/search?q=",//Google索引url檢查地址      "http://www.sogou.com/web?ie=utf8&query="//搜狗索引url檢查地址    }    , noFindKeyword = { "抱歉,沒有找到與", "找不到和您的查詢", "未收錄?" };//搜尋引擎未索引url地址時的關鍵字  /// <summary>  /// 擷取響應的編碼  /// </summary>  /// <param name="contenttype"></param>  /// <returns></returns>  private static Encoding GetEncoding(string contenttype)  {    if (!string.IsNullOrEmpty(contenttype))    {      contenttype = contenttype.ToLower();      if (contenttype.IndexOf("gb2312") != -1 || contenttype.IndexOf("gbk") != -1) return Encoding.GetEncoding(936);      if (contenttype.IndexOf("big5") != -1) return Encoding.GetEncoding(950);    }    return Encoding.UTF8;  }  /// <summary>  /// 使用HttpWebRequest對象,自動識別字元集  /// </summary>  /// <param name="url"></param>  /// <param name="addUseragent">是否添加UserAgent,採集其他網站時防止被攔截</param>  /// <returns></returns>  public static string GetHtml(string url, bool addUseragent)  {    HttpWebRequest request = (HttpWebRequest)HttpWebRequest.Create(url);    if (addUseragent) request.UserAgent = "Googlebot|Feedfetcher-Google|Baiduspider";    string html = null;    try    {      HttpWebResponse response = (HttpWebResponse)request.GetResponse();      StreamReader srd = new StreamReader(response.GetResponseStream(), GetEncoding(response.ContentType));      html = srd.ReadToEnd();      srd.Close();      response.Close();    }    catch { }    return html;  }  /// <summary>  /// 檢查某個url是否被搜尋引擎索引  /// </summary>  /// <param name="url">url地址</param>  /// <param name="engin">0:百度 1:Google 2:搜狗,其他搜尋引擎如bing和360直接查網址顯示的結果不是直接得到網址的,有些出入,不做檢查</param>  /// <returns></returns>  public static bool CheckIndex(string url, int engin)  {    if (string.IsNullOrEmpty(url)) return false;    if (engin < 0 || engin > 2) engin = 0;    url = urls[engin] + HttpUtility.UrlEncode(url.ToLower().Replace("http://", "").Replace("https://", ""));    bool r = true;    string html = GetHtml(url, true);    if (html == null || html.IndexOf(noFindKeyword[engin]) != -1) r = false;    return r;  }}//調用方法樣本    SearchEngineIndex.CheckIndex("www.jb51.net/article/20101014/2902.aspx", 0);//檢查百度索引    SearchEngineIndex.CheckIndex("www.jb51.net/article/20101014/2902.aspx", 1);//檢查Google索引    SearchEngineIndex.CheckIndex("www.jb51.net/article/20101014/2902.aspx", 2);//檢查搜狗索引

Asp檢查百度,Google,搜狗搜尋引擎是否收錄文章網址原始碼:

<%class SearchEnginIndex dim urls,noFindKeyword private sub Class_Initialize  '百度,Google,搜狗url地址索引查詢地址  urls=array("http://www.baidu.com/s?ie=utf-8&wd=","https://www.google.com.hk/search?q=","http://www.sogou.com/web?ie=utf8&query=")  '搜尋引擎未索引url地址時的關鍵字  NoFindKeyword=array("抱歉,沒有找到與", "找不到和您的查詢", "未收錄?") End sub private function GetEncoding(contenttype)  contenttype=lcase(contenttype)  if instr(contenttype,"gb2312")<>0 and instr(contenttype,"gbk")<>0 then   GetEncoding="gb2312"  elseif instr(contenttype,"big5")<>0 then   GetEncoding="big5"  else   GetEncoding="utf-8"  end if end function private function BinToString(bin,encoding)'將2進位流資料依據編碼轉為對應的字串內容  dim obj  set obj=Server.CreateObject("Adodb.Stream")  obj.Type=1:obj.Mode=3:obj.Open  obj.Write bin  obj.Position=0:obj.Type=2:obj.Charset=encoding  BinToString=obj.ReadText  obj.Close:set obj=nothing end function public function GetHtml(url)  dim xhr  set xhr=server.CreateObject("microsoft.xmlhttp")  xhr.open "get",url,false  xhr.send  encoding=GetEncoding(xhr.getResponseHeader("content-type"))  response.CharSet=encoding  GetHtml=BinToString(xhr.responsebody,encoding)  set xhr=nothing end function public function CheckIndex(url,engin)  if len(url)=0 then exit function  if engin<0 or engin>2 then engin=1  url=urls(engin)&server.URLEncode(url)  dim html  html=GetHtml(url)  CheckIndex=instr(html,NoFindKeyword(engin))=0 End functionend Classset sei=new SearchEnginIndexresponse.Write sei.CheckIndex("www.jb51.net/article/20101014/2902.aspx",0)'百度索引response.Write sei.CheckIndex("www.jb51.net/article/20101014/2902.aspx",1)'Google索引response.Write sei.CheckIndex("www.jb51.net/article/20101014/2902.aspx",2)'搜狗索引set sei=nothing %>

相關文章

聯繫我們

該頁面正文內容均來源於網絡整理,並不代表阿里雲官方的觀點,該頁面所提到的產品和服務也與阿里云無關,如果該頁面內容對您造成了困擾,歡迎寫郵件給我們,收到郵件我們將在5個工作日內處理。

如果您發現本社區中有涉嫌抄襲的內容,歡迎發送郵件至: info-contact@alibabacloud.com 進行舉報並提供相關證據,工作人員會在 5 個工作天內聯絡您,一經查實,本站將立刻刪除涉嫌侵權內容。

A Free Trial That Lets You Build Big!

Start building with 50+ products and up to 12 months usage for Elastic Compute Service

  • Sales Support

    1 on 1 presale consultation

  • After-Sales Support

    24/7 Technical Support 6 Free Tickets per Quarter Faster Response

  • Alibaba Cloud offers highly flexible support services tailored to meet your exact needs.