您现在的位置:首页 >> 前端 >> 内容

页面爬虫(获取其他页面HTML)加载到自己页面

时间:2013/6/22 10:13:13 点击:

  核心提示://前台p id=showIframe/p$(document).ready(function() { var url = @Url.Action(GetPageHtml,Catalog); $.aj...

//前台

 <p id="showIframe"></p>

$(document).ready(function() {

        var url = "@Url.Action("GetPageHtml","Catalog")";
       
        $.ajax({
            url: url,
            type: "POST",
            dataType:"json",
            data: { url: "https://www.baidu.com" },
            error: function () {
                alert("bbb");
            },
            success: function (data) {
                $("#showIframe").append(data);
                //$("#showIframe p").hide();
                //$("#showIframe>#container").show();
                //$("#showIframe>#container>#content").show();
                //$("#showIframe>#container>#content>.cmsPage").show();
            }
        });

 });

 


//后台

//爬虫本质,发送URL请求,返回整个页面HTML

[HttpPost]
        public JsonResult GetPageHtml(string url)
        {
            string pageinfo;
            try
            {
                HttpWebRequest myReq = (HttpWebRequest)HttpWebRequest.Create(url);
                myReq.Accept = "image/gif, image/x-xbitmap, image/jpeg, image/pjpeg, application/x-shockwave-flash, application/vnd.ms-excel, application/vnd.ms-powerpoint, application/msword, */*";
                myReq.UserAgent = "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 2.0.50727)";
                HttpWebResponse myRep = (HttpWebResponse)myReq.GetResponse();
                Stream myStream = myRep.GetResponseStream();
                StreamReader sr = new StreamReader(myStream, Encoding.Default);
                pageinfo = sr.ReadToEnd().ToString();
            }
            catch
            {
                pageinfo = "";
            }
            return Json(pageinfo);
        }


 

作者:网络 来源:不详