获取URL网页信息

Posted 倪子

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了获取URL网页信息相关的知识,希望对你有一定的参考价值。

 

 

        static string Gethtml(string url)
        {string strHTML = "";
            WebClient myWebClient = new WebClient();
            Stream myStream = myWebClient.OpenRead(url);
            StreamReader sr = new StreamReader(myStream, System.Text.Encoding.GetEncoding("utf-8"));
            strHTML = sr.ReadToEnd();
            myStream.Close();
            return strHTML;
        }


        static bool GetHtml(string url)
      {
    
            HttpWebRequest myHttpWebRequest = (HttpWebRequest)WebRequest.Create(url);
            myHttpWebRequest.Timeout = 20 * 1000; //连接超时
            myHttpWebRequest.Accept = "*/*";
            myHttpWebRequest.UserAgent = "Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0;)";
            HttpWebResponse myHttpWebResponse = (HttpWebResponse)myHttpWebRequest.GetResponse();
            Stream stream = myHttpWebResponse.GetResponseStream();
            StreamReader sr =
               new StreamReader(stream, Encoding.GetEncoding("utf-8"));
            var html = sr.ReadToEnd();
           
}

 

 

获取当前Cookies保存后获取整站信息

static void Main(string[] args)
        {
           

            Console.WriteLine("确保挂载VPN后。。。回车键继续!");
            Console.ReadKey();

            string url = "http://www.sciencedirect.com/science/journal/00118486/61/6";

            string indata = "aa=zhuye";
            CookieContainer myCookieContainer =
                new CookieContainer();
            //新建一个cookiecontainer来存放cookie集合
            HttpWebRequest myHttpWebRequest =
                (HttpWebRequest)WebRequest.Create(url);
            //新建一个httpwebrequest
            myHttpWebRequest.ContentType = "application/x-www-form-urlencoded";
            myHttpWebRequest.ContentLength = indata.Length;
            myHttpWebRequest.Method = "post";
            myHttpWebRequest.CookieContainer = myCookieContainer;
            //设置httpwebrequest的cookiecontainer为
            //刚才建立的那个mycookiecontainer
            Stream myRequestStream = myHttpWebRequest.GetRequestStream();
            StreamWriter myStreamWriter = new StreamWriter(myRequestStream, Encoding.GetEncoding("gb2312"));
            myStreamWriter.Write(indata);
            //把数据写入httpwebrequest的request流
            myStreamWriter.Close();
            myRequestStream.Close();
            //关闭打开对象
            HttpWebResponse myHttpWebResponse =
                (HttpWebResponse)myHttpWebRequest.GetResponse();
            //新建一个httpwebresponse
            myHttpWebResponse.Cookies = myCookieContainer.GetCookies(myHttpWebRequest.RequestUri);
          
            Console.WriteLine("获取cookies成功!。。。关闭VPN后任意键继续");
            Console.ReadKey();

            var htmlData = SaveCook(myHttpWebRequest, prevUrl, myCookieContainer, myHttpWebResponse);
                               
            }
        }

 

 public static string SaveCook(HttpWebRequest myHttpWebRequest, string url, CookieContainer myCookieContainer, HttpWebResponse myHttpWebResponse)
        {
            //拿到了cookie,再进行请求就能直接读取到登录后的内容了
            myHttpWebRequest = (HttpWebRequest)WebRequest.Create(url);
            myHttpWebRequest.CookieContainer = myCookieContainer;//*
                                                                 //刚才那个cookiecontainer已经存有了cookie,把它附加到
 
            myHttpWebResponse = (HttpWebResponse)myHttpWebRequest.GetResponse();
            myHttpWebResponse.Cookies =
                myCookieContainer.GetCookies(myHttpWebRequest.RequestUri);


            Stream myresponsestream = myHttpWebResponse.GetResponseStream();
            StreamReader mystreamreader =
               new StreamReader(myresponsestream, Encoding.GetEncoding("gb2312"));

            var html = mystreamreader.ReadToEnd();
            //把数据从httpwebresponse的response流中读出
            mystreamreader.Close();
            myresponsestream.Close();
            return html;

        }

 

以上是关于获取URL网页信息的主要内容,如果未能解决你的问题,请参考以下文章

python如何批量抓取很多url的信息 求大佬 代码

Unity实战项目 ☀️| 教你如何在Unity中通过 代码获取 URL链接网页 的 标题 等各种信息✨

获取URL网页信息

如何获取网页的header格式

急!加分!如何获取网页视频中的URL地址?如优酷、腾讯这些在线的URL格式。

PHP抓取网页获取特定信息