内容显示页
 
类别:.Net + C# | 浏览(361) | 2008-5-4 17:47:15 | 关闭广告

 

using System;
using System.Collections.Generic;
using System.Text;
using System.Diagnostics;
using System.Text.RegularExpressions;
using System.IO;
using System.Net;

namespace 采集测试
{
    class Program
    {
        static void Main(string[] args)
        {
            string[] urls= {
                "http://www.yongfa365.com",
                "http://www.cbdcn.com",
                "http://www.csdn.net",
                "http://www.sina.com",
                "http://www.tom.com",
            };

            string html="";

            html = CaiJi.GetHtmlSource("http://www.yongfa365.com", Encoding.Default);
            Console.Write(html);
            Console.ReadKey();

            html = CaiJi.GetHtmlSource("http://www.baidu.com/");
            Console.Write(html);
            Console.ReadKey();

            html = CaiJi.GetHtmlSource("http://www.tom.com","utf-8");
            Console.Write(html);
            Console.ReadKey();

            foreach (string url in urls)
            {
                Console.Write(CaiJi.GetHtmlSource(url));
                Console.ReadKey();
            
            }
        }
    }
}


/// <summary>
/// 柳永法采集类
/// </summary>
class CaiJi
{
    /// <summary>
    /// 取得网页源码
    /// </summary>
    /// <param name="url">网页地址,eg:"http://www.yongfa365.com/" </param> 
    /// <param name="charset">网页编码,eg:"utf-8"</param>
    /// <returns>返回网页源文件</returns>
    public static string GetHtmlSource(string url, string charset)
    {
        //编码处理 
        Encoding nowCharset;
        if (charset == "" || charset == null)
        {
            nowCharset = Encoding.Default;
        }
        else
        {
            nowCharset = Encoding.GetEncoding(charset);
        }

        //处理内容
        string html = "";
        try
        {
            //WebRequest myWebRequest = WebRequest.Create(url);
            //WebResponse myWebResponse = myWebRequest.GetResponse();
            //Stream stream = myWebResponse.GetResponseStream();
            //StreamReader reader = new StreamReader(stream, nowCharset);

            HttpWebRequest request = (HttpWebRequest)WebRequest.Create(url);
            HttpWebResponse response = (HttpWebResponse)request.GetResponse();
            Stream stream = response.GetResponseStream();
            StreamReader reader = new StreamReader(stream, nowCharset);
            html = reader.ReadToEnd();
            stream.Close();
        }
        catch (Exception e)
        {
        }
        return html;
    }

    /// <summary>
    /// 取得网页源码
    /// </summary>
    /// <param name="url">网页地址,eg: "http://www.yongfa365.com/" </param> 
    /// <param name="charset">网页编码,eg: Encoding.UTF8</param>
    /// <returns>返回网页源文件</returns>
    public static string GetHtmlSource(string url, Encoding charset)
    {
        //处理内容
        string html = "";
        try
        {
            HttpWebRequest request = (HttpWebRequest)WebRequest.Create(url);
            HttpWebResponse response = (HttpWebResponse)request.GetResponse();
            Stream stream = response.GetResponseStream();
            StreamReader reader = new StreamReader(stream, charset);
            html = reader.ReadToEnd();
            stream.Close();
        }
        catch (Exception e)
        {
        }
        return html;
    }

    /// <summary>
    /// 取得网页源码
    /// 对于带BOM的网页很有效,不管是什么编码都能正确识别
    /// </summary>
    /// <param name="url">网页地址,eg: "http://www.yongfa365.com/" </param> 
    /// <returns>返回网页源文件</returns>
    public static string GetHtmlSource(string url)
    {
        //处理内容
        string html = "";
        try
        {
            HttpWebRequest request = (HttpWebRequest)WebRequest.Create(url);
            HttpWebResponse response = (HttpWebResponse)request.GetResponse();
            Stream stream = response.GetResponseStream();
            StreamReader reader = new StreamReader(stream, Encoding.Default); 
            html = reader.ReadToEnd();
            stream.Close();
        }
        catch (Exception e)
        {
        }
        return html;
    }
}

 

 


引用本页地址:http://www.yongfa365.com/item/C.netCaiJiLei.html
 
 
相关链接
 
网友评论:
姓名: 记住我
网址:
邮箱:
内容:
验证码:  验证码图片看不清? 换张图试试
 
   
 
 
文章分类
 
   

Power by :柳永法(yongfa365)'Blog | Model by :hibaidu | CSS by:众网友 | 京ICP备07011491号  QQ:64049027  E-mail:64049027qq.com

本空间赞助商:北京中科兴联信息技术有限公司