天天看點

TPL使用異步程式設計模型(APM)實作簡單網頁抓取

using System;
using System.Collections.Generic;
using System.Linq;
using System.Net;
using System.Threading;
using System.Threading.Tasks;

namespace fofo.NetSpider
{
    public class SimpleNetSpider
    {
        public void Start()
        {
            string[] urls = InitUrls();

            Task<WebResponse>[] tasks = urls.Select(url => GetResponseAsync(url)).ToArray();

            Task.WaitAll(tasks);
        }

        private string[] InitUrls()
        {
            string[] urls = 
            {
                "http://www.baidu.com/",
                "http://www.cnblogs.com",
                "http://www.csdn.com"
            };

            return urls;
        }

        // 啟動任務
        private Task<WebResponse> GetResponseAsync(string strUrl)
        {
            WebRequest webRequest = WebRequest.Create(strUrl);
            Task<WebResponse> task = Task<WebResponse>.Factory.FromAsync(webRequest.BeginGetResponse, GetResponseAsyncCompleted, webRequest);

            return task;
        }

        // 抓取結束回調函數
        private WebResponse GetResponseAsyncCompleted(IAsyncResult result)
        {
            WebRequest webRequest = (WebRequest)result.AsyncState;
            WebResponse response = webRequest.EndGetResponse(result);

            using (System.IO.StreamReader reader = new System.IO.StreamReader(response.GetResponseStream()))
            {
                // 具體處理            
            }

            return response;
        }   
    }
}