网页抓取邮箱

using System;
using System.Collections.Generic;
using System.ComponentModel;
using System.Data;
using System.Drawing;
using System.IO;
using System.Net;
using System.Text;
using System.Text.RegularExpressions;
using System.Windows.Forms;


namespace WindowsFormsApplication5
{
    public partial class Form1 : Form
    {
        public Form1()
        {
            InitializeComponent();
        }

        private void button1_Click(object sender, EventArgs e)
        {
            WebClient web = new WebClient();//抓取网页的类
            web.Encoding = Encoding.Default;//字符串编码方式
            string url = textBox1.Text.Trim();//去除输入网址的空格
            if (!string.IsNullOrEmpty(url))//判读输入网址是否为空
            {
                string html = web.DownloadString(url);//下载网页
                MatchCollection mc = Regex.Matches(html, @"[a-zA-Z0-9_\-\.]+@\w+(\.\w+)+");//按正则表达式匹配
                StringBuilder sb = new StringBuilder();//可变字符串序列
                foreach (Match m in mc)
                {
                    sb.AppendLine(m.Value);//将字符追加到当前对象的末尾
                }
                textBox2.Text = sb.ToString();//显示出来
                //File.WriteAllText(@"E:\1.txt", sb.ToString());
                StreamWriter sw = new StreamWriter(@"E:\1.txt", true);//使用写入流保存到txt文档中
                sw.WriteLine(sb.ToString());
            }            
        }
    }
}

 

posted @ 2015-06-14 20:46  九省巡按  阅读(430)  评论(0编辑  收藏  举报