实例介绍
【实例简介】邮箱蜘蛛采集
【实例截图】
【核心代码】
using System;
using System.Collections.Generic;
using System.ComponentModel;
using System.Data;
using System.Drawing;
using System.Linq;
using System.Text;
using System.Windows.Forms;
using System.Diagnostics;
using FireCrawler.Lib;
namespace FireCrawler
{
public partial class MainForm : Form
{
#region Fields
private WebSiteDetector _detector;
#endregion
#region Properties
// number of bytes downloaded
private int nByteCount;
private int ByteCount
{
get { return nByteCount; }
set
{
nByteCount = value;
this.statusStrip.Text = Commas(nByteCount / 1024 1) " KB";
}
}
// number of Uri's found
private int nURLCount;
private int URLCount
{
get { return nURLCount; }
set
{
nURLCount = value;
this.statusBarPanelURLs.Text = Commas(nURLCount) " URL found";
}
}
// number of files downloaded
private int nFileCount;
private int FileCount
{
get { return nFileCount; }
set
{
nFileCount = value;
this.statusBarPanelFiles.Text = Commas(nFileCount) " file(s) downloaded";
}
}
#endregion
public MainForm()
{
InitializeComponent();
dataGridThreads.AutoGenerateColumns = false;
dataGridContacts.AutoGenerateColumns = false;
_detector = new WebSiteDetector();
_detector.StatusChanged = new DetectorStatusChangedEventHandler(DetectorStatusChanged);
_detector.ContactsFound = new DetectorContactsFoundEventHandler(DetectorContactsFound);
}
#region Helpers
string Commas(int nNum)
{
string str = nNum.ToString();
int nIndex = str.Length;
while (nIndex > 3)
{
str = str.Insert(nIndex - 3, ",");
nIndex -= 3;
}
return str;
}
void ShowSettingsDialog()
{
SettingsForm dialog = new SettingsForm();
if (dialog.ShowDialog() == DialogResult.OK)
{
}
}
#endregion
#region UI Events
private void exitToolStripMenuItem_Click(object sender, EventArgs e)
{
this.Close();
}
private void settingsToolStripMenuItem_Click(object sender, EventArgs e)
{
ShowSettingsDialog();
}
#endregion
private void buttonGo_Click(object sender, EventArgs e)
{
var text = txtSeeds.Text.Trim();
var seeds = text.Split(new string[] { "\r\n" }, StringSplitOptions.RemoveEmptyEntries);
if (seeds == null || seeds.Length == 0)
{
MessageBox.Show(this, "请输入搜索网址","提示");
return;
}
if (_detector.Status == DetectorStatus.Start)
{
MessageBox.Show(this, "当前正在搜索中.....","提示");
return;
}
var d = MessageBox.Show(this, "是否开启搜索任务?","启动提示", MessageBoxButtons.OKCancel);
if (d == System.Windows.Forms.DialogResult.Cancel)
return;
for (int i = 0; i < seeds.Length; i )
{
var item = seeds[i];
if (item.ToLower().StartsWith("http:") == false)
item = "http://" item;
seeds[i] = item;
}
int layers = (int)Settings.Layers;
_detector.InitSeeds(seeds,layers);
_detector.Start();
tabcontrol.SelectedIndex = 2;
}
private void buttonStop_Click(object sender, EventArgs e)
{
if (_detector.Status != DetectorStatus.Start)
return;
var d = MessageBox.Show(this, "是否关闭当前任务?", "关闭提示", MessageBoxButtons.OKCancel);
if (d == System.Windows.Forms.DialogResult.Cancel)
return;
_detector.Abort();
}
delegate void UpdateDataGridCallback(WebSiteDetector d);
private void UpdateDataGrid(WebSiteDetector d)
{
try
{
if (this.dataGridThreads.InvokeRequired)
{
UpdateDataGridCallback callback = new UpdateDataGridCallback(UpdateDataGrid);
this.Invoke(callback, new object[] { d });
}
else
{
dataGridThreads.DataSource = typeof(CrawlerThread[]);
dataGridThreads.DataSource = d.Crawlers;
}
}
catch (ObjectDisposedException)
{
}
}
private void UpdateDataGridContactOutput(WebSiteDetector d)
{
try
{
if (this.dataGridContacts.InvokeRequired)
{
UpdateDataGridCallback callback = new UpdateDataGridCallback(UpdateDataGridContactOutput);
this.Invoke(callback, new object[] { d });
}
else
{
dataGridContacts.DataSource = typeof(ContactOutputItem[]);
dataGridContacts.DataSource = d.OutputItems.ToArray();
}
}
catch (ObjectDisposedException)
{
}
}
delegate void UpdateStatusStripCallback();
private void UpdateStatusStrip()
{
if (this.statusStrip.InvokeRequired)
{
UpdateStatusStripCallback callback = new UpdateStatusStripCallback(UpdateStatusStrip);
this.Invoke(callback, new object[] { });
}
else
{
statusBarPanelURLs.Text = string.Format("待检测URL: {0}", _detector.UrlsQueueFrontier.Count.ToString());
statusBarPanelFiles.Text = string.Format("已检测URL: {0}", _detector.CrawleHistroy.Count.ToString());
statusBarPanelSpeed.Text = string.Format("速度: {0:0.00}KB/sec", _detector.GetDetectSpeed());
statusBarPanelByteCount.Text = string.Format("流量: {0:0.00}MB", 1.0 * _detector.TotalSize / 1024 / 1024);
}
}
private void DetectorStatusChanged(object sender, DetectorStatusChangedEventArgs e)
{
WebSiteDetector d = (WebSiteDetector)sender;
UpdateDataGrid(d);
}
void DetectorContactsFound(object sender, DetectorContactsFoundEventArgs e)
{
WebSiteDetector d = (WebSiteDetector)sender;
UpdateDataGridContactOutput(d);
}
private void timer_Tick(object sender, EventArgs e)
{
UpdateStatusStrip();
}
private void MainForm_FormClosing(object sender, FormClosingEventArgs e)
{
_detector.Abort();
_detector.Dump("dump.txt");
}
private void aboutToolStripMenuItem_Click(object sender, EventArgs e)
{
AboutForm form = new AboutForm();
form.ShowDialog(this);
}
private void btnBaidu_Click(object sender, EventArgs e)
{
BaiduForm baiduForm = new BaiduForm(this);
var d = baiduForm.ShowDialog(this);
if(d == System.Windows.Forms.DialogResult.OK)
buttonGo.PerformClick();
}
public void AcceptBaiduResult(string[] seeds)
{
string searchText = string.Empty;
foreach (var seed in seeds)
{
searchText = seed;
searchText = "\r\n";
}
txtSeeds.Text = searchText;
}
private void btnStart_Click(object sender, EventArgs e)
{
buttonGo.PerformClick();
}
private void btnExcel_Click(object sender, EventArgs e)
{
FireCrawler.Common.ExcelUtil.ExportDataGridViewToExcel(dataGridContacts);
}
}
}
好例子网口号:伸出你的我的手 — 分享!
相关软件
网友评论
小贴士
感谢您为本站写下的评论,您的评论对其它用户来说具有重要的参考价值,所以请认真填写。
- 类似“顶”、“沙发”之类没有营养的文字,对勤劳贡献的楼主来说是令人沮丧的反馈信息。
- 相信您也不想看到一排文字/表情墙,所以请不要反馈意义不大的重复字符,也请尽量不要纯表情的回复。
- 提问之前请再仔细看一遍楼主的说明,或许是您遗漏了。
- 请勿到处挖坑绊人、招贴广告。既占空间让人厌烦,又没人会搭理,于人于己都无利。
关于好例子网
本站旨在为广大IT学习爱好者提供一个非营利性互相学习交流分享平台。本站所有资源都可以被免费获取学习研究。本站资源来自网友分享,对搜索内容的合法性不具有预见性、识别性、控制性,仅供学习研究,请务必在下载后24小时内给予删除,不得用于其他任何用途,否则后果自负。基于互联网的特殊性,平台无法对用户传输的作品、信息、内容的权属或合法性、安全性、合规性、真实性、科学性、完整权、有效性等进行实质审查;无论平台是否已进行审查,用户均应自行承担因其传输的作品、信息、内容而可能或已经产生的侵权或权属纠纷等法律责任。本站所有资源不代表本站的观点或立场,基于网友分享,根据中国法律《信息网络传播权保护条例》第二十二与二十三条之规定,若资源存在侵权或相关问题请联系本站客服人员,点此联系我们。关于更多版权及免责申明参见 版权及免责申明


支持(0) 盖楼(回复)