实例介绍
【实例简介】邮箱蜘蛛采集
【实例截图】
【核心代码】
using System; using System.Collections.Generic; using System.ComponentModel; using System.Data; using System.Drawing; using System.Linq; using System.Text; using System.Windows.Forms; using System.Diagnostics; using FireCrawler.Lib; namespace FireCrawler { public partial class MainForm : Form { #region Fields private WebSiteDetector _detector; #endregion #region Properties // number of bytes downloaded private int nByteCount; private int ByteCount { get { return nByteCount; } set { nByteCount = value; this.statusStrip.Text = Commas(nByteCount / 1024 1) " KB"; } } // number of Uri's found private int nURLCount; private int URLCount { get { return nURLCount; } set { nURLCount = value; this.statusBarPanelURLs.Text = Commas(nURLCount) " URL found"; } } // number of files downloaded private int nFileCount; private int FileCount { get { return nFileCount; } set { nFileCount = value; this.statusBarPanelFiles.Text = Commas(nFileCount) " file(s) downloaded"; } } #endregion public MainForm() { InitializeComponent(); dataGridThreads.AutoGenerateColumns = false; dataGridContacts.AutoGenerateColumns = false; _detector = new WebSiteDetector(); _detector.StatusChanged = new DetectorStatusChangedEventHandler(DetectorStatusChanged); _detector.ContactsFound = new DetectorContactsFoundEventHandler(DetectorContactsFound); } #region Helpers string Commas(int nNum) { string str = nNum.ToString(); int nIndex = str.Length; while (nIndex > 3) { str = str.Insert(nIndex - 3, ","); nIndex -= 3; } return str; } void ShowSettingsDialog() { SettingsForm dialog = new SettingsForm(); if (dialog.ShowDialog() == DialogResult.OK) { } } #endregion #region UI Events private void exitToolStripMenuItem_Click(object sender, EventArgs e) { this.Close(); } private void settingsToolStripMenuItem_Click(object sender, EventArgs e) { ShowSettingsDialog(); } #endregion private void buttonGo_Click(object sender, EventArgs e) { var text = txtSeeds.Text.Trim(); var seeds = text.Split(new string[] { "\r\n" }, StringSplitOptions.RemoveEmptyEntries); if (seeds == null || seeds.Length == 0) { MessageBox.Show(this, "请输入搜索网址","提示"); return; } if (_detector.Status == DetectorStatus.Start) { MessageBox.Show(this, "当前正在搜索中.....","提示"); return; } var d = MessageBox.Show(this, "是否开启搜索任务?","启动提示", MessageBoxButtons.OKCancel); if (d == System.Windows.Forms.DialogResult.Cancel) return; for (int i = 0; i < seeds.Length; i ) { var item = seeds[i]; if (item.ToLower().StartsWith("http:") == false) item = "http://" item; seeds[i] = item; } int layers = (int)Settings.Layers; _detector.InitSeeds(seeds,layers); _detector.Start(); tabcontrol.SelectedIndex = 2; } private void buttonStop_Click(object sender, EventArgs e) { if (_detector.Status != DetectorStatus.Start) return; var d = MessageBox.Show(this, "是否关闭当前任务?", "关闭提示", MessageBoxButtons.OKCancel); if (d == System.Windows.Forms.DialogResult.Cancel) return; _detector.Abort(); } delegate void UpdateDataGridCallback(WebSiteDetector d); private void UpdateDataGrid(WebSiteDetector d) { try { if (this.dataGridThreads.InvokeRequired) { UpdateDataGridCallback callback = new UpdateDataGridCallback(UpdateDataGrid); this.Invoke(callback, new object[] { d }); } else { dataGridThreads.DataSource = typeof(CrawlerThread[]); dataGridThreads.DataSource = d.Crawlers; } } catch (ObjectDisposedException) { } } private void UpdateDataGridContactOutput(WebSiteDetector d) { try { if (this.dataGridContacts.InvokeRequired) { UpdateDataGridCallback callback = new UpdateDataGridCallback(UpdateDataGridContactOutput); this.Invoke(callback, new object[] { d }); } else { dataGridContacts.DataSource = typeof(ContactOutputItem[]); dataGridContacts.DataSource = d.OutputItems.ToArray(); } } catch (ObjectDisposedException) { } } delegate void UpdateStatusStripCallback(); private void UpdateStatusStrip() { if (this.statusStrip.InvokeRequired) { UpdateStatusStripCallback callback = new UpdateStatusStripCallback(UpdateStatusStrip); this.Invoke(callback, new object[] { }); } else { statusBarPanelURLs.Text = string.Format("待检测URL: {0}", _detector.UrlsQueueFrontier.Count.ToString()); statusBarPanelFiles.Text = string.Format("已检测URL: {0}", _detector.CrawleHistroy.Count.ToString()); statusBarPanelSpeed.Text = string.Format("速度: {0:0.00}KB/sec", _detector.GetDetectSpeed()); statusBarPanelByteCount.Text = string.Format("流量: {0:0.00}MB", 1.0 * _detector.TotalSize / 1024 / 1024); } } private void DetectorStatusChanged(object sender, DetectorStatusChangedEventArgs e) { WebSiteDetector d = (WebSiteDetector)sender; UpdateDataGrid(d); } void DetectorContactsFound(object sender, DetectorContactsFoundEventArgs e) { WebSiteDetector d = (WebSiteDetector)sender; UpdateDataGridContactOutput(d); } private void timer_Tick(object sender, EventArgs e) { UpdateStatusStrip(); } private void MainForm_FormClosing(object sender, FormClosingEventArgs e) { _detector.Abort(); _detector.Dump("dump.txt"); } private void aboutToolStripMenuItem_Click(object sender, EventArgs e) { AboutForm form = new AboutForm(); form.ShowDialog(this); } private void btnBaidu_Click(object sender, EventArgs e) { BaiduForm baiduForm = new BaiduForm(this); var d = baiduForm.ShowDialog(this); if(d == System.Windows.Forms.DialogResult.OK) buttonGo.PerformClick(); } public void AcceptBaiduResult(string[] seeds) { string searchText = string.Empty; foreach (var seed in seeds) { searchText = seed; searchText = "\r\n"; } txtSeeds.Text = searchText; } private void btnStart_Click(object sender, EventArgs e) { buttonGo.PerformClick(); } private void btnExcel_Click(object sender, EventArgs e) { FireCrawler.Common.ExcelUtil.ExportDataGridViewToExcel(dataGridContacts); } } }
好例子网口号:伸出你的我的手 — 分享!
网友评论
小贴士
感谢您为本站写下的评论,您的评论对其它用户来说具有重要的参考价值,所以请认真填写。
- 类似“顶”、“沙发”之类没有营养的文字,对勤劳贡献的楼主来说是令人沮丧的反馈信息。
- 相信您也不想看到一排文字/表情墙,所以请不要反馈意义不大的重复字符,也请尽量不要纯表情的回复。
- 提问之前请再仔细看一遍楼主的说明,或许是您遗漏了。
- 请勿到处挖坑绊人、招贴广告。既占空间让人厌烦,又没人会搭理,于人于己都无利。
关于好例子网
本站旨在为广大IT学习爱好者提供一个非营利性互相学习交流分享平台。本站所有资源都可以被免费获取学习研究。本站资源来自网友分享,对搜索内容的合法性不具有预见性、识别性、控制性,仅供学习研究,请务必在下载后24小时内给予删除,不得用于其他任何用途,否则后果自负。基于互联网的特殊性,平台无法对用户传输的作品、信息、内容的权属或合法性、安全性、合规性、真实性、科学性、完整权、有效性等进行实质审查;无论平台是否已进行审查,用户均应自行承担因其传输的作品、信息、内容而可能或已经产生的侵权或权属纠纷等法律责任。本站所有资源不代表本站的观点或立场,基于网友分享,根据中国法律《信息网络传播权保护条例》第二十二与二十三条之规定,若资源存在侵权或相关问题请联系本站客服人员,点此联系我们。关于更多版权及免责申明参见 版权及免责申明
支持(0) 盖楼(回复)