关于多个frame页面的抓取

来源:互联网 发布:java 可变参数 编辑:程序博客网 时间:2024/05/09 21:54

using System;

using System.Collections.Generic;

using System.ComponentModel;

using System.Data;

using System.Drawing;

using System.Linq;

using System.Text;

using System.Windows.Forms;

using mshtml;

 

namespace WindowsFormsApplication3

{

    public partial class Form1 : Form

    {

        public Form1()

        {

            InitializeComponent();

        }

 

        private void webBrowser1_DocumentCompleted(object sender, WebBrowserDocumentCompletedEventArgs e)

        {

            IHTMLDocument2 doc = (IHTMLDocument2)webBrowser1.Document.DomDocument;

 

            foreach (IHTMLElement LV0 in doc.all)

            {

                if (LV0.tagName.ToUpper() == "FRAME")

                {

                    IHTMLFrameBase2 LV0_FRAME = (IHTMLFrameBase2)LV0;

                    if (LV0_FRAME.contentWindow.name == "frm4")

                    {

                        foreach (IHTMLElement LV1 in LV0_FRAME.contentWindow.document.all)

                        {

                            if (LV1.tagName.ToUpper() == "FRAME")

                            {

                                IHTMLFrameBase2 LV1_FRAME = (IHTMLFrameBase2)LV1;

                                if (LV1_FRAME.contentWindow.name == "frm002")

                                {

                                    foreach (IHTMLElement LV2 in LV1_FRAME.contentWindow.document.all)

                                    {

                                        if (LV2.tagName.ToUpper() == "TABLE")

                                        {

                                           // MessageBox.Show(LV2.innerHTML);

                                            HTMLTable table = (HTMLTable)LV2;

                                            HTMLTableCell cell=null;

                                            HTMLTableRow row= null;

                                            object index=1;

                                            string text = "";

                                            row= (HTMLTableRow)table.rows.item(index,index);

                                            for (int i = 0; i < row.cells.length; i++)

                                            {

                                                object indexcell = i;

                                                string str = ",";

                                                cell = (HTMLTableCell)row.cells.item(indexcell, indexcell);

                                                if (i == 1)

                                                {

                                                   str = cell.innerHTML;

                                                   str = str.Replace("<EM>", ",");

                                                   str = str.Replace("</EM>", ",");                                                  

                                                   text = text + str;

                                                }

                                                else

                                                text = text + cell.innerText+str;

                                            }

                                           MessageBox.Show(text);

                                           HTMLDocument doc1 = (HTMLDocument)LV2.document;

                                           HTMLButtonElement button = (HTMLButtonElement)doc1.getElementById("showme");

                                           button.click();

                                        }

                                    }

                                }  

                            }

                        }

                    }

 

                }

            }

        }

 

 

     

 

        private void button1_Click(object sender, EventArgs e)

        {

            webBrowser1.Navigate(textBox1.Text);

        }

    }

}

 

 

原创粉丝点击