项目实例如下:按钮代码如下:
Dim web As new System.Windows.Forms.WebBrowser
web.ScriptErrorsSuppressed = True
'web.Navigate("http://toutiao.com/m6114233861/")
Dim ad As WinForm.ComboBox = e.Form.Controls("ComboBox2")
web.Navigate(ad.Value)
Do Until web.ReadyState = 4
Application.DoEvents
Loop
Dim pg = web.Document.GetElementById("pagebar").GetElementsByTagName("a")
Dim mpg As Integer = 1
If pg.count > 1 Then
mpg = pg(pg.count-2).Innertext
End If
DataTables("文章列表").DataRows.Clear
For i As Integer = 1 To mpg
web.Navigate( ad.text & "/p" & i)
'web.Navigate("http://toutiao.com/m6114233861/p" & i)
Do Until web.ReadyState = 4
Application.DoEvents
Loop
Dim divs = web.Document.GetElementById("ColumnContainer")
For Each div As object In divs.GetElementsByTagName("div")
If div.GetAttribute("ClassName") = "pin" Then
Dim tbs = div.GetElementsByTagName("table")
Dim trs = tbs(0).GetElementsByTagName("tr")
'output.show(trs(0).GetElementsByTagName("h3")(0).Innertext) '文章标题
'output.show(trs(0).GetElementsByTagName("a")(0).GetAttribute("href")) '文章标题
'output.show(trs(1).GetElementsByTagName("div")(1).Innertext) '正文
Dim tds = trs(2).GetElementsByTagName("td")
'output.show(tds(1).innertext) '阅读数
'output.show(tds(2).innertext) '评论数
'output.show(tds(3).innertext) '发布时间
'output.show("------")
Dim dr As DataRow = DataTables("文章列表").AddNew()
Dim 阅读数 As String = tds(1).innertext
Dim Parts() As String = 阅读数.Split(":")
Dim 评论数 As String = tds(2).innertext
Dim Parts1() As String = 评论数.Split(":")
Dim bt As System.Windows.Forms.HtmlElement
bt = web.Document.GetElementByID("keywords") '今日头条单位标题
'Output.Show(bt.innerText & " " & bt.GetAttribute("content"))
dr("单位") = bt.innerText & " " & bt.GetAttribute("content")
'msgbox(bt.innerText & " " & bt.GetAttribute("content"))
dr("文章标题") = trs(0).GetElementsByTagName("h3")(0).Innertext
dr("发布时间") = tds(3).innertext
dr("阅读数") = Parts(1)
dr("评论数") = Parts1(1)
dr("正文") = trs(1).GetElementsByTagName("div")(1).Innertext
dr("网址") = trs(0).GetElementsByTagName("a")(0).GetAttribute("href")
End If
Next
Next