Foxtable(狐表)用户栏目专家坐堂 → html 采集的问题


  共有2242人关注过本帖树形打印复制链接

主题:html 采集的问题

帅哥哟,离线,有人找我吗?
有点甜
  1楼 | 信息 | 搜索 | 邮箱 | 主页 | UC


加好友 发短信
等级:版主 帖子:85326 积分:427815 威望:0 精华:5 注册:2012/10/18 22:13:00
  发帖心情 Post By:2017/8/10 9:36:00 [显示全部帖子]

Dim data As String = FileSys.ReadAllText("d:\test.txt").Replace(vbcrlf, "").Replace(chr(9), "")
Dim reg As new System.Text.RegularExpressions.Regex("(?><tr.*?>).*?</tr>")
Dim reg2 As new System.Text.RegularExpressions.Regex("<td.*?>.*?<")
Dim reg3 As new System.Text.RegularExpressions.Regex("(?<=<td.*?>).*?(?=<)")
Dim reg4 As new System.Text.RegularExpressions.Regex("(?<=title="").*?(?="")")
Dim mc As object = reg.Matches(data)
For i as integer = 0 to mc.count-1
    'output.show(mc(i).value)
    Dim m As object = reg2.Matches(mc(i).value)
    output.show(m(0).value)
    Dim m1 As object = reg3.Matches(mc(i).value)
    output.show(m1(0).value)
    Dim m2 As object = reg4.Matches(mc(i).value)
    If m2.count > 0 Then
        output.show(m2(0).value)
    End If
next

 回到顶部