zoukankan      html  css  js  c++  java
  • 抓取网页萃取网页内容的代码 选择自 liujien 的 Blog

    dim sUrl
     sUrl="http://travel.state.gov/visa/frvi_bulletincurrent.html"
     Function streamtochar(StrStream)
     set stream=CreateObject("ADODB.Stream")
     stream.type=1
     stream.Mode=3
     stream.Open
     stream.Write Strstream
     stream.Position= 0
     stream.Type= 2
     stream.Charset="gb2312"
     streamtochar= stream.ReadText
     stream.Close
     set stream=nothing
     End Function
     i = i + 1
     function getContentByUrl(url)
     set XmlHttp = CreateObject("MSXML2.XMLHTTP")
     XmlHttp.open "GET",url,false
     XmlHttp.send
     getContentByUrl = streamtochar(oXmlHttp.responseBody)
     set XmlHttp=nothing
     end function
    
     function getRealContent(url)
     sContent = getContentByUrl(url)
     getRealContent=sContent
     end function
    
    html= getContentByUrl(surl)
     url_start=inStr(html," " )  url_end=inStr(html," ")
     url=Mid(html,url_start,url_end-url_start)
     url=replace(url,"“) 
     Date_start=inStr(html,"Washington, D.C. ")+57
     Date_end=inStr(html," A. STATUTORY")-14
     Date_T=Mid(html,Date_start,Date_end-Date_start)
  • 相关阅读:
    使用 pandas 导出数据
    Vue -- 基础语法和使用
    Django-用户模块与权限系统相关
    rest-framework之权限组件
    rest-framework之认证组件
    rest-framework之解析器
    Markdown -语法说明
    rest-framework之APIView 序列化组件
    eggjs-对接微信公众号
    常用站点
  • 原文地址:https://www.cnblogs.com/guola/p/400867.html
Copyright © 2011-2022 走看看