您现在的位置是:网站首页> 编程资料编程资料

百度小偷_小偷/采集_

2023-05-25 322人已围观

简介 百度小偷_小偷/采集_

<%
Function bytes2BSTR(vIn)
strReturn = ""
For i = 1 To LenB(vIn)
ThisCharCode = AscB(MidB(vIn,i,1))
If ThisCharCode < &H80 Then
strReturn = strReturn & Chr(ThisCharCode)
Else
NextCharCode = AscB(MidB(vIn,i+1,1))
strReturn = strReturn & Chr(CLng(ThisCharCode) * &H100 + CInt(NextCharCode))
i = i + 1
End If
Next
bytes2BSTR = ubb(strReturn)
End Function

Function dq(key)
dim XmlHttp
set XmlHttp = CreateObject("Microsoft.XMLHTTP")
XmlHttp.Open "GET","http://www.baidu.com/s?wd="&key&"&pn="&request("pn"), false
XmlHttp.setRequestHeader "Content-Type","text/XML"
XmlHttp.Send
dq = bytes2BSTR(XmlHttp.responseBody)
End Function

Function BR(Str)
Str = Replace(Str,"{br}","
")
Str = Replace(Str,vbcrlf,"
")
Str = Replace(Str,"

","
")
Str = Replace(Str,"

","
")
Str = Replace(Str,"

","
")
BR = Str
End Function


function ubb(str)

if instr(str,"找到相关网页") = 0 then
ubb = "没有搜索到任何内容"
exit function
end if

str = Replace(str,vbcrlf,"{br}")
str = Replace(str,"
","{br}")
str = Replace(str,"",""&vbcrlf)
str = Replace(str,"

dim re,Match,Matches
set re = New RegExp
re.Global = True
re.IgnoreCase = True

re.Pattern=".*\(.*)\<\/td>"

Set Matches = re.Execute(str)

For Each Match in Matches
ubb=ubb&BR(Match.value)
next
re.Pattern="(\- \百度快照\<\/a>)"
ubb = re.replace(ubb,"")
re.Pattern="(\
.[^\<]*\<\/a>)"
ubb = re.replace(ubb,"")
re.Pattern="(\.[^\<]*\<\/font>)"
ubb = re.replace(ubb,"


") '每一条信息的间隔
ubb = Replace(ubb,"","")
ubb = Replace(ubb,"","")
ubb = BR(UBB)


re.Pattern="(找到相关网页.*秒)"
Set Matches = re.Execute(str)
set Match = Matches(0)
ubb = ubb & Match & "
"

str = Replace(str,"

","
"&vbcrlf)


re.Pattern="\

(.*)\<\/div>"
Set Matches = re.Execute(str)
set Match = Matches(0)
Dim TheLink
TheLink = Match
re.Pattern="href=s?(.[^>]*)"
TheLink = re.replace(TheLink,"href=""$1""")

ubb = ubb & TheLink
end function

if len(request("wd")) > 0 then
response.write dq(request("wd"))
end if
%>




-六神源码网