import urllib2
connect= urllib2.Request('http://www.baidu.com')
url1 = urllib2.urlopen(connect)
print url.read()
import urllib2
url1="http://bbs.tianya.cn/post-16-835537-"
url3=".shtml#ty_vip_look[%E6%8B%89%E9%A3%8E%E7%86%8A%E7%8C%AB"
for i in range(1,481):
a=urllib2.Request(url1+str(i)+url3)
b=urllib2.urlopen(a)
path=str("D:/noval/天眼传人"+str(i)+".html")
c=open(path,"w+")
code=b.read()
c.write(code)
c.close
print "当前下载页数:",i
import urllib2
url1="http://bbs.tianya.cn/post-16-835537-"
url3=".shtml#ty_vip_look[%E6%8B%89%E9%A3%8E%E7%86%8A%E7%8C%AB"
for i in range(1,481):
#a=urllib2.Request(url1+str(i)+url3)
b=urllib2.urlopen((url1+str(i)+url3)
path=str("D:/noval/天眼传人"+str(i)+".html")
c=open(path,"w+")
code=b.read()
c.write(code)
c.close
print "当前下载页数:",i
import cookielib, urllib2 cj = cookielib.CookieJar() opener = urllib2.build_opener(urllib2.HTTPCookieProcessor(cj))
# encoding=utf-8 import urllib import urllib2 import cookielib import re cj=cookielib.CookieJar() opener=urllib2.build_opener(urllib2.HTTPCookieProcessor(cj)) url="http://beijing.douban.com/events/future-all?start=0" req=urllib2.Request(url) event=urllib2.urlopen(req) str1=event.read()
# -*- coding: utf-8 -*-
#---------------------------------------
# program:豆瓣同城爬虫
# author:GisLu
# data:2014-02-08
#---------------------------------------
import urllib
import urllib2
import cookielib
import re
cj=cookielib.CookieJar()
opener=urllib2.build_opener(urllib2.HTTPCookieProcessor(cj))
#正则提取
def search(str1):
regex=re.compile(r'summary">([dD]*?)</span>[dD]*?class="hidden-xs">([dD]*?)<time[dD]*?<li title="([dD]*?)">[dD]*?strong>([dD]*?)</strong>')
for i in regex.finditer(str1):
print "活动名称:",i.group(1)
a=i.group(2)
b=a.replace('</span>','')
print b.replace('n','')
print '活动地点:',i.group(3)
c=i.group(4).decode('utf-8')
print '费用:',c
#获取url
for i in range(0,5):
url="http://beijing.douban.com/events/future-all?start="
url=url+str(i*10)
req=urllib2.Request(url)
event=urllib2.urlopen(req)
str1=event.read()
search(str1)
import urllib
#---------------------------------------
# @program:图书借阅查询
# @author:GisLu
# @data:2014-02-08
#---------------------------------------
import urllib2
import cookielib
import re
cj=cookielib.CookieJar()
opener=urllib2.build_opener(urllib2.HTTPCookieProcessor(cj))
opener.addheaders = [('User-agent','Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1)')]
urllib2.install_opener(opener)
#登陆获取cookies
postdata=urllib.urlencode({
'user':'X1234564',
'pw':'demacialalala',
'imageField.x':'0',
'imageField.y':'0'})
rep=urllib2.Request(
url='http://210.45.210.6/dzjs/login.asp',
data=postdata
)
result=urllib2.urlopen(rep)
print result.geturl()
import urllib
#---------------------------------------
# @program:图书借阅查询
# @author:GisLu
# @data:2014-02-08
#---------------------------------------
import urllib2
import cookielib
import re
cj=cookielib.CookieJar()
opener=urllib2.build_opener(urllib2.HTTPCookieProcessor(cj))
opener.addheaders = [('User-agent','Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1)')]
urllib2.install_opener(opener)
#登陆获取cookies
postdata=urllib.urlencode({
'user':'X11134564',
'pw':'demacialalala',
'imageField.x':'0',
'imageField.y':'0'})
rep=urllib2.Request(
url='http://210.45.210.6/dzjs/login.asp',
data=postdata
)
result=urllib2.urlopen(rep)
print result.geturl()
#获取账目表
Postdata=urllib.urlencode({
'nCxfs':'1',
'submit1':'检索'})
aa=urllib2.Request(
url='http://210.45.210.6/dzjs/jhcx.asp',
data=Postdata
)
bb=urllib2.urlopen(aa)
cc=bb.read()
zhangmu=re.findall('tdborder4 >(.*?)</td>',cc)
for i in zhangmu:
i=i.decode('gb2312')
i=i.encode('gb2312')
print i.strip(' ')
机械节能产品生产企业官网模板...
大气智能家居家具装修装饰类企业通用网站模板...
礼品公司网站模板
宽屏简约大气婚纱摄影影楼模板...
蓝白WAP手机综合医院类整站源码(独立后台)...苏ICP备2024110244号-2 苏公网安备32050702011978号 增值电信业务经营许可证编号:苏B2-20251499 | Copyright 2018 - 2026 源码网商城 (www.ymwmall.com) 版权所有