python 采集小程序
分类:CentOS运维 阅读:77404 次
# coding=utf8
#LINUXQQ for crawler data v0.1
import os
import re
import urllib
videourl = ‘http://www.centoscn.com/’
rootdir = ‘D:\\video\\’
def progress(blocknum,blocksize,totalsize):
per = 100.0 * blocknum * blocksize / totalsize
if per > 100:
per = 100
print “%.2f%%”% per
def contact(link,directory):
newlink = link.replace(‘&’,'&’)
newhtml = urllib.urlopen(str(videourl + newlink))
newdata = re.compile(‘
if req:
os.mkdir(rootdir + directory )
download = req.group(1).replace('html','swf')
if urllib.urlretrieve(download, rootdir + directory + '\\study.swf',progress):
print directory + 'download ok'
else:
print directory + 'download failure'
def crawler(url):
html = urllib.urlopen('http://www.51zxw.net/list.aspx?cid=359')
data = re.compile(r' ]*?>(.*?)‘, re.S|re.U)
req = re.findall(data,html.read())
for i in req:
contact(i[0],i[1])
if __name__==’__main__’:
i = 8
p = 1
while p <= i:
url = ‘http://www.51zxw.net/list.aspx?page=%d&cid=359′ % (p)
p += 1
crawler(url)
热门推荐
- Centos6.5搭建bugzilla
- CentOS下通过yum安装svn及配置
- CentOS系统设置Nginx服务自动启动运行
- CentOS6.5下webbench对nginx的压力测试
- CentOS下RPM方式安装MySQL5.6
- 配置Nginx区分PC或手机访问不同网站
- centos6.3下mysql5.5.32源码安装
- CentOS下使用yum安装mysql详解
- CentOS 7搭建SVN服务器
- CentOS 7安装配置Samba服务器
- CentOS下无网络安装Nginx
- CentOS下的apache服务器配置与管理
- CentOS 7 搭建支持 HTTP 协议的 SVN 服务器
- CentOS安装SVN服务器
- CentOS7搭建OpenStack云系统之准备篇
- CentOS使用yum安装mysql详解
- CentOS7.0下nginx+mysql+php环境安装
- CentOS下以RPM方式安装MySQL5.5
- CentOS下Dhcp服务器详细配置
- Centos下转发DNS服务器的架设与测试