从网上看到一篇很有意思的文章,转载过来大家可以试一下
直接上代码吧
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 | #!/usr/bin/env python
#coding:utf-8
import urllib2
import re
class qiubai:
def __init__(self,page=1):
self.page=page
def search(self,page):
url = "http://www.qiushibaike.com/week/page/%s" % page
re_qb = re.compile(r'detail.*?<a.*?>(.*?)<.*?title= "(.*?)" >\s*(.*?)\s*?<',re.DOTALL)
html = urllib2.urlopen(url).read()
my_qiubai = re_qb.findall(html)
for i in range(0,19):
for k in range(3):
print my_qiubai[i][k]
s = raw_input( "回车继续" )
if s == "q" :
exit ()
else :
page=int(page)+1
print "-" *18 + "第" + str(page) + "页" + "-" *18
self.search(page)
print "-" *40
def query(self):
global p
p = raw_input( "输入要看的页数:" )
if p == "q" :
exit ()
elif not p.isdigit() or p == "0" :
self.query()
else :
print "-" *18 + "第" + p + "页" + "-" *18
self.search(p)
if __name__ == "__main__" :
print "-" *40
print "糗百命令行版"
print '输入 "q" 退出程序'
print "-" *40
qb=qiubai()
qb.query()
|
Copier après la connexion