查看文章 |
备份ycool博客文章的脚本(python)
2009-02-09 20:09
import urllib2,urllib import cookielib # your blog name, like this blog_name = "http://***.ycool.com/index" # your accout email here username = 'overboming@gmail.com' # your password here passwd = '*****' # maximum arcticle list article_num = 91 #never mind the following Login_server = 'http://account.ycool.com/signin.php' Logout_server = '' class poster: def __init__(self): cookie=cookielib.CookieJar() opener=urllib2.build_opener(urllib2.HTTPCookieProcessor(cookie)) urllib2.install_opener(opener) def login(self,password): params = urllib.urlencode({'signin_token': username, 'signin_passwd': passwd ,'act':'signin','_yc_dest':'http://www.ycool.com/index.php?_yc_service=yc'}) foo = urllib2.urlopen(Login_server, params) # print foo.read() def logout(self): foo = urllib2.urlopen(Logout_server) def test(): """test bed for login """ foo = poster() foo.login(passwd) print '=========================================================' def work(): """let's download all of the arcticles""" test() #login for i in range(article_num): open('%d.html' % i,'w').write(urllib2.urlopen('%s%d.html' % (blog_name,i)).read()) print 'download complete for page %d' % i print 'my job is down for %d pages' % article_num work() |