#!/bin/env python # -*- coding: utf-8 -*- import urllib, re, ClientCookie#, socket ZODIAC = u"Близнецы" DAYS = 4 USER_AGENT = "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.0.1) Gecko/2008070206 Firefox/3.0.1" #TIMEOUT = 5 def fetch_page(zodiac): opener = ClientCookie.build_opener(ClientCookie.HTTPCookieProcessor(ClientCookie.CookieJar())) opener.addheaders = [("User-Agent", USER_AGENT)] ClientCookie.install_opener(opener) page = unicode(ClientCookie.urlopen('http://www.icqbot.org/web').read(), 'cp1251') session_id = re.search(r'.*\r\n' + r'
\r\n(.*?)
\r\n(.*?)
\r\n' * (DAYS-1) + r'
\r\n(.*?)
\r\n(.*?)
.*', page, re.S).groups() return '%s:\n%s\n%s\n\n%s\n%s\n\n%s\n%s\n\n%s\n%s' % (header, date1, text1, date2, text2, date3, text3, date4, text4) if __name__ == '__main__': #socket.setdefaulttimeout(TIMEOUT) print parse_page(fetch_page(ZODIAC.encode('cp1251')))