import urllib2 import logging import re class PageImporter(object): def __init__(self, url, feed): self.url = url self.feed = feed def fetch_page(self): request = urllib2.Request(self.url) try: response = urllib2.urlopen(request) except HTTPError, e: logging.error('The server couldn\'t fulfill the request. Error: %s' % e.code) except URLError, e: logging.error('Failed to reach server. Reason: %s' % e.reason) else: data = response.read() html = data html = self.rewrite_page(html) self.save_page(html) def rewrite_page(self, response): head = response.find('
') + 6 base_code = u'