def postprocess_html(self, soup, first): for img in soup.findAll('img', src=True): if img['src'].startswith('http:'): img.extract()