keep_only_tags = [ dict(name='header'), dict(name='div', attrs={'class':'leading-xl-loose'}), dict(name='div', attrs={'id':'rev-more-content'}) ]