Here's my recipe for ShackNews, a video games news site. Their HTML is already pretty nice so it doesn't do much. Comments and improvements welcome as I am just starting out.
PHP Code:
class AdvancedUserRecipe1312317103(BasicNewsRecipe):
title = u'ShackNews'
oldest_article = 7
max_articles_per_feed = 100
no_stylesheets = True
keep_only_tags = [dict(name='div', attrs={'id':['article']})]
remove_tags = [
dict(name='ul',attrs={'class':['share']}),
dict(name='div',attrs={'class':['tags']}),
dict(name='div',attrs={'class':['focalbox']}),
dict(name='div',attrs={'class':['embedimage']})
]
extra_css = 'blockquote {font-style: italic;}'
feeds = [(u'ShackNews', u'http://feed.shacknews.com/shackfeed.xml')]