View Single Post
Old 05-16-2011, 08:37 AM   #2
schuster
Zealot
schuster doesn't litterschuster doesn't litter
 
Posts: 119
Karma: 100
Join Date: Jan 2011
Location: Germany / NRW /Köln
Device: prs-650 / prs-350 /kindle 3
try this

Code:
class AdvancedUserRecipe1305470859(BasicNewsRecipe):
    title          = u'Cosmopolitan Magazin'
    oldest_article = 14
    max_articles_per_feed = 20
    no_stylesheets         = True
    use_embedded_content   = False
    remove_javascript      = True
    cover_url = 'http://www.cosmopolitan.com/cm/shared/site_images/print_this/cosmopolitan_logo.gif'
    extra_css = '''
                    h2{font-family:Arial,Helvetica,sans-serif; font-size: x-small;}
                    h1{ font-family:Arial,Helvetica,sans-serif;  font-size:x-large; font-weight:bold;}
                '''
    remove_tags = [dict(name='div', attrs={'class':'printTools'})]

    def print_version(self,url):
          segments = url.split('/') 
          printURL = '/'.join(segments[0:3]) + '/print-this/' + '/'.join(segments[4:])
          return printURL

    def preprocess_html(self, soup):
        for alink in soup.findAll('a'):
            if alink.string is not None:
               tstr = alink.string
               alink.replaceWith(tstr)
        return soup

    feeds          = [(u'Sex&Love', u'http://www.cosmopolitan.com/sex-love/rss/'),
                          (u'Hair&Beauty', u'http://www.cosmopolitan.com/hairstyles-beauty/rss/'),
                          (u'Celebs & Style', u'http://www.cosmopolitan.com/celebrity/rss/'),
                          (u'Secrets & Advice', u'http://www.cosmopolitan.com/advice/rss/'),
                          (u'Sexy Beauty Secrets Blog', u'http://www.cosmopolitan.com/hairstyles-beauty/beauty-blog/rss/'),
                          (u'Joe Hottie`s Dating Blog', u'http://www.cosmopolitan.com/sex-love/joe-hottie/joe-hottie-rss/'),
                          (u'Bedroom Blog', u'http://www.cosmopolitan.com/sex-love/bedroom-blog/rss/')]
schuster is offline   Reply With Quote