#!/usr/bin/env python
"""
Generate RSS feed for LeFigaro  
copyright (c) 2004 Junichi Uekawa <dancer@netfort.gr.jp>
"""
import re
import urllib

p = re.compile('<A CLASS=TIT[^ ]* HREF="([^"]*)">([^"]*)<BR></A>.*?<SPAN CLASS=TXT-UNE>.*?<A HREF="[^"]*" CLASS=TXT-UNE>([^<]*)</A>', re.DOTALL)

html = unicode (
    urllib.urlopen("http://www.lefigaro.fr/index.html").read(),
    "iso-8859-1").encode("utf-8")

print """<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE rss PUBLIC "-//Netscape Communications//DTD RSS 0.91//EN"
            "http://my.netscape.com/publish/formats/rss-0.91.dtd">
<rss version="0.91">
<channel>
<title>Le Figaro</title>
<link>http://www.lefigaro.fr/</link>
<description>RSS feed for Le Figaro</description>
<language>fr</language>
"""
            
for m in p.finditer(html):
    print """
    <item>
      <title>%s</title>
      <link>%s</link>
      <description>
%s
      </description>
    """ % (m.group(2), "http://www.lefigaro.fr/" + m.group(1), m.group(3))
print """
</channel>
</rss>
"""
