X-Git-Url: https://git.ucc.asn.au/?p=planet-ucc.git;a=blobdiff_plain;f=update-planet;fp=update-planet;h=c6f04ddf05cc329c929c2c575230859a3b905f88;hp=0000000000000000000000000000000000000000;hb=b9d9d352f6a748d1c35696e7eec7de8bbb724556;hpb=b2d7ed4b39a5a03fb8f264e26b0d04a502928ddf diff --git a/update-planet b/update-planet new file mode 100755 index 0000000..c6f04dd --- /dev/null +++ b/update-planet @@ -0,0 +1,40 @@ +#!/usr/bin/python +# +# update-planet +# +# Downloads feeds from the URLs specified and generates the XHTML files. +# +# (c) 2004, Davyd Madeley +# + +import sys, urllib2, codecs +import XMLParse, XMLWriter + +# step 1: read in the config and download the feeds +feeds = [] +for feed in open('feedlist').readlines(): + if feed.strip()[0] != '#': + storage = feed.strip().split('\t') + name, feed = storage[0], storage[-1] + sys.stdout.write('Downloading feed "%s" from %s... ' % (name, feed)) + try: + # XXX: might want to consider some good caching code in here + feeds.append((name, feed, urllib2.urlopen(feed).read())) + sys.stdout.write('done.\n') + except: + sys.stdout.write('failed.\n') + +# step 2: process each feed +blogs = [] +for feed in feeds: + xml = XMLParse.XMLParse(feed[2]).parse() + for blog in xml: + blog.blogTitle = feed[0] + blogs += xml + +# step 3: write feed to disk +try: + codecs.open('planet.html', 'wb', 'utf-8').write(XMLWriter.XMLWriter(XMLWriter.XHTMLWriter, blogs).write()) +except: + sys.stderr.write('DEBUG: update-planet: could not write planet.html, aborting\n') + raise