#!/usr/bin/env python import sys import urllib2 from urllib import quote sys.path.append('/home/pat/.pylib') from BeautifulSoup import BeautifulStoneSoup def snag(query, userAgent="innocentrobot"): lang, title = query.split(':') url = 'http://%s.wikipedia.org/w/index.php?title=Special:Export&pages=%s' % (lang, quote(title)) print url req = urllib2.Request(url, None, {'User-agent': userAgent}) fp = urllib2.urlopen(req) return fp.read().decode('utf-8') def doc(xml): return BeautifulStoneSoup(xml) def dump(xml): soup = BeautifulStoneSoup(xml) return soup.page.revision.text.prettify() if __name__ == "__main__": article = snag(sys.argv[1].replace(' ', '_')) print dump(article)