#VERSION: 1.11 #AUTHORS: Fabien Devaux (fab@gnux.info) from novaprinter import prettyPrinter import urllib from xml.dom import minidom import re class mininova(object): url = 'http://www.mininova.org' name = 'Mininova' table_items = 'added cat name size seeds leech'.split() def search(self, what): order = 'seeds' # must be one in self.table_items def get_link(lnk): lnks = lnk.getElementsByTagName('a') i = 0 try: while not lnks.item(i).attributes.get('href').value.startswith('/get'): i += 1 except: return None return (self.url+lnks.item(i).attributes.get('href').value).strip() def get_text(txt): if txt.nodeType == txt.TEXT_NODE: return txt.toxml() else: return ''.join([ get_text(n) for n in txt.childNodes]) page = 1 while True: res = 0 dat = urllib.urlopen(self.url+'/search/%s/seeds/%d'%(what, page)).read().decode('utf-8', 'replace') dat = re.sub("