mirror of
https://github.com/vikstrous/pirate-get
synced 2025-01-24 12:14:20 +01:00
add variable number of pages to fetch option
This commit is contained in:
parent
f5e5a5487a
commit
4606e3a32e
@ -40,6 +40,7 @@ def main():
|
|||||||
parser = argparse.ArgumentParser(description='Finds and downloads torrents from the Pirate Bay')
|
parser = argparse.ArgumentParser(description='Finds and downloads torrents from the Pirate Bay')
|
||||||
parser.add_argument('q', metavar='search_term', help="The term to search for")
|
parser.add_argument('q', metavar='search_term', help="The term to search for")
|
||||||
parser.add_argument('--local', dest='database', help="An xml file containing the Pirate Bay database")
|
parser.add_argument('--local', dest='database', help="An xml file containing the Pirate Bay database")
|
||||||
|
parser.add_argument('-p', dest='pages', help="The number of pages to fetch (doesn't work with --local)", default=1)
|
||||||
|
|
||||||
def local(args):
|
def local(args):
|
||||||
xml_str = ''
|
xml_str = ''
|
||||||
@ -51,24 +52,32 @@ def main():
|
|||||||
|
|
||||||
#todo: redo this with html parser instead of regex
|
#todo: redo this with html parser instead of regex
|
||||||
def remote(args):
|
def remote(args):
|
||||||
f = urllib2.urlopen('http://thepiratebay.se/search/' + args.q.replace(" ", "+") + '/0/7/0')
|
|
||||||
res = f.read()
|
|
||||||
found = re.findall(""""(magnet\:\?xt=[^"]*)|<td align="right">([^<]+)</td>""", res)
|
|
||||||
state = "seeds"
|
|
||||||
curr = ['',0,0] #magnet, seeds, leeches
|
|
||||||
res_l = []
|
res_l = []
|
||||||
for f in found:
|
try:
|
||||||
if f[1] == '':
|
pages = int(args.pages)
|
||||||
curr[0] = f[0]
|
if pages < 1:
|
||||||
else:
|
raise Exception('')
|
||||||
if state == 'seeds':
|
except Exception:
|
||||||
curr[1] = f[1]
|
raise Exception("Please provide an integer greater than 0 for the number of pages to fetch.")
|
||||||
state = 'leeches'
|
|
||||||
|
for page in xrange(pages):
|
||||||
|
f = urllib2.urlopen('http://thepiratebay.se/search/' + args.q.replace(" ", "+") + '/' + str(page) + '/7/0')
|
||||||
|
res = f.read()
|
||||||
|
found = re.findall(""""(magnet\:\?xt=[^"]*)|<td align="right">([^<]+)</td>""", res)
|
||||||
|
state = "seeds"
|
||||||
|
curr = ['',0,0] #magnet, seeds, leeches
|
||||||
|
for f in found:
|
||||||
|
if f[1] == '':
|
||||||
|
curr[0] = f[0]
|
||||||
else:
|
else:
|
||||||
curr[2] = f[1]
|
if state == 'seeds':
|
||||||
state = 'seeds'
|
curr[1] = f[1]
|
||||||
res_l.append(curr)
|
state = 'leeches'
|
||||||
curr = ['', 0, 0]
|
else:
|
||||||
|
curr[2] = f[1]
|
||||||
|
state = 'seeds'
|
||||||
|
res_l.append(curr)
|
||||||
|
curr = ['', 0, 0]
|
||||||
return res_l
|
return res_l
|
||||||
|
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
@ -77,9 +86,9 @@ def main():
|
|||||||
else:
|
else:
|
||||||
mags = remote(args)
|
mags = remote(args)
|
||||||
|
|
||||||
print "S=seeders"
|
if mags and len(mags) > 0:
|
||||||
print "L=leechers"
|
print "S=seeders"
|
||||||
if mags:
|
print "L=leechers"
|
||||||
for m in range(len(mags)):
|
for m in range(len(mags)):
|
||||||
magnet = mags[m]
|
magnet = mags[m]
|
||||||
name = re.search("dn=([^\&]*)", magnet[0])
|
name = re.search("dn=([^\&]*)", magnet[0])
|
||||||
|
Loading…
Reference in New Issue
Block a user