1
0
Fork 0
mirror of https://github.com/evilhero/mylar synced 2025-02-02 12:31:44 +00:00

improved searching results by limiting 2ndary results through filters

This commit is contained in:
evilhero 2012-09-18 10:42:57 -04:00
parent a37ee7638a
commit dffe34cb76

View file

@ -19,6 +19,7 @@ import urllib2
import re import re
import helpers import helpers
import logger import logger
import datetime
from decimal import Decimal from decimal import Decimal
from HTMLParser import HTMLParseError from HTMLParser import HTMLParseError
@ -87,6 +88,7 @@ def MysterBinScrape(comsearch):
return mres return mres
def GCDScraper(ComicName, ComicYear, Total, ComicID): def GCDScraper(ComicName, ComicYear, Total, ComicID):
NOWyr = datetime.date.today().year
comicnm = ComicName comicnm = ComicName
comicyr = ComicYear comicyr = ComicYear
comicis = Total comicis = Total
@ -96,7 +98,8 @@ def GCDScraper(ComicName, ComicYear, Total, ComicID):
#print ( "comichave: " + str(comicis) ) #print ( "comichave: " + str(comicis) )
#print ( "comicid: " + str(comicid) ) #print ( "comicid: " + str(comicid) )
comicnm = re.sub(' ', '%20', comicnm) comicnm = re.sub(' ', '%20', comicnm)
input = 'http://www.comics.org/series/name/' + str(comicnm) + '/sort/alpha/' #input = 'http://www.comics.org/series/name/' + str(comicnm) + '/sort/alpha/'
input = 'http://www.comics.org/search/advanced/process/?target=series&method=icontains&logic=False&order2=date&order3=&start_date=' + str(comicyr) + '-01-01&end_date=' + str(NOWyr) + '-12-31&series=' + str(comicnm) + '&is_indexed=None'
response = urllib2.urlopen ( input ) response = urllib2.urlopen ( input )
soup = BeautifulSoup ( response) soup = BeautifulSoup ( response)