mylar/mylar/findcomicfeed.py

#!/usr/bin/env python

import os
import sys
import lib.feedparser as feedparser
#import feedparser
import re
import logger
import mylar
import unicodedata


def Startit(searchName, searchIssue, searchYear, ComicVersion):
    #searchName = "Uncanny Avengers"
    #searchIssue = "01"
    #searchYear = "2012"
    #clean up searchName due to webparse.
    searchName = searchName.replace("%20", " ")
    if "," in searchName:
        searchName = searchName.replace(",", "")
    logger.fdebug("name:" + str(searchName))
    logger.fdebug("issue:" + str(searchIssue))
    logger.fdebug("year:" + str(searchYear))
    splitSearch = searchName.split(" ")
    joinSearch = "+".join(splitSearch)+"+"+searchIssue
    searchIsOne = "0"+searchIssue
    searchIsTwo = "00"+searchIssue

    if "-" in searchName:
        searchName = searchName.replace("-", '((\\s)?[-:])?(\\s)?')

    regexName = searchName.replace(" ", '((\\s)?[-:])?(\\s)?')


    if mylar.USE_MINSIZE:
        size_constraints = "minsize=" + str(mylar.MINSIZE)
    else:
        size_constraints = "minsize=10"

    if mylar.USE_MAXSIZE:
        size_constraints = size_constraints + "&maxsize=" + str(mylar.MAXSIZE)

    if mylar.USENET_RETENTION != None:
        max_age = "&age=" + str(mylar.USENET_RETENTION)

    feed = feedparser.parse("http://nzbindex.nl/rss/alt.binaries.comics.dcp/?sort=agedesc&" + str(size_constraints) + str(max_age) + "&dq=%s&max=50&more=1" %joinSearch)

    totNum = len(feed.entries)

    keyPair = {}
    regList = []
    entries = []
    mres = {}
    countUp = 0

    logger.fdebug(str(totNum) + " results")

    while countUp < totNum:
 	urlParse = feed.entries[countUp].enclosures[0]
	#keyPair[feed.entries[countUp].title] = feed.entries[countUp].link
	keyPair[feed.entries[countUp].title] = urlParse["href"]

	countUp=countUp+1


    # thanks to SpammyHagar for spending the time in compiling these regEx's!

    regExTest=""

    regEx = "(%s\\s*(0)?(0)?%s\\s*\\(%s\\))" %(regexName, searchIssue, searchYear)
    regExOne = "(%s\\s*(0)?(0)?%s\\s*\\(.*?\\)\\s*\\(%s\\))" %(regexName, searchIssue, searchYear)

    #Sometimes comics aren't actually published the same year comicVine says - trying to adjust for these cases
    regExTwo = "(%s\\s*(0)?(0)?%s\\s*\\(%s\\))" %(regexName, searchIssue, int(searchYear)+1)
    regExThree = "(%s\\s*(0)?(0)?%s\\s*\\(%s\\))" %(regexName, searchIssue, int(searchYear)-1)
    regExFour = "(%s\\s*(0)?(0)?%s\\s*\\(.*?\\)\\s*\\(%s\\))" %(regexName, searchIssue, int(searchYear)+1)
    regExFive = "(%s\\s*(0)?(0)?%s\\s*\\(.*?\\)\\s*\\(%s\\))" %(regexName, searchIssue, int(searchYear)-1)

    regexList=[regEx, regExOne, regExTwo, regExThree, regExFour, regExFive]

    for title, link in keyPair.items():
        logger.fdebug("titlesplit: " + str(title.split("\"")))
        splitTitle = title.split("\"")

        for subs in splitTitle:
            logger.fdebug(subs)
            regExCount = 0
            if len(subs) > 10:
                #Looping through dictionary to run each regEx - length + regex is determined by regexList up top.
#                while regExCount < len(regexList):
#                    regExTest = re.findall(regexList[regExCount], subs, flags=re.IGNORECASE)
#                    regExCount = regExCount +1
#                    if regExTest:   
#                        logger.fdebug(title)
#                        entries.append({
#                                  'title':   subs,
#                                  'link':    str(link)
#                                  })
                entries.append({
                          'title':   subs,
                          'link':    str(link)
                          })

              
    if len(entries) >= 1:
        mres['entries'] = entries
        return mres 
#       print("Title: "+regList[0])
#       print("Link: "+keyPair[regList[0]])        
    else:
        logger.fdebug("No Results Found")
        return "no results"
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00			`#!/usr/bin/env python`

			`import os`
			`import sys`
			`import lib.feedparser as feedparser`
			`#import feedparser`
			`import re`
Fix: for endless downloading when Experimental Search was enabled. 2013-01-02 17:56:46 +00:00			`import logger`
FIX:(#162) Sab Download directory option available for Post-Processing, FIX:(#195) Series that had digits in the title would error out occasionally on File Checking, IMP: Minimum/Maximum size restrictions available for Experimental Search ONLY, IMP: some further work on the directory import screens 2013-02-09 03:34:02 +00:00			`import mylar`
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`import unicodedata`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00
			`def Startit(searchName, searchIssue, searchYear, ComicVersion):`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00			`#searchName = "Uncanny Avengers"`
			`#searchIssue = "01"`
			`#searchYear = "2012"`
			`#clean up searchName due to webparse.`
			`searchName = searchName.replace("%20", " ")`
FIX:(#378) Improved filechecker to pick up different variations in Volume inclusions, as well as special chars, IMP: Pullist improvements with regards to identical titles but not recent (would get confused), IMP: Added some extra checks when determining if a series is Continuing vs Ended 2013-05-09 02:22:47 +00:00			`if "," in searchName:`
			`searchName = searchName.replace(",", "")`
Fix: for endless downloading when Experimental Search was enabled. 2013-01-02 17:56:46 +00:00			`logger.fdebug("name:" + str(searchName))`
			`logger.fdebug("issue:" + str(searchIssue))`
			`logger.fdebug("year:" + str(searchYear))`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00			`splitSearch = searchName.split(" ")`
			`joinSearch = "+".join(splitSearch)+"+"+searchIssue`
			`searchIsOne = "0"+searchIssue`
			`searchIsTwo = "00"+searchIssue`

FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`if "-" in searchName:`
			`searchName = searchName.replace("-", '((\\s)?[-:])?(\\s)?')`

			`regexName = searchName.replace(" ", '((\\s)?[-:])?(\\s)?')`


FIX:(#162) Sab Download directory option available for Post-Processing, FIX:(#195) Series that had digits in the title would error out occasionally on File Checking, IMP: Minimum/Maximum size restrictions available for Experimental Search ONLY, IMP: some further work on the directory import screens 2013-02-09 03:34:02 +00:00			`if mylar.USE_MINSIZE:`
			`size_constraints = "minsize=" + str(mylar.MINSIZE)`
			`else:`
			`size_constraints = "minsize=10"`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
FIX:(#162) Sab Download directory option available for Post-Processing, FIX:(#195) Series that had digits in the title would error out occasionally on File Checking, IMP: Minimum/Maximum size restrictions available for Experimental Search ONLY, IMP: some further work on the directory import screens 2013-02-09 03:34:02 +00:00			`if mylar.USE_MAXSIZE:`
			`size_constraints = size_constraints + "&maxsize=" + str(mylar.MAXSIZE)`

FIX:(#238) Usenet Retention settings have no effect (Thnx TheLabRatt), FIX:(#240) added some checks for NZBGet values and fixed some invalid strings 2013-03-01 20:20:39 +00:00			`if mylar.USENET_RETENTION != None:`
			`max_age = "&age=" + str(mylar.USENET_RETENTION)`

FIX:(#340) Increase result-set from 25 to 50 to allow for lower-issue number variations. 2013-04-14 06:56:12 +00:00			`feed = feedparser.parse("http://nzbindex.nl/rss/alt.binaries.comics.dcp/?sort=agedesc&" + str(size_constraints) + str(max_age) + "&dq=%s&max=50&more=1" %joinSearch)`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
			`totNum = len(feed.entries)`

			`keyPair = {}`
			`regList = []`
			`entries = []`
			`mres = {}`
			`countUp = 0`

Fix: for endless downloading when Experimental Search was enabled. 2013-01-02 17:56:46 +00:00			`logger.fdebug(str(totNum) + " results")`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
			`while countUp < totNum:`
			`urlParse = feed.entries[countUp].enclosures[0]`
			`#keyPair[feed.entries[countUp].title] = feed.entries[countUp].link`
			`keyPair[feed.entries[countUp].title] = urlParse["href"]`

			`countUp=countUp+1`


FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`# thanks to SpammyHagar for spending the time in compiling these regEx's!`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`regExTest=""`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`regEx = "(%s\\s(0)?(0)?%s\\s\\(%s\\))" %(regexName, searchIssue, searchYear)`
			`regExOne = "(%s\\s(0)?(0)?%s\\s\\(.?\\)\\s\\(%s\\))" %(regexName, searchIssue, searchYear)`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`#Sometimes comics aren't actually published the same year comicVine says - trying to adjust for these cases`
			`regExTwo = "(%s\\s(0)?(0)?%s\\s\\(%s\\))" %(regexName, searchIssue, int(searchYear)+1)`
			`regExThree = "(%s\\s(0)?(0)?%s\\s\\(%s\\))" %(regexName, searchIssue, int(searchYear)-1)`
			`regExFour = "(%s\\s(0)?(0)?%s\\s\\(.?\\)\\s\\(%s\\))" %(regexName, searchIssue, int(searchYear)+1)`
			`regExFive = "(%s\\s(0)?(0)?%s\\s\\(.?\\)\\s\\(%s\\))" %(regexName, searchIssue, int(searchYear)-1)`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`regexList=[regEx, regExOne, regExTwo, regExThree, regExFour, regExFive]`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
			`for title, link in keyPair.items():`
IMP: Added Advanced Options tab to Manage for easier access to hidden options, IMP: attempt to clear out errors when annuals inclusion (not quite working yet), IMP: Removed alot of unnecessary print statements and did some renaming, FIX: Experimental search should now be working (regex's removed), FIX: Metatagging option will now take windows paths, FIX: PostProcessing would error out on using Metatagging option 2013-07-10 01:45:10 +00:00			`logger.fdebug("titlesplit: " + str(title.split("\"")))`
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`splitTitle = title.split("\"")`

			`for subs in splitTitle:`
IMP: Added Advanced Options tab to Manage for easier access to hidden options, IMP: attempt to clear out errors when annuals inclusion (not quite working yet), IMP: Removed alot of unnecessary print statements and did some renaming, FIX: Experimental search should now be working (regex's removed), FIX: Metatagging option will now take windows paths, FIX: PostProcessing would error out on using Metatagging option 2013-07-10 01:45:10 +00:00			`logger.fdebug(subs)`
FIX:(335) ? in filenames / comicnames correctly accounted for now in all facets, IMP: Improved upon RegEx's in Experimental Search (Thnx SpammyHagar), IMP: Added individual pulls for Pullist now (Grabbag_dir set in config.ini, else defaults to ComicLocation root), FIX:(#331) Incorrect re.sub when using blackhole functionality which causes it to break 2013-04-12 02:14:27 +00:00			`regExCount = 0`
			`if len(subs) > 10:`
			`#Looping through dictionary to run each regEx - length + regex is determined by regexList up top.`
IMP: Added Advanced Options tab to Manage for easier access to hidden options, IMP: attempt to clear out errors when annuals inclusion (not quite working yet), IMP: Removed alot of unnecessary print statements and did some renaming, FIX: Experimental search should now be working (regex's removed), FIX: Metatagging option will now take windows paths, FIX: PostProcessing would error out on using Metatagging option 2013-07-10 01:45:10 +00:00			`# while regExCount < len(regexList):`
			`# regExTest = re.findall(regexList[regExCount], subs, flags=re.IGNORECASE)`
			`# regExCount = regExCount +1`
			`# if regExTest:`
			`# logger.fdebug(title)`
			`# entries.append({`
			`# 'title': subs,`
			`# 'link': str(link)`
			`# })`
			`entries.append({`
			`'title': subs,`
			`'link': str(link)`
			`})`

fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00
			`if len(entries) >= 1:`
			`mres['entries'] = entries`
			`return mres`
			`# print("Title: "+regList[0])`
			`# print("Link: "+keyPair[regList[0]])`
			`else:`
Fix: for endless downloading when Experimental Search was enabled. 2013-01-02 17:56:46 +00:00			`logger.fdebug("No Results Found")`
fix: Experimental search, fix: dognzb not able to download nzbs, fix:nzb.su fix for nzb filenames (broke renaming/post-processing), add: newznab provider added, add:explicit search.log 2012-12-16 17:57:02 +00:00			`return "no results"`