From 6f133be1ef5fdc21e5cee56fdd1144120207f789 Mon Sep 17 00:00:00 2001
From: evilhero <evilhero@gmail.com>
Date: Mon, 11 Dec 2017 13:49:40 -0500
Subject: [PATCH] FIX:(#1796) When performing mass import or a large import via
 selection, would thread each import which would result in a db lock/error in
 some cases when there was a combination of files with and without metadata,
 FIX: Search results would include some common words when filtering, got rid
 of them, FIX: Total parse counter during an import would not reset to 0 on
 subsequent imports resulting in inflated numbers

---
 data/interfaces/default/importresults.html |   2 +-
 mylar/librarysync.py                       |   1 +
 mylar/mb.py                                |  11 +-
 mylar/webserve.py                          | 116 ++++++++++++---------
 4 files changed, 75 insertions(+), 55 deletions(-)
diff --git a/data/interfaces/default/importresults.html b/data/interfaces/default/importresults.html
index 280d5f07..0202660c 100755
--- a/data/interfaces/default/importresults.html
+++ b/data/interfaces/default/importresults.html
@@ -61,7 +61,7 @@
 
         <form action="markImports" method="get" id="markImports">
         <div id="markcomic">
-                <select name="action" onChange="doAjaxCall('markImports',$(this),'table',true);" data-error="You didn't select any comics">
+                <select name="action" onChange="doAjaxCall('markImports',$(this),'table',true);" data-success="Now running background Import" data-error="You didn't select any comics">
                         <option disabled="disabled" selected="selected">Choose...</option>
                         <option value="importselected">Start Import</option>
                         <option value="removeimport">Remove</option>
diff --git a/mylar/librarysync.py b/mylar/librarysync.py
index 3052d992..437d4d78 100755
--- a/mylar/librarysync.py
+++ b/mylar/librarysync.py
@@ -611,6 +611,7 @@ def libraryScan(dir=None, append=False, ComicID=None, ComicName=None, cron=None,
 
 def scanLibrary(scan=None, queue=None):
     mylar.IMPORT_FILES = 0
+    mylar.IMPORT_PARSED_COUNT = 0
     valreturn = []
     if scan:
         try:
diff --git a/mylar/mb.py b/mylar/mb.py
index 7a174eba..9d44b610 100755
--- a/mylar/mb.py
+++ b/mylar/mb.py
@@ -85,10 +85,17 @@ def findComic(name, mode, issue, limityear=None, type=None):
     comiclist = []
     arcinfolist = []
 
-    commons = [' and ', ' the ']
+    commons = ['and', 'the', '&', '-']
     for x in commons:
         if x in name.lower():
-            name = re.sub(x, ' ', name.lower()).strip()
+            for m in re.finditer(x, name.lower()):
+                tehstart = m.start()
+                tehend = m.end()
+                if any([x == 'the', x == 'and']):
+                    if not all([tehstart == 0, name[tehend] == ' ']) or not all([tehstart != 0, name[tehstart-1] == ' ', name[tehend] == ' ']):
+                        continue
+                else:
+                    name = name[tehstart:tehend].replace(x, ' ').strip() + name[tehend+1:]
 
     pattern = re.compile(ur'\w+', re.UNICODE)
     name = pattern.findall(name)
diff --git a/mylar/webserve.py b/mylar/webserve.py
index 58dad252..7835e036 100644
--- a/mylar/webserve.py
+++ b/mylar/webserve.py
@@ -374,11 +374,14 @@ class WebInterface(object):
         raise cherrypy.HTTPRedirect("comicDetails?ComicID=%s" % comicid)
     addComic.exposed = True
 
-    def addbyid(self, comicid, calledby=None, imported=None, ogcname=None):
+    def addbyid(self, comicid, calledby=None, imported=None, ogcname=None, nothread=False):
         mismatch = "no"
         logger.info('Attempting to add directly by ComicVineID: ' + str(comicid))
         if comicid.startswith('4050-'): comicid = re.sub('4050-', '', comicid)
-        threading.Thread(target=importer.addComictoDB, args=[comicid, mismatch, None, imported, ogcname]).start()
+        if nothread is False:
+            threading.Thread(target=importer.addComictoDB, args=[comicid, mismatch, None, imported, ogcname]).start()
+        else:
+            return importer.addComictoDB(comicid, mismatch, None, imported, ogcname)
         if calledby == True or calledby == 'True':
            return
         elif calledby == 'web-import':
@@ -3760,7 +3763,7 @@ class WebInterface(object):
                                 'Volume':        comicinfo['Volume'],
                                 'filelisting':   files,
                                 'srid':          SRID}
-                    self.addbyid(comicinfo['ComicID'], calledby=True, imported=imported, ogcname=comicinfo['ComicName'])
+                    self.addbyid(comicinfo['ComicID'], calledby=True, imported=imported, ogcname=comicinfo['ComicName'], nothread=True)
 
                     #status update.
                     ctrlVal = {"ComicID":     comicinfo['ComicID']}
@@ -4032,48 +4035,64 @@ class WebInterface(object):
 
                 myDB.upsert("importresults", newVal, ctrlVal)
 
-                if len(search_matches) > 1:
-                    # if we matched on more than one series above, just save those results instead of the entire search result set.
-                    for sres in search_matches:
-                        cVal = {"SRID":        SRID,
-                                "comicid":     sres['comicid']}
-                        #should store ogcname in here somewhere to account for naming conversions above.
-                        nVal = {"Series":      ComicName,
-                                "results":     len(search_matches),
-                                "publisher":   sres['publisher'],
-                                "haveit":      sres['haveit'],
-                                "name":        sres['name'],
-                                "deck":        sres['deck'],
-                                "url":         sres['url'],
-                                "description":  sres['description'],
-                                "comicimage":  sres['comicimage'],
-                                "issues":      sres['issues'],
-                                "ogcname":     ogcname,
-                               "comicyear":   sres['comicyear']}
-                        myDB.upsert("searchresults", nVal, cVal)
+                if resultset == 0:
+                    if len(search_matches) > 1:
+                       # if we matched on more than one series above, just save those results instead of the entire search result set.
+                        for sres in search_matches:
+                            cVal = {"SRID":        SRID,
+                                    "comicid":     sres['comicid']}
+                            #should store ogcname in here somewhere to account for naming conversions above.
+                            nVal = {"Series":      ComicName,
+                                    "results":     len(search_matches),
+                                    "publisher":   sres['publisher'],
+                                    "haveit":      sres['haveit'],
+                                    "name":        sres['name'],
+                                    "deck":        sres['deck'],
+                                    "url":         sres['url'],
+                                    "description":  sres['description'],
+                                    "comicimage":  sres['comicimage'],
+                                    "issues":      sres['issues'],
+                                    "ogcname":     ogcname,
+                                    "comicyear":   sres['comicyear']}
+                            myDB.upsert("searchresults", nVal, cVal)
+                        logger.info('[IMPORT] There is more than one result that might be valid - normally this is due to the filename(s) not having enough information for me to use (ie. no volume label/year). Manual intervention is required.')
+                        #force the status here just in case
+                        newVal = {'SRID':     SRID,
+                                  'Status':   'Manual Intervention'}
+                        myDB.upsert("importresults", newVal, ctrlVal)
+
+                    elif len(sresults) > 1:
+                        # store the search results for series that returned more than one result for user to select later / when they want.
+                        # should probably assign some random numeric for an id to reference back at some point.
+                        for sres in sresults:
+                            cVal = {"SRID":        SRID,
+                                    "comicid":     sres['comicid']}
+                            #should store ogcname in here somewhere to account for naming conversions above.
+                            nVal = {"Series":      ComicName,
+                                    "results":     len(sresults),
+                                    "publisher":   sres['publisher'],
+                                    "haveit":      sres['haveit'],
+                                    "name":        sres['name'],
+                                    "deck":        sres['deck'],
+                                    "url":         sres['url'],
+                                    "description":  sres['description'],
+                                    "comicimage":  sres['comicimage'],
+                                    "issues":      sres['issues'],
+                                    "ogcname":     ogcname,
+                                    "comicyear":   sres['comicyear']}
+                            myDB.upsert("searchresults", nVal, cVal)
+                        logger.info('[IMPORT] There is more than one result that might be valid - normally this is due to the filename(s) not having enough information for me to use (ie. no volume label/year). Manual intervention is required.')
+                        #force the status here just in case
+                        newVal = {'SRID':     SRID,
+                                  'Status':   'Manual Intervention'}
+                        myDB.upsert("importresults", newVal, ctrlVal)
+                    else:
+                        logger.info('[IMPORT] Could not find any matching results against CV. Check the logs and perhaps rename the attempted file(s)')
+                        newVal = {'SRID':     SRID,
+                                  'Status':   'No Results'}
+                        myDB.upsert("importresults", newVal, ctrlVal)
 
                 else:
-                    # store the search results for series that returned more than one result for user to select later / when they want.
-                    # should probably assign some random numeric for an id to reference back at some point.
-                    for sres in sresults:
-                        cVal = {"SRID":        SRID,
-                                "comicid":     sres['comicid']}
-                        #should store ogcname in here somewhere to account for naming conversions above.
-                        nVal = {"Series":      ComicName,
-                                "results":     len(sresults),
-                                "publisher":   sres['publisher'],
-                                "haveit":      sres['haveit'],
-                                "name":        sres['name'],
-                                "deck":        sres['deck'],
-                                "url":         sres['url'],
-                                "description":  sres['description'],
-                                "comicimage":  sres['comicimage'],
-                                "issues":      sres['issues'],
-                                "ogcname":     ogcname,
-                               "comicyear":   sres['comicyear']}
-                        myDB.upsert("searchresults", nVal, cVal)
-
-                if resultset == 1:
                     logger.info('[IMPORT] Now adding %s...' % ComicName)
 
                     if volume is None or volume == 'None':
@@ -4095,17 +4114,10 @@ class WebInterface(object):
                                 'filelisting':   files,
                                 'srid':          SRID}
 
-                    self.addbyid(sr['comicid'], calledby=True, imported=imported, ogcname=ogcname)  #imported=yes)
-
-                else:
-                    logger.info('[IMPORT] There is more than one result that might be valid - normally this is due to the filename(s) not having enough information for me to use (ie. no volume label/year). Manual intervention is required.')
-                    #force the status here just in case
-                    newVal = {'SRID':     SRID,
-                              'Status':   'Manual Intervention'}
-                    myDB.upsert("importresults", newVal, ctrlVal)
+                    self.addbyid(sr['comicid'], calledby=True, imported=imported, ogcname=ogcname, nothread=True)
 
         mylar.IMPORTLOCK = False
-        logger.info('[IMPORT] Initial Import complete (I might still be populating the series data).')
+        logger.info('[IMPORT] Import completed.')
 
     preSearchit.exposed = True