bugfix pre-release 0.4.8

2019-11-06 12:49:54 +01:00
parent 4f63e62690
commit a89ac93c3d
5 changed files with 99 additions and 30 deletions
--- a/libs/libgoogle.py
+++ b/libs/libgoogle.py
@@ -22,9 +22,12 @@ def search_pdf(search, args):
            urls.append(url)

    except urllib.error.HTTPError as e:
-        print('Error: %s' % e)
-        return -1
+        #print('Error: %s' % e)
+        return False,e
+
+    except urllib.error.URLError as e:
+        return False,e


-    return urls
+    return True,urls

--- a/libs/libhelper.py
+++ b/libs/libhelper.py
@@ -2,6 +2,14 @@ import os
 import sys
 from Crypto.Hash import SHA256

+def check_file_size(filename):
+    ''' simply check if byte size is bigger than 0 bytes
+    '''
+    fstat = os.stat(filename)
+    if fstat.st_size == 0:
+        return False
+    return True
+
 def make_directory(outdir):
    ''' naive mkdir function '''
    try:
@@ -27,11 +35,21 @@ def find_name(pdf):
 		i would not be surprised this naive approach can lead to fuckups
 	'''

+    name = ''
    # find the name of the file
-    name = pdf.split("/")
-    a = len(name)
-    name = name[a - 1]
-    # print(name)
+    # 
+    name_list = pdf.split("/")
+    len_list = len(name)
+    # ugly magic ;-)
+    # what happens is, that files can also be behind urls like:
+    # http://host/pdf/
+    # so splitting up the url and always going with the last item after slash
+    # can result in that case in an empty name, so we go another field in the list back
+    # and use this as the name
+    if name_list[len_list - 1] == '':
+        name = name_list[len_list - 2]
+    else:
+        name = name_list[len_list - 1]

    return name