updated and verified code to change result message

there is now a new type of result, duplicate files these are files that already exist in the destination folder and are not imported if not importing duplicates I have thoroughly verified that my changes do not cause any other part of the code to break or act in an unexpected manner. I have also removed some code that could never get used: elodie/localstorage.py: checksum() could never return None, code was not accessible due to earlier return because of this: elodie/filesystem.py: process_checksum() did not need to check if checksum was None after calculating it this is what allowed my new code to use None as a flag meaning that the file being imported and skipped is a duplicate file
D3Zyre · Oct 13, 2023 · 651c373 · D3Zyre · Oct 13, 2023 · D3Zyre
1 parent a620e70
commit 651c373
Show file tree

Hide file tree

Showing 3 changed files with 19 additions and 5 deletions.
diff --git a/elodie/filesystem.py b/elodie/filesystem.py
@@ -487,9 +487,6 @@ def parse_mask_for_location(self, mask, location_parts, place_name):
     def process_checksum(self, _file, allow_duplicate):
         db = Db()
         checksum = db.checksum(_file)
-        if(checksum is None):
-            log.info('Could not get checksum for %s.' % _file)
-            return None
 
         # If duplicates are not allowed then we check if we've seen this file
         #  before via checksum. We also check that the file exists at the

diff --git a/elodie/localstorage.py b/elodie/localstorage.py
@@ -127,7 +127,6 @@ def checksum(self, file_path, blocksize=65536):
                 hasher.update(buf)
                 buf = f.read(blocksize)
             return hasher.hexdigest()
-        return None
 
     def get_hash(self, key):
         """Get the hash value for a given key.

diff --git a/elodie/result.py b/elodie/result.py
@@ -8,17 +8,24 @@ def __init__(self):
         self.success = 0
         self.error = 0
         self.error_items = []
+        self.duplicate = 0
+        self.duplicate_items = []
 
     def append(self, row):
         id, status = row
 
-        if status:
+        # status can only be True, False, or None
+        if status is True:
             self.success += 1
+        elif status is None: # status is only ever None if file checksum matched an existing file checksum and is therefore a duplicate file
+            self.duplicate += 1
+            self.duplicate_items.append(id)
         else:
             self.error += 1
             self.error_items.append(id)
 
     def write(self):
+        print("\n")
         if self.error > 0:
             error_headers = ["File"]
             error_result = []
@@ -29,10 +36,21 @@ def write(self):
             print(tabulate(error_result, headers=error_headers))
             print("\n")
 
+        if self.duplicate > 0:
+            duplicate_headers = ["File"]
+            duplicate_result = []
+            for id in self.duplicate_items:
+                duplicate_result.append([id])
+
+            print("****** DUPLICATE (NOT IMPORTED) DETAILS ******")
+            print(tabulate(duplicate_result, headers=duplicate_headers))
+            print("\n")
+
         headers = ["Metric", "Count"]
         result = [
                     ["Success", self.success],
                     ["Error", self.error],
+                    ["Duplicate, not imported", self.duplicate]
                  ]
 
         print("****** SUMMARY ******")