2018-09-27 20:24:09 +00:00
|
|
|
#!/usr/bin/env python
|
2019-10-23 20:10:03 +00:00
|
|
|
import PySimpleGUI as sg
|
2018-07-25 10:40:14 +00:00
|
|
|
import hashlib
|
|
|
|
import os
|
|
|
|
|
2019-10-23 20:10:03 +00:00
|
|
|
'''
|
|
|
|
Find dups with PySimpleGUI
|
|
|
|
'''
|
2018-07-25 10:40:14 +00:00
|
|
|
|
|
|
|
# ====____====____==== FUNCTION DeDuplicate_folder(path) ====____====____==== #
|
|
|
|
# Function to de-duplicate the folder passed in #
|
|
|
|
# --------------------------------------------------------------------------- #
|
|
|
|
def FindDuplicatesFilesInFolder(path):
|
|
|
|
shatab = []
|
2019-10-23 20:10:03 +00:00
|
|
|
total, small_count, dup_count, error_count = [0]*4
|
2018-07-25 10:40:14 +00:00
|
|
|
pngdir = path
|
|
|
|
if not os.path.exists(path):
|
2019-10-23 20:10:03 +00:00
|
|
|
sg.popup('Duplicate Finder', '** Folder doesn\'t exist***', path)
|
2018-07-25 10:40:14 +00:00
|
|
|
return
|
|
|
|
pngfiles = os.listdir(pngdir)
|
|
|
|
total_files = len(pngfiles)
|
2019-10-23 20:10:03 +00:00
|
|
|
|
2018-07-25 10:40:14 +00:00
|
|
|
for idx, f in enumerate(pngfiles):
|
2019-10-23 20:10:03 +00:00
|
|
|
if not sg.one_line_progress_meter('Counting Duplicates',
|
|
|
|
idx + 1,
|
|
|
|
total_files,
|
|
|
|
'Counting Duplicate Files'):
|
2018-07-25 10:40:14 +00:00
|
|
|
break
|
|
|
|
total += 1
|
|
|
|
fname = os.path.join(pngdir, f)
|
|
|
|
if os.path.isdir(fname):
|
|
|
|
continue
|
|
|
|
x = open(fname, "rb").read()
|
|
|
|
|
|
|
|
m = hashlib.sha256()
|
|
|
|
m.update(x)
|
|
|
|
f_sha = m.digest()
|
|
|
|
if f_sha in shatab:
|
|
|
|
# uncomment next line to remove duplicate files
|
|
|
|
# os.remove(fname)
|
|
|
|
dup_count += 1
|
|
|
|
# sg.Print(f'Duplicate file - {f}') # cannot current use sg.Print with Progress Meter
|
|
|
|
continue
|
|
|
|
shatab.append(f_sha)
|
|
|
|
|
2019-10-23 20:10:03 +00:00
|
|
|
msg = '{} Files processed\n {} Duplicates found'.format(
|
|
|
|
total_files, dup_count)
|
|
|
|
sg.popup('Duplicate Finder Ended', msg)
|
|
|
|
|
2018-07-25 10:40:14 +00:00
|
|
|
|
|
|
|
# ====____====____==== Pseudo-MAIN program ====____====____==== #
|
|
|
|
# This is our main-alike piece of code #
|
|
|
|
# + Starts up the GUI #
|
|
|
|
# + Gets values from GUI #
|
|
|
|
# + Runs DeDupe_folder based on GUI inputs #
|
|
|
|
# ------------------------------------------------------------- #
|
|
|
|
if __name__ == '__main__':
|
|
|
|
|
|
|
|
source_folder = None
|
2019-10-23 20:10:03 +00:00
|
|
|
source_folder = sg.popup_get_folder(
|
|
|
|
'Duplicate Finder - Count number of duplicate files', 'Enter path to folder you wish to find duplicates in')
|
2018-10-29 00:01:03 +00:00
|
|
|
if source_folder is not None:
|
2018-07-25 10:40:14 +00:00
|
|
|
FindDuplicatesFilesInFolder(source_folder)
|
|
|
|
else:
|
2019-10-23 20:10:03 +00:00
|
|
|
sg.popup_cancel('Cancelling', '*** Cancelling ***')
|
2018-07-25 10:40:14 +00:00
|
|
|
exit(0)
|