-
Notifications
You must be signed in to change notification settings - Fork 0
/
remove-dupes.py
50 lines (33 loc) · 1.13 KB
/
remove-dupes.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
import os
import re
from lib.inputs import yesNo
from lib.files import traverse
# Absolute path to the directory you want to search
ROOT = r"C:\Users\[Users]\[pythonFiles]"
def removeDupes(path):
assert os.path.isdir(path)
files = [f for f in os.listdir(path) if os.path.isfile(os.path.join(path, f))]
dupFiles = []
for file in files:
position = re.search('[\w_\ ]+\d+\.\w+', file)
fileNameCut = re.sub(r'_*\s*\d+(?=.)', '', file)
if position is not None and fileNameCut in files:
dupFiles.append(file)
if len(dupFiles) == 0:
print("No duplicate files detected\n")
input("Press ENTER to exit")
return
print("---FILES---")
for file in dupFiles:
print(file)
if yesNo("Delete files (y/n): "):
for file in dupFiles:
os.remove(os.path.join(path, file))
print(f"Deleted {len(dupFiles)} files")
input("Press ENTER to exit")
def main():
assert os.path.isdir(ROOT)
sourceDir = traverse(ROOT, "Choose source directory (press ENTER to choose CWD): ")
removeDupes(sourceDir)
if __name__ == '__main__':
main()