🐛 file does not exist

hang-1n-there · hang-1n-there · commit 8a41dc14358f · 2023-11-14T02:06:34.000+09:00
diff --git a/image_split.py b/image_split.py
@@ -1,6 +1,7 @@
 import os
 import shutil
 from tqdm import tqdm
+
 def split_data():
     # 원본 데이터셋 폴더와 저장할 폴더 지정
     original_dataset_folder = 'C:/cv_project/Recycling_trash/Separate_Collection/trash_dataset'
@@ -11,29 +12,28 @@ def split_data():
         os.makedirs(train_folder)
 
     # 각 batch 폴더를 돌면서 파일을 읽어와 train 폴더에 저장
-    index = 0
+    start_index = 0
     for batch_folder in tqdm(os.listdir(original_dataset_folder), desc="Processing batches"):
-        batch_folder_name = f'batch_{batch_folder}'
-        batch_folder_path = os.path.join(original_dataset_folder, batch_folder_name)
+        batch_folder_path = os.path.join(original_dataset_folder, batch_folder)
 
         # batch 폴더가 존재하는지 확인
-        if os.path.exists(batch_folder_path):
+        if os.path.isdir(batch_folder_path):
             # batch 폴더 안에 있는 파일들을 정렬
             file_list = sorted(os.listdir(batch_folder_path))
 
             # train 폴더에 파일을 복사하면서 이름을 변경
             for i, file_name in enumerate(file_list):
                 # 숫자 부분을 4자리로 맞추고 0을 추가
+                index = start_index + i
                 padded_number = f"{index:04d}" if index < 1000 else str(index)
                 new_file_name = f"{padded_number}.jpg"
 
                 source_path = os.path.join(batch_folder_path, file_name)
                 destination_path = os.path.join(train_folder, new_file_name)
                 shutil.copyfile(source_path, destination_path)
 
-                # 다음 batch 폴더에서 시작할 인덱스 업데이트
-                index += i
-
+            # 다음 batch 폴더에서 시작할 인덱스 업데이트
+            start_index += len(file_list)
 
 if __name__ == '__main__':
     split_data()