-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathsplit.py
More file actions
66 lines (49 loc) · 1.68 KB
/
Copy pathsplit.py
File metadata and controls
66 lines (49 loc) · 1.68 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
import os
import random
import shutil
# ---------------- CONFIG ---------------- #
SOURCE_DIR = "mobilenet_data"
TARGET_DIR = "dataset"
TRAIN_RATIO = 0.8 # 80% train, 20% val
RANDOM_SEED = 42 # reproducibility
# ---------------------------------------- #
def split_train_val():
random.seed(RANDOM_SEED)
classes = [
d for d in os.listdir(SOURCE_DIR)
if os.path.isdir(os.path.join(SOURCE_DIR, d))
]
if not classes:
raise RuntimeError("No class folders found. Check SOURCE_DIR.")
for split in ["train", "val"]:
for cls in classes:
os.makedirs(os.path.join(TARGET_DIR, split, cls), exist_ok=True)
for cls in classes:
cls_path = os.path.join(SOURCE_DIR, cls)
images = [
f for f in os.listdir(cls_path)
if f.lower().endswith((".jpg", ".jpeg", ".png"))
]
if len(images) < 5:
print(f"⚠️ Very few samples in class '{cls}'")
random.shuffle(images)
split_idx = int(len(images) * TRAIN_RATIO)
train_imgs = images[:split_idx]
val_imgs = images[split_idx:]
for img in train_imgs:
shutil.copy2(
os.path.join(cls_path, img),
os.path.join(TARGET_DIR, "train", cls, img)
)
for img in val_imgs:
shutil.copy2(
os.path.join(cls_path, img),
os.path.join(TARGET_DIR, "val", cls, img)
)
print(
f"Class '{cls}': "
f"{len(train_imgs)} train | {len(val_imgs)} val"
)
print("\n✅ Train/Val split completed successfully.")
if __name__ == "__main__":
split_train_val()