poser/data_loader.py

import os
import numpy as np
from sklearn.model_selection import train_test_split
from PIL import Image
from colorama import Fore, init

# Initialize colorama
init(autoreset=True)

def resize_and_crop(img, target_size):
    # Resize the image while maintaining aspect ratio
    img.thumbnail((target_size[0], target_size[0]), Image.LANCZOS)

    # Get the current size
    width, height = img.size

    # Calculate dimensions to crop
    left = (width - target_size[0]) // 2
    top = (height - target_size[1]) // 2
    right = left + target_size[0]
    bottom = top + target_size[1]

    # Crop the image
    img = img.crop((left, top, right, bottom))

    return img

def load_datasets(dataset_path, img_size=(224, 224)):
    good_path = os.path.join(dataset_path, 'good')
    bad_path = os.path.join(dataset_path, 'bad')

    data = []
    labels = []

    # Load good posture images
    good_images = os.listdir(good_path)
    for img_name in good_images:
        img_path = os.path.join(good_path, img_name)
        img = Image.open(img_path).convert('RGB')
        img = resize_and_crop(img, img_size)
        img_array = np.array(img)
        data.append(img_array)
        labels.append(1)

    # Load bad posture images
    bad_images = os.listdir(bad_path)
    for img_name in bad_images:
        img_path = os.path.join(bad_path, img_name)
        img = Image.open(img_path).convert('RGB')
        img = resize_and_crop(img, img_size)
        img_array = np.array(img)
        data.append(img_array)
        labels.append(0)

    # Convert lists to numpy arrays
    X = np.array(data)
    y = np.array(labels)

    # Normalize pixel values to be between 0 and 1
    X = X.astype('float32') / 255.0

    print(Fore.CYAN + f"Total number of samples: {len(X)}")
    print(Fore.CYAN + f"Number of good posture samples: {len(good_images)}")
    print(Fore.CYAN + f"Number of bad posture samples: {len(bad_images)}")
    print(Fore.CYAN + f"Shape of X: {X.shape}")
    print(Fore.CYAN + f"Shape of y: {y.shape}")

    # Split the data into training and validation sets
    train_data, val_data, train_labels, val_labels = train_test_split(X, y, test_size=0.2, random_state=42)

    print(Fore.CYAN + f"Shape of train_data: {train_data.shape}")
    print(Fore.CYAN + f"Shape of train_labels: {train_labels.shape}")
    print(Fore.CYAN + f"Shape of val_data: {val_data.shape}")
    print(Fore.CYAN + f"Shape of val_labels: {val_labels.shape}")

    return train_data, train_labels, val_data, val_labels