data_provider.py

from config import *
from sklearn.model_selection import train_test_split

#==========================================================================================

series_dirs = [series_dir for series_dir in os.listdir(DATASET_DIR) if os.path.isdir(os.path.join(DATASET_DIR, series_dir))]

image_paths = []
label_paths = []

for series_dir in series_dirs:
    images_path = os.path.join(DATASET_DIR, series_dir, "images")
    labels_path = os.path.join(DATASET_DIR, series_dir, "labels")

    image_files = glob.glob(os.path.join(images_path, '*.png'))

    image_paths.extend(image_files)
    
    for image_file in image_files:
        image_name = os.path.splitext(os.path.basename(image_file))[0]
        label_file = os.path.join(labels_path, image_name + '.png')
        label_paths.append(label_file)

print("Number of images:", len(image_paths))
print("Number of labels:", len(label_paths))


#==========================================================================================

IMAGE_SIZE = (INPUT_HEIGHT, INPUT_WIDTH)

def convert_rgb_to_class(rgb_label):
    int_label = tf.zeros((rgb_label.shape[0], rgb_label.shape[1]), dtype=tf.int32)
    for class_name, color in COLOR_MAP.items():
        class_idx = list(COLOR_MAP.keys()).index(class_name)
        mask = tf.reduce_all(tf.equal(rgb_label, color), axis=-1)
        int_label = tf.where(mask, class_idx, int_label)
    
    return int_label

# ball, Class number: 0
# field, Class number: 1
# line, Class number: 2
# background, Class number: 3


def _one_hot_encode(x: tf.Tensor, y: tf.Tensor) -> tf.Tensor:

    one_hot_map = []
    for class_name in COLOR_MAP:
        eq_list = []
        for color in COLOR_MAP[class_name]:
            eq = tf.equal(y, color)
            rd = tf.reduce_all(eq, axis=-1)
            eq_list.append(rd)
        orl = tf.reduce_any(eq_list, axis=0)
        # eq = tf.equal(y, palette[class_name])
        class_map = tf.cast(orl, tf.float32)
        one_hot_map.append(class_map)
    one_hot_map = tf.stack(one_hot_map, axis=-1)
    y = tf.cast(one_hot_map, tf.float32)
    return x, y

def load_and_preprocess_data(image_path, label_path):

    image = tf.io.read_file(image_path)
    label = tf.io.read_file(label_path)

    image = tf.image.decode_png(image, channels=3)
    label = tf.image.decode_png(label, channels=3)

    image = tf.cast(image, dtype=tf.float32)
    label = tf.cast(label, dtype=tf.float32)

    image = tf.image.resize(image, IMAGE_SIZE)
    label = tf.image.resize(label, IMAGE_SIZE, method=tf.image.ResizeMethod.NEAREST_NEIGHBOR)

    image = image / 255.0

    label = convert_rgb_to_class(label)
    
    label = tf.one_hot(label, depth=NUMBER_OF_CLASSES)

    return image, label


def data_augmentation(image, label):
    if tf.random.uniform([]) > 0.5:
        image = tf.image.flip_left_right(image)
        label = tf.image.flip_left_right(label)
        
    if tf.random.uniform([]) > 0.5:
        image = tf.image.flip_up_down(image)
        label = tf.image.flip_up_down(label)

    image = tf.clip_by_value(image, 0, 255)
    image = tf.image.random_saturation(image, lower=0.8, upper=1.2)
    image = tf.image.random_brightness(image, max_delta=0.05)
    image = tf.image.random_contrast(image, lower=0.7, upper=1.3)
    return image, label


def display_something(dataset, num_samples=5):
    
    color_lookup_bgr = np.zeros((len(COLOR_MAP), 3), dtype=np.uint8)
    for idx, (class_name, color) in enumerate(COLOR_MAP.items()):
        color_bgr = [color[2], color[1], color[0]]
        color_lookup_bgr[idx] = np.array(color_bgr, dtype=np.uint8)

    for i, (image, label) in enumerate(dataset.take(num_samples)):

        image_np = image[1].numpy()
        label_np = label[1].numpy()
        

        if label_np.ndim > 2:
            label_indices = np.argmax(label_np, axis=-1)
        else:
            label_indices = label_np

        colored_label = color_lookup_bgr[label_indices]

        image_np = cv2.cvtColor(image_np, cv2.COLOR_BGR2RGB)
        
        cv2.imshow(f'Image {i + 1}', image_np)
        cv2.imshow(f'Label {i + 1}', colored_label)
        
        cv2.waitKey(0) 
        
        cv2.destroyAllWindows()


def getData():
    train_image_paths, test_image_paths, train_label_paths, test_label_paths = train_test_split(
        image_paths, label_paths, test_size=0.15, random_state=42
    )
    
    train_dataset = tf.data.Dataset.from_tensor_slices((train_image_paths, train_label_paths))
    train_dataset = train_dataset.map(load_and_preprocess_data, num_parallel_calls=tf.data.experimental.AUTOTUNE)
    train_dataset = train_dataset.map(data_augmentation, num_parallel_calls=tf.data.experimental.AUTOTUNE)
    train_dataset = train_dataset.shuffle(buffer_size=64).batch(BATCH_SIZE).prefetch(buffer_size=tf.data.experimental.AUTOTUNE)
    train_dataset = train_dataset.repeat(5)

    test_dataset = tf.data.Dataset.from_tensor_slices((test_image_paths, test_label_paths))
    test_dataset = test_dataset.map(load_and_preprocess_data, num_parallel_calls=tf.data.experimental.AUTOTUNE)
    test_dataset = test_dataset.batch(BATCH_SIZE).prefetch(buffer_size=tf.data.experimental.AUTOTUNE)
    test_dataset = test_dataset.repeat(5)

    # display_something(train_dataset)
    return train_dataset, test_dataset