FelixChan9527
diff --git a/‎ML/Kaggles/DiabeticRetinopathy/config.py‎
Lines changed: 48 additions & 0 deletions b/‎ML/Kaggles/DiabeticRetinopathy/config.py‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎ML/Kaggles/DiabeticRetinopathy/dataset.py‎
Lines changed: 56 additions & 0 deletions b/‎ML/Kaggles/DiabeticRetinopathy/dataset.py‎
Lines changed: 56 additions & 0 deletions
diff --git a/‎ML/Kaggles/DiabeticRetinopathy/preprocess_images.py‎
Lines changed: 82 additions & 0 deletions b/‎ML/Kaggles/DiabeticRetinopathy/preprocess_images.py‎
Lines changed: 82 additions & 0 deletions
diff --git a/‎ML/Kaggles/DiabeticRetinopathy/train.py‎
Lines changed: 125 additions & 0 deletions b/‎ML/Kaggles/DiabeticRetinopathy/train.py‎
Lines changed: 125 additions & 0 deletions
@@ -0,0 +1,48 @@
+import torch
+import albumentations as A
+from albumentations.pytorch import ToTensorV2
+
+DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+LEARNING_RATE = 3e-5
+WEIGHT_DECAY = 5e-4
+BATCH_SIZE = 20
+NUM_EPOCHS = 100
+NUM_WORKERS = 6
+CHECKPOINT_FILE = "b3.pth.tar"
+PIN_MEMORY = True
+SAVE_MODEL = True
+LOAD_MODEL = True
+
+# Data augmentation for images
+train_transforms = A.Compose(
+ [
+ A.Resize(width=760, height=760),
+ A.RandomCrop(height=728, width=728),
+ A.HorizontalFlip(p=0.5),
+ A.VerticalFlip(p=0.5),
+ A.RandomRotate90(p=0.5),
+ A.Blur(p=0.3),
+ A.CLAHE(p=0.3),
+ A.ColorJitter(p=0.3),
+ A.CoarseDropout(max_holes=12, max_height=20, max_width=20, p=0.3),
+ A.IAAAffine(shear=30, rotate=0, p=0.2, mode="constant"),
+ A.Normalize(
+ mean=[0.3199, 0.2240, 0.1609],
+ std=[0.3020, 0.2183, 0.1741],
+ max_pixel_value=255.0,
+ ),
+ ToTensorV2(),
+ ]
+)
+
+val_transforms = A.Compose(
+ [
+ A.Resize(height=728, width=728),
+ A.Normalize(
+ mean=[0.3199, 0.2240, 0.1609],
+ std=[0.3020, 0.2183, 0.1741],
+ max_pixel_value=255.0,
+ ),
+ ToTensorV2(),
+ ]
+)
@@ -0,0 +1,56 @@
+import config
+import os
+import pandas as pd
+import numpy as np
+from torch.utils.data import Dataset, DataLoader
+from PIL import Image
+from tqdm import tqdm
+
+
+class DRDataset(Dataset):
+ def __init__(self, images_folder, path_to_csv, train=True, transform=None):
+ super().__init__()
+ self.data = pd.read_csv(path_to_csv)
+ self.images_folder = images_folder
+ self.image_files = os.listdir(images_folder)
+ self.transform = transform
+ self.train = train
+
+ def __len__(self):
+ return self.data.shape[0] if self.train else len(self.image_files)
+
+ def __getitem__(self, index):
+ if self.train:
+ image_file, label = self.data.iloc[index]
+ else:
+ # if test simply return -1 for label, I do this in order to
+ # re-use same dataset class for test set submission later on
+ image_file, label = self.image_files[index], -1
+ image_file = image_file.replace(".jpeg", "")
+
+ image = np.array(Image.open(os.path.join(self.images_folder, image_file+".jpeg")))
+
+ if self.transform:
+ image = self.transform(image=image)["image"]
+
+ return image, label, image_file
+
+
+if __name__ == "__main__":
+ """
+ Test if everything works ok
+ """
+ dataset = DRDataset(
+ images_folder="../train/images_resized_650/",
+ path_to_csv="../train/trainLabels.csv",
+ transform=config.val_transforms,
+ )
+ loader = DataLoader(
+ dataset=dataset, batch_size=32, num_workers=2, shuffle=True, pin_memory=True
+ )
+
+ for x, label, file in tqdm(loader):
+ print(x.shape)
+ print(label.shape)
+ import sys
+ sys.exit()
@@ -0,0 +1,82 @@
+"""
+Tries to remove unnecessary black borders around the images, and
+"trim" the images to they take up the entirety of the image.
+It's hacky & not very nice but it works :))
+"""
+
+import os
+import numpy as np
+from PIL import Image
+import warnings
+from multiprocessing import Pool
+from tqdm import tqdm
+import cv2
+
+
+def trim(im):
+ """
+ Converts image to grayscale using cv2, then computes binary matrix
+ of the pixels that are above a certain threshold, then takes out
+ the first row where a certain percetage of the pixels are above the
+ threshold will be the first clip point. Same idea for col, max row, max col.
+ """
+ percentage = 0.02
+
+ img = np.array(im)
+ img_gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+ im = img_gray > 0.1 * np.mean(img_gray[img_gray != 0])
+ row_sums = np.sum(im, axis=1)
+ col_sums = np.sum(im, axis=0)
+ rows = np.where(row_sums > img.shape[1] * percentage)[0]
+ cols = np.where(col_sums > img.shape[0] * percentage)[0]
+ min_row, min_col = np.min(rows), np.min(cols)
+ max_row, max_col = np.max(rows), np.max(cols)
+ im_crop = img[min_row : max_row + 1, min_col : max_col + 1]
+ return Image.fromarray(im_crop)
+
+
+def resize_maintain_aspect(image, desired_size):
+ """
+ Stole this from some stackoverflow post but can't remember which,
+ this will add padding to maintain the aspect ratio.
+ """
+ old_size = image.size # old_size[0] is in (width, height) format
+ ratio = float(desired_size) / max(old_size)
+ new_size = tuple([int(x * ratio) for x in old_size])
+ im = image.resize(new_size, Image.ANTIALIAS)
+ new_im = Image.new("RGB", (desired_size, desired_size))
+ new_im.paste(im, ((desired_size - new_size[0]) // 2, (desired_size - new_size[1]) // 2))
+ return new_im
+
+
+def save_single(args):
+ img_file, input_path_folder, output_path_folder, output_size = args
+ image_original = Image.open(os.path.join(input_path_folder, img_file))
+ image = trim(image_original)
+ image = resize_maintain_aspect(image, desired_size=output_size[0])
+ image.save(os.path.join(output_path_folder + img_file))
+
+
+def fast_image_resize(input_path_folder, output_path_folder, output_size=None):
+ """
+ Uses multiprocessing to make it fast
+ """
+ if not output_size:
+ warnings.warn("Need to specify output_size! For example: output_size=100")
+ exit()
+
+ if not os.path.exists(output_path_folder):
+ os.makedirs(output_path_folder)
+
+ jobs = [
+ (file, input_path_folder, output_path_folder, output_size)
+ for file in os.listdir(input_path_folder)
+ ]
+
+ with Pool() as p:
+ list(tqdm(p.imap_unordered(save_single, jobs), total=len(jobs)))
+
+
+if __name__ == "__main__":
+ fast_image_resize("../train/images/", "../train/images_resized_150/", output_size=(150, 150))
+ fast_image_resize("../test/images/", "../test/images_resized_150/", output_size=(150, 150))
@@ -0,0 +1,125 @@
+import torch
+from torch import nn, optim
+import os
+import config
+from torch.utils.data import DataLoader
+from tqdm import tqdm
+from sklearn.metrics import cohen_kappa_score
+from efficientnet_pytorch import EfficientNet
+from dataset import DRDataset
+from torchvision.utils import save_image
+from utils import (
+ load_checkpoint,
+ save_checkpoint,
+ check_accuracy,
+ make_prediction,
+ get_csv_for_blend,
+)
+
+
+def train_one_epoch(loader, model, optimizer, loss_fn, scaler, device):
+ losses = []
+ loop = tqdm(loader)
+ for batch_idx, (data, targets, _) in enumerate(loop):
+ # save examples and make sure they look ok with the data augmentation,
+ # tip is to first set mean=[0,0,0], std=[1,1,1] so they look "normal"
+ #save_image(data, f"hi_{batch_idx}.png")
+
+ data = data.to(device=device)
+ targets = targets.to(device=device)
+
+ # forward
+ with torch.cuda.amp.autocast():
+ scores = model(data)
+ loss = loss_fn(scores, targets.unsqueeze(1).float())
+
+ losses.append(loss.item())
+
+ # backward
+ optimizer.zero_grad()
+ scaler.scale(loss).backward()
+ scaler.step(optimizer)
+ scaler.update()
+ loop.set_postfix(loss=loss.item())
+
+ print(f"Loss average over epoch: {sum(losses)/len(losses)}")
+
+
+def main():
+ train_ds = DRDataset(
+ images_folder="train/images_preprocessed_1000/",
+ path_to_csv="train/trainLabels.csv",
+ transform=config.val_transforms,
+ )
+ val_ds = DRDataset(
+ images_folder="train/images_preprocessed_1000/",
+ path_to_csv="train/valLabels.csv",
+ transform=config.val_transforms,
+ )
+ test_ds = DRDataset(
+ images_folder="test/images_preprocessed_1000",
+ path_to_csv="train/trainLabels.csv",
+ transform=config.val_transforms,
+ train=False,
+ )
+ test_loader = DataLoader(
+ test_ds, batch_size=config.BATCH_SIZE, num_workers=6, shuffle=False
+ )
+ train_loader = DataLoader(
+ train_ds,
+ batch_size=config.BATCH_SIZE,
+ num_workers=config.NUM_WORKERS,
+ pin_memory=config.PIN_MEMORY,
+ shuffle=False,
+ )
+ val_loader = DataLoader(
+ val_ds,
+ batch_size=config.BATCH_SIZE,
+ num_workers=2,
+ pin_memory=config.PIN_MEMORY,
+ shuffle=False,
+ )
+ loss_fn = nn.MSELoss()
+
+ model = EfficientNet.from_pretrained("efficientnet-b3")
+ model._fc = nn.Linear(1536, 1)
+ model = model.to(config.DEVICE)
+ optimizer = optim.Adam(model.parameters(), lr=config.LEARNING_RATE, weight_decay=config.WEIGHT_DECAY)
+ scaler = torch.cuda.amp.GradScaler()
+
+ if config.LOAD_MODEL and config.CHECKPOINT_FILE in os.listdir():
+ load_checkpoint(torch.load(config.CHECKPOINT_FILE), model, optimizer, config.LEARNING_RATE)
+
+ # Run after training is done and you've achieved good result
+ # on validation set, then run train_blend.py file to use information
+ # about both eyes concatenated
+ get_csv_for_blend(val_loader, model, "../train/val_blend.csv")
+ get_csv_for_blend(train_loader, model, "../train/train_blend.csv")
+ get_csv_for_blend(test_loader, model, "../train/test_blend.csv")
+ make_prediction(model, test_loader, "submission_.csv")
+ import sys
+ sys.exit()
+ #make_prediction(model, test_loader)
+
+ for epoch in range(config.NUM_EPOCHS):
+ train_one_epoch(train_loader, model, optimizer, loss_fn, scaler, config.DEVICE)
+
+ # get on validation
+ preds, labels = check_accuracy(val_loader, model, config.DEVICE)
+ print(f"QuadraticWeightedKappa (Validation): {cohen_kappa_score(labels, preds, weights='quadratic')}")
+
+ # get on train
+ #preds, labels = check_accuracy(train_loader, model, config.DEVICE)
+ #print(f"QuadraticWeightedKappa (Training): {cohen_kappa_score(labels, preds, weights='quadratic')}")
+
+ if config.SAVE_MODEL:
+ checkpoint = {
+ "state_dict": model.state_dict(),
+ "optimizer": optimizer.state_dict(),
+ }
+ save_checkpoint(checkpoint, filename=f"b3_{epoch}.pth.tar")
+
+
+
+if __name__ == "__main__":
+ main()