ImageImpaint_Python_II/ImageImpaint.py

import os
import sys

import PIL
import numpy as np
import torch
from matplotlib import pyplot as plt
from packaging.version import Version

import DataLoader
from DataLoader import get_image_loader
from Net import ImageNN
from netio import save_model, eval_evalset


def get_train_device():
    device = 'cuda' if torch.cuda.is_available() else 'cpu'
    print(f'Device to train net: {device}')
    return torch.device(device)


def train_model():
    # Set a known random seed for reproducibility
    np.random.seed(0)
    torch.manual_seed(0)
    device = get_train_device()

    # Prepare a path to plot to
    plotpath = "plots/"
    os.makedirs(plotpath, exist_ok=True)

    # Load datasets
    train_loader, test_loader = get_image_loader("training/", precision=np.float32)

    nn = ImageNN(n_in_channels=6, precision=np.float32)  # todo net params
    nn.train()  # init with train modeAdam
    nn.to(device)  # send net to device available

    optimizer = torch.optim.AdamW(nn.parameters(), lr=1e-3, weight_decay=1e-5)  # todo adjust parameters and lr
    loss_function = torch.nn.MSELoss()
    loss_function.to(device)
    n_epochs = 5  # todo epcchs here

    train_sample_size = len(train_loader)
    losses = []
    best_eval_loss = np.inf
    for epoch in range(n_epochs):
        print(f"Epoch {epoch}/{n_epochs}\n")
        i = 0
        for input_tensor, mask, target_tensor in train_loader:
            input_tensor = input_tensor.to(device)
            mask = mask.to(device)
            target_tensor = target_tensor.to(device)

            optimizer.zero_grad()  # reset gradients
            input_tensor = torch.cat((input_tensor, mask), 1)

            output = nn(input_tensor)  # get model output (forward pass)

            output_flat = output * (1 - mask)
            output_flat = output_flat[1 - mask > 0]

            rest = target_tensor * (1 - mask)
            rest = rest[1 - mask > 0]

            loss = loss_function(output_flat, rest)  # compute loss given model output and true target
            loss.backward()  # compute gradients (backward pass)
            optimizer.step()  # perform gradient descent update step

            losses.append(loss.item())

            i += train_loader.batch_size
            print(
                f'\rTraining epoch {epoch} [{i}/{train_sample_size * train_loader.batch_size}] (curr loss: {loss.item():.3})',
                end='')

            # eval model every 3000th sample
            if i % 3000 == 0:
                print(f"\nEvaluating model")
                eval_loss = eval_model(nn, test_loader, loss_function, device)
                print(f"Evalution loss={eval_loss}")
                if eval_loss < best_eval_loss:
                    best_eval_loss = eval_loss
                    save_model(nn)

                nn.train()

            # Plot output
            if i % 100 == 0:
                plot(input_tensor.detach().cpu().numpy()[0], target_tensor.detach().cpu().numpy()[0],
                     output.detach().cpu().numpy()[0],
                     plotpath, i, epoch)

    # evaluate model with submission pkl file
    eval_evalset()


# func to evaluate our trained model
def eval_model(model: torch.nn.Module, dataloader: torch.utils.data.DataLoader, loss_fn, device: torch.device):
    # switch to eval mode
    model.eval()
    loss = .0
    # disable gradient calculations
    with torch.no_grad():
        i = 0
        for input, mask, target in dataloader:
            input = input.to(device)
            target = target.to(device)
            mask = mask.to(device)

            input = torch.cat((input, mask), 1)
            out = model(input)

            out = out * (1 - mask)
            out = out[1 - mask > 0]

            rest = target * (1 - mask)
            rest = rest[1 - mask > 0]

            loss += loss_fn(out, rest).item()
            print(f'\rEval prog[{i}/{len(dataloader) * dataloader.batch_size}]', end='')
            i += dataloader.batch_size
    print()
    loss /= len(dataloader)
    return loss


def plot(inputs, targets, predictions, path, update, epoch):
    """Plotting the inputs, targets and predictions to file `path`"""
    os.makedirs(path, exist_ok=True)
    fig, axes = plt.subplots(ncols=4, figsize=(15, 5))

    for ax, data, title in zip(axes, [inputs, targets, predictions, predictions-targets], ["Input", "Target", "Prediction", "diff"]):
        ax.clear()
        ax.set_title(title)
        ax.imshow(DataLoader.postprocess(np.transpose(data[:3, :, :], (1, 2, 0))), interpolation="none")
        # ax.imshow(np.transpose((data[i]), (1, 2, 0)), interpolation="none")
        ax.set_axis_off()
    fig.savefig(os.path.join(path, f"{epoch:02d}_{update:07d}.png"), dpi=100)

    plt.close(fig)


def check_module_versions() -> None:
    python_check = '(\u2713)' if sys.version_info >= (3, 8) else '(\u2717)'
    numpy_check = '(\u2713)' if Version(np.__version__) >= Version('1.18') else '(\u2717)'
    torch_check = '(\u2713)' if Version(torch.__version__) >= Version('1.6.0') else '(\u2717)'
    pil_check = '(\u2713)' if Version(PIL.__version__) >= Version('6.0.0') else '(\u2717)'
    print(f'Installed Python version: {sys.version_info.major}.{sys.version_info.minor} {python_check}')
    print(f'Installed numpy version: {np.__version__} {numpy_check}')
    print(f'Installed PyTorch version: {torch.__version__} {torch_check}')
    print(f'Installed PIL version: {PIL.__version__} {pil_check}')
    assert any(x == '(\u2713)' for x in [python_check, numpy_check, torch_check, pil_check])


if __name__ == '__main__':
    check_module_versions()
    train_model()
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`import os`
			`import sys`

			`import PIL`
basic training logic 2022-06-28 16:28:36 +00:00			`import numpy as np`
implement basic structure of project 2022-06-01 10:27:58 +00:00			`import torch`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`from matplotlib import pyplot as plt`
			`from packaging.version import Version`
implement basic structure of project 2022-06-01 10:27:58 +00:00
saving of model 2022-07-01 13:35:12 +00:00			`import DataLoader`
implement basic structure of project 2022-06-01 10:27:58 +00:00			`from DataLoader import get_image_loader`
			`from Net import ImageNN`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`from netio import save_model, eval_evalset`
implmente save/load, eval structure 2022-06-01 14:07:32 +00:00

basic training logic 2022-06-28 16:28:36 +00:00			`def get_train_device():`
			`device = 'cuda' if torch.cuda.is_available() else 'cpu'`
			`print(f'Device to train net: {device}')`
			`return torch.device(device)`


implement basic structure of project 2022-06-01 10:27:58 +00:00			`def train_model():`
basic training logic 2022-06-28 16:28:36 +00:00			`# Set a known random seed for reproducibility`
			`np.random.seed(0)`
			`torch.manual_seed(0)`
			`device = get_train_device()`

lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`# Prepare a path to plot to`
			`plotpath = "plots/"`
			`os.makedirs(plotpath, exist_ok=True)`

basic training logic 2022-06-28 16:28:36 +00:00			`# Load datasets`
saving of model 2022-07-01 13:35:12 +00:00			`train_loader, test_loader = get_image_loader("training/", precision=np.float32)`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00
			`nn = ImageNN(n_in_channels=6, precision=np.float32) # todo net params`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`nn.train() # init with train modeAdam`
basic training logic 2022-06-28 16:28:36 +00:00			`nn.to(device) # send net to device available`
implement basic structure of project 2022-06-01 10:27:58 +00:00
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`optimizer = torch.optim.AdamW(nn.parameters(), lr=1e-3, weight_decay=1e-5) # todo adjust parameters and lr`
basic training logic 2022-06-28 16:28:36 +00:00			`loss_function = torch.nn.MSELoss()`
saving of model 2022-07-01 13:35:12 +00:00			`loss_function.to(device)`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`n_epochs = 5 # todo epcchs here`
basic training logic 2022-06-28 16:28:36 +00:00
			`train_sample_size = len(train_loader)`
implement basic structure of project 2022-06-01 10:27:58 +00:00			`losses = []`
add lots of validation code and correct saving of pickle file 2022-06-29 15:20:16 +00:00			`best_eval_loss = np.inf`
implement basic structure of project 2022-06-01 10:27:58 +00:00			`for epoch in range(n_epochs):`
implmente save/load, eval structure 2022-06-01 14:07:32 +00:00			`print(f"Epoch {epoch}/{n_epochs}\n")`
basic training logic 2022-06-28 16:28:36 +00:00			`i = 0`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`for input_tensor, mask, target_tensor in train_loader:`
rm wrong file edit net a bit 2022-07-11 21:36:07 +00:00			`input_tensor = input_tensor.to(device)`
			`mask = mask.to(device)`
			`target_tensor = target_tensor.to(device)`

lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`optimizer.zero_grad() # reset gradients`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`input_tensor = torch.cat((input_tensor, mask), 1)`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00
rm wrong file edit net a bit 2022-07-11 21:36:07 +00:00			`output = nn(input_tensor) # get model output (forward pass)`

			`output_flat = output * (1 - mask)`
			`output_flat = output_flat[1 - mask > 0]`

			`rest = target_tensor * (1 - mask)`
			`rest = rest[1 - mask > 0]`
basic training logic 2022-06-28 16:28:36 +00:00
rm wrong file edit net a bit 2022-07-11 21:36:07 +00:00			`loss = loss_function(output_flat, rest) # compute loss given model output and true target`
implement basic structure of project 2022-06-01 10:27:58 +00:00			`loss.backward() # compute gradients (backward pass)`
			`optimizer.step() # perform gradient descent update step`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00
implement basic structure of project 2022-06-01 10:27:58 +00:00			`losses.append(loss.item())`

saving of model 2022-07-01 13:35:12 +00:00			`i += train_loader.batch_size`
basic training logic 2022-06-28 16:28:36 +00:00			`print(`
			`f'\rTraining epoch {epoch} [{i}/{train_sample_size * train_loader.batch_size}] (curr loss: {loss.item():.3})',`
			`end='')`

add lots of validation code and correct saving of pickle file 2022-06-29 15:20:16 +00:00			`# eval model every 3000th sample`
saving of model 2022-07-01 13:35:12 +00:00			`if i % 3000 == 0:`
basic training logic 2022-06-28 16:28:36 +00:00			`print(f"\nEvaluating model")`
			`eval_loss = eval_model(nn, test_loader, loss_function, device)`
			`print(f"Evalution loss={eval_loss}")`
add lots of validation code and correct saving of pickle file 2022-06-29 15:20:16 +00:00			`if eval_loss < best_eval_loss:`
basic training logic 2022-06-28 16:28:36 +00:00			`best_eval_loss = eval_loss`
			`save_model(nn)`

saving of model 2022-07-01 13:35:12 +00:00			`nn.train()`

lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`# Plot output`
			`if i % 100 == 0:`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`plot(input_tensor.detach().cpu().numpy()[0], target_tensor.detach().cpu().numpy()[0],`
			`output.detach().cpu().numpy()[0],`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`plotpath, i, epoch)`

saving of model 2022-07-01 13:35:12 +00:00			`# evaluate model with submission pkl file`
			`eval_evalset()`
implmente save/load, eval structure 2022-06-01 14:07:32 +00:00

basic training logic 2022-06-28 16:28:36 +00:00			`# func to evaluate our trained model`
			`def eval_model(model: torch.nn.Module, dataloader: torch.utils.data.DataLoader, loss_fn, device: torch.device):`
			`# switch to eval mode`
			`model.eval()`
			`loss = .0`
			`# disable gradient calculations`
			`with torch.no_grad():`
			`i = 0`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`for input, mask, target in dataloader:`
saving of model 2022-07-01 13:35:12 +00:00			`input = input.to(device)`
			`target = target.to(device)`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`mask = mask.to(device)`
basic training logic 2022-06-28 16:28:36 +00:00
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`input = torch.cat((input, mask), 1)`
basic training logic 2022-06-28 16:28:36 +00:00			`out = model(input)`
rm wrong file edit net a bit 2022-07-11 21:36:07 +00:00
			`out = out * (1 - mask)`
			`out = out[1 - mask > 0]`

			`rest = target * (1 - mask)`
			`rest = rest[1 - mask > 0]`

			`loss += loss_fn(out, rest).item()`
basic training logic 2022-06-28 16:28:36 +00:00			`print(f'\rEval prog[{i}/{len(dataloader) * dataloader.batch_size}]', end='')`
			`i += dataloader.batch_size`
			`print()`
			`loss /= len(dataloader)`
			`return loss`
implement basic structure of project 2022-06-01 10:27:58 +00:00

lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`def plot(inputs, targets, predictions, path, update, epoch):`
			"""Plotting the inputs, targets and predictions to file `path`"""
			`os.makedirs(path, exist_ok=True)`
rm wrong file edit net a bit 2022-07-11 21:36:07 +00:00			`fig, axes = plt.subplots(ncols=4, figsize=(15, 5))`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00
rm wrong file edit net a bit 2022-07-11 21:36:07 +00:00			`for ax, data, title in zip(axes, [inputs, targets, predictions, predictions-targets], ["Input", "Target", "Prediction", "diff"]):`
add mask to training export trainpickle file in correct format 2022-07-09 23:22:28 +00:00			`ax.clear()`
			`ax.set_title(title)`
			`ax.imshow(DataLoader.postprocess(np.transpose(data[:3, :, :], (1, 2, 0))), interpolation="none")`
			`# ax.imshow(np.transpose((data[i]), (1, 2, 0)), interpolation="none")`
			`ax.set_axis_off()`
			`fig.savefig(os.path.join(path, f"{epoch:02d}_{update:07d}.png"), dpi=100)`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00
			`plt.close(fig)`


			`def check_module_versions() -> None:`
			`python_check = '(\u2713)' if sys.version_info >= (3, 8) else '(\u2717)'`
			`numpy_check = '(\u2713)' if Version(np.__version__) >= Version('1.18') else '(\u2717)'`
			`torch_check = '(\u2713)' if Version(torch.__version__) >= Version('1.6.0') else '(\u2717)'`
			`pil_check = '(\u2713)' if Version(PIL.__version__) >= Version('6.0.0') else '(\u2717)'`
			`print(f'Installed Python version: {sys.version_info.major}.{sys.version_info.minor} {python_check}')`
			`print(f'Installed numpy version: {np.__version__} {numpy_check}')`
			`print(f'Installed PyTorch version: {torch.__version__} {torch_check}')`
			`print(f'Installed PIL version: {PIL.__version__} {pil_check}')`
			`assert any(x == '(\u2713)' for x in [python_check, numpy_check, torch_check, pil_check])`

implmente save/load, eval structure 2022-06-01 14:07:32 +00:00
saving of model 2022-07-01 13:35:12 +00:00			`if __name__ == '__main__':`
lots of improvements data augmentation plotting of intermediate pics 2022-07-02 14:11:27 +00:00			`check_module_versions()`
saving of model 2022-07-01 13:35:12 +00:00			`train_model()`