main.py

import os
import sys

import cv2
import numpy as np
import math

from skimage.metrics import peak_signal_noise_ratio as psnr, structural_similarity as ssim, mean_squared_error

from PyQt5 import QtWidgets, QtGui, uic
from PyQt5.QtGui import QPixmap, QPalette, QImage, QCursor, QPainter, QPen
from PyQt5.QtCore import Qt, QMimeData
from PyQt5.QtWidgets import QApplication, QMainWindow, QScrollArea, QFileDialog, QLabel, QMessageBox, QAction, QMenu, QSizePolicy

import torch
from image_label import ImageLabel, RoiImageLabel
from fsrcnn_ir_model import FSRCNN
from vdsr_ir_model import VDSR
from edsr_ir_model import EDSR
from espcn_ir_model import ESPCN
from srgan_ir_model import SRGAN

from utils import round_to_multiple

main_window = None

class MainWindow(QMainWindow):
    def __init__(self):
        super(MainWindow, self).__init__()
        uic.loadUi('isr.ui', self)

        global main_window
        main_window = self

        self.labelResearchInputImage = RoiImageLabel()
        self.labelResearchInputImage.setROICallback(self.roi_chosen_callback)
        self.labelResearchBicubicImage = ImageLabel()
        self.labelResearchSRImage = ImageLabel()
        self.labelResearchGTImage = ImageLabel()
        self.labelProductionInputImage = ImageLabel()
        self.labelProductionSRImage = ImageLabel()

        self.btnResearchChooseImage.clicked.connect(self.research_process_input_image)
        self.btnProductionChooseImage.clicked.connect(self.production_process_input_image)

        self.btnResearchChooseROI.clicked.connect(self.research_choose_roi)

        self.cbResearchChooseModel.currentTextChanged.connect(self.research_model_changed)
        self.rbResearch_x2.toggled.connect(self.research_model_changed)
        self.cbProductionChooseModel.currentTextChanged.connect(self.production_model_changed)
        self.rbProduction_x2.toggled.connect(self.production_model_changed)

        self.actionShowHelp.triggered.connect(self.show_help)
        self.actionAbout.triggered.connect(self.show_about)

        self.research_input_image_filename = ""
        self.prod_input_image_filename = ""
        self.roi_gt = None
        self.prod_input = None
        
        self.sr_models = dict()

        self.torch_device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
        print(f"torch device is {self.torch_device}")

    def show_help(self):
        QMessageBox.information(self, "Справка", "Выберите модель из выпадающего списка и коэффициент увеличения разрешения - 2 или 4.\n\nЗатем выберите изображение. В режиме исследования, дополнительно, выберите интересующий фрагмент изображения. Ждите появления результирующих изображений на форме.\n\nПолученные изображения можно копировать в буфер обмена или сохранить в файл, кликнув по ним правой кнопкой мыши и выбрав Копировать/Сохранить.")

    def show_about(self):
        QMessageBox.information(self, "О программе", "Infrared Super Resolution, Рустем Гимадутдинов, 2022-2023")

    def research_choose_roi(self):
        if self.labelResearchInputImage.pixmap() != None:
            self.labelResearchInputImage.enableROIChoose()

    def research_process_input_image(self):
        self.research_input_image_filename, _ = QFileDialog.getOpenFileName(self, "Выбрать изображение", "", "Изображения (*.png *.jpg *.bmp)")
        if self.research_input_image_filename == "":
            return

        self.labelResearchInputImage.loadImage(self.research_input_image_filename, self.saResearchInputImage.width() - 5, self.saResearchInputImage.height() - 5, round_to_multiple(self.saResearchGTImage.width() - 10, 4))
        self.saResearchInputImage.setWidget(self.labelResearchInputImage)

    def production_process_input_image(self):
        self.prod_input_image_filename, _ = QFileDialog.getOpenFileName(self, "Выбрать изображение", "", "Изображения (*.png *.jpg *.bmp)")
        if self.prod_input_image_filename == "":
            return
        self.prod_input = cv2.imread(self.prod_input_image_filename, cv2.IMREAD_GRAYSCALE)
        self.labelProductionInputImage.setPixmapFromGrayscaleNumpy(self.prod_input)
        self.labelProductionInputImage.setToolTip("Файл: " + self.prod_input_image_filename + f"\nРазрешение: {self.prod_input.shape[1]}x{self.prod_input.shape[0]}")
        self.saProductionInputImage.setWidget(self.labelProductionInputImage)

        self.production_perform_sr()

    def production_perform_sr(self):
        QApplication.setOverrideCursor(Qt.WaitCursor)
        cur_scale = main_window.production_get_current_scale()
        model_name, model_fname = self.production_get_current_model_name()
        self.load_model(model_name, model_fname, cur_scale)

        # Inference
        if model_name == "VDSR": # For pre-upsampling methods we pass bicubic interpolated to the model
            bicub = cv2.resize(self.prod_input, (self.prod_input.shape[1] * cur_scale, self.prod_input.shape[0] * cur_scale), interpolation = cv2.INTER_CUBIC)
            sr = main_window.model_inference(main_window.sr_models[model_fname], bicub)
        else: # For post upsampling methods we pass LR to the model
            sr = main_window.model_inference(main_window.sr_models[model_fname], self.prod_input)

        # print(sr)
        # px = QPixmap(QImage(sr.data, sr.shape[1], sr.shape[0], sr.shape[1], QImage.Format_Grayscale8))
        # print(px)
        self.labelProductionSRImage.setPixmapFromGrayscaleNumpy(sr)
        self.labelProductionSRImage.setToolTip(f"{sr.shape[1]}x{sr.shape[0]}")
        self.labelProductionSRImage.setImageName(os.path.basename(self.prod_input_image_filename) + "_" + self.production_get_current_model_name()[0].lower() + "_x" + str(cur_scale))
        self.saProductionSRImage.setWidget(self.labelProductionSRImage)

        QApplication.restoreOverrideCursor()

    
    def model_inference(self, model, img):
        input_img = img.astype(np.float32) / 255.
        input_img = np.expand_dims(input_img, axis=0) # Add a batch dimension
        input_img = np.expand_dims(input_img, axis=0) # Add a batch dimension
        input_tensor = torch.from_numpy(input_img).to(self.torch_device)

        with torch.no_grad():
            output_tensor = model(input_tensor)

        output_img = output_tensor.cpu().detach().numpy()[0][0] # why second [0]
        output_img = (output_img * 255.0).clip(0, 255).astype(np.uint8) # Clip and convert to uint8
        return output_img


    def roi_chosen_callback(obj, roi_gt):
        global main_window

        main_window.roi_gt = roi_gt.copy()
        
        main_window.labelResearchGTImage.setPixmap(QPixmap(QImage(roi_gt.data, roi_gt.shape[1], roi_gt.shape[0], roi_gt.shape[1], QImage.Format_Grayscale8)))
        main_window.labelResearchGTImage.setToolTip(f"{roi_gt.shape[1]}x{roi_gt.shape[0]}")
        main_window.labelResearchBicubicImage.setToolTip(f"{roi_gt.shape[1]}x{roi_gt.shape[0]}")
        main_window.labelResearchSRImage.setToolTip(f"{roi_gt.shape[1]}x{roi_gt.shape[0]}")
        main_window.saResearchGTImage.setWidget(main_window.labelResearchGTImage)

        cur_scale = main_window.research_get_current_scale()
        # roi_tmp = cv2.resize(roi_gt, (roi_gt.shape[1] // 5, roi_gt.shape[0] // 5), interpolation = cv2.INTER_CUBIC)
        roi_lr = cv2.resize(roi_gt, (roi_gt.shape[1] // cur_scale, roi_gt.shape[0] // cur_scale), interpolation = cv2.INTER_CUBIC)
        roi_bicubic = cv2.resize(roi_lr, (roi_gt.shape[1], roi_gt.shape[0]), interpolation = cv2.INTER_CUBIC)

        main_window.labelResearchBicubicImage.setPixmap(QPixmap(QImage(roi_bicubic.data, roi_gt.shape[1], roi_gt.shape[0], roi_gt.shape[1], QImage.Format_Grayscale8)))
        main_window.saResearchBicubicImage.setWidget(main_window.labelResearchBicubicImage)

        # Calculate metrics for Bicubic
        psnr_bicubic = psnr(roi_gt, roi_bicubic)
        ssim_bicubic = ssim(roi_gt, roi_bicubic)
        # print(f"psnr_bicub = {psnr_bicubic}, ssim_bicub = {ssim_bicubic}")
        main_window.lbResearchBicubicMetrics.setText(f"PSNR: {psnr_bicubic:.2f} dB\nSSIM: {ssim_bicubic:.4f}")

        QApplication.setOverrideCursor(Qt.WaitCursor)

        model_name, model_fname = main_window.research_get_current_model_name()
        main_window.load_model(model_name, model_fname, cur_scale)

        # Inference
        if model_name == "VDSR": # For pre-upsampling methods we pass bicubic interpolated to the model
            roi_sr = main_window.model_inference(main_window.sr_models[model_fname], roi_bicubic)
        else: # For post upsampling methods we pass LR to the model
            roi_sr = main_window.model_inference(main_window.sr_models[model_fname], roi_lr)
            # print(roi_lr.shape, roi_sr.shape)

        main_window.labelResearchSRImage.setPixmap(QPixmap(QImage(roi_sr.data, roi_sr.shape[1], roi_sr.shape[0], roi_sr.shape[1], QImage.Format_Grayscale8)))
        main_window.saResearchSRImage.setWidget(main_window.labelResearchSRImage)

        # Calculate metrics for SR
        # print(roi_gt.shape, roi_sr.shape)
        psnr_sr = psnr(roi_gt, roi_sr)
        ssim_sr = ssim(roi_gt, roi_sr)
        # print(f"psnr_sr = {psnr_sr}, ssim_sr = {ssim_sr}")
        main_window.lbResearchSRMetrics.setText(f"PSNR: {psnr_sr:.2f} dB\nSSIM: {ssim_sr:.4f}")

        QApplication.restoreOverrideCursor()

    def load_model(self, model_name, model_fname, scale):
        # Load model and weight if not loaded yet
        if model_fname not in main_window.sr_models:
            if model_name == "FSRCNN":
                main_window.sr_models[model_fname] = FSRCNN(scale)
            elif model_name == "EDSR":
                main_window.sr_models[model_fname] = EDSR(scale)
            elif model_name == "VDSR":
                main_window.sr_models[model_fname] = VDSR()
            elif model_name == "ESPCN":
                main_window.sr_models[model_fname] = ESPCN(scale)
            else:
                main_window.sr_models[model_fname] = SRGAN(scale)
                print("Unknown model")

            main_window.sr_models[model_fname].load_state_dict(torch.load(model_fname, map_location=('cpu' if main_window.torch_device.type != 'cuda' else None))['state_dict'])
            main_window.sr_models[model_fname].to(main_window.torch_device)
            main_window.sr_models[model_fname].eval()
            print(f"Model {model_fname} loaded and ready")
        else:
            pass
    
    def research_get_current_model_name(self):
        model_name = self.cbResearchChooseModel.currentText()
        return model_name, model_name.lower() + "_ir_" + ("x2" if self.rbResearch_x2.isChecked() else "x4") + ".pth.tar"
    
    def production_get_current_model_name(self):
        model_name = self.cbProductionChooseModel.currentText()
        return model_name, model_name.lower() + "_ir_" + ("x2" if self.rbProduction_x2.isChecked() else "x4") + ".pth.tar"

    def research_get_current_scale(self):
        return 2 if self.rbResearch_x2.isChecked() else 4
    
    def production_get_current_scale(self):
        return 2 if self.rbProduction_x2.isChecked() else 4
    
    def research_model_changed(self):
        if type(self.roi_gt) != type(None):
            self.roi_chosen_callback(self.roi_gt)

    def production_model_changed(self):
        if type(self.prod_input) != type(None):
            self.production_perform_sr()


if __name__ == '__main__':
    app = QApplication(sys.argv)
    main_window = MainWindow()
    main_window.show()
    sys.exit(app.exec_())