update 2023

mv-lab · Jun 13, 2023 · 6f25d76 · 6f25d76
2 parents 5968c5b + d0afb83
commit 6f25d76
Show file tree

Hide file tree

Showing 5 changed files with 105 additions and 1 deletion.
diff --git a/cog.yaml b/cog.yaml
@@ -0,0 +1,13 @@
+build:
+ gpu: true
+ cuda: "11.6.2"
+ python_version: "3.10"
+ system_packages:
+ - "libgl1-mesa-glx"
+ - "libglib2.0-0"
+ python_packages:
+ - "ipython==8.4.0"
+ - "torch==1.12.1 --extra-index-url=https://download.pytorch.org/whl/cu116"
+ - "opencv-python==4.6.0.66"
+ - "timm==0.6.11"
+predict: "predict.py:Predictor"
diff --git a/media/swin2sr-figlr.gif b/media/swin2sr-figlr.gif
diff --git a/media/swin2sr-gifhr.gif b/media/swin2sr-gifhr.gif
diff --git a/models/network_swin2sr.py b/models/network_swin2sr.py
@@ -1,5 +1,5 @@
 # -----------------------------------------------------------------------------------
-# Swin2SR: Swin2SR: SwinV2 Transformer for Compressed Image Super-Resolution and Restoration, https://arxiv.org/abs/
+# Swin2SR: Swin2SR: SwinV2 Transformer for Compressed Image Super-Resolution and Restoration, https://arxiv.org/abs/2209.11345
 # Written by Conde and Choi et al.
 # -----------------------------------------------------------------------------------
 

diff --git a/predict.py b/predict.py
@@ -0,0 +1,91 @@
+import argparse
+import cv2
+import numpy as np
+import torch
+from cog import BasePredictor, Input, Path
+
+from main_test_swin2sr import define_model, test
+
+
+class Predictor(BasePredictor):
+ def setup(self):
+ """Load the model into memory to make running multiple predictions efficient"""
+ print("Loading pipeline...")
+
+ self.device = "cuda:0"
+
+ args = argparse.Namespace()
+ args.scale = 4
+ args.large_model = False
+
+ tasks = ["classical_sr", "compressed_sr", "real_sr"]
+ paths = [
+ "weights/Swin2SR_ClassicalSR_X4_64.pth",
+ "weights/Swin2SR_CompressedSR_X4_48.pth",
+ "weights/Swin2SR_RealworldSR_X4_64_BSRGAN_PSNR.pth",
+ ]
+ sizes = [64, 48, 128]
+
+ self.models = {}
+ for task, path, size in zip(tasks, paths, sizes):
+ args.training_patch_size = size
+ args.task, args.model_path = task, path
+ self.models[task] = define_model(args)
+ self.models[task].eval()
+ self.models[task] = self.models[task].to(self.device)
+
+ def predict(
+ self,
+ image: Path = Input(description="Input image"),
+ task: str = Input(
+ description="Choose a task",
+ choices=["classical_sr", "real_sr", "compressed_sr"],
+ default="real_sr",
+ ),
+ ) -> Path:
+ """Run a single prediction on the model"""
+
+ model = self.models[task]
+
+ window_size = 8
+ scale = 4
+
+ img_lq = cv2.imread(str(image), cv2.IMREAD_COLOR).astype(np.float32) / 255.0
+ img_lq = np.transpose(
+ img_lq if img_lq.shape[2] == 1 else img_lq[:, :, [2, 1, 0]], (2, 0, 1)
+ ) # HCW-BGR to CHW-RGB
+ img_lq = (
+ torch.from_numpy(img_lq).float().unsqueeze(0).to(self.device)
+ ) # CHW-RGB to NCHW-RGB
+
+ # inference
+ with torch.no_grad():
+ # pad input image to be a multiple of window_size
+ _, _, h_old, w_old = img_lq.size()
+ h_pad = (h_old // window_size + 1) * window_size - h_old
+ w_pad = (w_old // window_size + 1) * window_size - w_old
+ img_lq = torch.cat([img_lq, torch.flip(img_lq, [2])], 2)[
+ :, :, : h_old + h_pad, :
+ ]
+ img_lq = torch.cat([img_lq, torch.flip(img_lq, [3])], 3)[
+ :, :, :, : w_old + w_pad
+ ]
+
+ output = model(img_lq)
+
+ if task == "compressed_sr":
+ output = output[0][..., : h_old * scale, : w_old * scale]
+ else:
+ output = output[..., : h_old * scale, : w_old * scale]
+
+ # save image
+ output = output.data.squeeze().float().cpu().clamp_(0, 1).numpy()
+ if output.ndim == 3:
+ output = np.transpose(
+ output[[2, 1, 0], :, :], (1, 2, 0)
+ ) # CHW-RGB to HCW-BGR
+ output = (output * 255.0).round().astype(np.uint8) # float32 to uint8
+ output_path = "/tmp/out.png"
+ cv2.imwrite(output_path, output)
+
+ return Path(output_path)