Add files via upload

povolann · web-flow · commit af4138c00580 · 2022-04-27T16:11:09.000+09:00
diff --git a/LICENSE b/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2021 Jonathan Frawley
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/README.markdown b/README.markdown
@@ -0,0 +1,87 @@
+# MedNeRF: Medical Neural Radiance Fields for Reconstructing 3D-aware CT-Projections from a Single X-ray
+
+Repository copied from:
+https://github.com/abrilcf/mednerf
+
+
+## Get the Data
+You can find all DRR in the following [link](https://drive.google.com/file/d/1_EJX3LnRMG5uXEhZ63C2eYoY4hjwmipP/view?usp=sharing). Here is a description of the folders:
+
+An <em>instance</em> comprehends 72 DRRs (each at 5 degrees) from a 360 degree rotation of a real CT scan.
+
+
+`chest_xrays` all images of the 20 chest instances (.png, res. 128x128).
+
+`knee_xrays` all images of the 5 knee instances (.png, res. 128x128)
+
+## Train a model
+Refer to graf-main folder and execute, replacing CONFIG.yaml with knee.yaml or chest.yaml
+```
+python train.py configs/CONFIG.yaml
+```
+
+## Reconstruction given an X-ray
+After training a model, you can test its capacity to reconstruct 3D-aware CT projections given a single X-ray. 
+
+Install ray tune for hyperparameter tuning with:
+```
+pip install "ray[tune]"
+```
+
+To execute the reconstruction, please refer to graf-main folder and execute:
+```
+python finetune_xray.py configs/config-file.yaml --xray_img_path path_to_xray --save_dir path_to_save_dir --model path_to_trained_model configs/knee.yaml
+```
+(to use ray for finetuning, please change the runtime environment with your configuration)
+In my case:
+```
+ray.init(runtime_env={"conda": "/home/anya/anaconda3/envs/graf", "py_modules": ["/home/anya/Programs/mednerf/graf-main/submodules", "/home/anya/Programs/mednerf/graf-main/graf", "/home/anya/Programs/mednerf/graf-main/submodules/GAN_stability/", "/home/anya/Programs/mednerf/graf-main/configs"]})
+```
+
+## PixelNeRF instructions
+To use pixelNeRF model use the following configuration files:
+
+```
+pixel-nerf/conf/exp/ct_single.conf
+pixel-nerf/conf/exp/drr.conf
+```
+
+## Generate DRR images from CT scans
+To generate xrays images (.png) at different angles from CT scans use the script `generate_drr.py` under the folder `data/`. To run it you need to install the [Plastimatch's build](http://plastimatch.org/). Version 1.9.3 was used.
+
+An updated version of the script has been added (generate_drr_multiple_dirs.py). Use this script to automatically generate the set of DRRs when you have a global folder with multiple folders containing CT scans. The files do not necessarily need to be in the immediate subfolder. You only need to assign the path location of the global folder and the global folder to save the set of DRRs.
+
+### Overview of input arguments
+Replace the following variables within the file:
+
+- `input_path`: path to the .dcm files or .mha file of the CT.
+- `save_root_path`: path where you want the xrays images to be saved. 
+- `plasti_path`: path of the build. 
+- `multiple_view_mode <True | False>`: generate single xrays from lateral or frontal views or multiple images from a circular rotation around the z axis.
+    If False you need to specify the view with the argument `frontal_dir <True | False>` (false for lateral view).
+    If True you need to specify `num_xrays` to generate equally spaced number of views and `angles` to input the difference between neighboring angles (in  degrees).
+- `preprocessing <True | False>`: set this to True if files are .dcm for Hounsfield Units conversion. Set to False if given file is raw (.mha), for which       you need to provide its path under the variable `raw_input_file`.
+- `detector_size`: pair of values in mm
+- `bg_color`: choose either black or white background.
+- `resolution`: size of the output xrays images.
+
+## Acknowledgments
+
+This codebase is heavily based on the [GRAF](https://github.com/autonomousvision/graf) code base. We also use the code from [pixel-nerf](https://github.com/sxyu/pixel-nerf) for baseline experiments.
+
+We thank all authors for the wonderful code!
+
+## Citation
+If you use our model for your research, please cite the following work.
+
+```bash
+@misc{coronafigueroa2022mednerf,
+      title={MedNeRF: Medical Neural Radiance Fields for Reconstructing 3D-aware CT-Projections from a Single X-ray}, 
+      author={Abril Corona-Figueroa and Jonathan Frawley and Sam Bond-Taylor and Sarath Bethapudi and Hubert P. H. Shum and Chris G. Willcocks},
+      year={2022},
+      eprint={2202.01020},
+      archivePrefix={arXiv},
+      primaryClass={eess.IV}
+}
+```
+
diff --git a/gan_training.py b/gan_training.py
@@ -0,0 +1,164 @@
+import torch
+import numpy as np
+import os
+from tqdm import tqdm
+
+from submodules.GAN_stability.gan_training.train import toggle_grad, Trainer as TrainerBase
+from submodules.GAN_stability.gan_training.eval import Evaluator as EvaluatorBase
+from submodules.GAN_stability.gan_training.metrics import FIDEvaluator, KIDEvaluator
+
+from .utils import save_video, color_depth_map
+
+
+class Trainer(TrainerBase):
+    def __init__(self, *args, use_amp=False, **kwargs):
+        super(Trainer, self).__init__(*args, **kwargs)
+        self.use_amp = use_amp
+        if self.use_amp:
+            self.scaler = torch.cuda.amp.GradScaler()
+
+    def generator_trainstep(self, y, z):
+        if not self.use_amp:
+            return super(Trainer, self).generator_trainstep(y, z)
+        assert (y.size(0) == z.size(0))
+        toggle_grad(self.generator, True)
+        toggle_grad(self.discriminator, False)
+        self.generator.train()
+        self.discriminator.train()
+        self.g_optimizer.zero_grad()
+
+        with torch.cuda.amp.autocast():
+            x_fake = self.generator(z, y)
+            d_fake = self.discriminator(x_fake, y)
+            gloss = self.compute_loss(d_fake, 1)
+        self.scaler.scale(gloss).backward()
+
+        self.scaler.step(self.g_optimizer)
+        self.scaler.update()
+
+        return gloss.item()
+
+    def discriminator_trainstep(self, x_real, y, z, data_aug):
+        return super(Trainer, self).discriminator_trainstep(x_real, y, z, data_aug)       # spectral norm raises error for when using amp
+
+
+class Evaluator(EvaluatorBase):
+    def __init__(self, eval_fid_kid, *args, **kwargs):
+        super(Evaluator, self).__init__(*args, **kwargs)
+        if eval_fid_kid:
+            self.inception_eval = FIDEvaluator(
+              device=self.device,
+              batch_size=self.batch_size,
+              resize=True,
+              n_samples=20000,
+              n_samples_fake=1000,
+            )
+
+    def get_rays(self, pose):
+        return self.generator.val_ray_sampler(self.generator.H, self.generator.W,
+                                              self.generator.focal, pose)[0]
+
+    def create_samples(self, z, poses=None):
+        self.generator.eval()
+        N_samples = len(z)
+        device = self.generator.device
+        if self.batch_size > 1:
+            z = z.to(device).split(self.batch_size)
+        if poses is None:
+            rays = [None] * len(z)
+        else:
+            rays = torch.stack([self.get_rays(poses[i].to(device)) for i in range(N_samples)])
+            rays = rays.split(self.batch_size)
+
+        rgb, disp, acc = [], [], []
+        with torch.no_grad():
+            if self.batch_size > 1:
+                for z_i, rays_i in tqdm(zip(z, rays), total=len(z), desc='Create samples...'):
+                    bs = len(z_i)
+                    if rays_i is not None:
+                        rays_i = rays_i.permute(1, 0, 2, 3).flatten(1, 2)       # Bx2x(HxW)xC -> 2x(BxHxW)x3
+                    rgb_i, disp_i, acc_i, _ = self.generator(z_i, rays=rays_i)
+
+                    reshape = lambda x: x.view(bs, self.generator.H, self.generator.W, x.shape[1]).permute(0, 3, 1, 2)  # (NxHxW)xC -> NxCxHxW
+                    rgb.append(reshape(rgb_i).cpu())
+                    disp.append(reshape(disp_i).cpu())
+                    acc.append(reshape(acc_i).cpu())
+            else:
+                for rays_i in rays:
+                    bs = len(z)
+                    if rays_i is not None:
+                        rays_i = rays_i.permute(1, 0, 2, 3).flatten(1, 2)       # Bx2x(HxW)xC -> 2x(BxHxW)x3
+                    rgb_i, disp_i, acc_i, _ = self.generator(z, rays=rays_i)
+
+                    reshape = lambda x: x.view(bs, self.generator.H, self.generator.W, x.shape[1]).permute(0, 3, 1, 2)  # (NxHxW)xC -> NxCxHxW
+                    rgb.append(reshape(rgb_i).cpu())
+                    disp.append(reshape(disp_i).cpu())
+                    acc.append(reshape(acc_i).cpu())
+
+        rgb = torch.cat(rgb)
+        disp = torch.cat(disp)
+        acc = torch.cat(acc)
+
+        depth = self.disp_to_cdepth(disp)
+
+        return rgb, depth, acc
+
+    def make_video(self, basename, z, poses, as_gif=True):
+        """ Generate images and save them as video.
+        z (N_samples, zdim): latent codes
+        poses (N_frames, 3 x 4): camera poses for all frames of video
+        """
+        N_samples, N_frames = len(z), len(poses)
+
+        # reshape inputs
+        z = z.unsqueeze(1).expand(-1, N_frames, -1).flatten(0, 1)  # (N_samples x N_frames) x z_dim
+        poses = poses.unsqueeze(0) \
+            .expand(N_samples, -1, -1, -1).flatten(0, 1)  # (N_samples x N_frames) x 3 x 4
+
+        rgbs, depths, accs = self.create_samples(z, poses=poses)
+
+        reshape = lambda x: x.view(N_samples, N_frames, *x.shape[1:])
+        rgbs = reshape(rgbs)
+        depths = reshape(depths)
+        print('Done, saving', rgbs.shape)
+
+        fps = min(int(N_frames / 2.), 25)          # aim for at least 2 second video
+        for i in range(N_samples):
+            save_video(rgbs[i], basename + '{:04d}_rgb.mp4'.format(i), as_gif=as_gif, fps=fps)
+            save_video(depths[i], basename + '{:04d}_depth.mp4'.format(i), as_gif=as_gif, fps=fps)
+
+    def disp_to_cdepth(self, disps):
+        """Convert depth to color values"""
+        if (disps == 2e10).all():           # no values predicted
+            return torch.ones_like(disps)
+
+        near, far = self.generator.render_kwargs_test['near'], self.generator.render_kwargs_test['far']
+
+        disps = disps / 2 + 0.5  # [-1, 1] -> [0, 1]
+
+        depth = 1. / torch.max(1e-10 * torch.ones_like(disps), disps)  # disparity -> depth
+        depth[disps == 1e10] = far  # set undefined values to far plane
+
+        # scale between near, far plane for better visualization
+        depth = (depth - near) / (far - near)
+
+        depth = np.stack([color_depth_map(d) for d in depth[:, 0].detach().cpu().numpy()])  # convert to color
+        depth = (torch.from_numpy(depth).permute(0, 3, 1, 2) / 255.) * 2 - 1  # [0, 255] -> [-1, 1]
+
+        return depth
+
+    def compute_fid_kid(self, sample_generator=None):
+        if sample_generator is None:
+            def sample():
+                while True:
+                    z = self.zdist.sample((self.batch_size,))
+                    rgb, _, _ = self.create_samples(z)
+                    # convert to uint8 and back to get correct binning
+                    rgb = (rgb / 2 + 0.5).mul_(255).clamp_(0, 255).to(torch.uint8).to(torch.float) / 255. * 2 - 1
+                    yield rgb.cpu()
+            
+            sample_generator = sample()
+
+        fid, (kids, vars) = self.inception_eval.get_fid_kid(sample_generator)
+        kid = np.mean(kids)
+        return fid, kid
diff --git a/requirements.txt b/requirements.txt
@@ -0,0 +1,6 @@
+matplotlib
+numpy
+scikit-image
+pydicom
+gdcm
+pylibjpeg-libjpeg