apply_script_diffusion.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Created on Tue Jan 14 13:46:20 2020

@author: eschweiler
"""

import os
import numpy as np
import torch
import csv
from skimage import io
from scipy.ndimage import gaussian_filter
from argparse import ArgumentParser
from torch.autograd import Variable

from dataloader.h5_dataloader import MeristemH5Tiler as Tiler
from ThirdParty.diffusion import GaussianDiffusionTrainer, GaussianDiffusionSampler
from utils.utils import print_timestamp

SEED = 1337
torch.manual_seed(SEED)
np.random.seed(SEED)


def main(hparams):
    
    
    """
    Main testing routine specific for this project
    :param hparams:
    """

    # ------------------------
    # 0 SANITY CHECKS
    # ------------------------
    if not isinstance(hparams.overlap, (tuple, list)):
        hparams.overlap = (hparams.overlap,) * len(hparams.patch_size)
    if not isinstance(hparams.crop, (tuple, list)):
        hparams.crop = (hparams.crop,) * len(hparams.patch_size)
    assert all([p-2*o-2*c>0 for p,o,c in zip(hparams.patch_size, hparams.overlap, hparams.crop)]), 'Invalid combination of patch size, overlap and crop size.'
    
    # ------------------------
    # 1 INIT LIGHTNING MODEL
    # ------------------------
    model = network(hparams=hparams)
    model = model.load_from_checkpoint(hparams.ckpt_path)
    model = model.cuda()
    
    # ------------------------
    # 2 INIT DIFFUSION PARAMETERS
    # ------------------------
    device="cuda" if torch.cuda.is_available() else "cpu"
    
    if 'diffusionmodel' in hparams.pipeline.lower():
        DiffusionTrainer = GaussianDiffusionTrainer(hparams.num_timesteps, schedule=hparams.diffusion_schedule).to(device)
        DiffusionSampler = GaussianDiffusionSampler(model, hparams.num_timesteps, t_start=hparams.timesteps_start,\
                                                    t_save=hparams.timesteps_save, t_step=hparams.timesteps_step,\
                                                    schedule=hparams.diffusion_schedule,\
                                                    mean_type='epsilon', var_type='fixedlarge').to(device)
    else :
        raise NotImplementedError()
    
    hparams.out_channels *= DiffusionSampler.__len__()
    
    # ------------------------
    # 3 INIT DATA TILER
    # ------------------------
    tiler = Tiler(hparams.test_list, no_mask=hparams.input_batch=='image', no_img=hparams.input_batch=='mask',\
                  boundary_handling='none', reduce_dim='2d' in hparams.pipeline.lower(), **vars(hparams))
    fading_map = tiler.get_fading_map()
    fading_map = np.repeat(fading_map[np.newaxis,...], hparams.out_channels, axis=0)
    
    # ------------------------
    # 4 FILE AND FOLDER CHECKS
    # ------------------------
    os.makedirs(hparams.output_path, exist_ok=True)
    file_checklist = []
    
    # ------------------------
    # 5 PROCESS EACH IMAGE
    # ------------------------
    if hparams.num_files is None or hparams.num_files < 0:
        hparams.num_files = len(tiler.data_list)
    else:
        hparams.num_files = np.minimum(len(tiler.data_list), hparams.num_files)
        
    with torch.no_grad():
            
        for image_idx in range(hparams.num_files):
            
            # Get the current state of the processed files
            if os.path.isfile(os.path.join(hparams.output_path, 'tmp_file_checklist.csv')):
                file_checklist = []
                with open(os.path.join(hparams.output_path, 'tmp_file_checklist.csv'), 'r') as f:
                    reader = csv.reader(f, delimiter=';')
                    for row in reader:
                        if not len(row)==0:
                            file_checklist.append(row[0])
            
            # Check if current file has already been processed
            if not any([f==tiler.data_list[image_idx][0 if hparams.input_batch=='image' else 1] for f in file_checklist]):
                        
                print_timestamp('_'*20)
                print_timestamp('Processing file {0}', [tiler.data_list[image_idx][0 if hparams.input_batch=='image' else 1]])
            
                # Initialize current file        
                tiler.set_data_idx(image_idx)
                
                # Determine if the patch size exceeds the image size
                working_size = tuple(np.max(np.array(tiler.locations), axis=0) - np.min(np.array(tiler.locations), axis=0) + np.array(hparams.patch_size))
                    
                # Initialize maps      
                predicted_img = np.full((hparams.out_channels,)+working_size, 0, dtype=np.float32)        
                norm_map = np.full((hparams.out_channels,)+working_size, 0, dtype=np.float32)
                
                for patch_idx in range(tiler.__len__()):
                
                    print_timestamp('Generating patch {0}/{1}...',(patch_idx+1, tiler.__len__()))
                    
                    # Get the input
                    sample = tiler.__getitem__(patch_idx)
                    
                    # Apply gaussian blur to image data
                    if hparams.blur_sigma>0:
                        for ndim in range(sample[hparams.input_batch].shape[0]-1):
                            sample[hparams.input_batch][ndim,...] = gaussian_filter(sample[hparams.input_batch][ndim,...], hparams.blur_sigma, order=0)
                    
                    data = Variable(torch.from_numpy(sample[hparams.input_batch][np.newaxis,...]).cuda())
                    data = data.float() 

                    pred_patch = data[:,:-1,...].clone()      
                    pred_patch,_,_ = DiffusionTrainer(pred_patch, hparams.timesteps_start-1)
                    
                    cond = data[:,-1:,...].clone()
                    
                    _,pred_patch = DiffusionSampler(pred_patch, cond)
                    
                    # Convert final patch to numpy for saving
                    pred_patch = [p.cpu().data.numpy() for p in pred_patch]
                    pred_patch = np.array(pred_patch)
                    #if '2d' in hparams.pipeline.lower():
                    #    pred_patch = pred_patch[:,0,...] #remove batch dimension
                    #else:
                    #    pred_patch = np.squeeze(pred_patch)
                    pred_patch = pred_patch[:,0,...] #remove batch dimension
                    pred_patch = np.reshape(pred_patch, (pred_patch.shape[0]*pred_patch.shape[1],)+pred_patch.shape[2:])
                    
                    #pred_patch = np.squeeze(pred_patch)
                    pred_patch = np.clip(pred_patch, hparams.clip[0], hparams.clip[1])
                                
                    # Get the current slice position
                    slicing = tuple(map(slice, (0,)+tuple(tiler.patch_start+tiler.global_crop_before), (hparams.out_channels,)+tuple(tiler.patch_end+tiler.global_crop_before)))
                                
                    # Add predicted patch and fading weights to the corresponding maps
                    predicted_img[slicing] = predicted_img[slicing]+pred_patch*fading_map
                    norm_map[slicing] = norm_map[slicing]+fading_map
                    
                # Normalize the predicted image
                norm_map = np.clip(norm_map, 1e-5, np.inf)
                predicted_img = predicted_img / norm_map          
                
                # Crop the predicted image to its original size
                slicing = tuple(map(slice, (0,)+tuple(tiler.global_crop_before), (hparams.out_channels,)+tuple(np.array(predicted_img.shape[1:])+np.array(tiler.global_crop_after))))
                predicted_img = predicted_img[slicing]
                
                # Save the predicted image
                predicted_img = np.transpose(predicted_img, (1,2,3,0))
                predicted_img = predicted_img.astype(np.float32)
                if hparams.out_channels > 1:       
                    for channel in range(hparams.out_channels):
                        io.imsave(os.path.join(hparams.output_path, 'pred_'+str(channel)+'_'+os.path.split(tiler.data_list[image_idx][0 if hparams.input_batch=='image' else 1])[-1][:-3]+'.tif'), predicted_img[...,channel])
                else:   
                    io.imsave(os.path.join(hparams.output_path, 'pred_'+os.path.split(tiler.data_list[image_idx][0 if hparams.input_batch=='image' else 1])[-1][:-3]+'.tif'), predicted_img[...,0])
        
                # Mark current file as processed
                file_checklist.append(tiler.data_list[image_idx][0 if hparams.input_batch=='image' else 1])
                with open(os.path.join(hparams.output_path, 'tmp_file_checklist.csv'), 'w') as f:
                    writer = csv.writer(f, delimiter=';')
                    for check_file in file_checklist:
                        writer.writerow([check_file])
                    
            else:
                print_timestamp('_'*20)
                print_timestamp('Skipping file {0}', [tiler.data_list[image_idx][0 if hparams.input_batch=='image' else 1]])
                
        # Delete temporary checklist if everything has been processed
        os.remove(os.path.join(hparams.output_path, 'tmp_file_checklist.csv'))


if __name__ == '__main__':
    # ------------------------
    # TRAINING ARGUMENTS
    # ------------------------
    # these are project-wide arguments

    parent_parser = ArgumentParser(add_help=False)

    parent_parser.add_argument(
        '--output_path',
        type=str,
        default=r'results/experiment1',
        help='output path for test results'
    )
    
    parent_parser.add_argument(
        '--ckpt_path',
        type=str,
        default=r'results/experiment1/checkpoint.ckpt',
        help='output path for test results'
    )
    
    parent_parser.add_argument(
        '--gpus',
        type=int,
        default=1,
        help='number of GPUs to use'
    )
    
    parent_parser.add_argument(
        '--overlap',
        type=int,
        default=(0,0,0),
        help='overlap of adjacent patches',
        nargs='+'
    )
    
    parent_parser.add_argument(
        '--crop',
        type=int,
        default=(0,0,0),
        help='safety crop of patches',
        nargs='+'
    )
    
    parent_parser.add_argument(
        '--input_batch',
        type=str,
        default='mask',
        help='which part of the batch is used as input (image | mask)'
    )
    
    parent_parser.add_argument(
        '--clip',
        type=float,
        default=(-1000.0, 1000.0),
        help='clipping values for network outputs',
        nargs='+'
    )
    
    parent_parser.add_argument(
        '--num_files',
        type=int,
        default=1,
        help='number of files to process'
    )
    
    parent_parser.add_argument(
        '--timesteps_start',
        type=int,
        default=400,
        help='number of steps between saves'
    )
    
    parent_parser.add_argument(
        '--timesteps_save',
        type=int,
        default=100,
        help='number of steps between saves'
    )
    
    parent_parser.add_argument(
        '--blur_sigma',
        type=int,
        default=1,
        help='sigma of gaussian blur used on input data'
    )
    
    parent_parser.add_argument(
        '--timesteps_step',
        type=int,
        default=1,
        help='timesteps skipped between iterations'
    )
    
    parent_parser.add_argument(
        '--pipeline',
        type=str,
        default='DiffusionModel3D',
        help='which pipeline to load (DiffusionModel3D | DiffusionModel2D)'
    )
        
    parent_args = parent_parser.parse_known_args()[0]
    
    # load the desired network architecture
    
    if parent_args.pipeline.lower() == 'diffusionmodel3d':
        from models.DiffusionModel3D import DiffusionModel3D as network
    elif parent_args.pipeline.lower() == 'diffusionmodel2d':
        from models.DiffusionModel2D import DiffusionModel2D as network
    else:
        raise ValueError('Unknown pipeline "{0}".'.format(parent_args.pipeline))
        
    # each LightningModule defines arguments relevant to it
    parser = network.add_model_specific_args(parent_parser)
    hyperparams = parser.parse_args()

    # ---------------------
    # RUN TRAINING
    # ---------------------
    main(hyperparams)