generate.py

import torch
import torch.nn.functional as F
from torch.autograd import Variable
import random
import time
import os
import numpy as np
import imutil
from PIL import Image
import pathlib
from datasets.datasets import EMNIST, ImageNet
import argparse
from models import gan
from vast.tools import set_device_gpu, set_device_cpu, device
from torchvision import transforms
import matplotlib.pyplot as plt

parser = argparse.ArgumentParser("Generating Images")

# Dataset
parser.add_argument('--dataset', type=str, default='mnist', help="mnist | svhn | cifar10 | cifar100 | tiny_imagenet")
parser.add_argument('--dataroot', type=str, default='/home/user/heizmann/data/EMNIST/')
parser.add_argument('--outf', type=str, default='./log')
parser.add_argument('--protocol', type=int, default=2, help='imagenet protocol')

# optimization
parser.add_argument('--batch-size', type=int, default=64)
parser.add_argument('--lr', type=float, default=0.1, help="learning rate for model")
parser.add_argument('--gan_lr', type=float, default=0.0002, help="learning rate for gan")
parser.add_argument('--max_epoch', type=int, default=1, help='Maximum number of epochs')
parser.add_argument('--stepsize', type=int, default=30)
parser.add_argument('--temp', type=float, default=1.0, help="temp")
parser.add_argument('--num-centers', type=int, default=1)

# model
parser.add_argument('--weight-pl', type=float, default=0.1, help="weight for center loss")
parser.add_argument('--beta', type=float, default=0.1, help="weight for entropy loss")
parser.add_argument('--model', type=str, default='classifier32')

# misc
parser.add_argument('--nz', type=int, default=100)
parser.add_argument('--ns', type=int, default=1)
parser.add_argument('--eval-freq', type=int, default=1)
parser.add_argument('--print-freq', type=int, default=100)
parser.add_argument('--gpu', type=str, default='0')
parser.add_argument('--seed', type=int, default=0)
parser.add_argument('--use-cpu', action='store_true')
parser.add_argument('--save-dir', type=str, default='../log')
parser.add_argument('--result_dir', type=str, default='../generated_emnist')

parser.add_argument('--loss', type=str, default='ARPLoss')
parser.add_argument('--eval', action='store_true', help="Eval", default=False)
parser.add_argument('--cs', action='store_true', help="Confusing Sample", default=False)

parser.add_argument('--generate', action='store_true', help="Confusing Sample", default=False)
parser.add_argument('--number_images', type= int, help="number of images to create", default = 100)


def generate_arpl_images(netG, options):

    if options["dataset"] == "imagenet":
        
        imagenet_path = '/local/scratch/datasets/ImageNet/ILSVRC2012/'
        train_file = 'protocols/p{}_train.csv'
        
        train_tr = transforms.Compose(
            [transforms.Resize(256),
            transforms.RandomCrop(224),
            transforms.RandomHorizontalFlip(0.5),
            transforms.ToTensor()])
        
        train_file = pathlib.Path(train_file.format(options["protocol"]))
            
        train_data = ImageNet(
                csv_file=train_file,
                imagenet_path=imagenet_path,
                transform=train_tr
            )
            
        trainloader = torch.utils.data.DataLoader(
            train_data,
            batch_size=options["batch_size"],
            shuffle=True,
            num_workers=4,
            pin_memory=True)
        
        options['num_classes'] = train_data.label_count
    else:
        Data = EMNIST(options=options, val = False, test = False)
        trainloader = Data.train_loader
        
    iterations = options["number_images"]    
    
    images = generate_images(netG, iterations, trainloader, options)
    
    result_dir = options["result_dir"]
    images = export_images( options=options, images=images, result_dir=result_dir, dataloader=trainloader)
    print("DONE")

def generate_images(netG, iterations, trainloader, options):
    
    # setup device
    '''if options['use_gpu'] is not None:
        set_device_gpu(index=options['gpu'] )
        print(" ============== GPU Selected! =============")
    else:
        print("No GPU device selected, training will be extremely slow")
        set_device_cpu()
    '''
    netG.train()
    
    # netG = device(netG)

    torch.cuda.empty_cache()
     
    images = []  
    for _ in range(iterations):
        total_batches = len(trainloader)  
        random_index = random.randint(0, total_batches - 1) 
        
        #select a rondom batch from the trainloader
        for i, (data, label) in enumerate(trainloader):
            if i == random_index:
                start_images = data        
                break
        
        # Skip batches that do not match the expected size
        if data.size(0) != 64:
            continue  
        
        noise = torch.FloatTensor(start_images.size(0), options['nz'], options['ns'], options['ns']).normal_(0, 1)
        noise = Variable(noise)
        noise = device(noise)
        start_images = device(start_images)
     
        #create fake data from generator
        
        fake = netG(noise)
        images.append(fake.cpu().detach())  # Append to list and ensure tensor is on CPU and detached
        
        if _ % 100 == 0:
            print("CREATED " + str(_ * 64)+ " IMAGES")

        
    # Convert list of tensors to a single tensor
    images_tensor = torch.stack(images)
    '''# NumPy array:
    images_np = images_tensor.numpy()'''
    
    return images_tensor
        
# Trajectories are written to result_dir/trajectories/
def make_video_filename(result_dir, dataloader, label_type='active'):
    trajectory_id = '{}_{}'.format(dataloader.dsf.name, int(time.time() * 1000))
    video_filename = '{}-{}-{}-{}.mjpeg'.format(label_type, trajectory_id)
    video_filename = os.path.join('trajectories', video_filename)
    video_filename = os.path.join(result_dir, video_filename)
    path = os.path.join(result_dir, 'trajectories')
    if not os.path.exists(path):
        print("Creating trajectories directory {}".format(path))
        os.mkdir(path)
    return video_filename

def export_images(options, images, result_dir, dataloader):

    if options["dataset"] != "imagenet":
        # Squeeze single color channel of non-RGB images
        images = images.data.cpu().numpy().squeeze(2)
    else:
        images = images.data.cpu().numpy()
    
    # Ensure images are scaled to 0-255 and adjust if needed
    print("Image values before scaling:", images.min(), images.max())
    if images.max() <= 1.0:
        images *= 255
    print("Image values after scaling:", images.min(), images.max())

    images_dir = os.path.join(result_dir, 'images')
    if not os.path.exists(images_dir):
        os.makedirs(images_dir)

    for batch_index, seq in enumerate(images):
        batch_images = []  
        for frame_index, frame in enumerate(seq):
            if options["dataset"] == "imagenet":
                # For ImageNet, transpose the frame to move the channel dimension to the end
                frame = np.transpose(frame, (1, 2, 0))
                img = Image.fromarray(frame.astype('uint8'), 'RGB')
            else:
                # Squeeze the single color channel for grayscale images
                frame = frame.squeeze()
                # Create a grayscale image
                img = Image.fromarray(frame.astype('uint8'), 'L')
            

            filename = f'arpl_batch{batch_index}_frame{frame_index}_{int(time.time())}.jpg'
            img.save(os.path.join(images_dir, filename))
            batch_images.append(img)

        # Create and save the grid image for each batch
        if len(batch_images) > 0:
            num_cols = max(int(np.sqrt(len(batch_images))), 1)  # Ensure at least 1 column
            num_rows = (len(batch_images) + num_cols - 1) // num_cols  # Calculate rows ensuring at least 1 row
            
            if options["dataset"] == "imagenet":
                # Create a new empty image for RGB
                grid_image = Image.new('RGB', (num_cols * frame.shape[1], num_rows * frame.shape[0]))
            else:
                # Create a new empty image for grayscale
                grid_image = Image.new('L', (num_cols * frame.shape[1], num_rows * frame.shape[0]))
                        
            # Place images in the grid
            for index, image in enumerate(batch_images):
                row = index // num_cols
                col = index % num_cols
                grid_image.paste(image, (col * frame.shape[1], row * frame.shape[0]))
            
            # Save the grid image
            grid_filename = f'arpl_batch{batch_index}_grid_{int(time.time())}.jpg'
            grid_image.save(os.path.join(images_dir, grid_filename))
        else:
            print(f"No images to process in batch {batch_index}")

    return images


def get_network(options):
    
    # setup device
    if options['use_gpu'] is not None:
        set_device_gpu(index=options['gpu'] )
        print(" ============== GPU Selected! =============")
    else:
        print("No GPU device selected, training will be extremely slow")
        set_device_cpu()
    
    nz, ns = options['nz'], 1
    
    if options["dataset"] == "imagenet":
        network = gan.Generator256(1, nz, 64, 3)
    else:
        network = gan.Generator32(1, nz, 64, 1)
    
    epoch = options["max_epoch"]
    pth = get_pth_by_epoch(options['result_dir'], "netG", epoch)
    if pth:
        print("Loading {} from checkpoint {}".format("netG", pth))
 
        state_dict = torch.load(pth, map_location=torch.device('cpu'))
        # Move to GPU if necessary after some operations or checks
        # For some reason there is a "module" prefix to the keys that is not expected in the network init"
        state_dict = {key.replace('module.', ''): value for key, value in state_dict.items()}
        network.load_state_dict(state_dict)
        
        network = device(network) 
           
        return network
    else:
        raise FileNotFoundError("could not load file from checkpoint")
     
def ensure_directory_exists(filename):
    # Assume whatever comes after the last / is the filename
    tokens = filename.split('/')[:-1]
    # Perform a mkdir -p on the rest of the path
    path = '/'.join(tokens)
    print(f"Ensuring directory exists: {path}")  # Debugging print
    pathlib.Path(path).mkdir(parents=True, exist_ok=True)
    
def get_pth_by_epoch(result_dir, name, epoch=None):
    checkpoint_path = os.path.join(result_dir, 'checkpoints/')
    ensure_directory_exists(checkpoint_path)
    files = os.listdir(checkpoint_path)
    suffix = '.pth'
    if epoch is not None:
        suffix = f'_epoch_{epoch:04d}.pth'
    target_files = [f for f in files if name in f and f.endswith(suffix)]
    if not target_files:
        return None
    full_paths = [os.path.join(checkpoint_path, fn) for fn in target_files]
    full_paths.sort(key=lambda x: os.stat(x).st_mtime, reverse=True)
    return full_paths[0] if full_paths else None


if __name__ == '__main__':
    args = parser.parse_args()
    options = vars(args)
    
    # FOR NOW HAVE THIS HARDCODED
    options.update({'use_gpu':  True})
    options['dataroot'] = os.path.join(options['dataroot'], options['dataset'])

    network = get_network(options=options)
    
    generate_arpl_images(netG=network, options=options)