Spaces:

tidalove
/

adain

Sleeping

App Files Files Community

adain / test.py

MasaTate

changed out_path

fdf102d over 3 years ago

raw

history blame

6.04 kB

	import os
	import argparse
	from turtle import end_fill
	import torch
	import time
	import numpy as np
	from pathlib import Path
	from AdaIN import AdaINNet
	from PIL import Image
	from torchvision.utils import save_image
	from torchvision.transforms import ToPILImage
	from utils import adaptive_instance_normalization, grid_image, transform, Range
	from glob import glob

	parser = argparse.ArgumentParser()
	parser.add_argument('--content_image', type=str, help='Content image file path')
	parser.add_argument('--content_dir', type=str, help='Content image folder path')
	parser.add_argument('--style_image', type=str, help='Style image file path')
	parser.add_argument('--style_dir', type=str, help='Content image folder path')
	parser.add_argument('--decoder_weight', type=str, default='decoder.pth', help='Decoder weight file path')
	parser.add_argument('--alpha', type=float, default=1.0, choices=[Range(0.0, 1.0)], help='Alpha [0.0, 1.0] controls style transfer level')
	parser.add_argument('--cuda', action='store_true', help='Use CUDA')
	parser.add_argument('--grid_pth', type=str, default=None, help='Specify a grid image path (default=None) if generate a grid image that contains all style transferred images')
	parser.add_argument('--color_control', action='store_true', help='Preserve content color')
	args = parser.parse_args()
	assert args.content_image or args.content_dir
	assert args.style_image or args.style_dir
	assert args.decoder_weight

	device = torch.device('cuda' if args.cuda and torch.cuda.is_available() else 'cpu')


	def style_transfer(content_tensor, style_tensor, encoder, decoder, alpha=1.0):
	"""
	Given content image and style image, generate feature maps with encoder, apply
	neural style transfer with adaptive instance normalization, generate output image
	with decoder

	Args:
	content_tensor (torch.FloatTensor): Content image
	style_tensor (torch.FloatTensor): Style Image
	encoder: Encoder (vgg19) network
	decoder: Decoder network
	alpha (float, default=1.0): Weight of style image feature

	Return:
	output_tensor (torch.FloatTensor): Style Transfer output image
	"""

	content_enc = encoder(content_tensor)
	style_enc = encoder(style_tensor)

	transfer_enc = adaptive_instance_normalization(content_enc, style_enc)

	mix_enc = alpha * transfer_enc + (1-alpha) * content_enc
	return decoder(mix_enc)


	def linear_histogram_matching(content_tensor, style_tensor):
	"""
	Given content_tensor and style_tensor, transform style_tensor histogram to that of content_tensor.

	Args:
	content_tensor (torch.FloatTensor): Content image
	style_tensor (torch.FloatTensor): Style Image

	Return:
	style_tensor (torch.FloatTensor): histogram matched Style Image
	"""
	std_ct_1, mean_ct_1 = torch.var_mean(content_tensor[0][0],unbiased = False)
	std_ct_2, mean_ct_2 = torch.var_mean(content_tensor[0][1],unbiased = False)
	std_ct_3, mean_ct_3 = torch.var_mean(content_tensor[0][2],unbiased = False)
	std_st_1, mean_st_1 = torch.var_mean(style_tensor[0][0],unbiased = False)
	std_st_2, mean_st_2 = torch.var_mean(style_tensor[0][1],unbiased = False)
	std_st_3, mean_st_3 = torch.var_mean(style_tensor[0][2],unbiased = False)
	style_tensor[0][0] = (style_tensor[0][0] - mean_st_1) * std_ct_1 / std_st_1 + mean_ct_1
	style_tensor[0][1] = (style_tensor[0][1] - mean_st_2) * std_ct_2 / std_st_2 + mean_ct_2
	style_tensor[0][2] = (style_tensor[0][2] - mean_st_3) * std_ct_3 / std_st_3 + mean_ct_3
	return style_tensor


	def main():
	# Read content images and style images
	if args.content_image:
	content_pths = [Path(args.content_image)]
	else:
	content_pths = [Path(f) for f in glob(args.content_dir+'/*')]

	if args.style_image:
	style_pths = [Path(args.style_image)]
	else:
	style_pths = [Path(f) for f in glob(args.style_dir+'/*')]

	assert len(content_pths) > 0, 'Failed to load content image'
	assert len(style_pths) > 0, 'Failed to load style image'

	# Prepare directory for saving results
	out_dir = './results/'
	os.makedirs(out_dir, exist_ok=True)

	# Load AdaIN model
	vgg = torch.load('vgg_normalized.pth')
	model = AdaINNet(vgg).to(device)
	model.decoder.load_state_dict(torch.load(args.decoder_weight))
	model.eval()

	# Prepare image transform
	t = transform(512)

	# Prepare grid image, add style images to the first row
	if args.grid_pth:
	# Add empty image
	imgs = [np.ones((1, 1, 3), np.uint8) * 255]
	for style_pth in style_pths:
	imgs.append(Image.open(style_pth))

	# Timer
	times = []

	for content_pth in content_pths:
	content_img = Image.open(content_pth)
	content_tensor = t(content_img).unsqueeze(0).to(device)

	if args.grid_pth:
	imgs.append(content_img)

	for style_pth in style_pths:

	style_tensor = t(Image.open(style_pth)).unsqueeze(0).to(device)

	# Linear Histogram Matching if needed
	if args.color_control:
	style_tensor = linear_histogram_matching(content_tensor,style_tensor)

	# Start time
	tic = time.perf_counter()

	# Execute style transfer
	with torch.no_grad():
	out_tensor = style_transfer(content_tensor, style_tensor, model.encoder, model.decoder, args.alpha).cpu()

	# End time
	toc = time.perf_counter()
	print("Content: " + content_pth.stem + ". Style: " \
	+ style_pth.stem + '. Alpha: ' + str(args.alpha) + '. Style Transfer time: %.4f seconds' % (toc-tic))
	times.append(toc-tic)

	# Save image
	out_pth = out_dir + content_pth.stem + '_style_' + style_pth.stem + '_alpha' + str(args.alpha)
	if args.color_control: out_pth += '_colorcontrol'
	out_pth += content_pth.suffix
	save_image(out_tensor, out_pth)

	if args.grid_pth:
	imgs.append(Image.open(out_pth))

	# Remove runtime of first iteration because it is flawed for some unknown reason
	if len(times) > 1:
	times.pop(0)
	avg = sum(times)/len(times)
	print("Average style transfer time: %.4f seconds" % (avg))

	# Generate grid image
	if args.grid_pth:
	print("Generating grid image")
	grid_image(len(content_pths) + 1, len(style_pths) + 1, imgs, save_pth=args.grid_pth)
	print("Finished")

	if __name__ == '__main__':
	main()