NeuralSpline.py

import os,sys, math, argparse
import torch
import torch.nn as nn
import torch.nn.init as winit
import torch.nn.functional as F
import torch.optim as optim
from torchvision import datasets, transforms, utils
import torch.utils.data as data
from multiprocessing import cpu_count
import numpy as np
from tqdm import tqdm
from sklearn.preprocessing import OneHotEncoder
import ptcolor


class NeuralSpline(nn.Module):
	def __init__(self, n, nc, nexperts, colorspace='srgb', apply_to='rgb', abs=False, downsample_strategy='avgpool', dropout=0.0, n_input_channels=3):
		super(NeuralSpline, self).__init__()
		# define class params
		self.n = n
		self.x0 = 0
		self.step = 1.0 / (n-1.0)
		self.nexperts = nexperts
		self.colorspace = colorspace
		self.apply_to = apply_to
		self.abs = abs
		self.dropout = dropout
		# define white point and gamma correction for conversion to lab
		if self.colorspace=='srgb':
			self.white_point = 'd65'
			self.gamma_correction = 'srgb'
		else:
			self.white_point = 'd50'
			self.gamma_correction = 1.8
		# define fixed tensors to speed up computation
		self.xs = torch.arange(0,1,1.0/255.).cuda()
		momentum = 0.01
		# compute interpolation matrix (will be stored in self.matrix)
		self._precalc()
		# define net layers
		self.c1 = nn.Conv2d(n_input_channels, nc, kernel_size=5, stride=4, padding=0)
		self.c2 = nn.Conv2d(nc, 2*nc, kernel_size=3, stride=2, padding=0)
		self.b2 = nn.BatchNorm2d(2*nc, momentum=momentum)
		self.c3 = nn.Conv2d(2*nc, 4*nc, kernel_size=3, stride=2, padding=0)
		self.b3 = nn.BatchNorm2d(4*nc, momentum=momentum)
		self.c4 = nn.Conv2d(4*nc, 8*nc, kernel_size=3, stride=2, padding=0)
		self.b4 = nn.BatchNorm2d(8*nc, momentum=momentum)
		# define downsample layers
		if downsample_strategy=='maxpool':
			self.downsample = nn.MaxPool2d(7, stride=1)
			self.fc = nn.ModuleList([])
			for i in range(nexperts):
				self.fc.append(
					nn.Sequential(
						nn.Linear(8*nc, 8*nc),
						nn.ReLU(True),
						nn.Linear(8*nc, 3*n)
					)
				)
		elif downsample_strategy=='avgpool':
			self.downsample = nn.AvgPool2d(7, stride=1)
			self.fc = nn.ModuleList([])
			for i in range(nexperts):
				self.fc.append(
					nn.Sequential(
						nn.Linear(8*nc, 8*nc),
						nn.ReLU(True),
						nn.Linear(8*nc, 3*n)
					)
				)
		elif downsample_strategy=='convs':
			self.downsample = nn.Sequential(
				nn.Conv2d(8*nc, 16*nc, kernel_size=3, stride=2, padding=0),
				nn.BatchNorm2d(16*nc, momentum=momentum),
				nn.ReLU(True),
				nn.Conv2d(16*nc, 32*nc, kernel_size=3, stride=2, padding=0),
				nn.BatchNorm2d(32*nc, momentum=momentum),
				nn.ReLU(True),
			)
			self.fc = nn.ModuleList([])
			for i in range(nexperts):
				self.fc.append(
					nn.Sequential(
						nn.Linear(32*nc, 16*nc),
						nn.ReLU(True),
						nn.Linear(16*nc, 3*n)
					)
				)
		else:
			self.downsample = nn.Sequential(
				nn.Conv2d(8*nc, 8*nc, kernel_size=1, stride=1, padding=0),
				nn.BatchNorm2d(8*nc, momentum=momentum),
				nn.ReLU(True),
				nn.Conv2d(8*nc, 3*n, kernel_size=1, stride=1, padding=0),
				nn.BatchNorm2d(3*n, momentum=momentum),
				nn.ReLU(True),
				nn.AvgPool2d(7, stride=1)
			)
			self.fc = nn.ModuleList([])
			for i in range(nexperts): self.fc.append(lambda x: x)
		# init weights
		for m in self.modules():
			if isinstance(m, nn.Conv2d):
				nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')
			elif isinstance(m, nn.BatchNorm2d):
				nn.init.constant_(m.weight, 1)
				nn.init.constant_(m.bias, 0)


	def rgb2lab(self, x):
		return ptcolor.rgb2lab(x,	white_point=self.white_point,           \
									gamma_correction=self.gamma_correction, \
									clip_rgb=not self.training,				\
									space=self.colorspace)

	def lab2rgb(self, x):
		return ptcolor.lab2rgb(x, 	white_point=self.white_point,           \
									gamma_correction=self.gamma_correction, \
									clip_rgb=not self.training,				\
									space=self.colorspace)

	def _precalc(self):
		""" Calculate interpolation mat for finding Ms.
			It will be stored in self.matrix.
		"""
		n = self.n
		mat = 4 * np.eye(n - 2)
		np.fill_diagonal(mat[1:, :-1], 1)
		np.fill_diagonal(mat[:-1, 1:], 1)
		A = 6 * np.linalg.inv(mat) / (self.step ** 2)
		z = np.zeros(n - 2)
		A = np.vstack([z, A, z])

		B = np.zeros([n - 2, n])
		np.fill_diagonal(B, 1)
		np.fill_diagonal(B[:, 1:], -2)
		np.fill_diagonal(B[:, 2:], 1)
		self.matrix = np.dot(A, B)
		self.matrix = torch.from_numpy(self.matrix).float()
		self.matrix = self.matrix.cuda()

	def interpolate(self, ys):
		""" compute the coefficients of the polynomials
		"""
		# get coefficients of the polinomials that compose the spline
		h = self.step
		#M = self.matrix.dot(ys)
		M = torch.mm(self.matrix,ys.view(-1,1)).squeeze()
		a = (M[1:] - M[:-1]) / (6 * h)
		b = M[:-1] / 2
		c = (ys[1:] - ys[:-1]) / h - (M[1:] + 2 * M[:-1]) * (h / 6)
		d = ys[:-1]
		coeffs = torch.stack([a,b,c,d], dim=0)
		return coeffs

	def apply(self, coeffs, x):
		""" interpolate new data using coefficients
		"""
		xi = torch.clamp((x - self.x0) / self.step, 0, self.n-2)
		xi = torch.floor(xi)
		xf = x - self.x0 - xi*self.step
		ones = torch.ones(xf.size()).cuda()
		ex = torch.stack([xf ** 3, xf ** 2, xf, ones], dim=0)
		#y = np.dot(coeffs.transpose(0,1), ex)
		y = torch.mm(coeffs.transpose(0,1), ex)
		# create constant mat
		sel_mat = torch.zeros(y.size(0),xi.size(0)).cuda()
		rng = torch.arange(0,xi.size(0)).cuda()
		sel_mat[xi.data.long(),rng.long()]=1
		# multiply to get the right coeffs
		res = y*sel_mat
		res = res.sum(0)
		# return
		return res


	def enhanceImage(self, input_image, ys):
		image = input_image.clone()[:3,:,:]
		splines = torch.zeros(3,self.xs.size(0))
		# for each channel of the image, define spline and apply it
		for ch in range(min(3,image.size(0))):
			cur_ch = image[ch,:,:].clone()
			cur_ys = ys[ch,:].clone()
			# calculate spline upon identity + found ys
			identity = torch.arange(0,cur_ys.size(0)).float()/(cur_ys.size(0)-1)
			identity = identity.cuda()
			cur_coeffs = self.interpolate(cur_ys+identity)
			image[ch,:,:] = self.apply(cur_coeffs, cur_ch.view(-1)).view(cur_ch.size())
			splines[ch,:] = self.apply(cur_coeffs,self.xs).data.cpu()
		return image, splines


	def forward(self, batch):
		# convert to lab if required
		if self.apply_to=='lab': batch = self.rgb2lab(batch)
		# resize if needed
		if not (batch.size(2) == 256 and batch.size(3) == 256):
			smallbatch = F.interpolate(batch, size=(256,256),mode='bilinear')
		else:
			smallbatch = batch
		# get xs of the points with CNN
		ys = F.relu(self.c1(smallbatch))
		ys = self.b2(F.relu(self.c2(ys)))
		ys = self.b3(F.relu(self.c3(ys)))
		ys = self.b4(F.relu(self.c4(ys)))
		ys = self.downsample(ys)
		ys = ys.view(ys.size(0),-1)
		if self.dropout > 0.0 and self.training: ys = F.dropout(ys, p=self.dropout, training=self.training)
		ys = torch.cat([l(ys).view(-1,3,self.n).unsqueeze(1) for l in self.fc],1) # nexp*(bs,3*n) -> (bs,nexp,3,n)
		# now we got xs and ys. We need to create the interpolating spline
		# out = [torch.zeros(batch.size()).cuda() for i in range(self.nexperts)]
		out = [torch.zeros(batch.size(0),3,batch.size(2),batch.size(3)).cuda() for i in range(self.nexperts)]
		splines = [torch.zeros(batch.size(0),3,self.xs.size(0)) for i in range(self.nexperts)]
		# for each expert
		for nexp in range(self.nexperts):
			# init output vars
			cur_out = torch.zeros(batch.size()).cuda()
			# cur_splines = torch.zeros(batch.size(0),3,self.xs.size(0))
			# for each image
			for nimg in range(batch.size(0)):
				cur_img = batch[nimg,:,:,:]
				cur_ys = ys[nimg,nexp,:,:]
				# enhance the image with the expert spline
				if self.apply_to=='rgb':
					out[nexp][nimg,:,:,:], splines[nexp][nimg,:,:] = self.enhanceImage(cur_img, cur_ys)
				else:
					# squeeze lab range to use spline in the range [0,1]
					l,a,b = cur_img[0,:,:], cur_img[1,:,:], cur_img[2,:,:]
					l,a,b = l.clone(), a.clone(), b.clone()
					l = l / 100.
					a = (a+110.)/220.
					b = (b+110.)/220.
					cur_img = torch.stack((l,a,b),0)
					# calculate and apply spline
					cur_out, cur_spline = self.enhanceImage(cur_img, cur_ys)
					# expand back to lab range
					cur_out[0,:,:] = cur_out[0,:,:].clone() * 100.
					cur_out[1,:,:] = (cur_out[1,:,:].clone()*220.)-110.
					cur_out[2,:,:] = (cur_out[2,:,:].clone()*220.)-110.
					out[nexp][nimg,:,:,:] = cur_out
					splines[nexp][nimg,:,:] = cur_spline
			# if required, apply abs
			if self.abs:
				out[nexp] = torch.abs(out[nexp])
			# convert back if in test
			if not self.training:
				if self.apply_to=='lab':
					out[nexp] = self.lab2rgb(out[nexp])
				out[nexp] = torch.clamp(out[nexp],0,1)
		return out, splines


def unique(tensor1d):
    t, idx = np.unique(tensor1d.numpy(), return_inverse=True)
    return torch.from_numpy(t), torch.from_numpy(idx)

if __name__ == "__main__":
	n = 10
	nf = 100
	spline = NeuralSpline(n,nf)
	spline.cuda()
	# img = torch.rand(1,3,256,256)
	# px_vals = unique(img)
	img = torch.rand(5,3,256,256).cuda()
	out, splines = spline(img)
	print(out.size())
	import ipdb; ipdb.set_trace()
	#ris = spline(img)