CA_Basic/basic_large.py

import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import matplotlib.pyplot as plt
import numpy as np
import skimage
from skimage import io
import random
import math
import argparse
random.seed(2574)

def to_alpha(x):
    return torch.clamp(x[3:4,:,:], 0.0, 1.0)

def to_rgb(x):
    rgb, a = x[:3,:,:], to_alpha(x)
    return torch.clamp(1.0-a+rgb, 0.0, 1.0)

def show_tensor(t):
    plt.imshow(to_rgb(t).cpu().detach().permute(1,2,0))

def show_hidden(t, section):
    plt.imshow(torch.clamp(t[(4+section*3):(7+section*3), :, :], 0.0, 1.0).cpu().detach().permute(1,2,0))

def make_initial_state(d,x,y):
    i_state = torch.zeros(d, x, y)
    i_state[3:, x//2, y//2] = 1.0
    return i_state
    
class CAModel(nn.Module):
    
    def __init__(self, env_d):
        super(CAModel, self).__init__()
        self.conv1 = nn.Conv2d(env_d*3,144,1)
        self.conv2 = nn.Conv2d(144,env_d,1)
        nn.init.zeros_(self.conv2.weight)
        nn.init.zeros_(self.conv2.bias)
        
    def forward(self, x):
        x = F.relu(self.conv1(x))
        return self.conv2(x)
    
class CASimulator():
    
    def __init__(self):
        self.ENV_X = 256
        self.ENV_Y = 256
        self.ENV_D = 16
        self.step_size = 1.0
        self.update_probability = 0.5
        self.cur_batch_size = 1
        self.train_steps = 64000
        self.sim_min_steps = 160
        self.sim_max_steps = 208
        self.device = torch.device('cuda:1')
        self.normalize_grads = True
        self.initial_state = make_initial_state(self.ENV_D, self.ENV_X, self.ENV_Y)
        self.initial_state = self.initial_state.to(self.device)
        self.current_states = self.initial_state.repeat(self.cur_batch_size,1,1,1)
        self.current_states = self.current_states.to(self.device)
        self.ca_model = CAModel(self.ENV_D)
        self.ca_model = self.ca_model.to(self.device)
        #self.ca_model = nn.DataParallel(self.ca_model)
        self.output_path = 'output'
        self.checkpoint_path = 'checkpoints'
        image_paths = [f'img/{p}.png' for p in ['tree']]
        self.target_count = len(image_paths)
        if (self.cur_batch_size % len(image_paths) != 0):
            raise 'batch size must be divisible by number of image targets'
        self.sims_per_image = self.cur_batch_size//self.target_count

        first_img = skimage.img_as_float(io.imread(image_paths[0]))
        first_tens = torch.tensor(first_img).float().permute(2,0,1).repeat(self.sims_per_image,1,1,1)
        for im_path in image_paths[1:]:
            next_img = skimage.img_as_float(io.imread(im_path))
            next_tens = torch.tensor(next_img).float().permute(2,0,1).repeat(self.sims_per_image,1,1,1)
            first_tens = torch.cat((first_tens, next_tens), 0)
        self.target_states = first_tens.to(self.device)
        print(self.target_states.shape)

        #targ_img = skimage.img_as_float(io.imread('img/poke/bulb.png'))
        #self.target_states = torch.tensor(targ_img).float().permute(2,0,1).repeat(self.cur_batch_size,1,1,1)
        self.optimizer = optim.Adam(self.ca_model.parameters(), lr=2e-3)
        self.frames_out_count = 0
        self.losses = []

    def load_pretrained(self, path):
        self.ca_model.load_state_dict(torch.load(path))
        
    def wrap_edges(self, x):
        return F.pad(x, (1,1,1,1), 'circular', 0)
    
    def living_mask(self):
        alpha = self.current_states[:,3:4,:,:]
        return F.max_pool2d(self.wrap_edges(alpha), 3, stride=1) > 0.1
        
    def raw_senses(self):
        # state - (batch, depth, x, y)
        sobel_x = torch.tensor([[-1.0,0.0,1.0],[-2.0,0.0,2.0],[-1.0,0.0,1.0]])/8
        sobel_y = torch.tensor([[1.0,2.0,1.0],[0.0,0.0,0.0],[-1.0,-2.0,-1.0]])/8
        identity = torch.tensor([[0.0,0.0,0.0],[0.0,1.0,0.0],[0.0,0.0,0.0]])
        all_filters = torch.stack((identity, sobel_x, sobel_y))
        all_filters_batch = all_filters.repeat(self.ENV_D,1,1).unsqueeze(1)
        all_filters_batch = all_filters_batch.to(self.device)
        return F.conv2d(
            self.wrap_edges(self.current_states), 
            all_filters_batch, 
            groups=self.ENV_D
        )
    
    def sim_step(self):
        pre_update_life_mask = self.living_mask()
        state_updates = self.ca_model(self.raw_senses())*self.step_size
        # randomly block updates to enforce
        # asynchronous communication between cells
        rand_mask = torch.rand_like(
            self.current_states[:, :1, :, :]) < self.update_probability
        self.current_states += state_updates*(rand_mask.float().to(self.device))
        post_update_life_mask = self.living_mask()
        life_mask = pre_update_life_mask & post_update_life_mask
        life_mask = life_mask.to(self.device)
        self.current_states *= life_mask.float()

    def set_experiment_control_channel(self, s_index):
        # set image target channels
        self.current_states[:,-self.target_count:,:,:] = 0.0
        #self.current_states[:,-3] = 1.0
        # swap x and y here?
        #self.current_states[:,-2] = torch.clamp(torch.linspace(-1,2,self.ENV_X).repeat(self.ENV_Y, 1), 0.0, 1.0)
        #self.current_states[:,-3] = torch.clamp(torch.linspace(2,-1,self.ENV_X).repeat(self.ENV_Y, 1), 0.0, 1.0)
        #phase = s_index/200
        #self.current_states[:,-2] = torch.full_like(self.current_states[0][0], 0.5-0.5*math.cos(phase))
        #self.current_states[:,-3] = torch.full_like(self.current_states[0][0], 0.5*math.cos(phase)+0.5)
        wig = lambda x : 1/math.exp(min(x**4.0,16.0))
        k = 1.825
        phase = s_index / 200
        self.current_states[:,-3] = wig(phase)
        self.current_states[:,-2] = wig(phase-k)
        self.current_states[:,-1] = wig(phase-2*k)
        self.current_states[:,-5] = wig(phase-3*k)
        self.current_states[:,-7] = wig(phase-4*k)

    def set_unique_control_channel(self):
        # set image target channels
        self.current_states[:,-self.target_count:,:,:] = 0.0
        for i in range(self.target_count):
            self.current_states[i*self.sims_per_image:(i+1)*self.sims_per_image][:,-(i+1)] = 1.0

    def run_pretrained(self, steps, save_all):
        self.ca_model.eval()
        with torch.no_grad():
            dat_to_vis = random.randint(0,self.cur_batch_size-1)
            for i in range(steps):
                if i%50 == 0:
                    print(f'step: {i}')
                if (save_all):
                    show_tensor(self.current_states[dat_to_vis])
                    plt.savefig(f'pretrained_output/out{self.frames_out_count:06d}.png')
                    plt.clf()
                    show_hidden(self.current_states[dat_to_vis], 0)
                    plt.savefig(f'pretrained_output/out_hidden_{self.frames_out_count:06d}.png')
                    plt.clf()
                    self.frames_out_count += 1
                self.sim_step()
                self.set_experiment_control_channel(i)

    def run_sim(self, steps, run_idx, save_all):
        self.optimizer.zero_grad()
        dat_to_vis = random.randint(0,self.cur_batch_size-1)
        for i in range(steps):
            if (save_all):
                show_tensor(self.current_states[dat_to_vis])
                plt.savefig(f'{self.output_path}/all_figs/out{self.frames_out_count:06d}.png')
                plt.clf()
                show_hidden(self.current_states[dat_to_vis], 0)
                plt.savefig(f'{self.output_path}/all_figs/out_hidden_{self.frames_out_count:06d}.png')
                plt.clf()
                self.frames_out_count += 1
            self.sim_step()
            #self.set_unique_control_channel()

        loss = F.mse_loss(self.current_states[:,:4,:,:], self.target_states )
        loss.backward()
        if self.normalize_grads:
            with torch.no_grad():
                self.ca_model.conv1.weight.grad = self.ca_model.conv1.weight.grad/(self.ca_model.conv1.weight.grad.norm()+1e-8)
                self.ca_model.conv1.bias.grad = self.ca_model.conv1.bias.grad/(self.ca_model.conv1.bias.grad.norm()+1e-8)
                self.ca_model.conv2.weight.grad = self.ca_model.conv2.weight.grad/(self.ca_model.conv2.weight.grad.norm()+1e-8)
                self.ca_model.conv2.bias.grad = self.ca_model.conv2.bias.grad/(self.ca_model.conv2.bias.grad.norm()+1e-8)
        self.optimizer.step()
        lsv = loss.item()
        del loss
        self.losses.insert(0, lsv)
        self.losses = self.losses[:100]
        print(f'running loss: {sum(self.losses)/len(self.losses)}')
        print(f'loss run {run_idx} : {lsv}')
        
    def train_ca(self):
        for idx in range(self.train_steps):
            
            if (idx < 5000):
                for g in self.optimizer.param_groups:
                    g['lr'] = 6e-4
            elif (idx < 15000):
                for g in self.optimizer.param_groups:
                    g['lr'] = 3e-4
            elif (idx < 25000):
                for g in self.optimizer.param_groups:
                    g['lr'] = 2e-4
            elif (idx < 40000):
                for g in self.optimizer.param_groups:
                    g['lr'] = 1e-4
            else:
                for g in self.optimizer.param_groups:
                    g['lr'] = 7e-6
            
            self.current_states = self.initial_state.repeat(self.cur_batch_size,1,1,1)
            self.run_sim(random.randint(self.sim_min_steps, self.sim_min_steps), idx, (idx+1)%5000 == 0)
            if (idx % 10 == 0):
                show_tensor(self.current_states[random.randint(0,self.cur_batch_size-1)])
                plt.savefig(f'{self.output_path}/out{idx:06d}.png')
                plt.clf()
            if (idx % 5000 == 0):
                torch.save(self.ca_model.state_dict(), f'{self.checkpoint_path}/ca_model_step_{idx:06d}.pt')
            
if __name__ == '__main__':

    parser = argparse.ArgumentParser()

    parser.add_argument('--run-pretrained', dest='run_pretrained', action='store_true')

    parser.add_argument('--pretrained-path', type=str, default='ca_model_step_063500_multi_12')

    args = parser.parse_args()

    ca_sim = CASimulator()

    if args.run_pretrained:
        print('running pretained')
        ca_sim.load_pretrained(f'{self.checkpoint_path}/{args.pretrained_path}.pt')
        ca_sim.run_pretrained(2000, True)
    else:
        ca_sim.train_ca()