95 lines
3.1 KiB
Python
95 lines
3.1 KiB
Python
import jax, jax.numpy as jnp
|
|
from utils import State
|
|
from .. import BaseAlgorithm
|
|
from .genome import *
|
|
from .species import *
|
|
from .ga import *
|
|
|
|
class NEAT(BaseAlgorithm):
|
|
|
|
def __init__(
|
|
self,
|
|
genome: BaseGenome,
|
|
species: BaseSpecies,
|
|
mutation: BaseMutation = DefaultMutation(),
|
|
crossover: BaseCrossover = DefaultCrossover(),
|
|
):
|
|
self.genome = genome
|
|
self.species = species
|
|
self.mutation = mutation
|
|
self.crossover = crossover
|
|
|
|
def setup(self, randkey):
|
|
k1, k2 = jax.random.split(randkey, 2)
|
|
return State(
|
|
randkey=k1,
|
|
generation=0,
|
|
next_node_key=max(*self.genome.input_idx, *self.genome.output_idx) + 2,
|
|
# inputs nodes, output nodes, 1 hidden node
|
|
species=self.species.setup(k2),
|
|
)
|
|
|
|
def ask(self, state: State):
|
|
return self.species.ask(state)
|
|
|
|
def tell(self, state: State, fitness):
|
|
k1, k2, randkey = jax.random.split(state.randkey, 3)
|
|
|
|
state = state.update(
|
|
generation=state.generation + 1,
|
|
randkey=randkey
|
|
)
|
|
|
|
state, winner, loser, elite_mask = self.species.update_species(state, fitness, state.generation)
|
|
|
|
state = self.create_next_generation(k2, state, winner, loser, elite_mask)
|
|
|
|
state = self.species.speciate(state, state.generation)
|
|
|
|
return state
|
|
|
|
def transform(self, state: State):
|
|
"""transform the genome into a neural network"""
|
|
raise NotImplementedError
|
|
|
|
def forward(self, inputs, transformed):
|
|
raise NotImplementedError
|
|
|
|
def create_next_generation(self, randkey, state, winner, loser, elite_mask):
|
|
# prepare random keys
|
|
pop_size = self.species.pop_size
|
|
new_node_keys = jnp.arange(pop_size) + state.species.next_node_key
|
|
|
|
k1, k2 = jax.random.split(randkey, 2)
|
|
crossover_rand_keys = jax.random.split(k1, pop_size)
|
|
mutate_rand_keys = jax.random.split(k2, pop_size)
|
|
|
|
wpn, wpc = state.species.pop_nodes[winner], state.species.pop_conns[winner]
|
|
lpn, lpc = state.species.pop_nodes[loser], state.species.pop_conns[loser]
|
|
|
|
# batch crossover
|
|
n_nodes, n_conns = (jax.vmap(self.crossover, in_axes=(0, None, 0, 0, 0, 0))
|
|
(crossover_rand_keys, self.genome, wpn, wpc, lpn, lpc))
|
|
|
|
# batch mutation
|
|
m_n_nodes, m_n_conns = (jax.vmap(self.mutation, in_axes=(0, None, 0, 0, 0))
|
|
(mutate_rand_keys, self.genome, n_nodes, n_conns, new_node_keys))
|
|
|
|
# elitism don't mutate
|
|
pop_nodes = jnp.where(elite_mask[:, None, None], n_nodes, m_n_nodes)
|
|
pop_conns = jnp.where(elite_mask[:, None, None], n_conns, m_n_conns)
|
|
|
|
# update next node key
|
|
all_nodes_keys = pop_nodes[:, :, 0]
|
|
max_node_key = jnp.max(jnp.where(jnp.isnan(all_nodes_keys), -jnp.inf, all_nodes_keys))
|
|
next_node_key = max_node_key + 1
|
|
|
|
return state.update(
|
|
species=state.species.update(
|
|
pop_nodes=pop_nodes,
|
|
pop_conns=pop_conns,
|
|
),
|
|
next_node_key=next_node_key,
|
|
)
|
|
|