new architecture

2024-01-27 00:52:39 +08:00
parent 4efe9a53c1
commit aac41a089d
65 changed files with 1651 additions and 1783 deletions
--- a/algorithm/init.py
+++ b/algorithm/init.py
@@ -1,2 +1,2 @@
 from .base import BaseAlgorithm
 from .neat import NEAT
 from .hyperneat import HyperNEAT
--- a/algorithm/base.py
+++ b/algorithm/base.py
@@ -0,0 +1,24 @@
 from utils import State
 class BaseAlgorithm:
    def setup(self, randkey):
        """initialize the state of the algorithm"""
        raise NotImplementedError
    def ask(self, state: State):
        """require the population to be evaluated"""
        raise NotImplementedError
    def tell(self, state: State, fitness):
        """update the state of the algorithm"""
        raise NotImplementedError
    def transform(self, state: State):
        """transform the genome into a neural network"""
        raise NotImplementedError
    def forward(self, inputs, transformed):
        raise NotImplementedError
--- a/algorithm/hyperneat/init.py
+++ b/algorithm/hyperneat/init.py
@@ -1,2 +0,0 @@
 from .hyperneat import HyperNEAT
 from .substrate import NormalSubstrate, NormalSubstrateConfig
--- a/algorithm/hyperneat/hyperneat.py
+++ b/algorithm/hyperneat/hyperneat.py
@@ -1,113 +0,0 @@
 from typing import Type
 import jax
 from jax import numpy as jnp, Array, vmap
 import numpy as np
 from config import Config, HyperNeatConfig
 from core import Algorithm, Substrate, State, Genome, Gene
 from .substrate import analysis_substrate
 from algorithm import NEAT
 class HyperNEAT(Algorithm):
    def __init__(self, config: Config, gene: Type[Gene], substrate: Type[Substrate]):
        self.config = config
        self.neat = NEAT(config, gene)
        self.substrate = substrate
    def setup(self, randkey, state=State()):
        neat_key, randkey = jax.random.split(randkey)
        state = state.update(
            below_threshold=self.config.hyperneat.below_threshold,
            max_weight=self.config.hyperneat.max_weight,
        )
        state = self.neat.setup(neat_key, state)
        state = self.substrate.setup(self.config.substrate, state)
        assert self.config.hyperneat.inputs + 1 == state.input_coors.shape[0]  # +1 for bias
        assert self.config.hyperneat.outputs == state.output_coors.shape[0]
        h_input_idx, h_output_idx, h_hidden_idx, query_coors, correspond_keys = analysis_substrate(state)
        h_nodes = np.concatenate((h_input_idx, h_output_idx, h_hidden_idx))[..., np.newaxis]
        h_conns = np.zeros((correspond_keys.shape[0], 3), dtype=np.float32)
        h_conns[:, 0:2] = correspond_keys
        state = state.update(
            h_input_idx=h_input_idx,
            h_output_idx=h_output_idx,
            h_hidden_idx=h_hidden_idx,
            h_nodes=h_nodes,
            h_conns=h_conns,
            query_coors=query_coors,
        )
        return state
    def ask_algorithm(self, state: State):
        return state.pop_genomes
    def tell_algorithm(self, state: State, fitness):
        return self.neat.tell(state, fitness)
    def forward(self, state, inputs: Array, transformed: Array):
        return HyperNEATGene.forward(self.config.hyperneat, state, inputs, transformed)
    def forward_transform(self, state: State, genome: Genome):
        t = self.neat.forward_transform(state, genome)
        query_res = vmap(self.neat.forward, in_axes=(None, 0, None))(state, state.query_coors, t)
        # mute the connection with weight below threshold
        query_res = jnp.where((-state.below_threshold < query_res) & (query_res < state.below_threshold), 0., query_res)
        # make query res in range [-max_weight, max_weight]
        query_res = jnp.where(query_res > 0, query_res - state.below_threshold, query_res)
        query_res = jnp.where(query_res < 0, query_res + state.below_threshold, query_res)
        query_res = query_res / (1 - state.below_threshold) * state.max_weight
        h_conns = state.h_conns.at[:, 2:].set(query_res)
        return HyperNEATGene.forward_transform(Genome(state.h_nodes, h_conns))
 class HyperNEATGene:
    node_attrs = []  # no node attributes
    conn_attrs = ['weight']
    @staticmethod
    def forward_transform(genome: Genome):
        N = genome.nodes.shape[0]
        u_conns = jnp.zeros((N, N), dtype=jnp.float32)
        in_keys = jnp.asarray(genome.conns[:, 0], jnp.int32)
        out_keys = jnp.asarray(genome.conns[:, 1], jnp.int32)
        weights = genome.conns[:, 2]
        u_conns = u_conns.at[in_keys, out_keys].set(weights)
        return genome.nodes, u_conns
    @staticmethod
    def forward(config: HyperNeatConfig, state: State, inputs, transformed):
        batch_act, batch_agg = jax.vmap(config.activation), jax.vmap(config.aggregation)
        nodes, weights = transformed
        inputs_with_bias = jnp.concatenate((inputs, jnp.ones((1,))), axis=0)
        input_idx = state.h_input_idx
        output_idx = state.h_output_idx
        N = nodes.shape[0]
        vals = jnp.full((N,), 0.)
        def body_func(i, values):
            values = values.at[input_idx].set(inputs_with_bias)
            nodes_ins = values * weights.T
            values = batch_agg(nodes_ins)  # z = agg(ins)
            # values = values * nodes[:, 2] + nodes[:, 1]  # z = z * response + bias
            values = batch_act(values)  # z = act(z)
            return values
        vals = jax.lax.fori_loop(0, config.activate_times, body_func, vals)
        return vals[output_idx]
--- a/algorithm/hyperneat/substrate/init.py
+++ b/algorithm/hyperneat/substrate/init.py
@@ -1,2 +0,0 @@
 from .normal import NormalSubstrate, NormalSubstrateConfig
 from .tools import analysis_substrate
--- a/algorithm/hyperneat/substrate/normal.py
+++ b/algorithm/hyperneat/substrate/normal.py
@@ -1,25 +0,0 @@
 from dataclasses import dataclass
 from typing import Tuple
 import numpy as np
 from core import Substrate, State
 from config import SubstrateConfig
@dataclass(frozen=True)
 class NormalSubstrateConfig(SubstrateConfig):
    input_coors: Tuple = ((-1, -1), (0, -1), (1, -1))
    hidden_coors: Tuple = ((-1, 0), (0, 0), (1, 0))
    output_coors: Tuple = ((0, 1),)
 class NormalSubstrate(Substrate):
    @staticmethod
    def setup(config: NormalSubstrateConfig, state: State = State()):
        return state.update(
            input_coors=np.asarray(config.input_coors, dtype=np.float32),
            output_coors=np.asarray(config.output_coors, dtype=np.float32),
            hidden_coors=np.asarray(config.hidden_coors, dtype=np.float32),
        )
--- a/algorithm/hyperneat/substrate/tools.py
+++ b/algorithm/hyperneat/substrate/tools.py
@@ -1,49 +0,0 @@
 import numpy as np
 def analysis_substrate(state):
    cd = state.input_coors.shape[1]  # coordinate dimensions
    si = state.input_coors.shape[0]  # input coordinate size
    so = state.output_coors.shape[0]  # output coordinate size
    sh = state.hidden_coors.shape[0]  # hidden coordinate size
    input_idx = np.arange(si)
    output_idx = np.arange(si, si + so)
    hidden_idx = np.arange(si + so, si + so + sh)
    total_conns = si * sh + sh * sh + sh * so
    query_coors = np.zeros((total_conns, cd * 2))
    correspond_keys = np.zeros((total_conns, 2))
    # connect input to hidden
    aux_coors, aux_keys = cartesian_product(input_idx, hidden_idx, state.input_coors, state.hidden_coors)
    query_coors[0: si * sh, :] = aux_coors
    correspond_keys[0: si * sh, :] = aux_keys
    # connect hidden to hidden
    aux_coors, aux_keys = cartesian_product(hidden_idx, hidden_idx, state.hidden_coors, state.hidden_coors)
    query_coors[si * sh: si * sh + sh * sh, :] = aux_coors
    correspond_keys[si * sh: si * sh + sh * sh, :] = aux_keys
    # connect hidden to output
    aux_coors, aux_keys = cartesian_product(hidden_idx, output_idx, state.hidden_coors, state.output_coors)
    query_coors[si * sh + sh * sh:, :] = aux_coors
    correspond_keys[si * sh + sh * sh:, :] = aux_keys
    return input_idx, output_idx, hidden_idx, query_coors, correspond_keys
 def cartesian_product(keys1, keys2, coors1, coors2):
    len1 = keys1.shape[0]
    len2 = keys2.shape[0]
    repeated_coors1 = np.repeat(coors1, len2, axis=0)
    repeated_keys1 = np.repeat(keys1, len2)
    tiled_coors2 = np.tile(coors2, (len1, 1))
    tiled_keys2 = np.tile(keys2, len1)
    new_coors = np.concatenate((repeated_coors1, tiled_coors2), axis=1)
    correspond_keys = np.column_stack((repeated_keys1, tiled_keys2))
    return new_coors, correspond_keys
--- a/algorithm/neat/init.py
+++ b/algorithm/neat/init.py
@@ -1,2 +1,3 @@
 from .neat import NEAT
 from .gene import *
 from .genome import *
 from .neat import NEAT
--- a/algorithm/neat/ga/init.py
+++ b/algorithm/neat/ga/init.py
@@ -1,3 +1,2 @@
-from .crossover import crossover
+from .crossover import BaseCrossover, DefaultCrossover
-from .mutate import mutate
+from .mutation import BaseMutation, DefaultMutation
 from .operation import create_next_generation
--- a/algorithm/neat/ga/crossover.py
+++ b/algorithm/neat/ga/crossover.py
@@ -1,70 +0,0 @@
 import jax
 from jax import Array, numpy as jnp
 from core import Genome
 def crossover(randkey, genome1: Genome, genome2: Genome):
    """
    use genome1 and genome2 to generate a new genome
    notice that genome1 should have higher fitness than genome2 (genome1 is winner!)
    """
    randkey_1, randkey_2, key = jax.random.split(randkey, 3)
    # crossover nodes
    keys1, keys2 = genome1.nodes[:, 0], genome2.nodes[:, 0]
    # make homologous genes align in nodes2 align with nodes1
    nodes2 = align_array(keys1, keys2, genome2.nodes, False)
    nodes1 = genome1.nodes
    # For not homologous genes, use the value of nodes1(winner)
    # For homologous genes, use the crossover result between nodes1 and nodes2
    new_nodes = jnp.where(jnp.isnan(nodes1) | jnp.isnan(nodes2), nodes1, crossover_gene(randkey_1, nodes1, nodes2))
    # crossover connections
    con_keys1, con_keys2 = genome1.conns[:, :2], genome2.conns[:, :2]
    conns2 = align_array(con_keys1, con_keys2, genome2.conns, True)
    conns1 = genome1.conns
    new_cons = jnp.where(jnp.isnan(conns1) | jnp.isnan(conns2), conns1, crossover_gene(randkey_2, conns1, conns2))
    return genome1.update(new_nodes, new_cons)
 def align_array(seq1: Array, seq2: Array, ar2: Array, is_conn: bool) -> Array:
    """
    After I review this code, I found that it is the most difficult part of the code. Please never change it!
    make ar2 align with ar1.
    :param seq1:
    :param seq2:
    :param ar2:
    :param is_conn:
    :return:
    align means to intersect part of ar2 will be at the same position as ar1,
    non-intersect part of ar2 will be set to Nan
    """
    seq1, seq2 = seq1[:, jnp.newaxis], seq2[jnp.newaxis, :]
    mask = (seq1 == seq2) & (~jnp.isnan(seq1))
    if is_conn:
        mask = jnp.all(mask, axis=2)
    intersect_mask = mask.any(axis=1)
    idx = jnp.arange(0, len(seq1))
    idx_fixed = jnp.dot(mask, idx)
    refactor_ar2 = jnp.where(intersect_mask[:, jnp.newaxis], ar2[idx_fixed], jnp.nan)
    return refactor_ar2
 def crossover_gene(rand_key: Array, g1: Array, g2: Array) -> Array:
    """
    crossover two genes
    :param rand_key:
    :param g1:
    :param g2:
    :return:
    only gene with the same key will be crossover, thus don't need to consider change key
    """
    r = jax.random.uniform(rand_key, shape=g1.shape)
    return jnp.where(r > 0.5, g1, g2)
--- a/algorithm/neat/ga/crossover/init.py
+++ b/algorithm/neat/ga/crossover/init.py
@@ -0,0 +1,2 @@
 from .base import BaseCrossover
 from .default import DefaultCrossover
--- a/algorithm/neat/ga/crossover/base.py
+++ b/algorithm/neat/ga/crossover/base.py
@@ -0,0 +1,3 @@
 class BaseCrossover:
    def __call__(self, randkey, genome, nodes1, nodes2, conns1, conns2):
        raise NotImplementedError
--- a/algorithm/neat/ga/crossover/default.py
+++ b/algorithm/neat/ga/crossover/default.py
@@ -0,0 +1,66 @@
 import jax, jax.numpy as jnp
 from .base import BaseCrossover
 class DefaultCrossover(BaseCrossover):
    def __call__(self, randkey, genome, nodes1, nodes2, conns1, conns2):
        """
        use genome1 and genome2 to generate a new genome
        notice that genome1 should have higher fitness than genome2 (genome1 is winner!)
        """
        randkey_1, randkey_2, key = jax.random.split(randkey, 3)
        # crossover nodes
        keys1, keys2 = nodes1[:, 0], nodes2[:, 0]
        # make homologous genes align in nodes2 align with nodes1
        nodes2 = self.align_array(keys1, keys2, nodes2, False)
        # For not homologous genes, use the value of nodes1(winner)
        # For homologous genes, use the crossover result between nodes1 and nodes2
        new_nodes = jnp.where(jnp.isnan(nodes1) | jnp.isnan(nodes2), nodes1, self.crossover_gene(randkey_1, nodes1, nodes2))
        # crossover connections
        con_keys1, con_keys2 = conns1[:, :2], conns2[:, :2]
        conns2 = self.align_array(con_keys1, con_keys2, conns2, True)
        new_conns = jnp.where(jnp.isnan(conns1) | jnp.isnan(conns2), conns1, self.crossover_gene(randkey_2, conns1, conns2))
        return new_nodes, new_conns
    def align_array(self, seq1, seq2, ar2, is_conn: bool):
        """
        After I review this code, I found that it is the most difficult part of the code. Please never change it!
        make ar2 align with ar1.
        :param seq1:
        :param seq2:
        :param ar2:
        :param is_conn:
        :return:
        align means to intersect part of ar2 will be at the same position as ar1,
        non-intersect part of ar2 will be set to Nan
        """
        seq1, seq2 = seq1[:, jnp.newaxis], seq2[jnp.newaxis, :]
        mask = (seq1 == seq2) & (~jnp.isnan(seq1))
        if is_conn:
            mask = jnp.all(mask, axis=2)
        intersect_mask = mask.any(axis=1)
        idx = jnp.arange(0, len(seq1))
        idx_fixed = jnp.dot(mask, idx)
        refactor_ar2 = jnp.where(intersect_mask[:, jnp.newaxis], ar2[idx_fixed], jnp.nan)
        return refactor_ar2
    def crossover_gene(self, rand_key, g1, g2):
        """
        crossover two genes
        :param rand_key:
        :param g1:
        :param g2:
        :return:
        only gene with the same key will be crossover, thus don't need to consider change key
        """
        r = jax.random.uniform(rand_key, shape=g1.shape)
        return jnp.where(r > 0.5, g1, g2)
--- a/algorithm/neat/ga/mutate.py
+++ b/algorithm/neat/ga/mutate.py
@@ -1,186 +0,0 @@
 from typing import Tuple
 import jax
 from jax import Array, numpy as jnp, vmap
 from config import NeatConfig
 from core import State, Gene, Genome
 from utils import check_cycles, fetch_random, fetch_first, I_INT, unflatten_conns
 def mutate(config: NeatConfig, gene: Gene, state: State, randkey, genome: Genome, new_node_key):
    """
    Mutate a population of genomes
    """
    k1, k2 = jax.random.split(randkey)
    genome = mutate_structure(config, gene, state, k1, genome, new_node_key)
    genome = mutate_values(gene, state, randkey, genome)
    return genome
 def mutate_structure(config: NeatConfig, gene: Gene, state: State, randkey, genome: Genome, new_node_key):
    def mutate_add_node(key_, genome_: Genome):
        i_key, o_key, idx = choice_connection_key(key_, genome_.conns)
        def nothing():
            return genome_
        def successful_add_node():
            # disable the connection
            new_genome = genome_.update_conns(genome_.conns.at[idx, 2].set(False))
            # add a new node
            new_genome = new_genome.add_node(new_node_key, gene.new_node_attrs(state))
            # add two new connections
            new_genome = new_genome.add_conn(i_key, new_node_key, True, gene.new_conn_attrs(state))
            new_genome = new_genome.add_conn(new_node_key, o_key, True, gene.new_conn_attrs(state))
            return new_genome
        # if from_idx == I_INT, that means no connection exist, do nothing
        return jax.lax.cond(idx == I_INT, nothing, successful_add_node)
    def mutate_delete_node(key_, genome_: Genome):
        # TODO: Do we really need to delete a node?
        # randomly choose a node
        key, idx = choice_node_key(key_, genome_.nodes, state.input_idx, state.output_idx,
                                   allow_input_keys=False, allow_output_keys=False)
        def nothing():
            return genome_
        def successful_delete_node():
            # delete the node
            new_genome = genome_.delete_node_by_pos(idx)
            # delete all connections
            new_conns = jnp.where(((new_genome.conns[:, 0] == key) | (new_genome.conns[:, 1] == key))[:, None],
                                  jnp.nan, new_genome.conns)
            return new_genome.update_conns(new_conns)
        return jax.lax.cond(idx == I_INT, nothing, successful_delete_node)
    def mutate_add_conn(key_, genome_: Genome):
        # randomly choose two nodes
        k1_, k2_ = jax.random.split(key_, num=2)
        i_key, from_idx = choice_node_key(k1_, genome_.nodes, state.input_idx, state.output_idx,
                                          allow_input_keys=True, allow_output_keys=True)
        o_key, to_idx = choice_node_key(k2_, genome_.nodes, state.input_idx, state.output_idx,
                                        allow_input_keys=False, allow_output_keys=True)
        conn_pos = fetch_first((genome_.conns[:, 0] == i_key) & (genome_.conns[:, 1] == o_key))
        def nothing():
            return genome_
        def successful():
            return genome_.add_conn(i_key, o_key, True, gene.new_conn_attrs(state))
        def already_exist():
            return genome_.update_conns(genome_.conns.at[conn_pos, 2].set(True))
        is_already_exist = conn_pos != I_INT
        if config.network_type == 'feedforward':
            u_cons = unflatten_conns(genome_.nodes, genome_.conns)
            cons_exist = jnp.where(~jnp.isnan(u_cons[0, :, :]), True, False)
            is_cycle = check_cycles(genome_.nodes, cons_exist, from_idx, to_idx)
            choice = jnp.where(is_already_exist, 0, jnp.where(is_cycle, 1, 2))
            return jax.lax.switch(choice, [already_exist, nothing, successful])
        elif config.network_type == 'recurrent':
            return jax.lax.cond(is_already_exist, already_exist, successful)
        else:
            raise ValueError(f"Invalid network type: {config.network_type}")
    def mutate_delete_conn(key_, genome_: Genome):
        # randomly choose a connection
        i_key, o_key, idx = choice_connection_key(key_, genome_.conns)
        def nothing():
            return genome_
        def successfully_delete_connection():
            return genome_.delete_conn_by_pos(idx)
        return jax.lax.cond(idx == I_INT, nothing, successfully_delete_connection)
    k1, k2, k3, k4 = jax.random.split(randkey, num=4)
    r1, r2, r3, r4 = jax.random.uniform(k1, shape=(4,))
    def no(k, g):
        return g
    genome = jax.lax.cond(r1 < config.node_add, mutate_add_node, no, k1, genome)
    genome = jax.lax.cond(r2 < config.node_delete, mutate_delete_node, no, k2, genome)
    genome = jax.lax.cond(r3 < config.conn_add, mutate_add_conn, no, k3, genome)
    genome = jax.lax.cond(r4 < config.conn_delete, mutate_delete_conn, no, k4, genome)
    return genome
 def mutate_values(gene: Gene, state: State, randkey, genome: Genome):
    k1, k2 = jax.random.split(randkey, num=2)
    nodes_keys = jax.random.split(k1, num=genome.nodes.shape[0])
    conns_keys = jax.random.split(k2, num=genome.conns.shape[0])
    nodes_attrs, conns_attrs = genome.nodes[:, 1:], genome.conns[:, 3:]
    new_nodes_attrs = vmap(gene.mutate_node, in_axes=(None, 0, 0))(state, nodes_keys, nodes_attrs)
    new_conns_attrs = vmap(gene.mutate_conn, in_axes=(None, 0, 0))(state, conns_keys, conns_attrs)
    # nan nodes not changed
    new_nodes_attrs = jnp.where(jnp.isnan(nodes_attrs), jnp.nan, new_nodes_attrs)
    new_conns_attrs = jnp.where(jnp.isnan(conns_attrs), jnp.nan, new_conns_attrs)
    new_nodes = genome.nodes.at[:, 1:].set(new_nodes_attrs)
    new_conns = genome.conns.at[:, 3:].set(new_conns_attrs)
    return genome.update(new_nodes, new_conns)
 def choice_node_key(rand_key: Array, nodes: Array,
                    input_keys: Array, output_keys: Array,
                    allow_input_keys: bool = False, allow_output_keys: bool = False) -> Tuple[Array, Array]:
    """
    Randomly choose a node key from the given nodes. It guarantees that the chosen node not be the input or output node.
    :param rand_key:
    :param nodes:
    :param input_keys:
    :param output_keys:
    :param allow_input_keys:
    :param allow_output_keys:
    :return: return its key and position(idx)
    """
    node_keys = nodes[:, 0]
    mask = ~jnp.isnan(node_keys)
    if not allow_input_keys:
        mask = jnp.logical_and(mask, ~jnp.isin(node_keys, input_keys))
    if not allow_output_keys:
        mask = jnp.logical_and(mask, ~jnp.isin(node_keys, output_keys))
    idx = fetch_random(rand_key, mask)
    key = jnp.where(idx != I_INT, nodes[idx, 0], jnp.nan)
    return key, idx
 def choice_connection_key(rand_key: Array, conns: Array):
    """
    Randomly choose a connection key from the given connections.
    :return: i_key, o_key, idx
    """
    idx = fetch_random(rand_key, ~jnp.isnan(conns[:, 0]))
    i_key = jnp.where(idx != I_INT, conns[idx, 0], jnp.nan)
    o_key = jnp.where(idx != I_INT, conns[idx, 1], jnp.nan)
    return i_key, o_key, idx
--- a/algorithm/neat/ga/mutation/init.py
+++ b/algorithm/neat/ga/mutation/init.py
@@ -0,0 +1,2 @@
 from .base import BaseMutation
 from .default import DefaultMutation
--- a/algorithm/neat/ga/mutation/base.py
+++ b/algorithm/neat/ga/mutation/base.py
@@ -0,0 +1,3 @@
 class BaseMutation:
    def __call__(self, key, genome, nodes, conns, new_node_key):
        raise NotImplementedError
--- a/algorithm/neat/ga/mutation/default.py
+++ b/algorithm/neat/ga/mutation/default.py
@@ -0,0 +1,201 @@
 import jax, jax.numpy as jnp
 from . import BaseMutation
 from utils import fetch_first, fetch_random, I_INT, unflatten_conns, check_cycles
 class DefaultMutation(BaseMutation):
    def __init__(
            self,
            conn_add: float = 0.4,
            conn_delete: float = 0,
            node_add: float = 0.2,
            node_delete: float = 0,
    ):
        self.conn_add = conn_add
        self.conn_delete = conn_delete
        self.node_add = node_add
        self.node_delete = node_delete
    def __call__(self, randkey, genome, nodes, conns, new_node_key):
        k1, k2 = jax.random.split(randkey)
        nodes, conns = self.mutate_structure(k1, genome, nodes, conns, new_node_key)
        nodes, conns = self.mutate_values(k2, genome, nodes, conns)
        return nodes, conns
    def mutate_structure(self, randkey, genome, nodes, conns, new_node_key):
        def mutate_add_node(key_, nodes_, conns_):
            i_key, o_key, idx = self.choice_connection_key(key_, conns_)
            def successful_add_node():
                # disable the connection
                new_conns = conns_.at[idx, 2].set(False)
                # add a new node
                new_nodes = genome.add_node(nodes_, new_node_key, genome.node_gene.new_custom_attrs())
                # add two new connections
                new_conns = genome.add_conn(new_conns, i_key, new_node_key, True, genome.conn_gene.new_custom_attrs())
                new_conns = genome.add_conn(new_conns, new_node_key, o_key, True, genome.conn_gene.new_custom_attrs())
                return new_nodes, new_conns
            return jax.lax.cond(
                idx == I_INT,
                lambda: (nodes_, conns_),  # do nothing
                successful_add_node
            )
        def mutate_delete_node(key_, nodes_, conns_):
            # randomly choose a node
            key, idx = self.choice_node_key(key_, nodes_, genome.input_idx, genome.output_idx,
                                            allow_input_keys=False, allow_output_keys=False)
            def successful_delete_node():
                # delete the node
                new_nodes = genome.delete_node_by_pos(nodes_, idx)
                # delete all connections
                new_conns = jnp.where(
                    ((conns_[:, 0] == key) | (conns_[:, 1] == key))[:, None],
                    jnp.nan,
                    conns_
                )
                return new_nodes, new_conns
            return jax.lax.cond(
                idx == I_INT,
                lambda: (nodes_, conns_),  # do nothing
                successful_delete_node
            )
        def mutate_add_conn(key_, nodes_, conns_):
            # randomly choose two nodes
            k1_, k2_ = jax.random.split(key_, num=2)
            # input node of the connection can be any node
            i_key, from_idx = self.choice_node_key(k1_, nodes_, genome.input_idx, genome.output_idx,
                                                   allow_input_keys=True, allow_output_keys=True)
            # output node of the connection can be any node except input node
            o_key, to_idx = self.choice_node_key(k2_, nodes_, genome.input_idx, genome.output_idx,
                                                 allow_input_keys=False, allow_output_keys=True)
            conn_pos = fetch_first((conns_[:, 0] == i_key) & (conns_[:, 1] == o_key))
            is_already_exist = conn_pos != I_INT
            def nothing():
                return nodes_, conns_
            def successful():
                return nodes_, genome.add_conn(conns_, i_key, o_key, True, genome.conns.new_custom_attrs())
            def already_exist():
                return nodes_, conns_.at[conn_pos, 2].set(True)
            if genome.network_type == 'feedforward':
                u_cons = unflatten_conns(nodes_, conns_)
                cons_exist = ~jnp.isnan(u_cons[0, :, :])
                is_cycle = check_cycles(nodes_, cons_exist, from_idx, to_idx)
                return jax.lax.cond(
                    is_already_exist,
                    already_exist,
                    jax.lax.cond(
                        is_cycle,
                        nothing,
                        successful
                    )
                )
            elif genome.network_type == 'recurrent':
                return jax.lax.cond(
                    is_already_exist,
                    already_exist,
                    successful
                )
            else:
                raise ValueError(f"Invalid network type: {genome.network_type}")
        def mutate_delete_conn(key_, nodes_, conns_):
            # randomly choose a connection
            i_key, o_key, idx = self.choice_connection_key(key_, conns_)
            def successfully_delete_connection():
                return nodes_, genome.delete_conn_by_pos(conns_, idx)
            return jax.lax.cond(
                idx == I_INT,
                lambda: (nodes_, conns_),  # nothing
                successfully_delete_connection
            )
        k1, k2, k3, k4 = jax.random.split(randkey, num=4)
        r1, r2, r3, r4 = jax.random.uniform(k1, shape=(4,))
        def no(k, g):
            return g
        genome = jax.lax.cond(r1 < self.node_add, mutate_add_node, no, k1, nodes, conns)
        genome = jax.lax.cond(r2 < self.node_delete, mutate_delete_node, no, k2, nodes, conns)
        genome = jax.lax.cond(r3 < self.conn_add, mutate_add_conn, no, k3, nodes, conns)
        genome = jax.lax.cond(r4 < self.conn_delete, mutate_delete_conn, no, k4, nodes, conns)
        return genome
    def mutate_values(self, randkey, genome, nodes, conns):
        k1, k2 = jax.random.split(randkey, num=2)
        nodes_keys = jax.random.split(k1, num=genome.nodes.shape[0])
        conns_keys = jax.random.split(k2, num=genome.conns.shape[0])
        new_nodes = jax.vmap(genome.nodes.mutate, in_axes=(0, 0))(nodes_keys, nodes)
        new_conns = jax.vmap(genome.conns.mutate, in_axes=(0, 0))(conns_keys, conns)
        # nan nodes not changed
        new_nodes = jnp.where(jnp.isnan(nodes), jnp.nan, new_nodes)
        new_conns = jnp.where(jnp.isnan(conns), jnp.nan, new_conns)
        return new_nodes, new_conns
    def choice_node_key(self, rand_key, nodes, input_idx, output_idx,
                        allow_input_keys: bool = False, allow_output_keys: bool = False):
        """
        Randomly choose a node key from the given nodes. It guarantees that the chosen node not be the input or output node.
        :param rand_key:
        :param nodes:
        :param input_idx:
        :param output_idx:
        :param allow_input_keys:
        :param allow_output_keys:
        :return: return its key and position(idx)
        """
        node_keys = nodes[:, 0]
        mask = ~jnp.isnan(node_keys)
        if not allow_input_keys:
            mask = jnp.logical_and(mask, ~jnp.isin(node_keys, input_idx))
        if not allow_output_keys:
            mask = jnp.logical_and(mask, ~jnp.isin(node_keys, output_idx))
        idx = fetch_random(rand_key, mask)
        key = jnp.where(idx != I_INT, nodes[idx, 0], jnp.nan)
        return key, idx
    def choice_connection_key(self, rand_key, conns):
        """
        Randomly choose a connection key from the given connections.
        :return: i_key, o_key, idx
        """
        idx = fetch_random(rand_key, ~jnp.isnan(conns[:, 0]))
        i_key = jnp.where(idx != I_INT, conns[idx, 0], jnp.nan)
        o_key = jnp.where(idx != I_INT, conns[idx, 1], jnp.nan)
        return i_key, o_key, idx
--- a/algorithm/neat/ga/operation.py
+++ b/algorithm/neat/ga/operation.py
@@ -1,40 +0,0 @@
 import jax
 from jax import numpy as jnp, vmap
 from config import NeatConfig
 from core import Genome, State, Gene
 from .mutate import mutate
 from .crossover import crossover
 def create_next_generation(config: NeatConfig, gene: Gene, state: State, randkey, winner, loser, elite_mask):
    # prepare random keys
    pop_size = state.idx2species.shape[0]
    new_node_keys = jnp.arange(pop_size) + state.next_node_key
    k1, k2 = jax.random.split(randkey, 2)
    crossover_rand_keys = jax.random.split(k1, pop_size)
    mutate_rand_keys = jax.random.split(k2, pop_size)
    # batch crossover
    wpn, wpc = state.pop_genomes.nodes[winner], state.pop_genomes.conns[winner]
    lpn, lpc = state.pop_genomes.nodes[loser], state.pop_genomes.conns[loser]
    n_genomes = vmap(crossover)(crossover_rand_keys, Genome(wpn, wpc), Genome(lpn, lpc))
    # batch mutation
    mutate_func = vmap(mutate, in_axes=(None, None, None, 0, 0, 0))
    m_n_genomes = mutate_func(config, gene, state, mutate_rand_keys, n_genomes, new_node_keys)  # mutate_new_pop_nodes
    # elitism don't mutate
    pop_nodes = jnp.where(elite_mask[:, None, None], n_genomes.nodes, m_n_genomes.nodes)
    pop_conns = jnp.where(elite_mask[:, None, None], n_genomes.conns, m_n_genomes.conns)
    # update next node key
    all_nodes_keys = pop_nodes[:, :, 0]
    max_node_key = jnp.max(jnp.where(jnp.isnan(all_nodes_keys), -jnp.inf, all_nodes_keys))
    next_node_key = max_node_key + 1
    return state.update(
        pop_genomes=Genome(pop_nodes, pop_conns),
        next_node_key=next_node_key,
    )
--- a/algorithm/neat/gene/init.py
+++ b/algorithm/neat/gene/init.py
@@ -1,3 +1,3 @@
-from .normal import NormalGene, NormalGeneConfig
+from .base import BaseGene
-from .recurrent import RecurrentGene, RecurrentGeneConfig
+from .conn import *
-
+from .node import *
--- a/algorithm/neat/gene/base.py
+++ b/algorithm/neat/gene/base.py
@@ -0,0 +1,23 @@
 class BaseGene:
    "Base class for node genes or connection genes."
    fixed_attrs = []
    custom_attrs = []
    def __init__(self):
        pass
    def new_custom_attrs(self):
        raise NotImplementedError
    def mutate(self, randkey, gene):
        raise NotImplementedError
    def distance(self, gene1, gene2):
        raise NotImplementedError
    def forward(self, attrs, inputs):
        raise NotImplementedError
    @property
    def length(self):
        return len(self.fixed_attrs) + len(self.custom_attrs)
--- a/algorithm/neat/gene/conn/init.py
+++ b/algorithm/neat/gene/conn/init.py
@@ -0,0 +1,2 @@
 from .base import BaseConnGene
 from .default import DefaultConnGene
--- a/algorithm/neat/gene/conn/base.py
+++ b/algorithm/neat/gene/conn/base.py
@@ -0,0 +1,12 @@
 from .. import BaseGene
 class BaseConnGene(BaseGene):
    "Base class for connection genes."
    fixed_attrs = ['input_index', 'output_index', 'enabled']
    def __init__(self):
        super().__init__()
    def forward(self, attrs, inputs):
        raise NotImplementedError
--- a/algorithm/neat/gene/conn/default.py
+++ b/algorithm/neat/gene/conn/default.py
@@ -0,0 +1,51 @@
 import jax.numpy as jnp
 from utils import mutate_float
 from . import BaseConnGene
 class DefaultConnGene(BaseConnGene):
    "Default connection gene, with the same behavior as in NEAT-python."
    fixed_attrs = ['input_index', 'output_index', 'enabled']
    attrs = ['weight']
    def __init__(
            self,
            weight_init_mean: float = 0.0,
            weight_init_std: float = 1.0,
            weight_mutate_power: float = 0.5,
            weight_mutate_rate: float = 0.8,
            weight_replace_rate: float = 0.1,
    ):
        super().__init__()
        self.weight_init_mean = weight_init_mean
        self.weight_init_std = weight_init_std
        self.weight_mutate_power = weight_mutate_power
        self.weight_mutate_rate = weight_mutate_rate
        self.weight_replace_rate = weight_replace_rate
    def new_custom_attrs(self):
        return jnp.array([self.weight_init_mean])
    def mutate(self, key, conn):
        input_index = conn[0]
        output_index = conn[1]
        enabled = conn[2]
        weight = mutate_float(key,
                              conn[3],
                              self.weight_init_mean,
                              self.weight_init_std,
                              self.weight_mutate_power,
                              self.weight_mutate_rate,
                              self.weight_replace_rate
                              )
        return jnp.array([input_index, output_index, enabled, weight])
    def distance(self, attrs1, attrs2):
        return (attrs1[2] != attrs2[2]) + jnp.abs(attrs1[3] - attrs2[3])  # enable + weight
    def forward(self, attrs, inputs):
        weight = attrs[0]
        return inputs * weight
--- a/algorithm/neat/gene/node/init.py
+++ b/algorithm/neat/gene/node/init.py
@@ -0,0 +1,2 @@
 from .base import BaseNodeGene
 from .default import DefaultNodeGene
--- a/algorithm/neat/gene/node/base.py
+++ b/algorithm/neat/gene/node/base.py
@@ -0,0 +1,12 @@
 from .. import BaseGene
 class BaseNodeGene(BaseGene):
    "Base class for node genes."
    fixed_attrs = ["index"]
    def __init__(self):
        super().__init__()
    def forward(self, attrs, inputs):
        raise NotImplementedError
--- a/algorithm/neat/gene/node/default.py
+++ b/algorithm/neat/gene/node/default.py
@@ -0,0 +1,96 @@
 from typing import Tuple
 import jax, jax.numpy as jnp
 from utils import Act, Agg, act, agg, mutate_int, mutate_float
 from . import BaseNodeGene
 class DefaultNodeGene(BaseNodeGene):
    "Default node gene, with the same behavior as in NEAT-python."
    fixed_attrs = ['index']
    custom_attrs = ['bias', 'response', 'aggregation', 'activation']
    def __init__(
            self,
            bias_init_mean: float = 0.0,
            bias_init_std: float = 1.0,
            bias_mutate_power: float = 0.5,
            bias_mutate_rate: float = 0.7,
            bias_replace_rate: float = 0.1,
            response_init_mean: float = 1.0,
            response_init_std: float = 0.0,
            response_mutate_power: float = 0.5,
            response_mutate_rate: float = 0.7,
            response_replace_rate: float = 0.1,
            activation_default: callable = Act.sigmoid,
            activation_options: Tuple = (Act.sigmoid,),
            activation_replace_rate: float = 0.1,
            aggregation_default: callable = Agg.sum,
            aggregation_options: Tuple = (Agg.sum,),
            aggregation_replace_rate: float = 0.1,
    ):
        super().__init__()
        self.bias_init_mean = bias_init_mean
        self.bias_init_std = bias_init_std
        self.bias_mutate_power = bias_mutate_power
        self.bias_mutate_rate = bias_mutate_rate
        self.bias_replace_rate = bias_replace_rate
        self.response_init_mean = response_init_mean
        self.response_init_std = response_init_std
        self.response_mutate_power = response_mutate_power
        self.response_mutate_rate = response_mutate_rate
        self.response_replace_rate = response_replace_rate
        self.activation_default = activation_options.index(activation_default)
        self.activation_options = activation_options
        self.activation_indices = jnp.arange(len(activation_options))
        self.activation_replace_rate = activation_replace_rate
        self.aggregation_default = aggregation_options.index(aggregation_default)
        self.aggregation_options = aggregation_options
        self.aggregation_indices = jnp.arange(len(aggregation_options))
        self.aggregation_replace_rate = aggregation_replace_rate
    def new_custom_attrs(self):
        return jnp.array(
            [self.bias_init_mean, self.response_init_mean, self.activation_default, self.aggregation_default]
        )
    def mutate(self, key, node):
        k1, k2, k3, k4 = jax.random.split(key, num=4)
        index = node[0]
        bias = mutate_float(k1, node[1], self.bias_init_mean, self.bias_init_std,
                            self.bias_mutate_power, self.bias_mutate_rate, self.bias_replace_rate)
        res = mutate_float(k2, node[2], self.response_init_mean, self.response_init_std,
                           self.response_mutate_power, self.response_mutate_rate, self.response_replace_rate)
        act = mutate_int(k3, node[3], self.activation_indices, self.activation_replace_rate)
        agg = mutate_int(k4, node[4], self.aggregation_indices, self.aggregation_replace_rate)
        return jnp.array([index, bias, res, act, agg])
    def distance(self, node1, node2):
        return (
                jnp.abs(node1[1] - node2[1]) +
                jnp.abs(node1[2] - node2[2]) +
                node1[3] != node2[3] +
                node1[4] != node2[4]
        )
    def forward(self, attrs, inputs):
        bias, res, act_idx, agg_idx = attrs
        z = agg(agg_idx, inputs, self.aggregation_options)
        z = bias + res * z
        z = act(act_idx, z, self.activation_options)
        return z
--- a/algorithm/neat/gene/normal.py
+++ b/algorithm/neat/gene/normal.py
@@ -1,210 +0,0 @@
 from dataclasses import dataclass
 from typing import Tuple
 import jax
 from jax import Array, numpy as jnp
 from config import GeneConfig
 from core import Gene, Genome, State
 from utils import Act, Agg, unflatten_conns, topological_sort, I_INT, act, agg
@dataclass(frozen=True)
 class NormalGeneConfig(GeneConfig):
    bias_init_mean: float = 0.0
    bias_init_std: float = 1.0
    bias_mutate_power: float = 0.5
    bias_mutate_rate: float = 0.7
    bias_replace_rate: float = 0.1
    response_init_mean: float = 1.0
    response_init_std: float = 0.0
    response_mutate_power: float = 0.5
    response_mutate_rate: float = 0.7
    response_replace_rate: float = 0.1
    activation_default: callable = Act.sigmoid
    activation_options: Tuple = (Act.sigmoid, )
    activation_replace_rate: float = 0.1
    aggregation_default: callable = Agg.sum
    aggregation_options: Tuple = (Agg.sum, )
    aggregation_replace_rate: float = 0.1
    weight_init_mean: float = 0.0
    weight_init_std: float = 1.0
    weight_mutate_power: float = 0.5
    weight_mutate_rate: float = 0.8
    weight_replace_rate: float = 0.1
    def __post_init__(self):
        assert self.bias_init_std >= 0.0
        assert self.bias_mutate_power >= 0.0
        assert self.bias_mutate_rate >= 0.0
        assert self.bias_replace_rate >= 0.0
        assert self.response_init_std >= 0.0
        assert self.response_mutate_power >= 0.0
        assert self.response_mutate_rate >= 0.0
        assert self.response_replace_rate >= 0.0
        assert self.activation_default == self.activation_options[0]
        assert self.aggregation_default == self.aggregation_options[0]
 class NormalGene(Gene):
    node_attrs = ['bias', 'response', 'aggregation', 'activation']
    conn_attrs = ['weight']
    def __init__(self, config: NormalGeneConfig = NormalGeneConfig()):
        self.config = config
    def setup(self, state: State = State()):
        return state.update(
            bias_init_mean=self.config.bias_init_mean,
            bias_init_std=self.config.bias_init_std,
            bias_mutate_power=self.config.bias_mutate_power,
            bias_mutate_rate=self.config.bias_mutate_rate,
            bias_replace_rate=self.config.bias_replace_rate,
            response_init_mean=self.config.response_init_mean,
            response_init_std=self.config.response_init_std,
            response_mutate_power=self.config.response_mutate_power,
            response_mutate_rate=self.config.response_mutate_rate,
            response_replace_rate=self.config.response_replace_rate,
            activation_replace_rate=self.config.activation_replace_rate,
            activation_default=0,
            activation_options=jnp.arange(len(self.config.activation_options)),
            aggregation_replace_rate=self.config.aggregation_replace_rate,
            aggregation_default=0,
            aggregation_options=jnp.arange(len(self.config.aggregation_options)),
            weight_init_mean=self.config.weight_init_mean,
            weight_init_std=self.config.weight_init_std,
            weight_mutate_power=self.config.weight_mutate_power,
            weight_mutate_rate=self.config.weight_mutate_rate,
            weight_replace_rate=self.config.weight_replace_rate,
        )
    def update(self, state):
        return state
    def new_node_attrs(self, state):
        return jnp.array([state.bias_init_mean, state.response_init_mean,
                          state.activation_default, state.aggregation_default])
    def new_conn_attrs(self, state):
        return jnp.array([state.weight_init_mean])
    def mutate_node(self, state, key, attrs: Array):
        k1, k2, k3, k4 = jax.random.split(key, num=4)
        bias = NormalGene._mutate_float(k1, attrs[0], state.bias_init_mean, state.bias_init_std,
                                        state.bias_mutate_power, state.bias_mutate_rate, state.bias_replace_rate)
        res = NormalGene._mutate_float(k2, attrs[1], state.response_init_mean, state.response_init_std,
                                       state.response_mutate_power, state.response_mutate_rate,
                                       state.response_replace_rate)
        act = NormalGene._mutate_int(k3, attrs[2], state.activation_options, state.activation_replace_rate)
        agg = NormalGene._mutate_int(k4, attrs[3], state.aggregation_options, state.aggregation_replace_rate)
        return jnp.array([bias, res, act, agg])
    def mutate_conn(self, state, key, attrs: Array):
        weight = NormalGene._mutate_float(key, attrs[0], state.weight_init_mean, state.weight_init_std,
                                          state.weight_mutate_power, state.weight_mutate_rate,
                                          state.weight_replace_rate)
        return jnp.array([weight])
    def distance_node(self, state, node1: Array, node2: Array):
        # bias + response + activation + aggregation
        return jnp.abs(node1[1] - node2[1]) + jnp.abs(node1[2] - node2[2]) + \
            (node1[3] != node2[3]) + (node1[4] != node2[4])
    def distance_conn(self, state, con1: Array, con2: Array):
        return (con1[2] != con2[2]) + jnp.abs(con1[3] - con2[3])  # enable + weight
    def forward_transform(self, state: State, genome: Genome):
        u_conns = unflatten_conns(genome.nodes, genome.conns)
        conn_enable = jnp.where(~jnp.isnan(u_conns[0]), True, False)
        # remove enable attr
        u_conns = jnp.where(conn_enable, u_conns[1:, :], jnp.nan)
        seqs = topological_sort(genome.nodes, conn_enable)
        return seqs, genome.nodes, u_conns
    def forward(self, state: State, inputs, transformed):
        cal_seqs, nodes, cons = transformed
        input_idx = state.input_idx
        output_idx = state.output_idx
        N = nodes.shape[0]
        ini_vals = jnp.full((N,), jnp.nan)
        ini_vals = ini_vals.at[input_idx].set(inputs)
        weights = cons[0, :]
        def cond_fun(carry):
            values, idx = carry
            return (idx < N) & (cal_seqs[idx] != I_INT)
        def body_func(carry):
            values, idx = carry
            i = cal_seqs[idx]
            def hit():
                ins = values * weights[:, i]
                z = agg(nodes[i, 4], ins, self.config.aggregation_options)  # z = agg(ins)
                z = z * nodes[i, 2] + nodes[i, 1]  # z = z * response + bias
                z = act(nodes[i, 3], z, self.config.activation_options)  # z = act(z)
                new_values = values.at[i].set(z)
                return new_values
            def miss():
                return values
            # the val of input nodes is obtained by the task, not by calculation
            values = jax.lax.cond(jnp.isin(i, input_idx), miss, hit)
            return values, idx + 1
        vals, _ = jax.lax.while_loop(cond_fun, body_func, (ini_vals, 0))
        return vals[output_idx]
    @staticmethod
    def _mutate_float(key, val, init_mean, init_std, mutate_power, mutate_rate, replace_rate):
        k1, k2, k3 = jax.random.split(key, num=3)
        noise = jax.random.normal(k1, ()) * mutate_power
        replace = jax.random.normal(k2, ()) * init_std + init_mean
        r = jax.random.uniform(k3, ())
        val = jnp.where(
            r < mutate_rate,
            val + noise,
            jnp.where(
                (mutate_rate < r) & (r < mutate_rate + replace_rate),
                replace,
                val
            )
        )
        return val
    @staticmethod
    def _mutate_int(key, val, options, replace_rate):
        k1, k2 = jax.random.split(key, num=2)
        r = jax.random.uniform(k1, ())
        val = jnp.where(
            r < replace_rate,
            jax.random.choice(k2, options),
            val
        )
        return val
--- a/algorithm/neat/gene/recurrent.py
+++ b/algorithm/neat/gene/recurrent.py
@@ -1,57 +0,0 @@
 from dataclasses import dataclass
 import jax
 from jax import numpy as jnp, vmap
 from .normal import NormalGene, NormalGeneConfig
 from core import State, Genome
 from utils import unflatten_conns, act, agg
@dataclass(frozen=True)
 class RecurrentGeneConfig(NormalGeneConfig):
    activate_times: int = 10
    def __post_init__(self):
        super().__post_init__()
        assert self.activate_times > 0
 class RecurrentGene(NormalGene):
    def __init__(self, config: RecurrentGeneConfig = RecurrentGeneConfig()):
        self.config = config
        super().__init__(config)
    def forward_transform(self, state: State, genome: Genome):
        u_conns = unflatten_conns(genome.nodes, genome.conns)
        # remove un-enable connections and remove enable attr
        conn_enable = jnp.where(~jnp.isnan(u_conns[0]), True, False)
        u_conns = jnp.where(conn_enable, u_conns[1:, :], jnp.nan)
        return genome.nodes, u_conns
    def forward(self, state: State, inputs, transformed):
        nodes, conns = transformed
        batch_act, batch_agg = vmap(act, in_axes=(0, 0, None)), vmap(agg, in_axes=(0, 0, None))
        input_idx = state.input_idx
        output_idx = state.output_idx
        N = nodes.shape[0]
        vals = jnp.full((N,), 0.)
        weights = conns[0, :]
        def body_func(i, values):
            values = values.at[input_idx].set(inputs)
            nodes_ins = values * weights.T
            values = batch_agg(nodes[:, 4], nodes_ins, self.config.aggregation_options)  # z = agg(ins)
            values = values * nodes[:, 2] + nodes[:, 1]  # z = z * response + bias
            values = batch_act(nodes[:, 3], values, self.config.activation_options)  # z = act(z)
            return values
        vals = jax.lax.fori_loop(0, self.config.activate_times, body_func, vals)
        return vals[output_idx]
--- a/algorithm/neat/genome/init.py
+++ b/algorithm/neat/genome/init.py
@@ -0,0 +1,3 @@
 from .base import BaseGenome
 from .default import DefaultGenome
 from .recurrent import RecurrentGenome
--- a/algorithm/neat/genome/base.py
+++ b/algorithm/neat/genome/base.py
@@ -0,0 +1,66 @@
 import jax.numpy as jnp
 from ..gene import BaseNodeGene, BaseConnGene, DefaultNodeGene, DefaultConnGene
 from utils import fetch_first
 class BaseGenome:
    network_type = None
    def __init__(
            self,
            num_inputs: int,
            num_outputs: int,
            max_nodes: int,
            max_conns: int,
            node_gene: BaseNodeGene = DefaultNodeGene(),
            conn_gene: BaseConnGene = DefaultConnGene(),
    ):
        self.num_inputs = num_inputs
        self.num_outputs = num_outputs
        self.input_idx = jnp.arange(num_inputs)
        self.output_idx = jnp.arange(num_inputs, num_inputs + num_outputs)
        self.max_nodes = max_nodes
        self.max_conns = max_conns
        self.node_gene = node_gene
        self.conn_gene = conn_gene
    def transform(self, nodes, conns):
        raise NotImplementedError
    def forward(self, inputs, transformed):
        raise NotImplementedError
    def add_node(self, nodes, new_key: int, attrs):
        """
        Add a new node to the genome.
        The new node will place at the first NaN row.
        """
        exist_keys = nodes[:, 0]
        pos = fetch_first(jnp.isnan(exist_keys))
        new_nodes = nodes.at[pos, 0].set(new_key)
        return new_nodes.at[pos, 1:].set(attrs)
    def delete_node_by_pos(self, nodes, pos):
        """
        Delete a node from the genome.
        Delete the node by its pos in nodes.
        """
        return nodes.at[pos].set(jnp.nan)
    def add_conn(self, conns, i_key, o_key, enable: bool, attrs):
        """
        Add a new connection to the genome.
        The new connection will place at the first NaN row.
        """
        con_keys = conns[:, 0]
        pos = fetch_first(jnp.isnan(con_keys))
        new_conns = conns.at[pos, 0:3].set(jnp.array([i_key, o_key, enable]))
        return new_conns.at[pos, 3:].set(attrs)
    def delete_conn_by_pos(self, conns, pos):
        """
        Delete a connection from the genome.
        Delete the connection by its idx.
        """
        return conns.at[pos].set(jnp.nan)
--- a/algorithm/neat/genome/default.py
+++ b/algorithm/neat/genome/default.py
@@ -0,0 +1,75 @@
 import jax, jax.numpy as jnp
 from utils import unflatten_conns, topological_sort, I_INT
 from . import BaseGenome
 from ..gene import BaseNodeGene, BaseConnGene, DefaultNodeGene, DefaultConnGene
 class DefaultGenome(BaseGenome):
    """Default genome class, with the same behavior as the NEAT-Python"""
    network_type = 'feedforward'
    def __init__(self,
                 num_inputs: int,
                 num_outputs: int,
                 node_gene: BaseNodeGene = DefaultNodeGene(),
                 conn_gene: BaseConnGene = DefaultConnGene(),
                 ):
        super().__init__(num_inputs, num_outputs, node_gene, conn_gene)
    def transform(self, nodes, conns):
        u_conns = unflatten_conns(nodes, conns)
        # DONE: Seems like there is a bug in this line
        # conn_enable = jnp.where(~jnp.isnan(u_conns[0]), True, False)
        # modified: exist conn and enable is true
        # conn_enable = jnp.where( (~jnp.isnan(u_conns[0])) & (u_conns[0] == 1), True, False)
        # advanced modified: when and only when enabled is True
        conn_enable = u_conns[0] == 1
        # remove enable attr
        u_conns = jnp.where(conn_enable, u_conns[1:, :], jnp.nan)
        seqs = topological_sort(nodes, conn_enable)
        return seqs, nodes, u_conns
    def forward(self, inputs, transformed):
        cal_seqs, nodes, conns = transformed
        N = nodes.shape[0]
        ini_vals = jnp.full((N,), jnp.nan)
        ini_vals = ini_vals.at[self.input_idx].set(inputs)
        nodes_attrs = nodes[:, 1:]
        def cond_fun(carry):
            values, idx = carry
            return (idx < N) & (cal_seqs[idx] != I_INT)
        def body_func(carry):
            values, idx = carry
            i = cal_seqs[idx]
            def hit():
                ins = jax.vmap(self.conn_gene.forward, in_axes=(1, 0))(conns[:, :, i], values)
                # ins = values * weights[:, i]
                z = self.node_gene.forward(nodes_attrs[i], ins)
                # z = agg(nodes[i, 4], ins, self.config.aggregation_options)  # z = agg(ins)
                # z = z * nodes[i, 2] + nodes[i, 1]  # z = z * response + bias
                # z = act(nodes[i, 3], z, self.config.activation_options)  # z = act(z)
                new_values = values.at[i].set(z)
                return new_values
            def miss():
                return values
            # the val of input nodes is obtained by the task, not by calculation
            values = jax.lax.cond(jnp.isin(i, self.input_idx), miss, hit)
            return values, idx + 1
        vals, _ = jax.lax.while_loop(cond_fun, body_func, (ini_vals, 0))
        return vals[self.output_idx]
--- a/algorithm/neat/genome/recurrent.py
+++ b/algorithm/neat/genome/recurrent.py
@@ -0,0 +1,58 @@
 import jax, jax.numpy as jnp
 from utils import unflatten_conns
 from . import BaseGenome
 from ..gene import BaseNodeGene, BaseConnGene, DefaultNodeGene, DefaultConnGene
 class RecurrentGenome(BaseGenome):
    """Default genome class, with the same behavior as the NEAT-Python"""
    network_type = 'recurrent'
    def __init__(self,
                 num_inputs: int,
                 num_outputs: int,
                 node_gene: BaseNodeGene = DefaultNodeGene(),
                 conn_gene: BaseConnGene = DefaultConnGene(),
                 activate_time: int = 10,
                 ):
        super().__init__(num_inputs, num_outputs, node_gene, conn_gene)
        self.activate_time = activate_time
    def transform(self, nodes, conns):
        u_conns = unflatten_conns(nodes, conns)
        # remove un-enable connections and remove enable attr
        conn_enable = u_conns[0] == 1
        u_conns = jnp.where(conn_enable, u_conns[1:, :], jnp.nan)
        return nodes, u_conns
    def forward(self, inputs, transformed):
        nodes, conns = transformed
        N = nodes.shape[0]
        vals = jnp.full((N,), jnp.nan)
        nodes_attrs = nodes[:, 1:]
        def body_func(_, values):
            # set input values
            values = values.at[self.input_idx].set(inputs)
            # calculate connections
            node_ins = jax.vmap(
                jax.vmap(
                    self.conn_gene.forward,
                    in_axes=(1, None)
                ),
                in_axes=(1, 0)
            )(conns, values)
            # calculate nodes
            values = jax.vmap(self.node_gene.forward)(nodes_attrs, node_ins.T)
            return values
        vals = jax.lax.fori_loop(0, self.activate_time, body_func, vals)
        return vals[self.output_idx]
--- a/algorithm/neat/neat.py
+++ b/algorithm/neat/neat.py
@@ -1,87 +1,38 @@
-from typing import Type
+import jax, jax.numpy as jnp
 from utils import State
 from .. import BaseAlgorithm
 from .genome import *
 from .species import *
 from .ga import *
-import jax
+class NEAT(BaseAlgorithm):
 from jax import numpy as jnp
 import numpy as np
-from config import Config
+    def __init__(
-from core import Algorithm, State, Gene, Genome
+            self,
-from .ga import create_next_generation
+            genome: BaseGenome,
-from .species import SpeciesInfo, update_species, speciate
+            species: BaseSpecies,
            mutation: BaseMutation = DefaultMutation(),
            crossover: BaseCrossover = DefaultCrossover(),
    ):
        self.genome = genome
        self.species = species
        self.mutation = mutation
        self.crossover = crossover
-
+    def setup(self, randkey):
-class NEAT(Algorithm):
+        k1, k2 = jax.random.split(randkey, 2)
-
+        return State(
-    def __init__(self, config: Config, gene_type: Type[Gene]):
+            randkey=k1,
-        self.config = config
+            generation=0,
-        self.gene = gene_type(config.gene)
+            next_node_key=max(*self.genome.input_idx, *self.genome.output_idx) + 2,
-
+            # inputs nodes, output nodes, 1 hidden node
-        self.forward_func = None
+            species=self.species.setup(k2),
        self.tell_func = None
    def setup(self, randkey, state: State = State()):
        """initialize the state of the algorithm"""
        input_idx = np.arange(self.config.neat.inputs)
        output_idx = np.arange(self.config.neat.inputs,
                               self.config.neat.inputs + self.config.neat.outputs)
        state = state.update(
            P=self.config.basic.pop_size,
            N=self.config.neat.max_nodes,
            C=self.config.neat.max_conns,
            S=self.config.neat.max_species,
            NL=1 + len(self.gene.node_attrs),  # node length = (key) + attributes
            CL=3 + len(self.gene.conn_attrs),  # conn length = (in, out, key) + attributes
            max_stagnation=self.config.neat.max_stagnation,
            species_elitism=self.config.neat.species_elitism,
            spawn_number_change_rate=self.config.neat.spawn_number_change_rate,
            genome_elitism=self.config.neat.genome_elitism,
            survival_threshold=self.config.neat.survival_threshold,
            compatibility_threshold=self.config.neat.compatibility_threshold,
            compatibility_disjoint=self.config.neat.compatibility_disjoint,
            compatibility_weight=self.config.neat.compatibility_weight,
            input_idx=input_idx,
            output_idx=output_idx,
        )
-        state = self.gene.setup(state)
+    def ask(self, state: State):
-        pop_genomes = self._initialize_genomes(state)
+        return self.species.ask(state)
        species_info = SpeciesInfo.initialize(state)
        idx2species = jnp.zeros(state.P, dtype=jnp.float32)
        center_nodes = jnp.full((state.S, state.N, state.NL), jnp.nan, dtype=jnp.float32)
        center_conns = jnp.full((state.S, state.C, state.CL), jnp.nan, dtype=jnp.float32)
        center_genomes = Genome(center_nodes, center_conns)
        center_genomes = center_genomes.set(0, pop_genomes[0])
        generation = 0
        next_node_key = max(*state.input_idx, *state.output_idx) + 2
        next_species_key = 1
        state = state.update(
            randkey=randkey,
            pop_genomes=pop_genomes,
            species_info=species_info,
            idx2species=idx2species,
            center_genomes=center_genomes,
            # avoid jax auto cast from int to float. that would cause re-compilation.
            generation=jnp.asarray(generation, dtype=jnp.int32),
            next_node_key=jnp.asarray(next_node_key, dtype=jnp.float32),
            next_species_key=jnp.asarray(next_species_key, dtype=jnp.float32),
        )
        return jax.device_put(state)
    def ask_algorithm(self, state: State):
        return state.pop_genomes
    def tell_algorithm(self, state: State, fitness):
        state = self.gene.update(state)
    def tell(self, state: State, fitness):
        k1, k2, randkey = jax.random.split(state.randkey, 3)
        state = state.update(
@@ -89,46 +40,55 @@ class NEAT(Algorithm):
            randkey=randkey
        )
-        state, winner, loser, elite_mask = update_species(state, k1, fitness)
+        state, winner, loser, elite_mask = self.species.update_species(state, fitness, state.generation)
-        state = create_next_generation(self.config.neat, self.gene, state, k2, winner, loser, elite_mask)
+        state = self.create_next_generation(k2, state, winner, loser, elite_mask)
-        state = speciate(self.gene, state)
+        state = self.species.speciate(state, state.generation)
        return state
-    def forward_transform(self, state: State, genome: Genome):
+    def transform(self, state: State):
-        return self.gene.forward_transform(state, genome)
+        """transform the genome into a neural network"""
        raise NotImplementedError
-    def forward(self, state: State, inputs, genome: Genome):
+    def forward(self, inputs, transformed):
-        return self.gene.forward(state, inputs, genome)
+        raise NotImplementedError
-    def _initialize_genomes(self, state):
+    def create_next_generation(self, randkey, state, winner, loser, elite_mask):
-        o_nodes = np.full((state.N, state.NL), np.nan, dtype=np.float32)  # original nodes
+        # prepare random keys
-        o_conns = np.full((state.C, state.CL), np.nan, dtype=np.float32)  # original connections
+        pop_size = self.species.pop_size
        new_node_keys = jnp.arange(pop_size) + state.species.next_node_key
-        input_idx = state.input_idx
+        k1, k2 = jax.random.split(randkey, 2)
-        output_idx = state.output_idx
+        crossover_rand_keys = jax.random.split(k1, pop_size)
-        new_node_key = max([*input_idx, *output_idx]) + 1
+        mutate_rand_keys = jax.random.split(k2, pop_size)
-        o_nodes[input_idx, 0] = input_idx
+        wpn, wpc = state.species.pop_nodes[winner], state.species.pop_conns[winner]
-        o_nodes[output_idx, 0] = output_idx
+        lpn, lpc = state.species.pop_nodes[loser], state.species.pop_conns[loser]
        o_nodes[new_node_key, 0] = new_node_key
        o_nodes[np.concatenate([input_idx, output_idx]), 1:] = self.gene.new_node_attrs(state)
        o_nodes[new_node_key, 1:] = self.gene.new_node_attrs(state)
-        input_conns = np.c_[input_idx, np.full_like(input_idx, new_node_key)]
+        # batch crossover
-        o_conns[input_idx, 0:2] = input_conns  # in key, out key
+        n_nodes, n_conns = (jax.vmap(self.crossover, in_axes=(0, None, 0, 0, 0, 0))
-        o_conns[input_idx, 2] = True  # enabled
+                     (crossover_rand_keys, self.genome, wpn, wpc, lpn, lpc))
        o_conns[input_idx, 3:] = self.gene.new_conn_attrs(state)
-        output_conns = np.c_[np.full_like(output_idx, new_node_key), output_idx]
+        # batch mutation
-        o_conns[output_idx, 0:2] = output_conns  # in key, out key
+        m_n_nodes, m_n_conns = (jax.vmap(self.mutation, in_axes=(0, None, 0, 0, 0))
-        o_conns[output_idx, 2] = True  # enabled
+                       (mutate_rand_keys, self.genome, n_nodes, n_conns, new_node_keys))
        o_conns[output_idx, 3:] = self.gene.new_conn_attrs(state)
-        # repeat origin genome for P times to create population
+        # elitism don't mutate
-        pop_nodes = np.tile(o_nodes, (state.P, 1, 1))
+        pop_nodes = jnp.where(elite_mask[:, None, None], n_nodes, m_n_nodes)
-        pop_conns = np.tile(o_conns, (state.P, 1, 1))
+        pop_conns = jnp.where(elite_mask[:, None, None], n_conns, m_n_conns)
        # update next node key
        all_nodes_keys = pop_nodes[:, :, 0]
        max_node_key = jnp.max(jnp.where(jnp.isnan(all_nodes_keys), -jnp.inf, all_nodes_keys))
        next_node_key = max_node_key + 1
        return state.update(
            species=state.species.update(
                pop_nodes=pop_nodes,
                pop_conns=pop_conns,
            ),
            next_node_key=next_node_key,
        )
        return Genome(pop_nodes, pop_conns)
--- a/algorithm/neat/species/init.py
+++ b/algorithm/neat/species/init.py
@@ -1,2 +1,2 @@
-from .species_info import SpeciesInfo
+from .base import BaseSpecies
-from .operations import update_species, speciate
+from .default import DefaultSpecies
--- a/algorithm/neat/species/base.py
+++ b/algorithm/neat/species/base.py
@@ -0,0 +1,14 @@
 from utils import State
 class BaseSpecies:
    def setup(self, randkey):
        raise NotImplementedError
    def ask(self, state: State):
        raise NotImplementedError
    def update_species(self, state, fitness, generation):
        raise NotImplementedError
    def speciate(self, state, generation):
        raise NotImplementedError
--- a/algorithm/neat/species/default.py
+++ b/algorithm/neat/species/default.py
@@ -0,0 +1,514 @@
 import numpy as np
 import jax, jax.numpy as jnp
 from utils import State, rank_elements, argmin_with_mask, fetch_first
 from ..genome import BaseGenome
 class DefaultSpecies:
    def __init__(self,
                 genome: BaseGenome,
                 pop_size,
                 species_size,
                 compatibility_disjoint: float = 1.0,
                 compatibility_weight: float = 0.4,
                 max_stagnation: int = 15,
                 species_elitism: int = 2,
                 spawn_number_change_rate: float = 0.5,
                 genome_elitism: int = 2,
                 survival_threshold: float = 0.2,
                 min_species_size: int = 1,
                 compatibility_threshold: float = 3.5
                 ):
        self.genome = genome
        self.pop_size = pop_size
        self.species_size = species_size
        self.compatibility_disjoint = compatibility_disjoint
        self.compatibility_weight = compatibility_weight
        self.max_stagnation = max_stagnation
        self.species_elitism = species_elitism
        self.spawn_number_change_rate = spawn_number_change_rate
        self.genome_elitism = genome_elitism
        self.survival_threshold = survival_threshold
        self.min_species_size = min_species_size
        self.compatibility_threshold = compatibility_threshold
        self.species_arange = jnp.arange(self.species_size)
    def setup(self, randkey):
        pop_nodes, pop_conns = initialize_population(self.pop_size, self.genome)
        species_keys = jnp.full((self.species_size,), jnp.nan)  # the unique index (primary key) for each species
        best_fitness = jnp.full((self.species_size,), jnp.nan)  # the best fitness of each species
        last_improved = jnp.full((self.species_size,), jnp.nan)  # the last generation that the species improved
        member_count = jnp.full((self.species_size,), jnp.nan)  # the number of members of each species
        idx2species = jnp.zeros(self.pop_size)  # the species index of each individual
        # nodes for each center genome of each species
        center_nodes = jnp.full((self.species_size, self.genome.max_nodes, self.genome.node_gene.length), jnp.nan)
        # connections for each center genome of each species
        center_conns = jnp.full((self.species_size, self.genome.max_conns, self.genome.conn_gene.length), jnp.nan)
        species_keys = species_keys.at[0].set(0)
        best_fitness = best_fitness.at[0].set(-jnp.inf)
        last_improved = last_improved.at[0].set(0)
        member_count = member_count.at[0].set(self.pop_size)
        center_nodes = center_nodes.at[0].set(pop_nodes[0])
        center_conns = center_conns.at[0].set(pop_conns[0])
        return State(
            randkey=randkey,
            species_keys=species_keys,
            best_fitness=best_fitness,
            last_improved=last_improved,
            member_count=member_count,
            idx2species=idx2species,
            center_nodes=center_nodes,
            center_conns=center_conns,
            next_species_key=1,  # 0 is reserved for the first species
        )
    def ask(self, state):
        return state.pop_nodes, state.pop_conns
    def update_species(self, state, fitness, generation):
        # update the fitness of each species
        species_fitness = self.update_species_fitness(state, fitness)
        # stagnation species
        state, species_fitness = self.stagnation(state, generation, species_fitness)
        # sort species_info by their fitness. (also push nan to the end)
        sort_indices = jnp.argsort(species_fitness)[::-1]
        state = state.update(
            species_keys=state.species_keys[sort_indices],
            best_fitness=state.best_fitness[sort_indices],
            last_improved=state.last_improved[sort_indices],
            member_count=state.member_count[sort_indices],
            center_nodes=state.center_nodes[sort_indices],
            center_conns=state.center_conns[sort_indices],
        )
        # decide the number of members of each species by their fitness
        spawn_number = self.cal_spawn_numbers(state)
        k1, k2 = jax.random.split(state.randkey)
        # crossover info
        winner, loser, elite_mask = self.create_crossover_pair(state, k1, spawn_number, fitness)
        return state(randkey=k2), winner, loser, elite_mask
    def update_species_fitness(self, state, fitness):
        """
        obtain the fitness of the species by the fitness of each individual.
        use max criterion.
        """
        def aux_func(idx):
            s_fitness = jnp.where(state.idx2species == state.species_keys[idx], fitness, -jnp.inf)
            val = jnp.max(s_fitness)
            return val
        return jax.vmap(aux_func)(self.species_arange)
    def stagnation(self, state, generation, species_fitness):
        """
        stagnation species.
        those species whose fitness is not better than the best fitness of the species for a long time will be stagnation.
        elitism species never stagnation
        generation: the current generation
        """
        def check_stagnation(idx):
            # determine whether the species stagnation
            st = (
                    (species_fitness[idx] <= state.best_fitness[
                        idx]) &  # not better than the best fitness of the species
                    (generation - state.last_improved[idx] > self.max_stagnation)  # for a long time
            )
            # update last_improved and best_fitness
            li, bf = jax.lax.cond(
                species_fitness[idx] > state.best_fitness[idx],
                lambda: (generation, species_fitness[idx]),  # update
                lambda: (state.last_improved[idx], state.best_fitness[idx])  # not update
            )
            return st, bf, li
        spe_st, best_fitness, last_improved = jax.vmap(check_stagnation)(self.species_arange)
        # elite species will not be stagnation
        species_rank = rank_elements(species_fitness)
        spe_st = jnp.where(species_rank < self.species_elitism, False, spe_st)  # elitism never stagnation
        # set stagnation species to nan
        def update_func(idx):
            return jax.lax.cond(
                spe_st[idx],
                lambda: (
                    jnp.nan,  # species_key
                    jnp.nan,  # best_fitness
                    jnp.nan,  # last_improved
                    jnp.nan,  # member_count
                    -jnp.inf,  # species_fitness
                    jnp.full_like(center_nodes[idx], jnp.nan),  # center_nodes
                    jnp.full_like(center_conns[idx], jnp.nan),  # center_conns
                ),  # stagnation species
                lambda: (
                    species_keys[idx],
                    best_fitness[idx],
                    last_improved[idx],
                    state.member_count[idx],
                    species_fitness[idx],
                    center_nodes[idx],
                    center_conns[idx]
                )  # not stagnation species
            )
        (
            species_keys,
            best_fitness,
            last_improved,
            member_count,
            species_fitness,
            center_nodes,
            center_conns
        ) = (
            jax.vmap(update_func)(self.species_arange))
        return state.update(
            species_keys=species_keys,
            best_fitness=best_fitness,
            last_improved=last_improved,
            member_count=member_count,
            center_nodes=center_nodes,
            center_conns=center_conns,
        ), species_fitness
    def cal_spawn_numbers(self, state):
        """
        decide the number of members of each species by their fitness rank.
        the species with higher fitness will have more members
        Linear ranking selection
            e.g. N = 3, P=10 -> probability = [0.5, 0.33, 0.17], spawn_number = [5, 3, 2]
        """
        species_keys = state.species_keys
        is_species_valid = ~jnp.isnan(species_keys)
        valid_species_num = jnp.sum(is_species_valid)
        denominator = (valid_species_num + 1) * valid_species_num / 2  # obtain 3 + 2 + 1 = 6
        rank_score = valid_species_num - self.species_arange  # obtain [3, 2, 1]
        spawn_number_rate = rank_score / denominator  # obtain [0.5, 0.33, 0.17]
        spawn_number_rate = jnp.where(is_species_valid, spawn_number_rate, 0)  # set invalid species to 0
        target_spawn_number = jnp.floor(spawn_number_rate * self.pop_size)  # calculate member
        # Avoid too much variation of numbers for a species
        previous_size = state.member_count
        spawn_number = previous_size + (target_spawn_number - previous_size) * self.spawn_number_change_rate
        spawn_number = spawn_number.astype(jnp.int32)
        # must control the sum of spawn_number to be equal to pop_size
        error = state.P - jnp.sum(spawn_number)
        # add error to the first species to control the sum of spawn_number
        spawn_number = spawn_number.at[0].add(error)
        return spawn_number
    def create_crossover_pair(self, state, randkey, spawn_number, fitness):
        s_idx = self.species_arange
        p_idx = jnp.arange(self.pop_size)
        def aux_func(key, idx):
            members = state.idx2species == state.species_keys[idx]
            members_num = jnp.sum(members)
            members_fitness = jnp.where(members, fitness, -jnp.inf)
            sorted_member_indices = jnp.argsort(members_fitness)[::-1]
            survive_size = jnp.floor(self.survival_threshold * members_num).astype(jnp.int32)
            select_pro = (p_idx < survive_size) / survive_size
            fa, ma = jax.random.choice(key, sorted_member_indices, shape=(2, self.pop_size), replace=True, p=select_pro)
            # elite
            fa = jnp.where(p_idx < self.genome_elitism, sorted_member_indices, fa)
            ma = jnp.where(p_idx < self.genome_elitism, sorted_member_indices, ma)
            elite = jnp.where(p_idx < self.genome_elitism, True, False)
            return fa, ma, elite
        fas, mas, elites = jax.vmap(aux_func)(jax.random.split(randkey, self.species_size), s_idx)
        spawn_number_cum = jnp.cumsum(spawn_number)
        def aux_func(idx):
            loc = jnp.argmax(idx < spawn_number_cum)
            # elite genomes are at the beginning of the species
            idx_in_species = jnp.where(loc > 0, idx - spawn_number_cum[loc - 1], idx)
            return fas[loc, idx_in_species], mas[loc, idx_in_species], elites[loc, idx_in_species]
        part1, part2, elite_mask = jax.vmap(aux_func)(p_idx)
        is_part1_win = fitness[part1] >= fitness[part2]
        winner = jnp.where(is_part1_win, part1, part2)
        loser = jnp.where(is_part1_win, part2, part1)
        return winner, loser, elite_mask
    def speciate(self, state, generation):
        # prepare distance functions
        o2p_distance_func = jax.vmap(self.distance, in_axes=(None, None, 0, 0))  # one to population
        # idx to specie key
        idx2species = jnp.full((self.pop_size,), jnp.nan)  # NaN means not assigned to any species
        # the distance between genomes to its center genomes
        o2c_distances = jnp.full((self.pop_size,), jnp.inf)
        # step 1: find new centers
        def cond_func(carry):
            # i, idx2species, center_nodes, center_conns, o2c_distances
            i, i2s, cns, ccs, o2c = carry
            return (
                    (i < self.species_size) &
                    (~jnp.isnan(state.species_keys[i]))
            )  # current species is existing
        def body_func(carry):
            i, i2s, cns, ccs, o2c = carry
            distances = o2p_distance_func(cns, ccs, state.pop_nodes, state.pop_conns)
            # find the closest one
            closest_idx = argmin_with_mask(distances, mask=jnp.isnan(i2s))
            i2s = i2s.at[closest_idx].set(state.species_info.species_keys[i])
            cns = cns.set(i, state.pop_nodes[closest_idx])
            ccs = ccs.set(i, state.pop_conns[closest_idx])
            # the genome with closest_idx will become the new center, thus its distance to center is 0.
            o2c = o2c.at[closest_idx].set(0)
            return i + 1, i2s, cns, ccs, o2c
        _, idx2species, center_nodes, center_conns, o2c_distances = \
            jax.lax.while_loop(cond_func, body_func,
                               (0, idx2species, state.center_nodes, state.center_conns, o2c_distances))
        state = state.update(
            idx2species=idx2species,
            center_nodes=center_nodes,
            center_conns=center_conns,
        )
        # part 2: assign members to each species
        def cond_func(carry):
            # i, idx2species, center_nodes, center_conns, species_keys, o2c_distances, next_species_key
            i, i2s, cns, ccs, sk, o2c, nsk = carry
            current_species_existed = ~jnp.isnan(sk[i])
            not_all_assigned = jnp.any(jnp.isnan(i2s))
            not_reach_species_upper_bounds = i < self.species_size
            return not_reach_species_upper_bounds & (current_species_existed | not_all_assigned)
        def body_func(carry):
            i, i2s, cns, ccs, sk, o2c, nsk = carry
            _, i2s, cns, ccs, sk, o2c, nsk = jax.lax.cond(
                jnp.isnan(sk[i]),  # whether the current species is existing or not
                create_new_species,  # if not existing, create a new specie
                update_exist_specie,  # if existing, update the specie
                (i, i2s, cns, ccs, sk, o2c, nsk)
            )
            return i + 1, i2s, cns, ccs, sk, o2c, nsk
        def create_new_species(carry):
            i, i2s, cns, ccs, sk, o2c, nsk = carry
            # pick the first one who has not been assigned to any species
            idx = fetch_first(jnp.isnan(i2s))
            # assign it to the new species
            # [key, best score, last update generation, member_count]
            sk = sk.at[i].set(nsk)  # nsk -> next species key
            i2s = i2s.at[idx].set(nsk)
            o2c = o2c.at[idx].set(0)
            # update center genomes
            cns = cns.set(i, state.pop_nodes[idx])
            ccs = ccs.set(i, state.pop_conns[idx])
            # find the members for the new species
            i2s, o2c = speciate_by_threshold(i, i2s, cns, ccs, sk, o2c)
            return i, i2s, cns, ccs, sk, o2c, nsk + 1  # change to next new speciate key
        def update_exist_specie(carry):
            i, i2s, cns, ccs, sk, o2c, nsk = carry
            i2s, o2c = speciate_by_threshold(i, i2s, cns, ccs, sk, o2c)
            # turn to next species
            return i + 1, i2s, cns, ccs, sk, o2c, nsk
        def speciate_by_threshold(i, i2s, cns, ccs, sk, o2c):
            # distance between such center genome and ppo genomes
            o2p_distance = o2p_distance_func(cns[i], ccs[i], state.pop_nodes, state.pop_conns)
            close_enough_mask = o2p_distance < self.compatibility_threshold
            # when a genome is not assigned or the distance between its current center is bigger than this center
            catchable_mask = jnp.isnan(i2s) | (o2p_distance < o2c)
            mask = close_enough_mask & catchable_mask
            # update species info
            i2s = jnp.where(mask, sk[i], i2s)
            # update distance between centers
            o2c = jnp.where(mask, o2p_distance, o2c)
            return i2s, o2c
        # update idx2species
        _, idx2species, center_nodes, center_conns, species_keys, _, next_species_key = jax.lax.while_loop(
            cond_func,
            body_func,
            (0, state.idx2species, state.center_nodes, center_conns, state.species_info.species_keys, o2c_distances,
             state.next_species_key)
        )
        # if there are still some pop genomes not assigned to any species, add them to the last genome
        # this condition can only happen when the number of species is reached species upper bounds
        idx2species = jnp.where(jnp.isnan(idx2species), species_keys[-1], idx2species)
        # complete info of species which is created in this generation
        new_created_mask = (~jnp.isnan(species_keys)) & jnp.isnan(state.best_fitness)
        best_fitness = jnp.where(new_created_mask, -jnp.inf, state.best_fitness)
        last_improved = jnp.where(new_created_mask, generation, state.last_improved)
        # update members count
        def count_members(idx):
            return jax.lax.cond(
                jnp.isnan(species_keys[idx]),  # if the species is not existing
                lambda _: jnp.nan,  # nan
                lambda _: jnp.sum(idx2species == species_keys[idx], dtype=jnp.float32)  # count members
            )
        member_count = jax.vmap(count_members)(self.species_arange)
        return state.update(
            species_keys=species_keys,
            best_fitness=best_fitness,
            last_improved=last_improved,
            member_count=member_count,
            idx2species=idx2species,
            center_nodes=center_nodes,
            center_conns=center_conns,
            next_species_key=next_species_key
        )
    def distance(self, nodes1, conns1, nodes2, conns2):
        """
        The distance between two genomes
        """
        return self.node_distance(nodes1, nodes2) + self.conn_distance(conns1, conns2)
    def node_distance(self, nodes1, nodes2):
        """
        The distance of the nodes part for two genomes
        """
        node_cnt1 = jnp.sum(~jnp.isnan(nodes1[:, 0]))
        node_cnt2 = jnp.sum(~jnp.isnan(nodes2[:, 0]))
        max_cnt = jnp.maximum(node_cnt1, node_cnt2)
        # align homologous nodes
        # this process is similar to np.intersect1d.
        nodes = jnp.concatenate((nodes1, nodes2), axis=0)
        keys = nodes[:, 0]
        sorted_indices = jnp.argsort(keys, axis=0)
        nodes = nodes[sorted_indices]
        nodes = jnp.concatenate([nodes, jnp.full((1, nodes.shape[1]), jnp.nan)], axis=0)  # add a nan row to the end
        fr, sr = nodes[:-1], nodes[1:]  # first row, second row
        # flag location of homologous nodes
        intersect_mask = (fr[:, 0] == sr[:, 0]) & ~jnp.isnan(nodes[:-1, 0])
        # calculate the count of non_homologous of two genomes
        non_homologous_cnt = node_cnt1 + node_cnt2 - 2 * jnp.sum(intersect_mask)
        # calculate the distance of homologous nodes
        hnd = jax.vmap(self.genome.node_gene.distance, in_axes=(0, 0))(fr, sr)
        hnd = jnp.where(jnp.isnan(hnd), 0, hnd)
        homologous_distance = jnp.sum(hnd * intersect_mask)
        val = non_homologous_cnt * self.compatibility_disjoint + homologous_distance * self.compatibility_weight
        return jnp.where(max_cnt == 0, 0, val / max_cnt)  # avoid zero division
    def conn_distance(self, conns1, conns2):
        """
        The distance of the conns part for two genomes
        """
        con_cnt1 = jnp.sum(~jnp.isnan(conns1[:, 0]))
        con_cnt2 = jnp.sum(~jnp.isnan(conns2[:, 0]))
        max_cnt = jnp.maximum(con_cnt1, con_cnt2)
        cons = jnp.concatenate((conns1, conns2), axis=0)
        keys = cons[:, :2]
        sorted_indices = jnp.lexsort(keys.T[::-1])
        cons = cons[sorted_indices]
        cons = jnp.concatenate([cons, jnp.full((1, cons.shape[1]), jnp.nan)], axis=0)  # add a nan row to the end
        fr, sr = cons[:-1], cons[1:]  # first row, second row
        # both genome has such connection
        intersect_mask = jnp.all(fr[:, :2] == sr[:, :2], axis=1) & ~jnp.isnan(fr[:, 0])
        non_homologous_cnt = con_cnt1 + con_cnt2 - 2 * jnp.sum(intersect_mask)
        hcd = jax.vmap(self.genome.conn_gene.distance, in_axes=(0, 0))(fr, sr)
        hcd = jnp.where(jnp.isnan(hcd), 0, hcd)
        homologous_distance = jnp.sum(hcd * intersect_mask)
        val = non_homologous_cnt * self.compatibility_disjoint + homologous_distance * self.compatibility_weight
        return jnp.where(max_cnt == 0, 0, val / max_cnt)
 def initialize_population(pop_size, genome):
    o_nodes = np.full((genome.max_nodes, genome.node_gene.length), np.nan)  # original nodes
    o_conns = np.full((genome.max_conns, genome.conn_gene.length), np.nan)  # original connections
    input_idx, output_idx = genome.input_idx, genome.output_idx
    new_node_key = max([*input_idx, *output_idx]) + 1
    o_nodes[input_idx, 0] = genome.input_idx
    o_nodes[output_idx, 0] = genome.output_idx
    o_nodes[new_node_key, 0] = new_node_key  # one hidden node
    o_nodes[np.concatenate([input_idx, output_idx]), 1:] = genome.node_gene.new_attrs()
    o_nodes[new_node_key, 1:] = genome.node_gene.new_attrs()  # one hidden node
    input_conns = np.c_[input_idx, np.full_like(input_idx, new_node_key)]  # input nodes to hidden
    o_conns[input_idx, 0:2] = input_conns  # in key, out key
    o_conns[input_idx, 2] = True  # enabled
    o_conns[input_idx, 3:] = genome.conn_gene.new_conn_attrs()
    output_conns = np.c_[np.full_like(output_idx, new_node_key), output_idx]  # hidden to output nodes
    o_conns[output_idx, 0:2] = output_conns  # in key, out key
    o_conns[output_idx, 2] = True  # enabled
    o_conns[output_idx, 3:] = genome.conn_gene.new_conn_attrs()
    # repeat origin genome for P times to create population
    pop_nodes = np.tile(o_nodes, (pop_size, 1, 1))
    pop_conns = np.tile(o_conns, (pop_size, 1, 1))
    return pop_nodes, pop_conns
--- a/algorithm/neat/species/distance.py
+++ b/algorithm/neat/species/distance.py
@@ -1,71 +0,0 @@
 from jax import Array, numpy as jnp, vmap
 from core import Gene
 def distance(gene: Gene, state, genome1, genome2):
    return node_distance(gene, state, genome1.nodes, genome2.nodes) + \
        connection_distance(gene, state, genome1.conns, genome2.conns)
 def node_distance(gene: Gene, state, nodes1: Array, nodes2: Array):
    """
    Calculate the distance between nodes of two genomes.
    """
    # statistics nodes count of two genomes
    node_cnt1 = jnp.sum(~jnp.isnan(nodes1[:, 0]))
    node_cnt2 = jnp.sum(~jnp.isnan(nodes2[:, 0]))
    max_cnt = jnp.maximum(node_cnt1, node_cnt2)
    # align homologous nodes
    # this process is similar to np.intersect1d.
    nodes = jnp.concatenate((nodes1, nodes2), axis=0)
    keys = nodes[:, 0]
    sorted_indices = jnp.argsort(keys, axis=0)
    nodes = nodes[sorted_indices]
    nodes = jnp.concatenate([nodes, jnp.full((1, nodes.shape[1]), jnp.nan)], axis=0)  # add a nan row to the end
    fr, sr = nodes[:-1], nodes[1:]  # first row, second row
    # flag location of homologous nodes
    intersect_mask = (fr[:, 0] == sr[:, 0]) & ~jnp.isnan(nodes[:-1, 0])
    # calculate the count of non_homologous of two genomes
    non_homologous_cnt = node_cnt1 + node_cnt2 - 2 * jnp.sum(intersect_mask)
    # calculate the distance of homologous nodes
    hnd = vmap(gene.distance_node, in_axes=(None, 0, 0))(state, fr, sr)
    hnd = jnp.where(jnp.isnan(hnd), 0, hnd)
    homologous_distance = jnp.sum(hnd * intersect_mask)
    val = non_homologous_cnt * state.compatibility_disjoint + homologous_distance * state.compatibility_weight
    return jnp.where(max_cnt == 0, 0, val / max_cnt)  # avoid zero division
 def connection_distance(gene: Gene, state, cons1: Array, cons2: Array):
    """
    Calculate the distance between connections of two genomes.
    Similar process as node_distance.
    """
    con_cnt1 = jnp.sum(~jnp.isnan(cons1[:, 0]))
    con_cnt2 = jnp.sum(~jnp.isnan(cons2[:, 0]))
    max_cnt = jnp.maximum(con_cnt1, con_cnt2)
    cons = jnp.concatenate((cons1, cons2), axis=0)
    keys = cons[:, :2]
    sorted_indices = jnp.lexsort(keys.T[::-1])
    cons = cons[sorted_indices]
    cons = jnp.concatenate([cons, jnp.full((1, cons.shape[1]), jnp.nan)], axis=0)  # add a nan row to the end
    fr, sr = cons[:-1], cons[1:]  # first row, second row
    # both genome has such connection
    intersect_mask = jnp.all(fr[:, :2] == sr[:, :2], axis=1) & ~jnp.isnan(fr[:, 0])
    non_homologous_cnt = con_cnt1 + con_cnt2 - 2 * jnp.sum(intersect_mask)
    hcd = vmap(gene.distance_conn, in_axes=(None, 0, 0))(state, fr, sr)
    hcd = jnp.where(jnp.isnan(hcd), 0, hcd)
    homologous_distance = jnp.sum(hcd * intersect_mask)
    val = non_homologous_cnt * state.compatibility_disjoint + homologous_distance * state.compatibility_weight
    return jnp.where(max_cnt == 0, 0, val / max_cnt)
--- a/algorithm/neat/species/operations.py
+++ b/algorithm/neat/species/operations.py
@@ -1,319 +0,0 @@
 import jax
 from jax import numpy as jnp, vmap
 from core import Gene, Genome, State
 from utils import rank_elements, fetch_first
 from .distance import distance
 from .species_info import SpeciesInfo
 def update_species(state, randkey, fitness):
    # update the fitness of each species
    species_fitness = update_species_fitness(state, fitness)
    # stagnation species
    state, species_fitness = stagnation(state, species_fitness)
    # sort species_info by their fitness. (push nan to the end)
    sort_indices = jnp.argsort(species_fitness)[::-1]
    state = state.update(
        species_info=state.species_info[sort_indices],
        center_genomes=state.center_genomes[sort_indices],
    )
    # decide the number of members of each species by their fitness
    spawn_number = cal_spawn_numbers(state)
    # crossover info
    winner, loser, elite_mask = create_crossover_pair(state, randkey, spawn_number, fitness)
    return state, winner, loser, elite_mask
 def update_species_fitness(state, fitness):
    """
    obtain the fitness of the species by the fitness of each individual.
    use max criterion.
    """
    def aux_func(idx):
        s_fitness = jnp.where(state.idx2species == state.species_info.species_keys[idx], fitness, -jnp.inf)
        f = jnp.max(s_fitness)
        return f
    return vmap(aux_func)(jnp.arange(state.species_info.size()))
 def stagnation(state, species_fitness):
    """
    stagnation species.
    those species whose fitness is not better than the best fitness of the species for a long time will be stagnation.
    elitism species never stagnation
    """
    def aux_func(idx):
        s_fitness = species_fitness[idx]
        sk, bf, li, _ = state.species_info.get(idx)
        st = (s_fitness <= bf) & (state.generation - li > state.max_stagnation)
        li = jnp.where(s_fitness > bf, state.generation, li)
        bf = jnp.where(s_fitness > bf, s_fitness, bf)
        return st, sk, bf, li
    spe_st, species_keys, best_fitness, last_improved = vmap(aux_func)(jnp.arange(species_fitness.shape[0]))
    # elite species will not be stagnation
    species_rank = rank_elements(species_fitness)
    spe_st = jnp.where(species_rank < state.species_elitism, False, spe_st)  # elitism never stagnation
    # set stagnation species to nan
    species_keys = jnp.where(spe_st, jnp.nan, species_keys)
    best_fitness = jnp.where(spe_st, jnp.nan, best_fitness)
    last_improved = jnp.where(spe_st, jnp.nan, last_improved)
    member_count = jnp.where(spe_st, jnp.nan, state.species_info.member_count)
    species_fitness = jnp.where(spe_st, -jnp.inf, species_fitness)
    species_info = SpeciesInfo(species_keys, best_fitness, last_improved, member_count)
    # TODO: Simplify the coded
    center_nodes = jnp.where(spe_st[:, None, None], jnp.nan, state.center_genomes.nodes)
    center_conns = jnp.where(spe_st[:, None, None], jnp.nan, state.center_genomes.conns)
    state = state.update(
        species_info=species_info,
        center_genomes=Genome(center_nodes, center_conns)
    )
    return state, species_fitness
 def cal_spawn_numbers(state):
    """
    decide the number of members of each species by their fitness rank.
    the species with higher fitness will have more members
    Linear ranking selection
        e.g. N = 3, P=10 -> probability = [0.5, 0.33, 0.17], spawn_number = [5, 3, 2]
    """
    species_keys = state.species_info.species_keys
    is_species_valid = ~jnp.isnan(species_keys)
    valid_species_num = jnp.sum(is_species_valid)
    denominator = (valid_species_num + 1) * valid_species_num / 2  # obtain 3 + 2 + 1 = 6
    rank_score = valid_species_num - jnp.arange(species_keys.shape[0])  # obtain [3, 2, 1]
    spawn_number_rate = rank_score / denominator  # obtain [0.5, 0.33, 0.17]
    spawn_number_rate = jnp.where(is_species_valid, spawn_number_rate, 0)  # set invalid species to 0
    target_spawn_number = jnp.floor(spawn_number_rate * state.P)  # calculate member
    # Avoid too much variation of numbers in a species
    previous_size = state.species_info.member_count
    spawn_number = previous_size + (target_spawn_number - previous_size) * state.spawn_number_change_rate
    # jax.debug.print("previous_size: {}, spawn_number: {}", previous_size, spawn_number)
    spawn_number = spawn_number.astype(jnp.int32)
    # must control the sum of spawn_number to be equal to pop_size
    error = state.P - jnp.sum(spawn_number)
    spawn_number = spawn_number.at[0].add(error)  # add error to the first species to control the sum of spawn_number
    return spawn_number
 def create_crossover_pair(state, randkey, spawn_number, fitness):
    species_size = state.species_info.size()
    pop_size = fitness.shape[0]
    s_idx = jnp.arange(species_size)
    p_idx = jnp.arange(pop_size)
    # def aux_func(key, idx):
    def aux_func(key, idx):
        members = state.idx2species == state.species_info.species_keys[idx]
        members_num = jnp.sum(members)
        members_fitness = jnp.where(members, fitness, -jnp.inf)
        sorted_member_indices = jnp.argsort(members_fitness)[::-1]
        elite_size = state.genome_elitism
        survive_size = jnp.floor(state.survival_threshold * members_num).astype(jnp.int32)
        select_pro = (p_idx < survive_size) / survive_size
        fa, ma = jax.random.choice(key, sorted_member_indices, shape=(2, pop_size), replace=True, p=select_pro)
        # elite
        fa = jnp.where(p_idx < elite_size, sorted_member_indices, fa)
        ma = jnp.where(p_idx < elite_size, sorted_member_indices, ma)
        elite = jnp.where(p_idx < elite_size, True, False)
        return fa, ma, elite
    fas, mas, elites = vmap(aux_func)(jax.random.split(randkey, species_size), s_idx)
    spawn_number_cum = jnp.cumsum(spawn_number)
    def aux_func(idx):
        loc = jnp.argmax(idx < spawn_number_cum)
        # elite genomes are at the beginning of the species
        idx_in_species = jnp.where(loc > 0, idx - spawn_number_cum[loc - 1], idx)
        return fas[loc, idx_in_species], mas[loc, idx_in_species], elites[loc, idx_in_species]
    part1, part2, elite_mask = vmap(aux_func)(p_idx)
    is_part1_win = fitness[part1] >= fitness[part2]
    winner = jnp.where(is_part1_win, part1, part2)
    loser = jnp.where(is_part1_win, part2, part1)
    return winner, loser, elite_mask
 def speciate(gene: Gene, state: State):
    pop_size, species_size = state.idx2species.shape[0], state.species_info.size()
    # prepare distance functions
    o2p_distance_func = vmap(distance, in_axes=(None, None, None, 0))  # one to population
    # idx to specie key
    idx2species = jnp.full((pop_size,), jnp.nan)  # NaN means not assigned to any species
    # the distance between genomes to its center genomes
    o2c_distances = jnp.full((pop_size,), jnp.inf)
    # step 1: find new centers
    def cond_func(carry):
        i, i2s, cgs, o2c = carry
        return (i < species_size) & (~jnp.isnan(state.species_info.species_keys[i]))  # current species is existing
    def body_func(carry):
        i, i2s, cgs, o2c = carry
        distances = o2p_distance_func(gene, state, cgs[i], state.pop_genomes)
        # find the closest one
        closest_idx = argmin_with_mask(distances, mask=jnp.isnan(i2s))
        i2s = i2s.at[closest_idx].set(state.species_info.species_keys[i])
        cgs = cgs.set(i, state.pop_genomes[closest_idx])
        # the genome with closest_idx will become the new center, thus its distance to center is 0.
        o2c = o2c.at[closest_idx].set(0)
        return i + 1, i2s, cgs, o2c
    _, idx2species, center_genomes, o2c_distances = \
        jax.lax.while_loop(cond_func, body_func, (0, idx2species, state.center_genomes, o2c_distances))
    state = state.update(
        idx2species=idx2species,
        center_genomes=center_genomes,
    )
    # part 2: assign members to each species
    def cond_func(carry):
        i, i2s, cgs, sk, o2c, nsk = carry
        current_species_existed = ~jnp.isnan(sk[i])
        not_all_assigned = jnp.any(jnp.isnan(i2s))
        not_reach_species_upper_bounds = i < species_size
        return not_reach_species_upper_bounds & (current_species_existed | not_all_assigned)
    def body_func(carry):
        i, i2s, cgs, sk, o2c, nsk = carry
        _, i2s, cgs, sk, o2c, nsk = jax.lax.cond(
            jnp.isnan(sk[i]),  # whether the current species is existing or not
            create_new_species,  # if not existing, create a new specie
            update_exist_specie,  # if existing, update the specie
            (i, i2s, cgs, sk, o2c, nsk)
        )
        return i + 1, i2s, cgs, sk, o2c, nsk
    def create_new_species(carry):
        i, i2s, cgs, sk, o2c, nsk = carry
        # pick the first one who has not been assigned to any species
        idx = fetch_first(jnp.isnan(i2s))
        # assign it to the new species
        # [key, best score, last update generation, member_count]
        sk = sk.at[i].set(nsk)
        i2s = i2s.at[idx].set(nsk)
        o2c = o2c.at[idx].set(0)
        # update center genomes
        cgs = cgs.set(i, state.pop_genomes[idx])
        i2s, o2c = speciate_by_threshold(i, i2s, cgs, sk, o2c)
        # when a new species is created, it needs to be updated, thus do not change i
        return i + 1, i2s, cgs, sk, o2c, nsk + 1  # change to next new speciate key
    def update_exist_specie(carry):
        i, i2s, cgs, sk, o2c, nsk = carry
        i2s, o2c = speciate_by_threshold(i, i2s, cgs, sk, o2c)
        # turn to next species
        return i + 1, i2s, cgs, sk, o2c, nsk
    def speciate_by_threshold(i, i2s, cgs, sk, o2c):
        # distance between such center genome and ppo genomes
        o2p_distance = o2p_distance_func(gene, state, cgs[i], state.pop_genomes)
        close_enough_mask = o2p_distance < state.compatibility_threshold
        # when a genome is not assigned or the distance between its current center is bigger than this center
        cacheable_mask = jnp.isnan(i2s) | (o2p_distance < o2c)
        # jax.debug.print("{}", o2p_distance)
        mask = close_enough_mask & cacheable_mask
        # update species info
        i2s = jnp.where(mask, sk[i], i2s)
        # update distance between centers
        o2c = jnp.where(mask, o2p_distance, o2c)
        return i2s, o2c
    # update idx2species
    _, idx2species, center_genomes, species_keys, _, next_species_key = jax.lax.while_loop(
        cond_func,
        body_func,
        (0, state.idx2species, state.center_genomes, state.species_info.species_keys, o2c_distances,
         state.next_species_key)
    )
    # if there are still some pop genomes not assigned to any species, add them to the last genome
    # this condition can only happen when the number of species is reached species upper bounds
    idx2species = jnp.where(jnp.isnan(idx2species), species_keys[-1], idx2species)
    # complete info of species which is created in this generation
    new_created_mask = (~jnp.isnan(species_keys)) & jnp.isnan(state.species_info.best_fitness)
    best_fitness = jnp.where(new_created_mask, -jnp.inf, state.species_info.best_fitness)
    last_improved = jnp.where(new_created_mask, state.generation, state.species_info.last_improved)
    # update members count
    def count_members(idx):
        key = species_keys[idx]
        count = jnp.sum(idx2species == key, dtype=jnp.float32)
        count = jnp.where(jnp.isnan(key), jnp.nan, count)
        return count
    member_count = vmap(count_members)(jnp.arange(species_size))
    return state.update(
        species_info=SpeciesInfo(species_keys, best_fitness, last_improved, member_count),
        idx2species=idx2species,
        center_genomes=center_genomes,
        next_species_key=next_species_key
    )
 def argmin_with_mask(arr, mask):
    masked_arr = jnp.where(mask, arr, jnp.inf)
    min_idx = jnp.argmin(masked_arr)
    return min_idx
--- a/algorithm/neat/species/species_info.py
+++ b/algorithm/neat/species/species_info.py
@@ -1,55 +0,0 @@
 from jax.tree_util import register_pytree_node_class
 import numpy as np
 import jax.numpy as jnp
@register_pytree_node_class
 class SpeciesInfo:
    def __init__(self, species_keys, best_fitness, last_improved, member_count):
        self.species_keys = species_keys
        self.best_fitness = best_fitness
        self.last_improved = last_improved
        self.member_count = member_count
    @classmethod
    def initialize(cls, state):
        species_keys = np.full((state.S,), np.nan, dtype=np.float32)
        best_fitness = np.full((state.S,), np.nan, dtype=np.float32)
        last_improved = np.full((state.S,), np.nan, dtype=np.float32)
        member_count = np.full((state.S,), np.nan, dtype=np.float32)
        species_keys[0] = 0
        best_fitness[0] = -np.inf
        last_improved[0] = 0
        member_count[0] = state.P
        return cls(species_keys, best_fitness, last_improved, member_count)
    def __getitem__(self, i):
        return SpeciesInfo(self.species_keys[i], self.best_fitness[i], self.last_improved[i], self.member_count[i])
    def get(self, i):
        return self.species_keys[i], self.best_fitness[i], self.last_improved[i], self.member_count[i]
    def set(self, idx, value):
        species_keys = self.species_keys.at[idx].set(value[0])
        best_fitness = self.best_fitness.at[idx].set(value[1])
        last_improved = self.last_improved.at[idx].set(value[2])
        member_count = self.member_count.at[idx].set(value[3])
        return SpeciesInfo(species_keys, best_fitness, last_improved, member_count)
    def remove(self, idx):
        return self.set(idx, jnp.array([jnp.nan] * 4))
    def size(self):
        return self.species_keys.shape[0]
    def tree_flatten(self):
        children = self.species_keys, self.best_fitness, self.last_improved, self.member_count
        aux_data = None
        return children, aux_data
    @classmethod
    def tree_unflatten(cls, aux_data, children):
        return cls(*children)
--- a/config/init.py
+++ b/config/init.py
@@ -1 +0,0 @@
 from .config import *
--- a/config/config.py
+++ b/config/config.py
@@ -1,107 +0,0 @@
 from dataclasses import dataclass
 from utils import Act, Agg
@dataclass(frozen=True)
 class BasicConfig:
    seed: int = 42
    fitness_target: float = 1
    generation_limit: int = 1000
    pop_size: int = 100
    def __post_init__(self):
        assert self.pop_size > 0, "the population size must be greater than 0"
@dataclass(frozen=True)
 class NeatConfig:
    network_type: str = "feedforward"
    inputs: int = 2
    outputs: int = 1
    max_nodes: int = 50
    max_conns: int = 100
    max_species: int = 10
    # genome config
    compatibility_disjoint: float = 1
    compatibility_weight: float = 0.5
    conn_add: float = 0.4
    conn_delete: float = 0
    node_add: float = 0.2
    node_delete: float = 0
    # species config
    compatibility_threshold: float = 3.5
    species_elitism: int = 2
    max_stagnation: int = 15
    genome_elitism: int = 2
    survival_threshold: float = 0.2
    min_species_size: int = 1
    spawn_number_change_rate: float = 0.5
    def __post_init__(self):
        assert self.network_type in ["feedforward", "recurrent"], "the network type must be feedforward or recurrent"
        assert self.inputs > 0, "the inputs number of neat must be greater than 0"
        assert self.outputs > 0, "the outputs number of neat must be greater than 0"
        assert self.max_nodes > 0, "the maximum nodes must be greater than 0"
        assert self.max_conns > 0, "the maximum connections must be greater than 0"
        assert self.max_species > 0, "the maximum species must be greater than 0"
        assert self.compatibility_disjoint > 0, "the compatibility disjoint must be greater than 0"
        assert self.compatibility_weight > 0, "the compatibility weight must be greater than 0"
        assert self.conn_add >= 0, "the connection add probability must be greater than 0"
        assert self.conn_delete >= 0, "the connection delete probability must be greater than 0"
        assert self.node_add >= 0, "the node add probability must be greater than 0"
        assert self.node_delete >= 0, "the node delete probability must be greater than 0"
        assert self.compatibility_threshold > 0, "the compatibility threshold must be greater than 0"
        assert self.species_elitism > 0, "the species elitism must be greater than 0"
        assert self.max_stagnation > 0, "the max stagnation must be greater than 0"
        assert self.genome_elitism > 0, "the genome elitism must be greater than 0"
        assert self.survival_threshold > 0, "the survival threshold must be greater than 0"
        assert self.min_species_size > 0, "the min species size must be greater than 0"
        assert self.spawn_number_change_rate > 0, "the spawn number change rate must be greater than 0"
@dataclass(frozen=True)
 class HyperNeatConfig:
    below_threshold: float = 0.2
    max_weight: float = 3
    activation: callable = Act.sigmoid
    aggregation: callable = Agg.sum
    activate_times: int = 5
    inputs: int = 2
    outputs: int = 1
    def __post_init__(self):
        assert self.below_threshold > 0, "the below threshold must be greater than 0"
        assert self.max_weight > 0, "the max weight must be greater than 0"
        assert self.activate_times > 0, "the activate times must be greater than 0"
        assert self.inputs > 0, "the inputs number of hyper neat must be greater than 0"
        assert self.outputs > 0, "the outputs number of hyper neat must be greater than 0"
@dataclass(frozen=True)
 class GeneConfig:
    pass
@dataclass(frozen=True)
 class SubstrateConfig:
    pass
@dataclass(frozen=True)
 class ProblemConfig:
    pass
@dataclass(frozen=True)
 class Config:
    basic: BasicConfig = BasicConfig()
    neat: NeatConfig = NeatConfig()
    hyperneat: HyperNeatConfig = HyperNeatConfig()
    gene: GeneConfig = GeneConfig()
    substrate: SubstrateConfig = SubstrateConfig()
    problem: ProblemConfig = ProblemConfig()
--- a/core/init.py
+++ b/core/init.py
@@ -1,6 +0,0 @@
 from .algorithm import Algorithm
 from .state import State
 from .genome import Genome
 from .gene import Gene
 from .substrate import Substrate
 from .problem import Problem
--- a/core/algorithm.py
+++ b/core/algorithm.py
@@ -1,50 +0,0 @@
 from functools import partial
 import jax
 from .state import State
 from .genome import Genome
 class Algorithm:
    def setup(self, randkey, state: State = State()):
        """initialize the state of the algorithm"""
        raise NotImplementedError
    @partial(jax.jit, static_argnums=(0,))
    def ask(self, state: State):
        """require the population to be evaluated"""
        return self.ask_algorithm(state)
    @partial(jax.jit, static_argnums=(0,))
    def tell(self, state: State, fitness):
        """update the state of the algorithm"""
        return self.tell_algorithm(state, fitness)
    @partial(jax.jit, static_argnums=(0,))
    def transform(self, state: State, genome: Genome):
        """transform the genome into a neural network"""
        return self.forward_transform(state, genome)
    @partial(jax.jit, static_argnums=(0,))
    def act(self, state: State, inputs, genome: Genome):
        return self.forward(state, inputs, genome)
    def forward_transform(self, state: State, genome: Genome):
        raise NotImplementedError
    def forward(self, state: State, inputs, genome: Genome):
        raise NotImplementedError
    def ask_algorithm(self, state: State):
        """ask the specific algorithm for a new population"""
        raise NotImplementedError
    def tell_algorithm(self, state: State, fitness):
        """tell the specific algorithm the fitness of the population"""
        raise NotImplementedError
--- a/core/gene.py
+++ b/core/gene.py
@@ -1,40 +0,0 @@
 from config import GeneConfig
 from .state import State
 class Gene:
    node_attrs = []
    conn_attrs = []
    def __init__(self, config: GeneConfig = GeneConfig()):
        raise NotImplementedError
    def setup(self, state=State()):
        raise NotImplementedError
    def update(self, state):
        raise NotImplementedError
    def new_node_attrs(self, state: State):
        raise NotImplementedError
    def new_conn_attrs(self, state: State):
        raise NotImplementedError
    def mutate_node(self, state: State, randkey, node_attrs):
        raise NotImplementedError
    def mutate_conn(self, state: State, randkey, conn_attrs):
        raise NotImplementedError
    def distance_node(self, state: State, node_attrs1, node_attrs2):
        raise NotImplementedError
    def distance_conn(self, state: State, conn_attrs1, conn_attrs2):
        raise NotImplementedError
    def forward_transform(self, state: State, genome):
        raise NotImplementedError
    def forward(self, state: State, inputs, transform):
        raise NotImplementedError
--- a/core/genome.py
+++ b/core/genome.py
@@ -1,90 +0,0 @@
 from __future__ import annotations
 from jax.tree_util import register_pytree_node_class
 from jax import numpy as jnp
 from utils.tools import fetch_first
@register_pytree_node_class
 class Genome:
    def __init__(self, nodes, conns):
        self.nodes = nodes
        self.conns = conns
    def __repr__(self):
        return f"Genome(nodes={self.nodes}, conns={self.conns})"
    def __getitem__(self, idx):
        return self.__class__(self.nodes[idx], self.conns[idx])
    def __eq__(self, other):
        nodes_eq = jnp.alltrue((self.nodes == other.nodes) | (jnp.isnan(self.nodes) & jnp.isnan(other.nodes)))
        conns_eq = jnp.alltrue((self.conns == other.conns) | (jnp.isnan(self.conns) & jnp.isnan(other.conns)))
        return nodes_eq & conns_eq
    def set(self, idx, value: Genome):
        return self.__class__(self.nodes.at[idx].set(value.nodes), self.conns.at[idx].set(value.conns))
    def update(self, nodes, conns):
        return self.__class__(nodes, conns)
    def update_nodes(self, nodes):
        return self.update(nodes, self.conns)
    def update_conns(self, conns):
        return self.update(self.nodes, conns)
    def count(self):
        """Count how many nodes and connections are in the genome."""
        nodes_cnt = jnp.sum(~jnp.isnan(self.nodes[:, 0]))
        conns_cnt = jnp.sum(~jnp.isnan(self.conns[:, 0]))
        return nodes_cnt, conns_cnt
    def add_node(self, new_key: int, attrs):
        """
        Add a new node to the genome.
        The new node will place at the first NaN row.
        """
        exist_keys = self.nodes[:, 0]
        pos = fetch_first(jnp.isnan(exist_keys))
        new_nodes = self.nodes.at[pos, 0].set(new_key)
        new_nodes = new_nodes.at[pos, 1:].set(attrs)
        return self.update_nodes(new_nodes)
    def delete_node_by_pos(self, pos):
        """
        Delete a node from the genome.
        Delete the node by its pos in nodes.
        """
        nodes = self.nodes.at[pos].set(jnp.nan)
        return self.update_nodes(nodes)
    def add_conn(self, i_key, o_key, enable: bool, attrs):
        """
        Add a new connection to the genome.
        The new connection will place at the first NaN row.
        """
        con_keys = self.conns[:, 0]
        pos = fetch_first(jnp.isnan(con_keys))
        new_conns = self.conns.at[pos, 0:3].set(jnp.array([i_key, o_key, enable]))
        new_conns = new_conns.at[pos, 3:].set(attrs)
        return self.update_conns(new_conns)
    def delete_conn_by_pos(self, pos):
        """
        Delete a connection from the genome.
        Delete the connection by its idx.
        """
        conns = self.conns.at[pos].set(jnp.nan)
        return self.update_conns(conns)
    def tree_flatten(self):
        children = self.nodes, self.conns
        aux_data = None
        return children, aux_data
    @classmethod
    def tree_unflatten(cls, aux_data, children):
        return cls(*children)
--- a/core/problem.py
+++ b/core/problem.py
@@ -1,29 +0,0 @@
 from typing import Callable
 from config import ProblemConfig
 from .state import State
 class Problem:
    jitable = None
    def __init__(self, problem_config: ProblemConfig = ProblemConfig()):
        self.config = problem_config
    def evaluate(self, randkey, state: State, act_func: Callable, params):
        raise NotImplementedError
    @property
    def input_shape(self):
        raise NotImplementedError
    @property
    def output_shape(self):
        raise NotImplementedError
    def show(self, randkey, state: State, act_func: Callable, params, *args, **kwargs):
        """
        show how a genome perform in this problem
        """
        raise NotImplementedError
--- a/core/substrate.py
+++ b/core/substrate.py
@@ -1,8 +0,0 @@
 from config import SubstrateConfig
 class Substrate:
    @staticmethod
    def setup(state, config: SubstrateConfig = SubstrateConfig()):
        return state
--- a/examples/brax/ant.py
+++ b/examples/brax/ant.py
@@ -12,7 +12,7 @@ def example_conf():
        basic=BasicConfig(
            seed=42,
            fitness_target=10000,
-            pop_size=1000
+            pop_size=100
        ),
        neat=NeatConfig(
            inputs=27,
--- a/pipeline.py
+++ b/pipeline.py
@@ -1,7 +1,3 @@
 """
 pipeline for jitable env like func_fit, gymnax
 """
 from functools import partial
 from typing import Type
@@ -16,24 +12,28 @@ from core import State, Algorithm, Problem
 class Pipeline:
-    def __init__(self, config: Config, algorithm: Algorithm, problem_type: Type[Problem]):
+    def __init__(
        self,
        algorithm: Algorithm,
        problem: Problem,
        seed: int = 42,
        fitness_target: float = 1,
        generation_limit: int = 1000,
        pop_size: int = 100,
    ):
        assert problem.jitable, "Currently, problem must be jitable"
        assert problem_type.jitable, "problem must be jitable"
        self.config = config
        self.algorithm = algorithm
-        self.problem = problem_type(config.problem)
+        self.problem = problem
        self.seed = seed
        self.fitness_target = fitness_target
        self.generation_limit = generation_limit
        self.pop_size = pop_size
        print(self.problem.input_shape, self.problem.output_shape)
-        if isinstance(algorithm, NEAT):
+        # TODO: make each algorithm's input_num and output_num
-            assert config.neat.inputs == self.problem.input_shape[-1], f"problem input shape {self.problem.input_shape}"
+        assert algorithm.input_num == self.problem.input_shape[-1], f"problem input shape {self.problem.input_shape}"
        elif isinstance(algorithm, HyperNEAT):
            assert config.hyperneat.inputs == self.problem.input_shape[-1], f"problem input shape {self.problem.input_shape}"
        else:
            raise NotImplementedError
        self.act_func = self.algorithm.act
@@ -45,19 +45,19 @@ class Pipeline:
        self.generation_timestamp = None
    def setup(self):
-        key = jax.random.PRNGKey(self.config.basic.seed)
+        key = jax.random.PRNGKey(self.seed)
        algorithm_key, evaluate_key = jax.random.split(key, 2)
-        state = State()
+
-        state = self.algorithm.setup(algorithm_key, state)
+        # TODO: Problem should has setup function to maintain state
-        return state.update(
+        return State(
-            evaluate_key=evaluate_key
+            alg=self.algorithm.setup(algorithm_key),
            pro=self.problem.setup(evaluate_key),
        )
    @partial(jax.jit, static_argnums=(0,))
    def step(self, state):
        key, sub_key = jax.random.split(state.evaluate_key)
-        keys = jax.random.split(key, self.config.basic.pop_size)
+        keys = jax.random.split(key, self.pop_size)
        pop = self.algorithm.ask(state)
@@ -72,7 +72,7 @@ class Pipeline:
    def auto_run(self, ini_state):
        state = ini_state
-        for _ in range(self.config.basic.generation_limit):
+        for _ in range(self.generation_limit):
            self.generation_timestamp = time.time()
@@ -84,7 +84,7 @@ class Pipeline:
            self.analysis(state, previous_pop, fitnesses)
-            if max(fitnesses) >= self.config.basic.fitness_target:
+            if max(fitnesses) >= self.fitness_target:
                print("Fitness limit reached!")
                return state, self.best_genome
@@ -120,3 +120,4 @@ class Pipeline:
        print("start compile")
        self.step.lower(self, state).compile()
        print(f"compile finished, cost time: {time.time() - tic}s")
--- a/problem/init.py
+++ b/problem/init.py
@@ -0,0 +1 @@
 from .base import BaseProblem
--- a/problem/base.py
+++ b/problem/base.py
@@ -0,0 +1,44 @@
 from typing import Callable
 from config import ProblemConfig
 from core.state import State
 class BaseProblem:
    jitable = None
    def __init__(self):
        pass
    def setup(self, randkey, state: State = State()):
        """initialize the state of the problem"""
        raise NotImplementedError
    def evaluate(self, randkey, state: State, act_func: Callable, params):
        """evaluate one individual"""
        raise NotImplementedError
    @property
    def input_shape(self):
        """
        The input shape for the problem to evaluate
        In RL problem, it is the observation space
        In function fitting problem, it is the input shape of the function
        """
        raise NotImplementedError
    @property
    def output_shape(self):
        """
        The output shape for the problem to evaluate
        In RL problem, it is the action space
        In function fitting problem, it is the output shape of the function
        """
        raise NotImplementedError
    def show(self, randkey, state: State, act_func: Callable, params, *args, **kwargs):
        """
        show how a genome perform in this problem
        """
        raise NotImplementedError
--- a/problem/func_fit/init.py
+++ b/problem/func_fit/init.py
@@ -1,3 +1,3 @@
-from .func_fit import FuncFit, FuncFitConfig
+from .func_fit import FuncFit
 from .xor import XOR
 from .xor3d import XOR3d
--- a/problem/func_fit/func_fit.py
+++ b/problem/func_fit/func_fit.py
@@ -1,42 +1,35 @@
 from typing import Callable
 from dataclasses import dataclass
 import jax
 import jax.numpy as jnp
 from config import ProblemConfig
 from core import Problem, State
 from .. import BaseProblem
-@dataclass(frozen=True)
+class FuncFit(BaseProblem):
 class FuncFitConfig(ProblemConfig):
    error_method: str = 'mse'
    def __post_init__(self):
        assert self.error_method in {'mse', 'rmse', 'mae', 'mape'}
 class FuncFit(Problem):
    jitable = True
-    def __init__(self, config: FuncFitConfig = FuncFitConfig()):
+    def __init__(self,
-        self.config = config
+        error_method: str = 'mse'
-        super().__init__(config)
+    ):
        super().__init__()
-    def evaluate(self, randkey, state: State, act_func: Callable, params):
+        assert error_method in {'mse', 'rmse', 'mae', 'mape'}
        self.error_method = error_method
    def evaluate(self, randkey, state, act_func, params):
        predict = act_func(state, self.inputs, params)
-        if self.config.error_method == 'mse':
+        if self.error_method == 'mse':
            loss = jnp.mean((predict - self.targets) ** 2)
-        elif self.config.error_method == 'rmse':
+        elif self.error_method == 'rmse':
            loss = jnp.sqrt(jnp.mean((predict - self.targets) ** 2))
-        elif self.config.error_method == 'mae':
+        elif self.error_method == 'mae':
            loss = jnp.mean(jnp.abs(predict - self.targets))
-        elif self.config.error_method == 'mape':
+        elif self.error_method == 'mape':
            loss = jnp.mean(jnp.abs((predict - self.targets) / self.targets))
        else:
@@ -44,7 +37,7 @@ class FuncFit(Problem):
        return -loss
-    def show(self, randkey, state: State, act_func: Callable, params, *args, **kwargs):
+    def show(self, randkey, state, act_func, params, *args, **kwargs):
        predict = act_func(state, self.inputs, params)
        inputs, target, predict = jax.device_get([self.inputs, self.targets, predict])
        loss = -self.evaluate(randkey, state, act_func, params)
--- a/problem/func_fit/xor.py
+++ b/problem/func_fit/xor.py
@@ -1,13 +1,12 @@
 import numpy as np
-from .func_fit import FuncFit, FuncFitConfig
+from .func_fit import FuncFit
 class XOR(FuncFit):
-    def __init__(self, config: FuncFitConfig = FuncFitConfig()):
+    def __init__(self, error_method: str = 'mse'):
-        self.config = config
+        super().__init__(error_method)
        super().__init__(config)
    @property
    def inputs(self):
--- a/problem/func_fit/xor3d.py
+++ b/problem/func_fit/xor3d.py
@@ -1,13 +1,12 @@
 import numpy as np
-from .func_fit import FuncFit, FuncFitConfig
+from .func_fit import FuncFit
 class XOR3d(FuncFit):
-    def __init__(self, config: FuncFitConfig = FuncFitConfig()):
+    def __init__(self, error_method: str = 'mse'):
-        self.config = config
+        super().__init__(error_method)
        super().__init__(config)
    @property
    def inputs(self):
@@ -37,8 +36,8 @@ class XOR3d(FuncFit):
    @property
    def input_shape(self):
-        return (8, 3)
+        return 8, 3
    @property
    def output_shape(self):
-        return (8, 1)
+        return 8, 1
--- a/problem/rl_env/brax_env.py
+++ b/problem/rl_env/brax_env.py
@@ -1,28 +1,13 @@
 from dataclasses import dataclass
 from typing import Callable
 import jax.numpy as jnp
 from brax import envs
 from core import State
 from .rl_jit import RLEnv, RLEnvConfig
-
+from .rl_jit import RLEnv
@dataclass(frozen=True)
 class BraxConfig(RLEnvConfig):
    env_name: str = "ant"
    backend: str = "generalized"
    def __post_init__(self):
        # TODO: Check if env_name is registered
        # assert self.env_name in gymnax.registered_envs, f"Env {self.env_name} not registered"
        pass
 class BraxEnv(RLEnv):
-    def __init__(self, config: BraxConfig = BraxConfig()):
+    def __init__(self, env_name: str = "ant", backend: str = "generalized"):
-        super().__init__(config)
+        super().__init__()
-        self.config = config
+        self.env = envs.create(env_name=env_name, backend=backend)
        self.env = envs.create(env_name=config.env_name, backend=config.backend)
    def env_step(self, randkey, env_state, action):
        state = self.env.step(env_state, action)
@@ -40,9 +25,7 @@ class BraxEnv(RLEnv):
    def output_shape(self):
        return (self.env.action_size,)
-    def show(self, randkey, state: State, act_func: Callable, params, save_path=None, height=512, width=512,
+    def show(self, randkey, state, act_func, params, save_path=None, height=512, width=512, duration=0.1, *args, **kwargs):
             duration=0.1, *args,
             **kwargs):
        import jax
        import imageio
@@ -56,8 +39,7 @@ class BraxEnv(RLEnv):
        def step(key, env_state, obs):
            key, _ = jax.random.split(key)
-            net_out = act_func(state, obs, params)
+            action = act_func(state, obs, params)
            action = self.config.output_transform(net_out)
            obs, env_state, r, done, _ = self.step(randkey, env_state, action)
            return key, env_state, obs, r, done
@@ -72,7 +54,6 @@ class BraxEnv(RLEnv):
        def create_gif(image_list, gif_name, duration):
            with imageio.get_writer(gif_name, mode='I', duration=duration) as writer:
                for image in image_list:
                    # 确保图像的数据类型正确
                    formatted_image = np.array(image, dtype=np.uint8)
                    writer.append_data(formatted_image)
--- a/problem/rl_env/gymnax_env.py
+++ b/problem/rl_env/gymnax_env.py
@@ -1,26 +1,15 @@
 from dataclasses import dataclass
 from typing import Callable
 import gymnax
-from core import State
+from .rl_jit import RLEnv
 from .rl_jit import RLEnv, RLEnvConfig
@dataclass(frozen=True)
 class GymNaxConfig(RLEnvConfig):
    env_name: str = "CartPole-v1"
    def __post_init__(self):
        assert self.env_name in gymnax.registered_envs, f"Env {self.env_name} not registered"
 class GymNaxEnv(RLEnv):
-    def __init__(self, config: GymNaxConfig = GymNaxConfig()):
+    def __init__(self, env_name):
-        super().__init__(config)
+        super().__init__()
-        self.config = config
+        assert env_name in gymnax.registered_envs, f"Env {env_name} not registered"
-        self.env, self.env_params = gymnax.make(config.env_name)
+        self.env, self.env_params = gymnax.make(env_name)
    def env_step(self, randkey, env_state, action):
        return self.env.step(randkey, env_state, action, self.env_params)
@@ -36,5 +25,5 @@ class GymNaxEnv(RLEnv):
    def output_shape(self):
        return self.env.action_space(self.env_params).shape
-    def show(self, randkey, state: State, act_func: Callable, params):
+    def show(self, randkey, state, act_func, params, *args, **kwargs):
        raise NotImplementedError("GymNax render must rely on gym 0.19.0(old version).")
--- a/problem/rl_env/rl_jit.py
+++ b/problem/rl_env/rl_jit.py
@@ -1,28 +1,18 @@
 from dataclasses import dataclass
 from typing import Callable
 from functools import partial
 import jax
-from config import ProblemConfig
+from .. import BaseProblem
-from core import Problem, State
+class RLEnv(BaseProblem):
@dataclass(frozen=True)
 class RLEnvConfig(ProblemConfig):
    output_transform: Callable = lambda x: x
 class RLEnv(Problem):
    jitable = True
-    def __init__(self, config: RLEnvConfig = RLEnvConfig()):
+    # TODO: move output transform to algorithm
-        super().__init__(config)
+    def __init__(self):
-        self.config = config
+        super().__init__()
-    def evaluate(self, randkey, state: State, act_func: Callable, params):
+    def evaluate(self, randkey, state, act_func, params):
        rng_reset, rng_episode = jax.random.split(randkey)
        init_obs, init_env_state = self.reset(rng_reset)
@@ -31,8 +21,7 @@ class RLEnv(Problem):
            return ~done
        def body_func(carry):
            obs, env_state, rng, _, tr = carry  # total reward
-            net_out = act_func(state, obs, params)
+            action = act_func(state, obs, params)
            action = self.config.output_transform(net_out)
            next_obs, next_env_state, reward, done, _ = self.step(rng, env_state, action)
            next_rng, _ = jax.random.split(rng)
            return next_obs, next_env_state, next_rng, done, tr + reward
@@ -67,5 +56,5 @@ class RLEnv(Problem):
    def output_shape(self):
        raise NotImplementedError
-    def show(self, randkey, state: State, act_func: Callable, params, *args, **kwargs):
+    def show(self, randkey, state, act_func, params, *args, **kwargs):
        raise NotImplementedError
--- a/t.py
+++ b/t.py
@@ -0,0 +1,64 @@
 from algorithm.neat import *
 from utils import Act, Agg
 import jax, jax.numpy as jnp
 def main():
    # index, bias, response, activation, aggregation
    nodes = jnp.array([
        [0, 0, 1, 0, 0], # in[0]
        [1, 0, 1, 0, 0], # in[1]
        [2, 0.5, 1, 0, 0],  # out[0],
        [3, 1, 1, 0, 0],  # hidden[0],
        [4, -1, 1, 0, 0],  # hidden[1],
    ])
    # in_node, out_node, enable, weight
    conns = jnp.array([
        [0, 3, 1, 0.5], # in[0] -> hidden[0]
        [1, 4, 1, 0.5], # in[1] -> hidden[1]
        [3, 2, 1, 0.5], # hidden[0] -> out[0]
        [4, 2, 1, 0.5], # hidden[1] -> out[0]
    ])
    genome = RecurrentGenome(
        num_inputs=2,
        num_outputs=1,
        node_gene=DefaultNodeGene(
            activation_default=Act.identity,
            activation_options=(Act.identity, ),
            aggregation_default=Agg.sum,
            aggregation_options=(Agg.sum, ),
        ),
        activate_time=3
    )
    transformed = genome.transform(nodes, conns)
    print(*transformed, sep='\n')
    inputs = jnp.array([0, 0])
    outputs = genome.forward(inputs, transformed)
    print(outputs)
    inputs = jnp.array([[0, 0],[0, 1], [1, 0], [1, 1]])
    outputs = jax.jit(jax.vmap(genome.forward, in_axes=(0, None)))(inputs, transformed)
    print(outputs)
    expected: [[0.5], [0.75], [0.75], [1]]
    print('\n-------------------------------------------------------\n')
    conns = conns.at[0, 2].set(False)  # disable in[0] -> hidden[0]
    print(conns)
    transformed = genome.transform(nodes, conns)
    print(*transformed, sep='\n')
    inputs = jnp.array([[0, 0],[0, 1], [1, 0], [1, 1]])
    outputs = jax.vmap(genome.forward, in_axes=(0, None))(inputs, transformed)
    print(outputs)
    expected: [[0.5], [0.75], [0.5], [0.75]]
 if __name__ == '__main__':
    main()
--- a/test/init.py
+++ b/test/init.py
--- a/test/test_genome.py
+++ b/test/test_genome.py
@@ -0,0 +1,113 @@
 from algorithm.neat import *
 from utils import Act, Agg
 import jax, jax.numpy as jnp
 def test_default():
    # index, bias, response, activation, aggregation
    nodes = jnp.array([
        [0, 0, 1, 0, 0], # in[0]
        [1, 0, 1, 0, 0], # in[1]
        [2, 0.5, 1, 0, 0],  # out[0],
        [3, 1, 1, 0, 0],  # hidden[0],
        [4, -1, 1, 0, 0],  # hidden[1],
    ])
    # in_node, out_node, enable, weight
    conns = jnp.array([
        [0, 3, 1, 0.5], # in[0] -> hidden[0]
        [1, 4, 1, 0.5], # in[1] -> hidden[1]
        [3, 2, 1, 0.5], # hidden[0] -> out[0]
        [4, 2, 1, 0.5], # hidden[1] -> out[0]
    ])
    genome = DefaultGenome(
        num_inputs=2,
        num_outputs=1,
        node_gene=DefaultNodeGene(
            activation_default=Act.identity,
            activation_options=(Act.identity, ),
            aggregation_default=Agg.sum,
            aggregation_options=(Agg.sum, ),
        ),
    )
    transformed = genome.transform(nodes, conns)
    print(*transformed, sep='\n')
    inputs = jnp.array([[0, 0],[0, 1], [1, 0], [1, 1]])
    outputs = jax.jit(jax.vmap(genome.forward, in_axes=(0, None)))(inputs, transformed)
    print(outputs)
    assert jnp.allclose(outputs, jnp.array([[0.5], [0.75], [0.75], [1]]))
    # expected: [[0.5], [0.75], [0.75], [1]]
    print('\n-------------------------------------------------------\n')
    conns = conns.at[0, 2].set(False)  # disable in[0] -> hidden[0]
    print(conns)
    transformed = genome.transform(nodes, conns)
    print(*transformed, sep='\n')
    inputs = jnp.array([[0, 0],[0, 1], [1, 0], [1, 1]])
    outputs = jax.vmap(genome.forward, in_axes=(0, None))(inputs, transformed)
    print(outputs)
    assert jnp.allclose(outputs, jnp.array([[0], [0.25], [0], [0.25]]))
    # expected: [[0.5], [0.75], [0.5], [0.75]]
 def test_recurrent():
    # index, bias, response, activation, aggregation
    nodes = jnp.array([
        [0, 0, 1, 0, 0], # in[0]
        [1, 0, 1, 0, 0], # in[1]
        [2, 0.5, 1, 0, 0],  # out[0],
        [3, 1, 1, 0, 0],  # hidden[0],
        [4, -1, 1, 0, 0],  # hidden[1],
    ])
    # in_node, out_node, enable, weight
    conns = jnp.array([
        [0, 3, 1, 0.5], # in[0] -> hidden[0]
        [1, 4, 1, 0.5], # in[1] -> hidden[1]
        [3, 2, 1, 0.5], # hidden[0] -> out[0]
        [4, 2, 1, 0.5], # hidden[1] -> out[0]
    ])
    genome = RecurrentGenome(
        num_inputs=2,
        num_outputs=1,
        node_gene=DefaultNodeGene(
            activation_default=Act.identity,
            activation_options=(Act.identity, ),
            aggregation_default=Agg.sum,
            aggregation_options=(Agg.sum, ),
        ),
        activate_time=3,
    )
    transformed = genome.transform(nodes, conns)
    print(*transformed, sep='\n')
    inputs = jnp.array([[0, 0],[0, 1], [1, 0], [1, 1]])
    outputs = jax.jit(jax.vmap(genome.forward, in_axes=(0, None)))(inputs, transformed)
    print(outputs)
    assert jnp.allclose(outputs, jnp.array([[0.5], [0.75], [0.75], [1]]))
    # expected: [[0.5], [0.75], [0.75], [1]]
    print('\n-------------------------------------------------------\n')
    conns = conns.at[0, 2].set(False)  # disable in[0] -> hidden[0]
    print(conns)
    transformed = genome.transform(nodes, conns)
    print(*transformed, sep='\n')
    inputs = jnp.array([[0, 0],[0, 1], [1, 0], [1, 1]])
    outputs = jax.vmap(genome.forward, in_axes=(0, None))(inputs, transformed)
    print(outputs)
    assert jnp.allclose(outputs, jnp.array([[0], [0.25], [0], [0.25]]))
    # expected: [[0.5], [0.75], [0.5], [0.75]]
--- a/utils/init.py
+++ b/utils/init.py
@@ -2,3 +2,4 @@ from .activation import Act, act
 from .aggregation import Agg, agg
 from .tools import *
 from .graph import *
 from .state import State
--- a/utils/aggregation.py
+++ b/utils/aggregation.py
@@ -57,10 +57,8 @@ def agg(idx, z, agg_funcs):
    """
    idx = jnp.asarray(idx, dtype=jnp.int32)
-    def all_nan():
+    return jax.lax.cond(
-        return 0.
+        jnp.all(jnp.isnan(z)),
-
+        lambda: jnp.nan,  # all inputs are nan
-    def not_all_nan():
+        lambda: jax.lax.switch(idx, agg_funcs, z)  # otherwise
-        return jax.lax.switch(idx, agg_funcs, z)
+    )
    return jax.lax.cond(jnp.all(jnp.isnan(z)), all_nan, not_all_nan)
--- a/utils/state.py
+++ b/utils/state.py
--- a/utils/tools.py
+++ b/utils/tools.py
@@ -5,13 +5,11 @@ import jax
 from jax import numpy as jnp, Array, jit, vmap
 I_INT = np.iinfo(jnp.int32).max  # infinite int
 EMPTY_NODE = np.full((1, 5), jnp.nan)
 EMPTY_CON = np.full((1, 4), jnp.nan)
 def unflatten_conns(nodes, conns):
    """
-    transform the (C, CL) connections to (CL-2, N, N)
+    transform the (C, CL) connections to (CL-2, N, N), 2 is for the input index and output index)
    :return:
    """
    N = nodes.shape[0]
@@ -67,3 +65,42 @@ def rank_elements(array, reverse=False):
    if not reverse:
        array = -array
    return jnp.argsort(jnp.argsort(array))
@jit
 def mutate_float(key, val, init_mean, init_std, mutate_power, mutate_rate, replace_rate):
    k1, k2, k3 = jax.random.split(key, num=3)
    noise = jax.random.normal(k1, ()) * mutate_power
    replace = jax.random.normal(k2, ()) * init_std + init_mean
    r = jax.random.uniform(k3, ())
    val = jnp.where(
        r < mutate_rate,
        val + noise,
        jnp.where(
            (mutate_rate < r) & (r < mutate_rate + replace_rate),
            replace,
            val
        )
    )
    return val
@jit
 def mutate_int(key, val, options, replace_rate):
    k1, k2 = jax.random.split(key, num=2)
    r = jax.random.uniform(k1, ())
    val = jnp.where(
        r < replace_rate,
        jax.random.choice(k2, options),
        val
    )
    return val
 def argmin_with_mask(arr, mask):
    masked_arr = jnp.where(mask, arr, jnp.inf)
    min_idx = jnp.argmin(masked_arr)
    return min_idx
		`@@ -1,2 +0,0 @@`
			`from .hyperneat import HyperNEAT`
			`from .substrate import NormalSubstrate, NormalSubstrateConfig`
		`@@ -1,2 +0,0 @@`
			`from .normal import NormalSubstrate, NormalSubstrateConfig`
			`from .tools import analysis_substrate`
		`@@ -0,0 +1,2 @@`
							`from .base import BaseCrossover`
							`from .default import DefaultCrossover`
		`@@ -0,0 +1,2 @@`
							`from .base import BaseMutation`
							`from .default import DefaultMutation`
		`@@ -0,0 +1,2 @@`
							`from .base import BaseConnGene`
							`from .default import DefaultConnGene`
		`@@ -0,0 +1,2 @@`
							`from .base import BaseNodeGene`
							`from .default import DefaultNodeGene`
`@@ -1,2 +1,2 @@`
	`from .species_info import SpeciesInfo`	`from .base import BaseSpecies`
	`from .operations import update_species, speciate`	`from .default import DefaultSpecies`