update hyperneat and related examples

2024-07-11 15:08:02 +08:00
parent 9bad577d89
commit 3cb5fbf581
7 changed files with 102 additions and 136 deletions
--- a/examples/brax/walker.py
+++ b/examples/brax/walker.py
@@ -1,60 +0,0 @@
 from pipeline import Pipeline
 from algorithm.neat import *
 from problem.rl_env import BraxEnv
 from tensorneat.common import Act
 import jax, jax.numpy as jnp
 def split_right_left(randkey, forward_func, obs):
    right_obs_keys = jnp.array([2, 3, 4, 11, 12, 13])
    left_obs_keys = jnp.array([5, 6, 7, 14, 15, 16])
    right_action_keys = jnp.array([0, 1, 2])
    left_action_keys = jnp.array([3, 4, 5])
    right_foot_obs = obs
    left_foot_obs = obs
    left_foot_obs = left_foot_obs.at[right_obs_keys].set(obs[left_obs_keys])
    left_foot_obs = left_foot_obs.at[left_obs_keys].set(obs[right_obs_keys])
    right_action, left_action = jax.vmap(forward_func)(jnp.stack([right_foot_obs, left_foot_obs]))
    # print(right_action.shape)
    # print(left_action.shape)
    return jnp.concatenate([right_action, left_action])
 if __name__ == "__main__":
    pipeline = Pipeline(
        algorithm=NEAT(
            species=DefaultSpecies(
                genome=DefaultGenome(
                    num_inputs=17,
                    num_outputs=3,
                    max_nodes=50,
                    max_conns=100,
                    node_gene=DefaultNodeGene(
                        activation_options=(Act.tanh,),
                        activation_default=Act.tanh,
                    ),
                    output_transform=Act.tanh,
                ),
                pop_size=1000,
                species_size=10,
            ),
        ),
        problem=BraxEnv(
            env_name="walker2d",
            max_step=1000,
            action_policy=split_right_left
        ),
        generation_limit=10000,
        fitness_target=5000,
    )
    # initialize state
    state = pipeline.setup()
    # print(state)
    # run until terminate
    state, best = pipeline.auto_run(state)
--- a/examples/brax/walker2d.py
+++ b/examples/brax/walker2d.py
@@ -0,0 +1,51 @@
 from tensorneat.pipeline import Pipeline
 from tensorneat.algorithm.neat import NEAT
 from tensorneat.genome import DefaultGenome, BiasNode
 from tensorneat.problem.rl_env import BraxEnv
 from tensorneat.common import Act, Agg
 import jax, jax.numpy as jnp
 def random_sample_policy(randkey, obs):
    return jax.random.uniform(randkey, (6,))
 if __name__ == "__main__":
    pipeline = Pipeline(
        algorithm=NEAT(
            pop_size=1000,
            species_size=20,
            survival_threshold=0.1,
            compatibility_threshold=1.0,
            genome=DefaultGenome(
                max_nodes=100,
                max_conns=200,
                num_inputs=17,
                num_outputs=6,
                init_hidden_layers=(),
                node_gene=BiasNode(
                    activation_options=Act.tanh,
                    aggregation_options=Agg.sum,
                ),
                output_transform=Act.standard_tanh,
            ),
        ),
        problem=BraxEnv(
            env_name="walker2d",
            max_step=1000,
            obs_normalization=True,
            sample_episodes=1000,
            sample_policy=random_sample_policy,
        ),
        seed=42,
        generation_limit=100,
        fitness_target=5000,
    )
    # initialize state
    state = pipeline.setup()
    # print(state)
    # run until terminate
    state, best = pipeline.auto_run(state)
--- a/examples/func_fit/xor_hyperneat.py
+++ b/examples/func_fit/xor_hyperneat.py
@@ -1,53 +1,33 @@
-from pipeline import Pipeline
+from tensorneat.pipeline import Pipeline
-from algorithm.neat import *
+from tensorneat.algorithm.neat import NEAT
-from algorithm.hyperneat import *
+from tensorneat.algorithm.hyperneat import HyperNEAT, FullSubstrate
 from tensorneat.genome import DefaultGenome
 from tensorneat.common import Act
-from problem.func_fit import XOR3d
+from tensorneat.problem.func_fit import XOR3d
 if __name__ == "__main__":
    pipeline = Pipeline(
        algorithm=HyperNEAT(
            substrate=FullSubstrate(
-                input_coors=[(-1, -1), (0.333, -1), (-0.333, -1), (1, -1)],  # 3(XOR3d inputs) + 1(bias)
+                input_coors=((-1, -1), (-0.33, -1), (0.33, -1), (1, -1)),
-                hidden_coors=[
+                hidden_coors=((-1, 0), (0, 0), (1, 0)),
-                    (-1, -0.5), (0.333, -0.5), (-0.333, -0.5),
+                output_coors=((0, 1),),
                    (1, -0.5),
                    (-1, 0),
                    (0.333, 0),
                    (-0.333, 0),
                    (1, 0),
                    (-1, 0.5),
                    (0.333, 0.5),
                    (-0.333, 0.5),
                    (1, 0.5),
                ],
                output_coors=[
                    (0, 1),  # one output
                ],
            ),
            neat=NEAT(
-                species=DefaultSpecies(
+                pop_size=10000,
-                    genome=DefaultGenome(
+                species_size=20,
-                        num_inputs=4,  # [*coor1, *coor2]
+                survival_threshold=0.01,
-                        num_outputs=1,  # the weight of connection between two coor1 and coor2
+                genome=DefaultGenome(
-                        max_nodes=50,
+                    num_inputs=4,  # size of query coors
-                        max_conns=100,
+                    num_outputs=1,
-                        node_gene=DefaultNodeGene(
+                    init_hidden_layers=(),
-                            activation_default=Act.tanh,
+                    output_transform=Act.standard_tanh,
                            activation_options=(Act.tanh,),
                        ),
                        output_transform=Act.tanh,  # the activation function for output node in NEAT
                    ),
                    pop_size=1000,
                    species_size=10,
                    compatibility_threshold=2,
                    survival_threshold=0.03,
                ),
            ),
            activation=Act.tanh,
            activate_time=10,
-            output_transform=Act.sigmoid,  # the activation function for output node in HyperNEAT
+            output_transform=Act.standard_sigmoid,
        ),
        problem=XOR3d(),
        generation_limit=300,
--- a/tensorneat/algorithm/init.py
+++ b/tensorneat/algorithm/init.py
@@ -1,2 +1,3 @@
 from .base import BaseAlgorithm
 from .neat import NEAT
 from .hyperneat import HyperNEAT
--- a/tensorneat/algorithm/hyperneat/hyperneat.py
+++ b/tensorneat/algorithm/hyperneat/hyperneat.py
@@ -1,12 +1,12 @@
 from typing import Callable
-import jax, jax.numpy as jnp
+import jax
 from jax import vmap, numpy as jnp
 from tensorneat.common import State, Act, Agg
 from .. import BaseAlgorithm, NEAT
 from ..neat.gene import BaseNodeGene, BaseConnGene
 from ..neat.genome import RecurrentGenome
 from .substrate import *
 from tensorneat.common import State, Act, Agg
 from tensorneat.algorithm import BaseAlgorithm, NEAT
 from tensorneat.genome import BaseNode, BaseConn, RecurrentGenome
 class HyperNEAT(BaseAlgorithm):
@@ -14,64 +14,65 @@ class HyperNEAT(BaseAlgorithm):
        self,
        substrate: BaseSubstrate,
        neat: NEAT,
-        below_threshold: float = 0.3,
+        weight_threshold: float = 0.3,
        max_weight: float = 5.0,
-        aggregation=Agg.sum,
+        aggregation: Callable = Agg.sum,
-        activation=Act.sigmoid,
+        activation: Callable = Act.sigmoid,
        activate_time: int = 10,
-        output_transform: Callable = Act.sigmoid,
+        output_transform: Callable = Act.standard_sigmoid,
    ):
        assert (
            substrate.query_coors.shape[1] == neat.num_inputs
-        ), "Substrate input size should be equal to NEAT input size"
+        ), "Query coors of Substrate should be equal to NEAT input size"
-
+        
        self.substrate = substrate
        self.neat = neat
-        self.below_threshold = below_threshold
+        self.weight_threshold = weight_threshold
        self.max_weight = max_weight
        self.hyper_genome = RecurrentGenome(
            num_inputs=substrate.num_inputs,
            num_outputs=substrate.num_outputs,
            max_nodes=substrate.nodes_cnt,
            max_conns=substrate.conns_cnt,
-            node_gene=HyperNodeGene(aggregation, activation),
+            node_gene=HyperNEATNode(aggregation, activation),
-            conn_gene=HyperNEATConnGene(),
+            conn_gene=HyperNEATConn(),
            activate_time=activate_time,
            output_transform=output_transform,
        )
        self.pop_size = neat.pop_size
    def setup(self, state=State()):
        state = self.neat.setup(state)
        state = self.substrate.setup(state)
        return self.hyper_genome.setup(state)
-    def ask(self, state: State):
+    def ask(self, state):
        return self.neat.ask(state)
-    def tell(self, state: State, fitness):
+    def tell(self, state, fitness):
        state = self.neat.tell(state, fitness)
        return state
    def transform(self, state, individual):
        transformed = self.neat.transform(state, individual)
-        query_res = jax.vmap(self.neat.forward, in_axes=(None, None, 0))(
+        query_res = vmap(self.neat.forward, in_axes=(None, None, 0))(
            state, transformed, self.substrate.query_coors
        )
-        # mute the connection with weight below threshold
+        # mute the connection with weight weight threshold
        query_res = jnp.where(
-            (-self.below_threshold < query_res) & (query_res < self.below_threshold),
+            (-self.weight_threshold < query_res) & (query_res < self.weight_threshold),
            0.0,
            query_res,
        )
        # make query res in range [-max_weight, max_weight]
        query_res = jnp.where(
-            query_res > 0, query_res - self.below_threshold, query_res
+            query_res > 0, query_res - self.weight_threshold, query_res
        )
        query_res = jnp.where(
-            query_res < 0, query_res + self.below_threshold, query_res
+            query_res < 0, query_res + self.weight_threshold, query_res
        )
-        query_res = query_res / (1 - self.below_threshold) * self.max_weight
+        query_res = query_res / (1 - self.weight_threshold) * self.max_weight
        h_nodes, h_conns = self.substrate.make_nodes(
            query_res
@@ -79,11 +80,11 @@ class HyperNEAT(BaseAlgorithm):
        return self.hyper_genome.transform(state, h_nodes, h_conns)
-    def forward(self, state, inputs, transformed):
+    def forward(self, state, transformed, inputs):
        # add bias
        inputs_with_bias = jnp.concatenate([inputs, jnp.array([1])])
-        res = self.hyper_genome.forward(state, inputs_with_bias, transformed)
+        res = self.hyper_genome.forward(state, transformed, inputs_with_bias)
        return res
    @property
@@ -94,18 +95,11 @@ class HyperNEAT(BaseAlgorithm):
    def num_outputs(self):
        return self.substrate.num_outputs
-    @property
+    def show_details(self, state, fitness):
-    def pop_size(self):
+        return self.neat.show_details(state, fitness)
        return self.neat.pop_size
    def member_count(self, state: State):
        return self.neat.member_count(state)
    def generation(self, state: State):
        return self.neat.generation(state)
-class HyperNodeGene(BaseNodeGene):
+class HyperNEATNode(BaseNode):
    def __init__(
        self,
        aggregation=Agg.sum,
@@ -123,7 +117,7 @@ class HyperNodeGene(BaseNodeGene):
        )
-class HyperNEATConnGene(BaseConnGene):
+class HyperNEATConn(BaseConn):
    custom_attrs = ["weight"]
    def forward(self, state, attrs, inputs):
--- a/tensorneat/genome/operations/mutation/default.py
+++ b/tensorneat/genome/operations/mutation/default.py
@@ -23,10 +23,10 @@ from ...utils import (
 class DefaultMutation(BaseMutation):
    def __init__(
        self,
-        conn_add: float = 0.1,
+        conn_add: float = 0.2,
-        conn_delete: float = 0,
+        conn_delete: float = 0.2,
        node_add: float = 0.1,
-        node_delete: float = 0,
+        node_delete: float = 0.1,
    ):
        self.conn_add = conn_add
        self.conn_delete = conn_delete
--- a/tensorneat/pipeline.py
+++ b/tensorneat/pipeline.py
@@ -34,7 +34,7 @@ class Pipeline(StatefulBaseClass):
        self.generation_limit = generation_limit
        self.pop_size = self.algorithm.pop_size
-        # print(self.problem.input_shape, self.problem.output_shape)
+        np.random.seed(self.seed)
        # TODO: make each algorithm's input_num and output_num
        assert (