odify genome for the official release

2024-07-10 11:24:11 +08:00
parent 075460f896
commit ee8ec84202
83 changed files with 588 additions and 611 deletions
--- a/examples/gymnax/arcbot.py
+++ b/examples/gymnax/arcbot.py
@@ -0,0 +1,36 @@
+import jax.numpy as jnp
+
+from pipeline import Pipeline
+from algorithm.neat import *
+
+from problem.rl_env import GymNaxEnv
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=NEAT(
+            species=DefaultSpecies(
+                genome=DefaultGenome(
+                    num_inputs=6,
+                    num_outputs=3,
+                    max_nodes=50,
+                    max_conns=100,
+                    output_transform=lambda out: jnp.argmax(
+                        out
+                    ),  # the action of acrobot is {0, 1, 2}
+                ),
+                pop_size=10000,
+                species_size=10,
+            ),
+        ),
+        problem=GymNaxEnv(
+            env_name="Acrobot-v1",
+        ),
+        generation_limit=10000,
+        fitness_target=-62,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)
--- a/examples/gymnax/cartpole.py
+++ b/examples/gymnax/cartpole.py
@@ -0,0 +1,41 @@
+import jax.numpy as jnp
+
+from pipeline import Pipeline
+from algorithm.neat import *
+
+from problem.rl_env import GymNaxEnv
+
+
+def action_policy(randkey, forward_func, obs):
+    return jnp.argmax(forward_func(obs))
+
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=NEAT(
+            species=DefaultSpecies(
+                genome=DefaultGenome(
+                    num_inputs=4,
+                    num_outputs=2,
+                    max_nodes=50,
+                    max_conns=100,
+                    # output_transform=lambda out: jnp.argmax(
+                    #     out
+                    # ),  # the action of cartpole is {0, 1}
+                ),
+                pop_size=10000,
+                species_size=10,
+            ),
+        ),
+        problem=GymNaxEnv(
+            env_name="CartPole-v1", repeat_times=5, action_policy=action_policy
+        ),
+        generation_limit=10000,
+        fitness_target=500,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)
--- a/examples/gymnax/cartpole_hyperneat.py
+++ b/examples/gymnax/cartpole_hyperneat.py
@@ -0,0 +1,74 @@
+import jax
+
+from pipeline import Pipeline
+from algorithm.neat import *
+from algorithm.hyperneat import *
+from tensorneat.common import Act
+
+from problem.rl_env import GymNaxEnv
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=HyperNEAT(
+            substrate=FullSubstrate(
+                input_coors=[
+                    (-1, -1),
+                    (-0.5, -1),
+                    (0, -1),
+                    (0.5, -1),
+                    (1, -1),
+                ],  # 4(problem inputs) + 1(bias)
+                hidden_coors=[
+                    (-1, -0.5),
+                    (0.333, -0.5),
+                    (-0.333, -0.5),
+                    (1, -0.5),
+                    (-1, 0),
+                    (0.333, 0),
+                    (-0.333, 0),
+                    (1, 0),
+                    (-1, 0.5),
+                    (0.333, 0.5),
+                    (-0.333, 0.5),
+                    (1, 0.5),
+                ],
+                output_coors=[
+                    (-1, 1),
+                    (1, 1),  # one output
+                ],
+            ),
+            neat=NEAT(
+                species=DefaultSpecies(
+                    genome=DefaultGenome(
+                        num_inputs=4,  # [*coor1, *coor2]
+                        num_outputs=1,  # the weight of connection between two coor1 and coor2
+                        max_nodes=50,
+                        max_conns=100,
+                        node_gene=DefaultNodeGene(
+                            activation_default=Act.tanh,
+                            activation_options=(Act.tanh,),
+                        ),
+                        output_transform=Act.tanh,  # the activation function for output node in NEAT
+                    ),
+                    pop_size=10000,
+                    species_size=10,
+                    compatibility_threshold=3.5,
+                    survival_threshold=0.03,
+                ),
+            ),
+            activation=Act.tanh,  # the activation function for output node in HyperNEAT
+            activate_time=10,
+            output_transform=jax.numpy.argmax,  # action of cartpole is in {0, 1}
+        ),
+        problem=GymNaxEnv(
+            env_name="CartPole-v1",
+        ),
+        generation_limit=300,
+        fitness_target=500,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)
--- a/examples/gymnax/mountain_car.py
+++ b/examples/gymnax/mountain_car.py
@@ -0,0 +1,36 @@
+import jax.numpy as jnp
+
+from pipeline import Pipeline
+from algorithm.neat import *
+
+from problem.rl_env import GymNaxEnv
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=NEAT(
+            species=DefaultSpecies(
+                genome=DefaultGenome(
+                    num_inputs=2,
+                    num_outputs=3,
+                    max_nodes=50,
+                    max_conns=100,
+                    output_transform=lambda out: jnp.argmax(
+                        out
+                    ),  # the action of mountain car is {0, 1, 2}
+                ),
+                pop_size=10000,
+                species_size=10,
+            ),
+        ),
+        problem=GymNaxEnv(
+            env_name="MountainCar-v0",
+        ),
+        generation_limit=10000,
+        fitness_target=-86,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)
--- a/examples/gymnax/mountain_car_continuous.py
+++ b/examples/gymnax/mountain_car_continuous.py
@@ -0,0 +1,37 @@
+from pipeline import Pipeline
+from algorithm.neat import *
+
+from problem.rl_env import GymNaxEnv
+from tensorneat.common import Act
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=NEAT(
+            species=DefaultSpecies(
+                genome=DefaultGenome(
+                    num_inputs=2,
+                    num_outputs=1,
+                    max_nodes=50,
+                    max_conns=100,
+                    node_gene=DefaultNodeGene(
+                        activation_options=(Act.tanh,),
+                        activation_default=Act.tanh,
+                    ),
+                    output_transform=Act.tanh
+                ),
+                pop_size=10000,
+                species_size=10,
+            ),
+        ),
+        problem=GymNaxEnv(
+            env_name="MountainCarContinuous-v0",
+        ),
+        generation_limit=10000,
+        fitness_target=99,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)
--- a/examples/gymnax/pendulum.py
+++ b/examples/gymnax/pendulum.py
@@ -0,0 +1,38 @@
+from pipeline import Pipeline
+from algorithm.neat import *
+
+from problem.rl_env import GymNaxEnv
+from tensorneat.common import Act
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=NEAT(
+            species=DefaultSpecies(
+                genome=DefaultGenome(
+                    num_inputs=3,
+                    num_outputs=1,
+                    max_nodes=50,
+                    max_conns=100,
+                    node_gene=DefaultNodeGene(
+                        activation_options=(Act.tanh,),
+                        activation_default=Act.tanh,
+                    ),
+                    output_transform=lambda out: Act.tanh(out)
+                    * 2,  # the action of pendulum is [-2, 2]
+                ),
+                pop_size=10000,
+                species_size=10,
+            ),
+        ),
+        problem=GymNaxEnv(
+            env_name="Pendulum-v1",
+        ),
+        generation_limit=10000,
+        fitness_target=-10,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)
--- a/examples/gymnax/reacher.py
+++ b/examples/gymnax/reacher.py
@@ -0,0 +1,33 @@
+import jax.numpy as jnp
+
+from pipeline import Pipeline
+from algorithm.neat import *
+
+from problem.rl_env import GymNaxEnv
+
+if __name__ == "__main__":
+    pipeline = Pipeline(
+        algorithm=NEAT(
+            species=DefaultSpecies(
+                genome=DefaultGenome(
+                    num_inputs=8,
+                    num_outputs=2,
+                    max_nodes=50,
+                    max_conns=100,
+                ),
+                pop_size=10000,
+                species_size=10,
+            ),
+        ),
+        problem=GymNaxEnv(
+            env_name="Reacher-misc",
+        ),
+        generation_limit=10000,
+        fitness_target=90,
+    )
+
+    # initialize state
+    state = pipeline.setup()
+    # print(state)
+    # run until terminate
+    state, best = pipeline.auto_run(state)