add evox support

2024-07-11 20:52:17 +08:00
parent e372ed7dcc
commit e2869c7562
6 changed files with 232 additions and 66 deletions
--- a/examples/tmp.py
+++ b/examples/tmp.py
@@ -1,21 +0,0 @@
 import jax, jax.numpy as jnp
 from tensorneat.algorithm import NEAT
 from tensorneat.genome import DefaultGenome, RecurrentGenome
 key = jax.random.key(0)
 genome = DefaultGenome(num_inputs=5, num_outputs=3, max_nodes=100, max_conns=500, init_hidden_layers=(1, 2 ,3))
 state = genome.setup()
 nodes, conns = genome.initialize(state, key)
 print(genome.repr(state, nodes, conns))
 inputs = jnp.array([1, 2, 3, 4, 5])
 transformed = genome.transform(state, nodes, conns)
 outputs = genome.forward(state, transformed, inputs)
 print(outputs)
 network = genome.network_dict(state, nodes, conns)
 print(network)
 genome.visualize(network)
--- a/examples/tmp2.py
+++ b/examples/tmp2.py
@@ -1,39 +0,0 @@
 import jax, jax.numpy as jnp
 from tensorneat.pipeline import Pipeline
 from tensorneat.algorithm.neat import NEAT
 from tensorneat.genome import DefaultGenome, DefaultNode, DefaultMutation, BiasNode
 from tensorneat.problem.func_fit import CustomFuncFit
 from tensorneat.common import Act, Agg
 def pagie_polynomial(inputs):
    x, y = inputs
    return x + y
 if __name__ == "__main__":
    genome=DefaultGenome(
        num_inputs=2,
        num_outputs=1,
        max_nodes=3,
        max_conns=2,
        init_hidden_layers=(),
        node_gene=BiasNode(
            activation_options=[Act.identity],
            aggregation_options=[Agg.sum],
        ),
        output_transform=Act.identity,
        mutation=DefaultMutation(
            node_add=0,
            node_delete=0,
            conn_add=0.0,
            conn_delete=0.0,
        )
    )
    randkey = jax.random.PRNGKey(42)
    state = genome.setup()
    nodes, conns = genome.initialize(state, randkey)
    print(genome)
--- a/examples/with_evox/evox_algorithm_adaptor.py
+++ b/examples/with_evox/evox_algorithm_adaptor.py
@@ -0,0 +1,34 @@
 import jax.numpy as jnp
 from evox import Algorithm as EvoXAlgorithm, State as EvoXState, jit_class
 from tensorneat.algorithm import BaseAlgorithm as TensorNEATAlgorithm
 from tensorneat.common import State as TensorNEATState
@jit_class
 class EvoXAlgorithmAdaptor(EvoXAlgorithm):
    def __init__(self, algorithm: TensorNEATAlgorithm):
        self.algorithm = algorithm
        self.fixed_state = None
    def setup(self, key):
        neat_algorithm_state = TensorNEATState(randkey=key)
        neat_algorithm_state = self.algorithm.setup(neat_algorithm_state)
        self.fixed_state = neat_algorithm_state
        return EvoXState(alg_state=neat_algorithm_state)
    def ask(self, state: EvoXState):
        population = self.algorithm.ask(state.alg_state)
        return population, state
    def tell(self, state: EvoXState, fitness):
        fitness = jnp.where(jnp.isnan(fitness), -jnp.inf, fitness)
        neat_algorithm_state = self.algorithm.tell(state.alg_state, fitness)
        return state.replace(alg_state=neat_algorithm_state)
    def transform(self, individual):
        return self.algorithm.transform(self.fixed_state, individual)
    def forward(self, transformed, inputs):
        return self.algorithm.forward(self.fixed_state, transformed, inputs)
--- a/examples/with_evox/example.py
+++ b/examples/with_evox/example.py
@@ -0,0 +1,65 @@
 import jax
 import jax.numpy as jnp
 from evox import workflows, algorithms, problems
 from tensorneat.examples.with_evox.evox_algorithm_adaptor import EvoXAlgorithmAdaptor
 from tensorneat.examples.with_evox.tensorneat_monitor import TensorNEATMonitor
 from tensorneat.algorithm import NEAT
 from tensorneat.algorithm.neat import DefaultSpecies, DefaultGenome, DefaultNodeGene
 from tensorneat.common import Act
 neat_algorithm = NEAT(
    species=DefaultSpecies(
        genome=DefaultGenome(
            num_inputs=17,
            num_outputs=6,
            max_nodes=200,
            max_conns=500,
            node_gene=DefaultNodeGene(
                activation_options=(Act.standard_tanh,),
                activation_default=Act.standard_tanh,
            ),
            output_transform=Act.tanh,
        ),
        pop_size=10000,
        species_size=10,
    ),
 )
 evox_algorithm = EvoXAlgorithmAdaptor(neat_algorithm)
 key = jax.random.PRNGKey(42)
 model_key, workflow_key = jax.random.split(key)
 monitor = TensorNEATMonitor(neat_algorithm, is_save=False)
 problem = problems.neuroevolution.Brax(
    env_name="walker2d",
    policy=evox_algorithm.forward,
    max_episode_length=1000,
    num_episodes=1,
    backend="mjx"
 )
 def nan2inf(x):
    return jnp.where(jnp.isnan(x), -jnp.inf, x)
 # create a workflow
 workflow = workflows.StdWorkflow(
    algorithm=evox_algorithm,
    problem=problem,
    candidate_transforms=[jax.jit(jax.vmap(evox_algorithm.transform))],
    fitness_transforms=[nan2inf],
    monitors=[monitor],
    opt_direction="max",
 )
 # init the workflow
 state = workflow.init(workflow_key)
 # state = workflow.enable_multi_devices(state)
 # run the workflow for 100 steps
 import time
 for i in range(100):
    tic = time.time()
    train_info, state = workflow.step(state)
    monitor.show()
--- a/examples/with_evox/ray_test.py
+++ b/examples/with_evox/ray_test.py
@@ -1,6 +0,0 @@
 import ray
 ray.init(num_gpus=2)
 available_resources = ray.available_resources()
 print("Available resources:", available_resources)
--- a/examples/with_evox/tensorneat_monitor.py
+++ b/examples/with_evox/tensorneat_monitor.py
@@ -0,0 +1,133 @@
 import warnings
 import os
 import time
 import numpy as np
 import jax
 from jax.experimental import io_callback
 from evox import Monitor
 from evox import State as EvoXState
 from tensorneat.algorithm import BaseAlgorithm as TensorNEATAlgorithm
 from tensorneat.common import State as TensorNEATState
 class TensorNEATMonitor(Monitor):
    def __init__(
        self,
        neat_algorithm: TensorNEATAlgorithm,
        save_dir: str = None,
        is_save: bool = False,
    ):
        super().__init__()
        self.neat_algorithm = neat_algorithm
        self.generation_timestamp = time.time()
        self.alg_state: TensorNEATState = None
        self.fitness = None
        self.best_fitness = -np.inf
        self.best_genome = None
        self.is_save = is_save
        if is_save:
            if save_dir is None:
                now = datetime.datetime.now().strftime("%Y%m%d%H%M%S")
                self.save_dir = f"./{self.__class__.__name__} {now}"
            else:
                self.save_dir = save_dir
            print(f"save to {self.save_dir}")
            if not os.path.exists(self.save_dir):
                os.makedirs(self.save_dir)
            self.genome_dir = os.path.join(self.save_dir, "genomes")
            if not os.path.exists(self.genome_dir):
                os.makedirs(self.genome_dir)
    def hooks(self):
        return ["pre_tell"]
    def pre_tell(self, state: EvoXState, cand_sol, transformed_cand_sol, fitness, transformed_fitness):
        io_callback(
            self.store_info,
            None,
            state,
            transformed_fitness,
        )
    def store_info(self, state: EvoXState, fitness):
        self.alg_state: TensorNEATState = state.query_state("algorithm").alg_state
        self.fitness = jax.device_get(fitness)
    def show(self):
        pop = self.neat_algorithm.ask(self.alg_state)
        valid_fitnesses = self.fitness[~np.isinf(self.fitness)]
        max_f, min_f, mean_f, std_f = (
            max(valid_fitnesses),
            min(valid_fitnesses),
            np.mean(valid_fitnesses),
            np.std(valid_fitnesses),
        )
        new_timestamp = time.time()
        cost_time = new_timestamp - self.generation_timestamp
        self.generation_timestamp = new_timestamp
        max_idx = np.argmax(self.fitness)
        if self.fitness[max_idx] > self.best_fitness:
            self.best_fitness = self.fitness[max_idx]
            self.best_genome = pop[0][max_idx], pop[1][max_idx]
        if self.is_save:
            best_genome = jax.device_get((pop[0][max_idx], pop[1][max_idx]))
            with open(
                os.path.join(
                    self.genome_dir,
                    f"{int(self.neat_algorithm.generation(self.alg_state))}.npz",
                ),
                "wb",
            ) as f:
                np.savez(
                    f,
                    nodes=best_genome[0],
                    conns=best_genome[1],
                    fitness=self.best_fitness,
                )
        # save best if save path is not None
        member_count = jax.device_get(self.neat_algorithm.member_count(self.alg_state))
        species_sizes = [int(i) for i in member_count if i > 0]
        pop = jax.device_get(pop)
        pop_nodes, pop_conns = pop  # (P, N, NL), (P, C, CL)
        nodes_cnt = (~np.isnan(pop_nodes[:, :, 0])).sum(axis=1)  # (P,)
        conns_cnt = (~np.isnan(pop_conns[:, :, 0])).sum(axis=1)  # (P,)
        max_node_cnt, min_node_cnt, mean_node_cnt = (
            max(nodes_cnt),
            min(nodes_cnt),
            np.mean(nodes_cnt),
        )
        max_conn_cnt, min_conn_cnt, mean_conn_cnt = (
            max(conns_cnt),
            min(conns_cnt),
            np.mean(conns_cnt),
        )
        print(
            f"Generation: {self.neat_algorithm.generation(self.alg_state)}, Cost time: {cost_time * 1000:.2f}ms\n",
            f"\tnode counts: max: {max_node_cnt}, min: {min_node_cnt}, mean: {mean_node_cnt:.2f}\n",
            f"\tconn counts: max: {max_conn_cnt}, min: {min_conn_cnt}, mean: {mean_conn_cnt:.2f}\n",
            f"\tspecies: {len(species_sizes)}, {species_sizes}\n",
            f"\tfitness: valid cnt: {len(valid_fitnesses)}, max: {max_f:.4f}, min: {min_f:.4f}, mean: {mean_f:.4f}, std: {std_f:.4f}\n",
        )
        # append log
        if self.is_save:
            with open(os.path.join(self.save_dir, "log.txt"), "a") as f:
                f.write(
                    f"{self.neat_algorithm.generation(self.alg_state)},{max_f},{min_f},{mean_f},{std_f},{cost_time}\n"
                )