add some test

2025-02-12 21:37:56 +08:00
parent 51028346fd
commit de2d906656
4 changed files with 417 additions and 0 deletions
--- a/test/ranknet.py
+++ b/test/ranknet.py
@@ -0,0 +1,140 @@
+# import RankNet
+from tensorneat import algorithm, genome, common
+from tensorneat.pipeline import Pipeline
+from tensorneat.genome import BiasNode
+from tensorneat.genome.operations import mutation
+from tensorneat.common import ACT, AGG
+import jax, jax.numpy as jnp
+from tensorneat.problem import BaseProblem
+
+data_num = 100
+input_size = 768  # Each network (genome) should have input size 768
+
+# The problem is to optimize a RankNet utilizing NEAT
+
+
+def binary_cross_entropy(prediction, target):
+    return -(target * jnp.log(prediction) + (1 - target) * jnp.log(1 - prediction))
+
+
+# Create dataset (100 samples of vectors with 768 features)
+INPUTS = jax.random.uniform(
+    jax.random.PRNGKey(0), (data_num, input_size)
+)  # the input data x
+LABELS = jax.random.uniform(jax.random.PRNGKey(0), (data_num, 1))  # the annotated labels y
+# True (1): >=; False (0): <
+pairwise_labels = jnp.where((LABELS - LABELS.T) >= 0, True, False)
+
+print(f"{INPUTS.shape=}, {LABELS.shape=}")
+
+
+# Define the custom Problem
+class CustomProblem(BaseProblem):
+
+    jitable = True  # necessary
+
+    def evaluate(self, state, randkey, act_func, params):
+        # Use ``act_func(state, params, inputs)`` to do network forward
+
+        # print("state: ", state)
+        # print("params: ",params)
+        # print("act_func: ",act_func)
+
+        ans_to_question = True
+
+        # Question: This is the same as doing a forward pass for the generated network?
+        #           Meaning the network does 100 passes for all the elements of 768 features?
+        if ans_to_question:
+            # do batch forward for all inputs (using jax.vamp).
+            predict = jax.vmap(act_func, in_axes=(None, None, 0))(
+                state, params, INPUTS
+            )  # should be shape (100, 1)
+        else:
+            # I misunderstood, so I have to create a RankNet myself to predict the output
+            # Setting up with the values present in the genome
+            current_node = state.species.idx2species
+            current_node_weights = state.pop_conns[current_node]
+            net = RankNet.RankNet(input_size, current_node_weights)
+            predict = net.forward(INPUTS)
+
+        pairwise_predictions = predict - predict.T  # shape (100, 100)
+        p = jax.nn.sigmoid(pairwise_predictions)  # shape (100, 100)
+
+        # calculate loss
+        loss = binary_cross_entropy(p, pairwise_labels)  # shape (100, 100)
+        # loss with shape (100, 100), we need to reduce it to a scalar
+        loss = jnp.mean(loss)
+
+        # return negative loss as fitness
+        # TensorNEAT maximizes fitness, equivalent to minimizing loss
+        return -loss
+
+    @property
+    def input_shape(self):
+        # the input shape that the act_func expects
+        return (input_size,)
+
+    @property
+    def output_shape(self):
+        # the output shape that the act_func returns
+        return (1,)
+
+    def show(self, state, randkey, act_func, params, *args, **kwargs):
+        # showcase the performance of one individual
+        predict = jax.vmap(act_func, in_axes=(None, None, 0))(state, params, INPUTS)
+
+        loss = jnp.mean(jnp.square(predict - LABELS))
+
+        msg = ""
+        for i in range(INPUTS.shape[0]):
+            msg += f"input: {INPUTS[i]}, target: {LABELS[i]}, predict: {predict[i]}\n"
+        msg += f"loss: {loss}\n"
+        print(msg)
+
+
+algorithm1 = algorithm.NEAT(
+    # setting values to be the same as default in python NEAT package to get same as paper authors
+    # tried as best I could to follow this https://neat-python.readthedocs.io/en/latest/config_file.html
+    pop_size=100,
+    survival_threshold=0.2,
+    min_species_size=2,
+    species_number_calculate_by="fitness",  # either this or rank, but 'fitness' should be more in line with original paper on NEAT
+    # species_size=10, #nothing specified for species_size, it remains default
+    # modifying the values the authors explicitly mention
+    compatibility_threshold=3.0,  # maybe need to consider this one in the future if weird results, default is 2.0
+    species_elitism=2,  # is 2 per default
+    genome=genome.DefaultGenome(
+        num_inputs=768,
+        num_outputs=1,
+        max_nodes=769,  # must at least be same as inputs and outputs
+        max_conns=768,  # must be 768 connections for the network to be fully connected
+        # 0 hidden layers per default
+        output_transform=common.ACT.sigmoid,
+        mutation=mutation.DefaultMutation(
+            # no allowing adding or deleting nodes
+            node_add=0.0,
+            node_delete=0.0,
+            # set mutation rates for edges to 0.5
+            conn_add=0.5,
+            conn_delete=0.5,
+        ),
+        node_gene=BiasNode(),
+    ),
+)
+
+problem = CustomProblem()
+
+pipeline = Pipeline(
+    algorithm1,
+    problem,
+    generation_limit=150,
+    fitness_target=1,
+    seed=42,
+)
+state = pipeline.setup()
+# run until termination
+state, best = pipeline.auto_run(state)
+# show results
+# pipeline.show(state, best)
+
+network = algorithm1.genome.network_dict(state, *best)
--- a/test/ranknet_neat.py
+++ b/test/ranknet_neat.py
@@ -0,0 +1,125 @@
+###this code will throw a ValueError
+from tensorneat import algorithm, genome, common
+from tensorneat.pipeline import Pipeline
+from tensorneat.genome.gene.node import DefaultNode
+from tensorneat.genome.gene.conn import DefaultConn
+from tensorneat.genome.operations import mutation
+import jax, jax.numpy as jnp
+from tensorneat.problem import BaseProblem
+
+def binary_cross_entropy(prediction, target):
+    return -(target * jnp.log(prediction) + (1 - target) * jnp.log(1 - prediction))
+
+# Define the custom Problem
+class CustomProblem(BaseProblem):
+
+    jitable = True  # necessary
+
+    def __init__(self, inputs, labels, threshold):
+        self.inputs = jnp.array(inputs) #nb! already has shape (n, 768)
+        self.labels = jnp.array(labels).reshape((-1,1)) #nb! has shape (n), must be transformed to have shape (n, 1) 
+        self.threshold = threshold
+
+        # move the calculation related to pairwise_labels to problem initialization
+        pairwise_labels = self.labels - self.labels.T
+        self.pairs_to_keep = jnp.abs(pairwise_labels) > self.threshold
+        # using nan istead of -inf
+        # as any mathmatical operation with nan will result in nan
+        pairwise_labels = jnp.where(self.pairs_to_keep, pairwise_labels, jnp.nan)
+        self.pairwise_labels = jnp.where(pairwise_labels > 0, True, False)
+
+    
+    def evaluate(self, state, randkey, act_func, params):
+        # do batch forward for all inputs (using jax.vamp).
+        predict = jax.vmap(act_func, in_axes=(None, None, 0))(
+            state, params, self.inputs
+        )  # should be shape (len(labels), 1)
+
+        #calculating pairwise labels and predictions
+        pairwise_predictions = predict - predict.T  # shape (len(inputs), len(inputs))
+
+        pairwise_predictions = jnp.where(self.pairs_to_keep, pairwise_predictions, jnp.nan)
+        pairwise_predictions = jax.nn.sigmoid(pairwise_predictions)
+
+        # calculate loss
+        loss = binary_cross_entropy(pairwise_predictions, self.pairwise_labels)  # shape (len(labels), len(labels))
+        # jax.debug.print("loss={}", loss)
+        # reduce loss to a scalar
+        # we need to ignore nan value here
+        loss = jnp.mean(loss, where=~jnp.isnan(loss))
+        # return negative loss as fitness
+        # TensorNEAT maximizes fitness, equivalent to minimizing loss
+        return -loss
+
+    @property
+    def input_shape(self):
+        # the input shape that the act_func expects
+        return (self.inputs.shape[1],)
+
+    @property
+    def output_shape(self):
+        # the output shape that the act_func returns
+        return (1,)
+
+    def show(self, state, randkey, act_func, params, *args, **kwargs):
+        # showcase the performance of one individual
+        predict = jax.vmap(act_func, in_axes=(None, None, 0))(state, params, self.inputs)
+
+        loss = jnp.mean(jnp.square(predict - self.labels))
+
+        n_elements = 5
+        if n_elements > len(self.inputs):
+            n_elements = len(self.inputs)
+
+        msg = f"Looking at {n_elements} first elements of input\n"
+        for i in range(n_elements):
+            msg += f"for input i: {i}, target: {self.labels[i]}, predict: {predict[i]}\n"
+        msg += f"total loss: {loss}\n"
+        print(msg)
+
+algorithm = algorithm.NEAT(
+    pop_size=10,
+    survival_threshold=0.2,
+    min_species_size=2,
+    compatibility_threshold=3.0,  
+    species_elitism=2,  
+    genome=genome.DefaultGenome(
+        num_inputs=768,
+        num_outputs=1,
+        max_nodes=769,  # must at least be same as inputs and outputs
+        max_conns=768,  # must be 768 connections for the network to be fully connected
+        output_transform=common.ACT.sigmoid,
+        mutation=mutation.DefaultMutation(
+            # no allowing adding or deleting nodes
+            node_add=0.0,
+            node_delete=0.0,
+            # set mutation rates for edges to 0.5
+            conn_add=0.5,
+            conn_delete=0.5,
+        ),
+        node_gene=DefaultNode(),
+        conn_gene=DefaultConn(),
+    ),
+)
+
+
+INPUTS = jax.random.uniform(jax.random.PRNGKey(0), (100, 768)) #the input data x
+LABELS = jax.random.uniform(jax.random.PRNGKey(0), (100, )) #the annotated labels y
+
+problem = CustomProblem(INPUTS, LABELS, 0.25)
+
+print("Setting up pipeline and running it")
+print("-----------------------------------------------------------------------")
+pipeline = Pipeline(
+    algorithm,
+    problem,
+    generation_limit=1,
+    fitness_target=1,
+    seed=42,
+)
+
+state = pipeline.setup()
+# run until termination
+state, best = pipeline.auto_run(state)
+# show results
+pipeline.show(state, best)
--- a/test/test.ipynb
+++ b/test/test.ipynb
@@ -0,0 +1,118 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import jax, jax.numpy as jnp"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "LABELS = jax.random.uniform(jax.random.PRNGKey(0), (5, 1))  # the annotated labels y"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "pairwise_labels = LABELS - LABELS.T"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(Array([[0.57450044],\n",
+       "        [0.09968603],\n",
+       "        [0.39316022],\n",
+       "        [0.8941783 ],\n",
+       "        [0.59656656]], dtype=float32),\n",
+       " Array([[ 0.        ,  0.47481441,  0.18134022, -0.31967783, -0.02206612],\n",
+       "        [-0.47481441,  0.        , -0.2934742 , -0.79449224, -0.49688053],\n",
+       "        [-0.18134022,  0.2934742 ,  0.        , -0.50101805, -0.20340633],\n",
+       "        [ 0.31967783,  0.79449224,  0.50101805,  0.        ,  0.2976117 ],\n",
+       "        [ 0.02206612,  0.49688053,  0.20340633, -0.2976117 ,  0.        ]],      dtype=float32))"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "LABELS, pairwise_labels"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def binary_cross_entropy(prediction, target):\n",
+    "    return -(target * jnp.log(prediction) + (1 - target) * jnp.log(1 - prediction))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "Array(0.6931472, dtype=float32, weak_type=True)"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "binary_cross_entropy(0.5, 1)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "jax_env",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.14"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
--- a/test/test.py
+++ b/test/test.py
@@ -0,0 +1,34 @@
+###shows the difference in loss between using jnp.where() and boolean indexing
+
+import jax
+import jax.numpy as jnp
+
+def binary_cross_entropy(prediction, target):
+    return -(target * jnp.log(prediction) + (1 - target) * jnp.log(1 - prediction))
+
+
+preds = jax.random.uniform(jax.random.PRNGKey(0), (100, )).reshape((-1,1)) #predictions
+LABELS = jax.random.uniform(jax.random.PRNGKey(0), (100, )).reshape((-1,1)) #the annotated labels y
+
+pair_lab = LABELS - LABELS.T
+pair_pred = preds - preds.T
+
+ptk = jnp.abs(pair_lab) > 0.25
+
+pair_labw = jnp.where(ptk, pair_lab, -jnp.nan)
+pair_labm = pair_lab[ptk]
+
+pair_labw = jnp.where(pair_labw > 0, True, False)
+pair_labm = jnp.where(pair_labm > 0, True, False)
+
+pair_predw = jnp.where(ptk, pair_pred, -jnp.nan)
+pair_predm = pair_pred[ptk]
+
+pair_predw = jax.nn.sigmoid(pair_predw)
+pair_predm = jax.nn.sigmoid(pair_predm)
+
+lossw = binary_cross_entropy(pair_predw, pair_labw)
+lossm = binary_cross_entropy(pair_predm, pair_labm)
+
+print("loss using jnp.where()", jnp.mean(lossw, where=~jnp.isnan(lossw)))
+print("loss using boolean indexing", jnp.mean(lossm, where=~jnp.isnan(lossm)))