Example template for contributing new tasks

In [ ]:

Copied!

"""Example template for contributing new tasks."""  # noqa: INP001
"""Example template for contributing new tasks."""  # noqa: INP001

In [ ]:

Copied!

import numpy as np
import numpy as np

In [ ]:

Copied!

from neurogym import spaces
from neurogym.core import TrialEnv
from neurogym import spaces
from neurogym.core import TrialEnv

In [ ]:

Copied!





class YourTask(TrialEnv):
    def __init__(self, dt=100, rewards=None, timing=None, sigma=1) -> None:
        super().__init__(dt=dt)
        # Possible decisions at the end of the trial
        self.choices = [1, 2]  # e.g. [left, right]
        self.sigma = sigma / np.sqrt(self.dt)  # Input noise

        # Optional rewards dictionary
        self.rewards = {"abort": -0.1, "correct": +1.0, "fail": 0.0}
        if rewards:
            self.rewards.update(rewards)

        # Optional timing dictionary
        # if provided, self.add_period can infer timing directly
        self.timing = {"fixation": 100, "stimulus": 2000, "delay": 0, "decision": 100}
        if timing:
            self.timing.update(timing)

        # Similar to gymnasium envs, define observations_space and action_space
        # Optional annotation of the observation space
        name = {"fixation": 0, "stimulus": [1, 2]}
        self.observation_space = spaces.Box(
            -np.inf,
            np.inf,
            shape=(3,),
            dtype=np.float32,
            name=name,
        )
        # Optional annotation of the action space
        name = {"fixation": 0, "choice": [1, 2]}
        self.action_space = spaces.Discrete(3, name=name)

    def _new_trial(self, **kwargs):
        """Called internally to generate a next trial.

        Typically, you need to
            set trial: a dictionary of trial information
            run self.add_period():
                will add time periods to the trial
                accesible through dict self.start_t and self.end_t
            run self.add_ob():
                will add observation to np array self.ob
            run self.set_groundtruth():
                will set groundtruth to np array self.gt

        Returns:
            trial: dictionary of trial information
        """
        # Setting trial information
        trial = {"ground_truth": self.rng.choice(self.choices)}
        trial.update(kwargs)  # allows wrappers to modify the trial
        ground_truth = trial["ground_truth"]

        # Adding periods sequentially
        self.add_period(["fixation", "stimulus", "delay", "decision"])

        # Setting observations, default all 0
        # Setting fixation cue to 1 before decision period
        self.add_ob(1, where="fixation")
        self.set_ob(0, "decision", where="fixation")
        # Set the stimulus
        stim = [0, 0, 0]
        stim[ground_truth] = 1
        self.add_ob(stim, "stimulus")
        # adding gaussian noise to stimulus with std = self.sigma
        self.add_randn(0, self.sigma, "stimulus", where="stimulus")

        # Setting ground-truth value for supervised learning
        self.set_groundtruth(ground_truth, "decision")

        return trial

    def _step(self, action):
        """Called internally to process one step.

        Receives an action and returns:
        a new observation, obs
        reward associated with the action, reward
        a boolean variable indicating whether the experiment has terminated, terminated
            See more at https://gymnasium.farama.org/tutorials/gymnasium_basics/handling_time_limits/#termination
        a boolean variable indicating whether the experiment has been truncated, truncated
            See more at https://gymnasium.farama.org/tutorials/gymnasium_basics/handling_time_limits/#truncation
        a dictionary with extra information:
            ground truth correct response, info['gt']
            boolean indicating the end of the trial, info['new_trial'].
        """
        terminated = False
        truncated = False
        # rewards
        reward = 0
        gt = self.gt_now
        # Example structure
        if not self.in_period("decision"):
            if action != 0:  # if fixation break
                reward = self.rewards["abort"]
        elif action != 0:
            terminated = True
            reward = self.rewards["correct"] if action == gt else self.rewards["fail"]

        return (
            self.ob_now,
            reward,
            terminated,
            truncated,
            {"new_trial": terminated, "gt": gt},
        )
class YourTask(TrialEnv):
    def __init__(self, dt=100, rewards=None, timing=None, sigma=1) -> None:
        super().__init__(dt=dt)
        # Possible decisions at the end of the trial
        self.choices = [1, 2]  # e.g. [left, right]
        self.sigma = sigma / np.sqrt(self.dt)  # Input noise

        # Optional rewards dictionary
        self.rewards = {"abort": -0.1, "correct": +1.0, "fail": 0.0}
        if rewards:
            self.rewards.update(rewards)

        # Optional timing dictionary
        # if provided, self.add_period can infer timing directly
        self.timing = {"fixation": 100, "stimulus": 2000, "delay": 0, "decision": 100}
        if timing:
            self.timing.update(timing)

        # Similar to gymnasium envs, define observations_space and action_space
        # Optional annotation of the observation space
        name = {"fixation": 0, "stimulus": [1, 2]}
        self.observation_space = spaces.Box(
            -np.inf,
            np.inf,
            shape=(3,),
            dtype=np.float32,
            name=name,
        )
        # Optional annotation of the action space
        name = {"fixation": 0, "choice": [1, 2]}
        self.action_space = spaces.Discrete(3, name=name)

    def _new_trial(self, **kwargs):
        """Called internally to generate a next trial.

        Typically, you need to
            set trial: a dictionary of trial information
            run self.add_period():
                will add time periods to the trial
                accesible through dict self.start_t and self.end_t
            run self.add_ob():
                will add observation to np array self.ob
            run self.set_groundtruth():
                will set groundtruth to np array self.gt

        Returns:
            trial: dictionary of trial information
        """
        # Setting trial information
        trial = {"ground_truth": self.rng.choice(self.choices)}
        trial.update(kwargs)  # allows wrappers to modify the trial
        ground_truth = trial["ground_truth"]

        # Adding periods sequentially
        self.add_period(["fixation", "stimulus", "delay", "decision"])

        # Setting observations, default all 0
        # Setting fixation cue to 1 before decision period
        self.add_ob(1, where="fixation")
        self.set_ob(0, "decision", where="fixation")
        # Set the stimulus
        stim = [0, 0, 0]
        stim[ground_truth] = 1
        self.add_ob(stim, "stimulus")
        # adding gaussian noise to stimulus with std = self.sigma
        self.add_randn(0, self.sigma, "stimulus", where="stimulus")

        # Setting ground-truth value for supervised learning
        self.set_groundtruth(ground_truth, "decision")

        return trial

    def _step(self, action):
        """Called internally to process one step.

        Receives an action and returns:
        a new observation, obs
        reward associated with the action, reward
        a boolean variable indicating whether the experiment has terminated, terminated
            See more at https://gymnasium.farama.org/tutorials/gymnasium_basics/handling_time_limits/#termination
        a boolean variable indicating whether the experiment has been truncated, truncated
            See more at https://gymnasium.farama.org/tutorials/gymnasium_basics/handling_time_limits/#truncation
        a dictionary with extra information:
            ground truth correct response, info['gt']
            boolean indicating the end of the trial, info['new_trial'].
        """
        terminated = False
        truncated = False
        # rewards
        reward = 0
        gt = self.gt_now
        # Example structure
        if not self.in_period("decision"):
            if action != 0:  # if fixation break
                reward = self.rewards["abort"]
        elif action != 0:
            terminated = True
            reward = self.rewards["correct"] if action == gt else self.rewards["fail"]

        return (
            self.ob_now,
            reward,
            terminated,
            truncated,
            {"new_trial": terminated, "gt": gt},
        )

In [ ]:

Copied!





if __name__ == "__main__":
    from neurogym.utils.logging import logger

    # Instantiate the task
    env = YourTask()
    trial = env.new_trial()
    logger.info(f"Trial info: {trial}")
    logger.info(f"Trial observation shape: {env.ob.shape}")
    logger.info(f"Trial action shape: {env.gt.shape}")
    env.reset()
    ob, reward, terminated, truncated, info = env.step(env.action_space.sample())
    logger.info(f"Single time step observation shape: {ob.shape}")
if __name__ == "__main__":
    from neurogym.utils.logging import logger

    # Instantiate the task
    env = YourTask()
    trial = env.new_trial()
    logger.info(f"Trial info: {trial}")
    logger.info(f"Trial observation shape: {env.ob.shape}")
    logger.info(f"Trial action shape: {env.gt.shape}")
    env.reset()
    ob, reward, terminated, truncated, info = env.step(env.action_space.sample())
    logger.info(f"Single time step observation shape: {ob.shape}")