sequoia/settings/sl/multi_task/setting.py

from dataclasses import dataclass
from typing import ClassVar, Type

from sequoia.settings.sl.task_incremental import TaskIncrementalSLSetting
from sequoia.utils import get_logger

# TODO: Playing around with this 'constant_property' idea as an alternative to the
# init=False of `constant` field.
from sequoia.utils.utils import constant_property

from ..task_incremental.setting import TaskIncrementalSLSetting
from ..traditional.setting import TraditionalSLSetting

logger = get_logger(__name__)


@dataclass
class MultiTaskSLSetting(TaskIncrementalSLSetting, TraditionalSLSetting):
    """IID version of the Task-Incremental Setting, where the data is shuffled.

    Can be used to estimate the upper bound performance of Task-Incremental CL Methods.
    """

    Results: ClassVar[Type[Results]] = TraditionalSLSetting.Results

    stationary_context: bool = constant_property(True)

    def __post_init__(self):
        super().__post_init__()
        # We reuse the training loop from Incremental, by modifying it so it
        # discriminates between "phases" and "tasks".

    @property
    def phases(self) -> int:
        return 1

    # def _make_train_dataset(self) -> Dataset:
    #     """ Returns the training dataset, which in this case will be shuffled.

    #     IDEA: We could probably do it the same way in both RL and SL:
    #     1. Create the 'datasets' for all the tasks;
    #     2. "concatenate"+"Shuffle" the "datasets":
    #         - in SL: ConcatDataset / shuffle the datasets
    #         - in RL: Create a true `MultiTaskEnvironment` that accepts a list of envs as
    #           an input and alternates between environments at each episode.
    #           (either round-robin style, or randomly)

    #     Returns
    #     -------
    #     Dataset
    #     """
    #     joined_dataset = concat(self.train_datasets)
    #     return shuffle(joined_dataset, seed=self.config.seed)

    # def _make_val_dataset(self) -> Dataset:
    #     joined_dataset = concat(self.val_datasets)
    #     return shuffle(joined_dataset, seed=self.config.seed)

    # def _make_test_dataset(self) -> Dataset:
    #     return concat(self.test_datasets)

    # def train_dataloader(
    #     self, batch_size: int = None, num_workers: int = None
    # ) -> PassiveEnvironment:
    #     """Returns a DataLoader for the training dataset.

    #     This dataloader will yield batches which will very likely contain data from
    #     multiple different tasks, and will contain task labels.

    #     Parameters
    #     ----------
    #     batch_size : int, optional
    #         Batch size to use. Defaults to None, in which case the value of
    #         `self.batch_size` is used.
    #     num_workers : int, optional
    #         Number of workers to use. Defaults to None, in which case the value of
    #         `self.num_workers` is used.

    #     Returns
    #     -------
    #     PassiveEnvironment
    #         A "Passive" Dataloader/gym.Env.
    #     """
    #     return super().train_dataloader(batch_size=batch_size, num_workers=num_workers)

    # def val_dataloader(
    #     self, batch_size: int = None, num_workers: int = None
    # ) -> PassiveEnvironment:
    #     """Returns a DataLoader for the validation dataset.

    #     This dataloader will yield batches which will very likely contain data from
    #     multiple different tasks, and will contain task labels.

    #     Parameters
    #     ----------
    #     batch_size : int, optional
    #         Batch size to use. Defaults to None, in which case the value of
    #         `self.batch_size` is used.
    #     num_workers : int, optional
    #         Number of workers to use. Defaults to None, in which case the value of
    #         `self.num_workers` is used.

    #     Returns
    #     -------
    #     PassiveEnvironment
    #         A "Passive" Dataloader/gym.Env.
    #     """
    #     return super().val_dataloader(batch_size=batch_size, num_workers=num_workers)

    # def test_dataloader(
    #     self, batch_size: int = None, num_workers: int = None
    # ) -> PassiveEnvironment:
    #     """Returns a DataLoader for the test dataset.

    #     This dataloader will yield batches which will very likely contain data from
    #     multiple different tasks, and will contain task labels.

    #     Unlike the train and validation environments, the test environment will not
    #     yield rewards until the action has been sent to it using either `send` (when
    #     iterating in the DataLoader-style) or `step` (when interacting with the
    #     environment in the gym.Env style). For more info, take a look at the
    #     `PassiveEnvironment` class.

    #     Parameters
    #     ----------
    #     batch_size : int, optional
    #         Batch size to use. Defaults to None, in which case the value of
    #         `self.batch_size` is used.
    #     num_workers : int, optional
    #         Number of workers to use. Defaults to None, in which case the value of
    #         `self.num_workers` is used.

    #     Returns
    #     -------
    #     PassiveEnvironment
    #         A "Passive" Dataloader/gym.Env.
    #     """
    #     return super().test_dataloader(batch_size=batch_size, num_workers=num_workers)

    # def test_loop(self, method: Method) -> "IncrementalAssumption.Results":
    #     """ Runs a multi-task test loop and returns the Results.
    #     """
    #     return super().test_loop(method)
    # # TODO:
    # test_env = self.test_dataloader()
    # try:
    #     # If the Method has `test` defined, use it.
    #     method.test(test_env)
    #     test_env.close()
    #     # Get the metrics from the test environment
    #     test_results: Results = test_env.get_results()
    #     print(f"Test results: {test_results}")
    #     return test_results

    # except NotImplementedError:
    #     logger.info(
    #         f"Will query the method for actions at each step, "
    #         f"since it doesn't implement a `test` method."
    #     )

    # obs = test_env.reset()

    # # TODO: Do we always have a maximum number of steps? or of episodes?
    # # Will it work the same for Supervised and Reinforcement learning?
    # max_steps: int = getattr(test_env, "step_limit", None)

    # # Reset on the last step is causing trouble, since the env is closed.
    # pbar = tqdm.tqdm(itertools.count(), total=max_steps, desc="Test")
    # episode = 0
    # for step in pbar:
    #     if test_env.is_closed():
    #         logger.debug(f"Env is closed")
    #         break
    #     # logger.debug(f"At step {step}")
    #     action = method.get_actions(obs, test_env.action_space)

    #     # logger.debug(f"action: {action}")
    #     # TODO: Remove this:
    #     if isinstance(action, Actions):
    #         action = action.y_pred
    #     if isinstance(action, Tensor):
    #         action = action.cpu().numpy()

    #     obs, reward, done, info = test_env.step(action)

    #     if done and not test_env.is_closed():
    #         # logger.debug(f"end of test episode {episode}")
    #         obs = test_env.reset()
    #         episode += 1

    # test_env.close()
    # test_results = test_env.get_results()

    # return test_results