dlc2action.project.project

Project interface
View Source
   1#
   2# Copyright 2020-2022 by A. Mathis Group and contributors. All rights reserved.
   3#
   4# This project and all its files are licensed under GNU AGPLv3 or later version. A copy is included in dlc2action/LICENSE.AGPL.
   5#
   6"""
   7Project interface
   8"""
   9import copy
  10from email.policy import default
  11import os
  12from re import search
  13from typing import Dict, List, Tuple, Union, Set, Iterable, Any, Optional
  14import shutil
  15
  16from numpy import ndarray
  17from ruamel.yaml import YAML
  18import pickle
  19import pandas as pd
  20from dlc2action.data.dataset import BehaviorDataset
  21from dlc2action.utils import apply_threshold
  22from collections.abc import Mapping
  23from collections import defaultdict
  24
  25from dlc2action.task.task_dispatcher import TaskDispatcher
  26import warnings
  27from copy import deepcopy, copy
  28import time
  29import numpy as np
  30from matplotlib import pyplot as plt
  31from matplotlib import cm
  32from itertools import product
  33from collections.abc import Iterable
  34import optuna
  35import plotly
  36import torch
  37from pathlib import Path
  38from dlc2action import options, __version__
  39from ruamel.yaml.comments import CommentedMap, CommentedSet
  40from tqdm import tqdm
  41from dlc2action.project.meta import (
  42    Searches,
  43    SavedStores,
  44    Run,
  45    SavedRuns,
  46    DecisionThresholds,
  47)
  48
  49
  50class Project:
  51    """
  52    A class to create and maintain the project files + keep track of experiments
  53    """
  54
  55    def __init__(
  56        self,
  57        name: str,
  58        data_type: str = None,
  59        annotation_type: str = "none",
  60        projects_path: str = None,
  61        data_path: Union[str, List] = None,
  62        annotation_path: Union[str, List] = None,
  63        copy: bool = False,
  64    ) -> None:
  65        """
  66        Parameters
  67        ----------
  68        name : str
  69            name of the project
  70        data_type : str, optional
  71            data type (run Project.data_types() to see available options; has to be provided if the project is being
  72            created)
  73        annotation_type : str, default 'none'
  74            annotation type (run Project.annotation_types() to see available options)
  75        projects_path : str, optional
  76            path to the projects folder (is filled with ~/DLC2Action by default)
  77        data_path : str, optional
  78            path to the folder containing input files for the project (has to be provided if the project is being
  79            created)
  80        annotation_path : str, optional
  81            path to the folder containing annotation files for the project
  82        copy : bool, default False
  83            if True, the files from annotation_path and data_path will be copied to the projects folder;
  84            otherwise they will be moved
  85        """
  86
  87        if projects_path is None:
  88            projects_path = os.path.join(str(Path.home()), "DLC2Action")
  89        if not os.path.exists(projects_path):
  90            os.mkdir(projects_path)
  91        self.project_path = os.path.join(projects_path, name)
  92        self.name = name
  93        self.data_type = data_type
  94        self.annotation_type = annotation_type
  95        self.data_path = data_path
  96        self.annotation_path = annotation_path
  97        if not os.path.exists(self.project_path):
  98            if data_type is None:
  99                raise ValueError(
 100                    "The data_type parameter is necessary when creating a new project!"
 101                )
 102            self._initialize_project(
 103                data_type, annotation_type, data_path, annotation_path, copy
 104            )
 105        else:
 106            self.annotation_type, self.data_type = self._read_types()
 107            if data_type != self.data_type and data_type is not None:
 108                raise ValueError(
 109                    f"The project has already been initialized with data_type={self.data_type}!"
 110                )
 111            if annotation_type != self.annotation_type and annotation_type != "none":
 112                raise ValueError(
 113                    f"The project has already been initialized with annotation_type={self.annotation_type}!"
 114                )
 115            self.annotation_path, data_path = self._read_paths()
 116            if self.data_path is None:
 117                self.data_path = data_path
 118            # if data_path != self.data_path and data_path is not None:
 119            #     raise ValueError(
 120            #         f"The project has already been initialized with data_path={self.data_path}!"
 121            #     )
 122            if annotation_path != self.annotation_path and annotation_path is not None:
 123                raise ValueError(
 124                    f"The project has already been initialized with annotation_path={self.annotation_path}!"
 125                )
 126        self._update_configs()
 127
 128    def _aggregate_predictions(
 129        self,
 130        prediction_name: str,
 131        episode_names: List,
 132        load_epochs: List = None,
 133        parameters_update: Dict = None,
 134        data_path: str = None,
 135        file_paths: Set = None,
 136        mode: str = "all",
 137        augment_n: int = 0,
 138        evaluate: bool = False,
 139        task: TaskDispatcher = None,
 140        embedding: bool = False,
 141    ) -> Tuple[TaskDispatcher, Dict, str, torch.Tensor]:
 142        """
 143        Generate a prediction
 144        """
 145
 146        if load_epochs is None:
 147            load_epochs = [None for _ in episode_names]
 148        prediction = defaultdict(lambda: defaultdict(lambda: defaultdict(lambda: 0)))
 149        cnt = defaultdict(lambda: defaultdict(lambda: defaultdict(lambda: 0)))
 150        behs = set(self.get_behavior_dictionary(episode_names[0]).values())
 151        if not all(
 152            [
 153                set(self.get_behavior_dictionary(x).values()) == behs
 154                for x in episode_names
 155            ]
 156        ):
 157            raise ValueError(f"The behavior sets are different in {episode_names}")
 158        behaviors = set()
 159        for i, episode_name in enumerate(episode_names):
 160            task, parameters, data_mode, new_pred, _ = self._make_prediction(
 161                prediction_name,
 162                episode_names=[episode_name],
 163                load_epochs=[load_epochs[i]],
 164                parameters_update=parameters_update,
 165                data_path=data_path,
 166                file_paths=file_paths,
 167                mode=mode,
 168                augment_n=augment_n,
 169                evaluate=evaluate,
 170                task=task,
 171                embedding=embedding,
 172            )
 173            new_pred = task.dataset(data_mode).generate_full_length_prediction(new_pred)
 174            beh_dict = task.behaviors_dict()
 175            for video_id, video_values in new_pred.items():
 176                for clip_id, clip_prediction in video_values.items():
 177                    for beh_i in range(clip_prediction.shape[0]):
 178                        prediction[video_id][clip_id][
 179                            beh_dict[beh_i]
 180                        ] += clip_prediction[beh_i, :].unsqueeze(0)
 181                        cnt[video_id][clip_id][beh_dict[beh_i]] += 1
 182                        behaviors.add(beh_dict[beh_i])
 183        output = defaultdict(lambda: {})
 184        # behaviors = sorted(behaviors)
 185        behavior_indices = sorted(
 186            [x for x in task.behaviors_dict().keys() if x != -100]
 187        )
 188        behaviors = [task.behaviors_dict()[key] for key in behavior_indices]
 189        for video_id, video_values in prediction.items():
 190            for clip_id, clip_values in video_values.items():
 191                pred = torch.cat(
 192                    [
 193                        clip_values[beh] / cnt[video_id][clip_id][beh]
 194                        for beh in behaviors
 195                    ],
 196                    0,
 197                )
 198                output[video_id][clip_id] = pred
 199        return task, parameters, data_mode, dict(output), None
 200
 201    def _make_prediction(
 202        self,
 203        prediction_name: str,
 204        episode_names: List,
 205        load_epochs: List = None,
 206        parameters_update: Dict = None,
 207        data_path: str = None,
 208        file_paths: Set = None,
 209        mode: str = "all",
 210        augment_n: int = 0,
 211        evaluate: bool = False,
 212        task: TaskDispatcher = None,
 213        embedding: bool = False,
 214    ) -> Tuple[TaskDispatcher, Dict, str, torch.Tensor]:
 215        """
 216        Generate a prediction
 217        """
 218
 219        names = []
 220        epochs = []
 221        if load_epochs is None:
 222            load_epochs = [None for _ in episode_names]
 223        if len(load_epochs) != len(episode_names):
 224            raise ValueError(
 225                f"The length of load_epochs and the length of episode_names should be the same!"
 226            )
 227        for i, episode_name in enumerate(episode_names):
 228            names += self._episodes().get_runs(episode_name)
 229            epochs.append(load_epochs[i])
 230        if len(names) == 0:
 231            warnings.warn(f"None of the episodes {episode_names} exist!")
 232            names = [None]
 233        episodes = self._episodes()
 234        lengths = [
 235            episodes.load_parameters(name)["general"]["len_segment"] for name in names
 236        ]
 237        overlaps = [
 238            episodes.load_parameters(name)["general"]["overlap"] for name in names
 239        ]
 240        if not all([x == lengths[0] for x in lengths]):
 241            raise ValueError(f"Episodes {episode_names} have different segment lengths")
 242        if not all([x == overlaps[0] for x in overlaps]):
 243            raise ValueError(f"Episodes {episode_names} have different overlaps")
 244        load_epochs = epochs
 245        prediction = None
 246        decision_thresholds = None
 247        time_total = 0
 248        behavior_dicts = [
 249            self.get_behavior_dictionary(episode_name) for episode_name in names
 250        ]
 251        if not all(
 252            [
 253                set(d.values()) == set(behavior_dicts[0].values())
 254                for d in behavior_dicts[1:]
 255            ]
 256        ):
 257            raise ValueError(
 258                f"Episodes {episode_names} have different sets of behaviors!"
 259            )
 260        behavior_indices = [x for x in behavior_dicts[0].keys() if x != -100]
 261        behaviors = [behavior_dicts[0][i] for i in behavior_indices]
 262        cnt = defaultdict(lambda: 0)
 263        behavior_probs = defaultdict(lambda: 0)
 264        for episode_name, load_epoch, behavior_dict in zip(
 265            names, load_epochs, behavior_dicts
 266        ):
 267            print(f"episode {episode_name}")
 268            task, parameters, data_mode = self._make_task_prediction(
 269                prediction_name=prediction_name,
 270                load_episode=episode_name,
 271                parameters_update=parameters_update,
 272                load_epoch=load_epoch,
 273                data_path=data_path,
 274                mode=mode,
 275                file_paths=file_paths,
 276                task=task,
 277                decision_thresholds=decision_thresholds,
 278            )
 279            behavior_indices_cur = [x for x in behavior_dict.keys() if x != -100]
 280            behaviors_cur = [behavior_dict[i] for i in behavior_indices_cur]
 281            # data_mode = "train" if mode == "all" else mode
 282            time_start = time.time()
 283            new_pred = task.predict(
 284                data_mode,
 285                raw_output=True,
 286                apply_primary_function=True,
 287                augment_n=augment_n,
 288                embedding=embedding,
 289            )
 290            for j, beh in enumerate(behaviors_cur):
 291                cnt[beh] += 1
 292                behavior_probs[beh] += new_pred[:, j, :].unsqueeze(1)
 293            # indices = [
 294            #     behaviors.index(behavior_dict[i]) for i in range(new_pred.shape[1])
 295            # ]
 296            # new_pred = new_pred[:, indices, :]
 297            time_end = time.time()
 298            time_total += time_end - time_start
 299            if evaluate:
 300                _, metrics = task.evaluate_prediction(new_pred, data=data_mode)
 301                if mode == "val":
 302                    self._update_episode_metrics(episode_name, metrics)
 303            # if prediction is None:
 304            #     prediction = new_pred
 305            # else:
 306            #     prediction += new_pred
 307            print("\n")
 308        prediction = torch.cat([behavior_probs[beh] / cnt[beh] for beh in behaviors], 1)
 309        hours = int(time_total // 3600)
 310        time_total -= hours * 3600
 311        minutes = int(time_total // 60)
 312        time_total -= minutes * 60
 313        seconds = int(time_total)
 314        inference_time = f"{hours}:{minutes:02}:{seconds:02}"
 315        # prediction /= len(names)
 316        return task, parameters, data_mode, prediction, inference_time
 317
 318    def _make_task_prediction(
 319        self,
 320        prediction_name: str,
 321        load_episode: str = None,
 322        parameters_update: Dict = None,
 323        load_epoch: int = None,
 324        data_path: str = None,
 325        mode: str = "val",
 326        file_paths: Set = None,
 327        decision_thresholds: List = None,
 328        task: TaskDispatcher = None,
 329    ) -> Tuple[TaskDispatcher, Dict, str]:
 330        """
 331        Make a `TaskDispatcher` object that will be used to generate a prediction
 332        """
 333
 334        if parameters_update is None:
 335            parameters_update = {}
 336        parameters_update_second = {}
 337        if mode == "all" or data_path is not None or file_paths is not None:
 338            parameters_update_second["training"] = {
 339                "val_frac": 0,
 340                "test_frac": 0,
 341                "partition_method": "random",
 342                "save_split": False,
 343                "split_path": None,
 344            }
 345            mode = "train"
 346        if decision_thresholds is not None:
 347            if (
 348                len(decision_thresholds)
 349                == self._episode(load_episode).get_num_classes()
 350            ):
 351                parameters_update_second["general"] = {
 352                    "threshold_value": decision_thresholds
 353                }
 354            else:
 355                raise ValueError(
 356                    f"The length of the decision thresholds {decision_thresholds} "
 357                    f"must be equal to the length of the behaviors dictionary "
 358                    f"{self._episode(load_episode).get_behaviors_dict()}"
 359                )
 360        data_param_update = {}
 361        if data_path is not None:
 362            data_param_update = {"data_path": data_path}
 363        if file_paths is not None:
 364            data_param_update = {"data_path": None, "file_paths": file_paths}
 365        parameters_update = self._update(parameters_update, {"data": data_param_update})
 366        if data_path is not None or file_paths is not None:
 367            general_update = {
 368                "annotation_type": "none",
 369                "only_load_annotated": False,
 370            }
 371        else:
 372            general_update = {}
 373        parameters_update = self._update(parameters_update, {"general": general_update})
 374        task, parameters = self._make_task(
 375            episode_name=prediction_name,
 376            load_episode=load_episode,
 377            parameters_update=parameters_update,
 378            parameters_update_second=parameters_update_second,
 379            load_epoch=load_epoch,
 380            purpose="prediction",
 381            task=task,
 382            behaviors=self.get_behavior_dictionary(load_episode),
 383        )
 384        # if data_path is not None or file_paths is not None:
 385        #     print('SETTING')
 386        #     task.set_behaviors(self.get_behavior_dictionary(load_episode))
 387        if mode is None:
 388            if task.exists("test"):
 389                mode = "test"
 390            elif task.exists("val"):
 391                mode = "val"
 392            else:
 393                mode = "train"
 394        return task, parameters, mode
 395
 396    def _make_task_training(
 397        self,
 398        episode_name: str,
 399        load_episode: str = None,
 400        parameters_update: Dict = None,
 401        load_epoch: int = None,
 402        load_search: str = None,
 403        load_parameters: list = None,
 404        round_to_binary: list = None,
 405        load_strict: bool = True,
 406        continuing: bool = False,
 407        task: TaskDispatcher = None,
 408        mask_name: str = None,
 409        throwaway: bool = False,
 410    ) -> Tuple[TaskDispatcher, Dict, str]:
 411        """
 412        Make a `TaskDispatcher` object that will be used to generate a prediction
 413        """
 414
 415        if parameters_update is None:
 416            parameters_update = {}
 417        if continuing:
 418            purpose = "continuing"
 419        else:
 420            purpose = "training"
 421        if mask_name is not None:
 422            mask_name = os.path.join(self._mask_path(), f"{mask_name}.pickle")
 423        parameters_update_second = {"data": {"real_lens": mask_name}}
 424        if throwaway:
 425            parameters_update = self._update(
 426                parameters_update, {"training": {"normalize": False, "device": "cpu"}}
 427            )
 428        return self._make_task(
 429            episode_name,
 430            load_episode,
 431            parameters_update,
 432            parameters_update_second,
 433            load_epoch,
 434            load_search,
 435            load_parameters,
 436            round_to_binary,
 437            purpose,
 438            task,
 439            load_strict=load_strict,
 440        )
 441
 442    def _make_parameters(
 443        self,
 444        episode_name: str,
 445        load_episode: str = None,
 446        parameters_update: Dict = None,
 447        parameters_update_second: Dict = None,
 448        load_epoch: int = None,
 449        load_search: str = None,
 450        load_parameters: list = None,
 451        round_to_binary: list = None,
 452        purpose: str = "train",
 453        load_strict: bool = True,
 454    ):
 455        """
 456        Construct a parameters dictionary
 457        """
 458
 459        if parameters_update is None:
 460            parameters_update = {}
 461        pars_update = deepcopy(parameters_update)
 462        if parameters_update_second is None:
 463            parameters_update_second = {}
 464        if purpose == "prediction" and "model" in pars_update.keys():
 465            raise ValueError("Cannot change model parameters after training!")
 466        if purpose in ["continuing", "prediction"] and load_episode is not None:
 467            read_parameters = self._read_parameters()
 468            parameters = self._episodes().load_parameters(load_episode)
 469            parameters["metrics"] = self._update(
 470                read_parameters["metrics"], parameters["metrics"]
 471            )
 472            parameters["ssl"] = self._update(
 473                read_parameters["ssl"], parameters.get("ssl", {})
 474            )
 475        else:
 476            parameters = self._read_parameters()
 477        if "model" in pars_update:
 478            model_params = pars_update.pop("model")
 479        else:
 480            model_params = None
 481        if "features" in pars_update:
 482            feat_params = pars_update.pop("features")
 483        else:
 484            feat_params = None
 485        if "augmentations" in pars_update:
 486            aug_params = pars_update.pop("augmentations")
 487        else:
 488            aug_params = None
 489        parameters = self._update(parameters, pars_update)
 490        if pars_update.get("general", {}).get("model_name") is not None:
 491            model_name = parameters["general"]["model_name"]
 492            parameters["model"] = self._open_yaml(
 493                os.path.join(self.project_path, "config", "model", f"{model_name}.yaml")
 494            )
 495        if pars_update.get("general", {}).get("feature_extraction") is not None:
 496            feat_name = parameters["general"]["feature_extraction"]
 497            parameters["features"] = self._open_yaml(
 498                os.path.join(
 499                    self.project_path, "config", "features", f"{feat_name}.yaml"
 500                )
 501            )
 502            aug_name = options.extractor_to_transformer[
 503                parameters["general"]["feature_extraction"]
 504            ]
 505            parameters["augmentations"] = self._open_yaml(
 506                os.path.join(
 507                    self.project_path, "config", "augmentations", f"{aug_name}.yaml"
 508                )
 509            )
 510        if model_params is not None:
 511            parameters["model"] = self._update(parameters["model"], model_params)
 512        if feat_params is not None:
 513            parameters["features"] = self._update(parameters["features"], feat_params)
 514        if aug_params is not None:
 515            parameters["augmentations"] = self._update(
 516                parameters["augmentations"], aug_params
 517            )
 518        if load_search is not None:
 519            parameters = self._update_with_search(
 520                parameters, load_search, load_parameters, round_to_binary
 521            )
 522        parameters = self._fill(
 523            parameters,
 524            episode_name,
 525            load_episode,
 526            load_epoch=load_epoch,
 527            load_strict=load_strict,
 528            only_load_model=(purpose != "continuing"),
 529            continuing=(purpose in ["prediction", "continuing"]),
 530            enforce_split_parameters=(purpose == "prediction"),
 531        )
 532        parameters = self._update(parameters, parameters_update_second)
 533        return parameters
 534
 535    def _make_task(
 536        self,
 537        episode_name: str,
 538        load_episode: str = None,
 539        parameters_update: Dict = None,
 540        parameters_update_second: Dict = None,
 541        load_epoch: int = None,
 542        load_search: str = None,
 543        load_parameters: list = None,
 544        round_to_binary: list = None,
 545        purpose: str = "train",
 546        task: TaskDispatcher = None,
 547        load_strict: bool = True,
 548        behaviors: Dict = None,
 549    ) -> Tuple[TaskDispatcher, Union[CommentedMap, dict]]:
 550        """
 551        Make a `TaskDispatcher` object
 552
 553        The task parameters are read from the config files and then updated with the
 554        parameters_update dictionary. The model can be either initialized from scratch or loaded from one of the
 555        previous experiments. All parameters and results are saved in the meta files and can be accessed with the
 556        list_episodes() function. The train/test/validation split is saved and loaded from a file whenever the
 557        same split parameters are used. The pre-computed datasets are also saved and loaded whenever the same
 558        data parameters are used.
 559
 560        Parameters
 561        ----------
 562        episode_name : str
 563            the name of the episode
 564        load_episode : str, optional
 565            the (previously run) episode name to load the model from
 566        parameters_update : dict, optional
 567            the dictionary used to update the parameters from the config
 568        parameters_update_second : dict, optional
 569            the dictionary used to update the parameters after the automatic fill-out
 570        load_epoch : int, optional
 571            the epoch to load (if load_episodes is not None); if not provided, the last epoch is used
 572        load_search : str, optional
 573            the hyperparameter search result to load
 574        load_parameters : list, optional
 575            a list of string names of the parameters to load from load_search (if not provided, all parameters
 576            are loaded)
 577        round_to_binary : list, optional
 578            a list of string names of the loaded parameters that should be rounded to the nearest power of two
 579        purpose : {"train", "continuing", "prediction"}
 580            the purpose of the task object (`"train"` for training from scratch, `"continuing"` for continuing
 581            the training of an interrupted episode, `"prediction"` for generating a prediction)
 582        task : TaskDispatcher, optional
 583            a pre-existing task; if provided, the method will update the task instead of creating a new one
 584            (this might save time, mainly on dataset loading)
 585
 586        Returns
 587        -------
 588        task : TaskDispatcher
 589            the `TaskDispatcher` instance
 590        parameters : dict
 591            the parameters dictionary that describes the task
 592        """
 593
 594        parameters = self._make_parameters(
 595            episode_name,
 596            load_episode,
 597            parameters_update,
 598            parameters_update_second,
 599            load_epoch,
 600            load_search,
 601            load_parameters,
 602            round_to_binary,
 603            purpose,
 604            load_strict=load_strict,
 605        )
 606        if parameters["data"].get("annotation_type", "none") == "none":
 607            parameters = self._update(
 608                parameters, {"data": {"behavior_dictionary": behaviors}}
 609            )
 610        if task is None:
 611            task = TaskDispatcher(parameters)
 612        else:
 613            task.update_task(parameters)
 614        self._save_stores(parameters)
 615        return task, parameters
 616
 617    def run_episode(
 618        self,
 619        episode_name: str,
 620        load_episode: str = None,
 621        parameters_update: Dict = None,
 622        task: TaskDispatcher = None,
 623        load_epoch: int = None,
 624        load_search: str = None,
 625        load_parameters: list = None,
 626        round_to_binary: list = None,
 627        load_strict: bool = True,
 628        n_seeds: int = 1,
 629        force: bool = False,
 630        suppress_name_check: bool = False,
 631        remove_saved_features: bool = False,
 632        mask_name: str = None,
 633        autostop_metric: str = None,
 634        autostop_interval: int = 50,
 635        autostop_threshold: float = 0.001,
 636        loading_bar: bool = False,
 637        trial: Tuple = None,
 638    ) -> TaskDispatcher:
 639        """
 640        Run an episode
 641
 642        The task parameters are read from the config files and then updated with the
 643        parameters_update dictionary. The model can be either initialized from scratch or loaded from one of the
 644        previous experiments. All parameters and results are saved in the meta files and can be accessed with the
 645        list_episodes() function. The train/test/validation split is saved and loaded from a file whenever the
 646        same split parameters are used. The pre-computed datasets are also saved and loaded whenever the same
 647        data parameters are used.
 648
 649        You can use the autostop parameters to finish training when the parameters are not improving. It will be
 650        stopped if the average value of `autostop_metric` over the last `autostop_interval` epochs is smaller than
 651        the average over the previous `autostop_interval` epochs + `autostop_threshold`. For example, if the
 652        current epoch is 120 and `autostop_interval` is 50, the averages over epochs 70-120 and 20-70 will be compared.
 653
 654        Parameters
 655        ----------
 656        episode_name : str
 657            the episode name
 658        load_episode : str, optional
 659            the (previously run) episode name to load the model from; if the episode has multiple runs,
 660            the new episode will have the same number of runs, each starting with one of the pre-trained models
 661        parameters_update : dict, optional
 662            the dictionary used to update the parameters from the config files
 663        task : TaskDispatcher, optional
 664            a pre-existing `TaskDispatcher` object (if provided, the method will update it instead of creating
 665            a new instance)
 666        load_epoch : int, optional
 667            the epoch to load (if load_episodes is not None); if not provided, the last epoch is used
 668        load_search : str, optional
 669            the hyperparameter search result to load
 670        load_parameters : list, optional
 671            a list of string names of the parameters to load from load_search (if not provided, all parameters
 672            are loaded)
 673        round_to_binary : list, optional
 674            a list of string names of the loaded parameters that should be rounded to the nearest power of two
 675        load_strict : bool, default True
 676            if `False`, matching weights will be loaded from `load_episode` and differences in parameter name lists and
 677            weight shapes will be ignored; otherwise mismatches will prompt a `RuntimeError`
 678        n_seeds : int, default 1
 679            the number of runs to perform with different random seeds; if `n_seeds > 1`, the episodes will be named
 680            `episode_name::seed_index`, e.g. `test_episode::0` and `test_episode::1`
 681        force : bool, default False
 682            if `True` and an episode with name `episode_name` already exists, it will be overwritten (use with caution!)
 683        suppress_name_check : bool, default False
 684            if `True`, episode names with a double colon are allowed (please don't use this option unless you understand
 685            why they are usually forbidden)
 686        remove_saved_features : bool, default False
 687            if `True`, the dataset will be deleted after training
 688        mask_name : str, optional
 689            the name of the real_lens to apply
 690        autostop_interval : int, default 50
 691            the number of epochs to average the autostop metric over
 692        autostop_threshold : float, default 0.001
 693            the autostop difference threshold
 694        autostop_metric : str, optional
 695            the autostop metric (can be any one of the tracked metrics of `'loss'`)
 696        """
 697
 698        if type(n_seeds) is not int or n_seeds < 1:
 699            raise ValueError(
 700                f"The n_seeds parameter has to be an integer larger than 0; got {n_seeds}"
 701            )
 702        if n_seeds > 1 and mask_name is not None:
 703            raise ValueError("Cannot apply a real_lens with n_seeds > 1")
 704        self._check_episode_validity(
 705            episode_name, allow_doublecolon=suppress_name_check, force=force
 706        )
 707        load_runs = self._episodes().get_runs(load_episode)
 708        if len(load_runs) > 1:
 709            task = self.run_episodes(
 710                episode_names=[
 711                    f'{episode_name}::{run.split("::")[-1]}' for run in load_runs
 712                ],
 713                load_episodes=load_runs,
 714                parameters_updates=[parameters_update for _ in load_runs],
 715                load_epochs=[load_epoch for _ in load_runs],
 716                load_searches=[load_search for _ in load_runs],
 717                load_parameters=[load_parameters for _ in load_runs],
 718                round_to_binary=[round_to_binary for _ in load_runs],
 719                load_strict=[load_strict for _ in load_runs],
 720                suppress_name_check=True,
 721                force=force,
 722                remove_saved_features=False,
 723            )
 724            if remove_saved_features:
 725                self._remove_stores(
 726                    {
 727                        "general": task.general_parameters,
 728                        "data": task.data_parameters,
 729                        "features": task.feature_parameters,
 730                    }
 731                )
 732            if n_seeds > 1:
 733                warnings.warn(
 734                    f"The n_seeds parameter is disregarded since load_episode={load_episode} has multiple runs"
 735                )
 736        elif n_seeds > 1:
 737            self.run_episodes(
 738                episode_names=[f"{episode_name}::{i}" for i in range(n_seeds)],
 739                load_episodes=[load_episode for _ in range(n_seeds)],
 740                parameters_updates=[parameters_update for _ in range(n_seeds)],
 741                load_epochs=[load_epoch for _ in range(n_seeds)],
 742                load_searches=[load_search for _ in range(n_seeds)],
 743                load_parameters=[load_parameters for _ in range(n_seeds)],
 744                round_to_binary=[round_to_binary for _ in range(n_seeds)],
 745                load_strict=[load_strict for _ in range(n_seeds)],
 746                suppress_name_check=True,
 747                force=force,
 748                remove_saved_features=remove_saved_features,
 749            )
 750        else:
 751            print(f"TRAINING {episode_name}")
 752            try:
 753                task, parameters = self._make_task_training(
 754                    episode_name,
 755                    load_episode,
 756                    parameters_update,
 757                    load_epoch,
 758                    load_search,
 759                    load_parameters,
 760                    round_to_binary,
 761                    continuing=False,
 762                    task=task,
 763                    mask_name=mask_name,
 764                    load_strict=load_strict,
 765                )
 766                self._save_episode(
 767                    episode_name,
 768                    parameters,
 769                    task.behaviors_dict(),
 770                    norm_stats=task.get_normalization_stats(),
 771                )
 772                time_start = time.time()
 773                if trial is not None:
 774                    trial, metric = trial
 775                else:
 776                    trial, metric = None, None
 777                logs = task.train(
 778                    autostop_metric=autostop_metric,
 779                    autostop_interval=autostop_interval,
 780                    autostop_threshold=autostop_threshold,
 781                    loading_bar=loading_bar,
 782                    trial=trial,
 783                    optimized_metric=metric,
 784                )
 785                time_end = time.time()
 786                time_total = time_end - time_start
 787                hours = int(time_total // 3600)
 788                time_total -= hours * 3600
 789                minutes = int(time_total // 60)
 790                time_total -= minutes * 60
 791                seconds = int(time_total)
 792                training_time = f"{hours}:{minutes:02}:{seconds:02}"
 793                self._update_episode_results(episode_name, logs, training_time)
 794                if remove_saved_features:
 795                    self._remove_stores(parameters)
 796                print("\n")
 797                return task
 798
 799            except Exception as e:
 800                if isinstance(e, optuna.exceptions.TrialPruned):
 801                    raise e
 802                else:
 803                    # if str(e) != f"The {episode_name} episode name is already in use!":
 804                    #     self.remove_episode(episode_name)
 805                    raise RuntimeError(f"Episode {episode_name} could not run")
 806
 807    def run_episodes(
 808        self,
 809        episode_names: List,
 810        load_episodes: List = None,
 811        parameters_updates: List = None,
 812        load_epochs: List = None,
 813        load_searches: List = None,
 814        load_parameters: List = None,
 815        round_to_binary: List = None,
 816        load_strict: List = None,
 817        force: bool = False,
 818        suppress_name_check: bool = False,
 819        remove_saved_features: bool = False,
 820    ) -> TaskDispatcher:
 821        """
 822        Run multiple episodes in sequence (and re-use previously loaded information)
 823
 824        For each episode, the task parameters are read from the config files and then updated with the
 825        parameter_update dictionary. The model can be either initialized from scratch or loaded from one of the
 826        previous experiments. All parameters and results are saved in the meta files and can be accessed with the
 827        list_episodes() function. The train/test/validation split is saved and loaded from a file whenever the
 828        same split parameters are used. The pre-computed datasets are also saved and loaded whenever the same
 829        data parameters are used.
 830
 831        Parameters
 832        ----------
 833        episode_names : list
 834            a list of strings of episode names
 835        load_episodes : list, optional
 836            a list of strings of (previously run) episode names to load the model from; if the episode has multiple runs,
 837            the new episode will have the same number of runs, each starting with one of the pre-trained models
 838        parameters_updates : list, optional
 839            a list of dictionaries used to update the parameters from the config
 840        load_epochs : list, optional
 841            a list of integers used to specify the epoch to load (if load_episodes is not None)
 842        load_searches : list, optional
 843            a list of strings of hyperparameter search results to load
 844        load_parameters : list, optional
 845            a list of lists of string names of the parameters to load from the searches
 846        round_to_binary : list, optional
 847            a list of string names of the loaded parameters that should be rounded to the nearest power of two
 848        load_strict : list, optional
 849            a list of boolean values specifying weight loading policy: if `False`, matching weights will be loaded from
 850            the corresponding episode and differences in parameter name lists and
 851            weight shapes will be ignored; otherwise mismatches will prompt a `RuntimeError` (by default `True` for
 852            every episode)
 853        force : bool, default False
 854            if `True` and an episode name is already taken, it will be overwritten (use with caution!)
 855        suppress_name_check : bool, default False
 856            if `True`, episode names with a double colon are allowed (please don't use this option unless you understand
 857            why they are usually forbidden)
 858        remove_saved_features : bool, default False
 859            if `True`, the dataset will be deleted after training
 860        """
 861
 862        task = None
 863        if load_searches is None:
 864            load_searches = [None for _ in episode_names]
 865        if load_episodes is None:
 866            load_episodes = [None for _ in episode_names]
 867        if parameters_updates is None:
 868            parameters_updates = [None for _ in episode_names]
 869        if load_parameters is None:
 870            load_parameters = [None for _ in episode_names]
 871        if load_epochs is None:
 872            load_epochs = [None for _ in episode_names]
 873        if load_strict is None:
 874            load_strict = [True for _ in episode_names]
 875        for (
 876            parameters_update,
 877            episode_name,
 878            load_episode,
 879            load_epoch,
 880            load_search,
 881            load_parameters_list,
 882            load_strict_value,
 883        ) in zip(
 884            parameters_updates,
 885            episode_names,
 886            load_episodes,
 887            load_epochs,
 888            load_searches,
 889            load_parameters,
 890            load_strict,
 891        ):
 892            task = self.run_episode(
 893                episode_name,
 894                load_episode,
 895                parameters_update,
 896                task,
 897                load_epoch,
 898                load_search,
 899                load_parameters_list,
 900                round_to_binary,
 901                load_strict_value,
 902                suppress_name_check=suppress_name_check,
 903                force=force,
 904                remove_saved_features=remove_saved_features,
 905            )
 906        return task
 907
 908    def continue_episode(
 909        self,
 910        episode_name: str,
 911        num_epochs: int = None,
 912        task: TaskDispatcher = None,
 913        n_seeds: int = 1,
 914        remove_saved_features: bool = False,
 915        device: str = "cuda",
 916        num_cpus: int = None,
 917    ) -> TaskDispatcher:
 918        """
 919        Load an older episode and continue running from the latest checkpoint
 920
 921        All parameters as well as the model and optimizer state dictionaries are loaded from the episode.
 922
 923        Parameters
 924        ----------
 925        episode_name : str
 926            the name of the episode to continue
 927        num_epochs : int, optional
 928            the new number of epochs
 929        task : TaskDispatcher, optional
 930            a pre-existing task; if provided, the method will update the task instead of creating a new one
 931            (this might save time, mainly on dataset loading)
 932        result_average_interval : int, default 5
 933            the metric are averaged over the last result_average_interval to be stored in the episodes meta file
 934            and displayed by list_episodes() function (the full log is still always available)
 935        n_seeds : int, default 1
 936            the number of runs to perform; if `n_seeds > 1`, the episodes will be named `episode_name::run_index`, e.g.
 937            `test_episode::0` and `test_episode::1`
 938        remove_saved_features : bool, default False
 939            if `True`, pre-computed features will be deleted after the run
 940        device : str, default "cuda"
 941            the torch device to use
 942        """
 943
 944        runs = self._episodes().get_runs(episode_name)
 945        for run in runs:
 946            print(f"TRAINING {run}")
 947            if num_epochs is None and not self._episode(run).unfinished():
 948                continue
 949            parameters_update = {
 950                "training": {
 951                    "num_epochs": num_epochs,
 952                    "device": device,
 953                },
 954                "general": {"num_cpus": num_cpus},
 955            }
 956            task, parameters = self._make_task_training(
 957                run,
 958                load_episode=run,
 959                parameters_update=parameters_update,
 960                continuing=True,
 961                task=task,
 962            )
 963            time_start = time.time()
 964            logs = task.train()
 965            time_end = time.time()
 966            old_time = self._training_time(run)
 967            if not np.isnan(old_time):
 968                time_end += old_time
 969                time_total = time_end - time_start
 970                hours = int(time_total // 3600)
 971                time_total -= hours * 3600
 972                minutes = int(time_total // 60)
 973                time_total -= minutes * 60
 974                seconds = int(time_total)
 975                training_time = f"{hours}:{minutes:02}:{seconds:02}"
 976            else:
 977                training_time = np.nan
 978            self._save_episode(
 979                run,
 980                parameters,
 981                task.behaviors_dict(),
 982                suppress_validation=True,
 983                training_time=training_time,
 984                norm_stats=task.get_normalization_stats(),
 985            )
 986            self._update_episode_results(run, logs)
 987            print("\n")
 988        if len(runs) < n_seeds:
 989            for i in range(len(runs), n_seeds):
 990                self.run_episode(
 991                    f"{episode_name}::{i}",
 992                    parameters_update=self._episodes().load_parameters(runs[0]),
 993                    task=task,
 994                    suppress_name_check=True,
 995                )
 996        if remove_saved_features:
 997            self._remove_stores(parameters)
 998        return task
 999
1000    def run_default_hyperparameter_search(
1001        self,
1002        search_name: str,
1003        model_name: str = None,
1004        metric: str = "f1",
1005        best_n: int = 3,
1006        direction: str = "maximize",
1007        load_episode: str = None,
1008        load_epoch: int = None,
1009        load_strict: bool = True,
1010        prune: bool = True,
1011        force: bool = False,
1012        remove_saved_features: bool = False,
1013        overlap: float = 0,
1014        num_epochs: int = 50,
1015        test_frac: float = 0,
1016        n_trials=150,
1017        device: str = None,
1018    ):
1019        """
1020        Run an optuna hyperparameter search with default parameters for a model
1021
1022        For the vast majority of cases, optimizing the default parameters should be enough.
1023        Check out `dlc2action.options.model_hyperparameters` for the lists of parameters.
1024        There are also options to set overlap, test fraction and number of epochs parameters for the search without
1025        modifying the project config files. However, if you want something more complex, look into
1026        `Project.run_hyperparameter_search`.
1027
1028        The task parameters are read from the config files and updated with the parameters_update dictionary.
1029        The model can be either initialized from scratch or loaded from a previously run episode.
1030        For each trial, the objective metric is averaged over a few best epochs.
1031
1032        Parameters
1033        ----------
1034        search_name : str
1035            the name of the search to store it in the meta files and load in run_episode
1036        model_name : str, optional
1037            the name of the model (by default loaded from the project settings, see `project.help('models')` for options)
1038        metric : str, default f1
1039            the metric to maximize/minimize (see direction); if the metric has an `"average"` parameter and it is set to
1040            `"none"` in the config files, it will be reset to `"macro"` for the search; see `project.help('metrics')` for options
1041        n_trials : int, default 20
1042            the number of optimization trials to run
1043        best_n : int, default 1
1044            the number of epochs to average the metric; if 0, the last value is taken
1045        parameters_update : dict, optional
1046            the parameters update dictionary
1047        direction : {'maximize', 'minimize'}
1048            optimization direction
1049        load_episode : str, optional
1050            the name of the episode to load the model from
1051        load_epoch : int, optional
1052            the epoch to load the model from (if not provided, the last checkpoint is used)
1053        prune : bool, default False
1054            if `True`, experiments where the optimized metric is improving too slowly will be terminated
1055            (with optuna HyperBand pruner)
1056        force : bool, default False
1057            if `True`, existing searches with the same name will be overwritten
1058        remove_saved_features : bool, default False
1059            if `True`, pre-computed features will be deleted after each run (if the data parameters change)
1060        device : str, optional
1061            cuda:{i} or cpu, if not given it is read from the default parameters
1062
1063        Returns
1064        -------
1065        dict
1066            a dictionary of best parameters
1067        """
1068
1069        if model_name is None:
1070            model_name = self._read_parameters()["general"]["model_name"]
1071        if model_name not in options.model_hyperparameters:
1072            raise ValueError(
1073                f"There is no default search space for {model_name}! Please choose from {options.model_hyperparameters.keys()} or try project.run_hyperparameter_search()"
1074            )
1075        pars = {
1076            "general": {
1077                "overlap": overlap,
1078                "model_name": model_name,
1079                "metric_functions": {metric},
1080            },
1081            "training": {"num_epochs": num_epochs},
1082        }
1083        if test_frac is not None:
1084            pars["training"]["test_frac"] = test_frac
1085        if not metric.split("_")[-1].isnumeric():
1086            project_pars = self._read_parameters()
1087            if project_pars["metrics"][metric].get("average") == "none":
1088                pars["metrics"] = {metric: {"average": "macro"}}
1089        if device is not None:
1090            pars["training"]["device"] = device
1091        return self.run_hyperparameter_search(
1092            search_name=search_name,
1093            search_space=options.model_hyperparameters[model_name],
1094            metric=metric,
1095            n_trials=n_trials,
1096            best_n=best_n,
1097            parameters_update=pars,
1098            direction=direction,
1099            load_episode=load_episode,
1100            load_epoch=load_epoch,
1101            load_strict=load_strict,
1102            prune=prune,
1103            force=force,
1104            remove_saved_features=remove_saved_features,
1105        )
1106
1107    def run_hyperparameter_search(
1108        self,
1109        search_name: str,
1110        search_space: Dict,
1111        metric: str = "f1",
1112        n_trials: int = 20,
1113        best_n: int = 1,
1114        parameters_update: Dict = None,
1115        direction: str = "maximize",
1116        load_episode: str = None,
1117        load_epoch: int = None,
1118        load_strict: bool = True,
1119        prune: bool = False,
1120        force: bool = False,
1121        remove_saved_features: bool = False,
1122    ) -> Dict:
1123        """
1124        Run an optuna hyperparameter search
1125
1126        For a simpler function that fits most use cases, check out `Project.run_default_hyperparameter_search()`.
1127
1128        To use a default search space with this method, import `dlc2action.options.model_hyperparameters`. It is
1129        a dictionary where keys are model names and values are default search spaces.
1130
1131        The task parameters are read from the config files and updated with the parameters_update dictionary.
1132        The model can be either initialized from scratch or loaded from a previously run episode.
1133        For each trial, the objective metric is averaged over a few best epochs.
1134
1135        Parameters
1136        ----------
1137        search_name : str
1138            the name of the search to store it in the meta files and load in run_episode
1139        search_space : dict
1140            a dictionary representing the search space; of this general structure:
1141            {'group/param_name': ('float/int/float_log/int_log', start, end),
1142            'group/param_name': ('categorical', [choices])}, e.g.
1143            {'data/overlap': ('int', 5, 100), 'training/lr': ('float_log', 1e-4, 1e-2),
1144            'data/feature_extraction': ('categorical', ['kinematic', 'bones'])};
1145        metric : str, default f1
1146            the metric to maximize/minimize (see direction)
1147        n_trials : int, default 20
1148            the number of optimization trials to run
1149        best_n : int, default 1
1150            the number of epochs to average the metric; if 0, the last value is taken
1151        parameters_update : dict, optional
1152            the parameters update dictionary
1153        direction : {'maximize', 'minimize'}
1154            optimization direction
1155        load_episode : str, optional
1156            the name of the episode to load the model from
1157        load_epoch : int, optional
1158            the epoch to load the model from (if not provided, the last checkpoint is used)
1159        prune : bool, default False
1160            if `True`, experiments where the optimized metric is improving too slowly will be terminated
1161            (with optuna HyperBand pruner)
1162        force : bool, default False
1163            if `True`, existing searches with the same name will be overwritten
1164        remove_saved_features : bool, default False
1165            if `True`, pre-computed features will be deleted after each run (if the data parameters change)
1166
1167        Returns
1168        -------
1169        dict
1170            a dictionary of best parameters
1171        """
1172
1173        self._check_search_validity(search_name, force=force)
1174        print(f"SEARCH {search_name}")
1175        self.remove_episode(f"_{search_name}")
1176        if parameters_update is None:
1177            parameters_update = {}
1178        parameters_update = self._update(
1179            parameters_update, {"general": {"metric_functions": {metric}}}
1180        )
1181        parameters = self._make_parameters(
1182            f"_{search_name}",
1183            load_episode,
1184            parameters_update,
1185            parameters_update_second={"training": {"model_save_path": None}},
1186            load_epoch=load_epoch,
1187            load_strict=load_strict,
1188        )
1189        task = None
1190
1191        if prune:
1192            pruner = optuna.pruners.HyperbandPruner()
1193        else:
1194            pruner = optuna.pruners.NopPruner()
1195        study = optuna.create_study(direction=direction, pruner=pruner)
1196        runner = _Runner(
1197            search_space=search_space,
1198            load_episode=load_episode,
1199            load_epoch=load_epoch,
1200            metric=metric,
1201            average=best_n,
1202            task=task,
1203            remove_saved_features=remove_saved_features,
1204            project=self,
1205            search_name=search_name,
1206        )
1207        study.optimize(lambda trial: runner.run(trial, parameters), n_trials=n_trials)
1208        search_path = self._search_path(search_name)
1209        os.mkdir(search_path)
1210        fig = optuna.visualization.plot_contour(study)
1211        plotly.offline.plot(
1212            fig, filename=os.path.join(search_path, f"{search_name}_contour.html")
1213        )
1214        fig = optuna.visualization.plot_param_importances(study)
1215        plotly.offline.plot(
1216            fig, filename=os.path.join(search_path, f"{search_name}_importances.html")
1217        )
1218        best_params = study.best_params
1219        best_value = study.best_value
1220        self._save_search(
1221            search_name,
1222            parameters,
1223            n_trials,
1224            best_params,
1225            best_value,
1226            metric,
1227            search_space,
1228        )
1229        self.remove_episode(f"_{search_name}")
1230        runner.clean()
1231        print(f"best parameters: {best_params}")
1232        print("\n")
1233        return best_params
1234
1235    def run_prediction(
1236        self,
1237        prediction_name: str,
1238        episode_names: List,
1239        load_epochs: List = None,
1240        parameters_update: Dict = None,
1241        augment_n: int = 10,
1242        data_path: str = None,
1243        mode: str = "all",
1244        file_paths: Set = None,
1245        remove_saved_features: bool = False,
1246        submission: bool = False,
1247        frame_number_map_file: str = None,
1248        force: bool = False,
1249        embedding: bool = False,
1250    ) -> None:
1251        """
1252        Load models from previously run episodes to generate a prediction
1253
1254        The probabilities predicted by the models are averaged.
1255        Unless `submission` is `True`, the prediction results are saved as a pickled dictionary in the project_name/results/predictions folder
1256        under the {episode_name}_{load_epoch}.pickle name. The file is a nested dictionary where the first-level
1257        keys are the video ids, the second-level keys are the clip ids (like individual names) and the values
1258        are the prediction arrays.
1259
1260        Parameters
1261        ----------
1262        prediction_name : str
1263            the name of the prediction
1264        episode_names : list
1265            a list of string episode names to load the models from
1266        load_epochs : list, optional
1267            a list of integer epoch indices to load the model from; if None, the last ones are used
1268        parameters_update : dict, optional
1269            a dictionary of parameter updates
1270        augment_n : int, default 10
1271            the number of augmentations to average over
1272        data_path : str, optional
1273            the data path to run the prediction for
1274        mode : {'all', 'test', 'val', 'train'}
1275            the subset of the data to make the prediction for (forced to 'all' if data_path is not None)
1276        file_paths : set, optional
1277            a set of string file paths (data with all prefixes + feature files, in any order) to run the prediction
1278            for
1279        remove_saved_features : bool, default False
1280            if `True`, pre-computed features will be deleted
1281        submission : bool, default False
1282            if `True`, a MABe-22 style submission file is generated
1283        frame_number_map_file : str, optional
1284            path to the frame number map file
1285        force : bool, default False
1286            if `True`, existing prediction with this name will be overwritten
1287        """
1288
1289        self._check_prediction_validity(prediction_name, force=force)
1290        print(f"PREDICTION {prediction_name}")
1291        if submission:
1292            task = ...
1293            # TODO: add submission option to _make_prediction
1294            predicted = task.generate_submission(
1295                frame_number_map_file=frame_number_map_file,
1296                dataset=mode,
1297                augment_n=augment_n,
1298            )
1299            folder = os.path.join(
1300                self.project_path,
1301                "results",
1302                "predictions",
1303                f"{prediction_name}",
1304            )
1305            filename = os.path.join(folder, f"{prediction_name}.npy")
1306            np.save(filename, predicted, allow_pickle=True)
1307        else:
1308            try:
1309                (
1310                    task,
1311                    parameters,
1312                    mode,
1313                    prediction,
1314                    inference_time,
1315                ) = self._make_prediction(
1316                    prediction_name,
1317                    episode_names,
1318                    load_epochs,
1319                    parameters_update,
1320                    data_path,
1321                    file_paths,
1322                    mode,
1323                    augment_n,
1324                    evaluate=False,
1325                    embedding=embedding,
1326                )
1327                predicted = task.dataset(mode).generate_full_length_prediction(
1328                    prediction
1329                )
1330            except ValueError:
1331                (
1332                    task,
1333                    parameters,
1334                    mode,
1335                    predicted,
1336                    inference_time,
1337                ) = self._aggregate_predictions(
1338                    prediction_name,
1339                    episode_names,
1340                    load_epochs,
1341                    parameters_update,
1342                    data_path,
1343                    file_paths,
1344                    mode,
1345                    augment_n,
1346                    evaluate=False,
1347                    embedding=embedding,
1348                )
1349            folder = self.prediction_path(prediction_name)
1350            os.mkdir(folder)
1351            for video_id, prediction in predicted.items():
1352                with open(
1353                    os.path.join(
1354                        folder, video_id + f"_{prediction_name}_prediction.pickle"
1355                    ),
1356                    "wb",
1357                ) as f:
1358                    prediction["min_frames"], prediction["max_frames"] = task.dataset(
1359                        mode
1360                    ).get_min_max_frames(video_id)
1361                    behavior_indices = sorted(
1362                        [key for key in task.behaviors_dict() if key != -100]
1363                    )
1364                    prediction["behaviors"] = [
1365                        task.behaviors_dict()[key] for key in behavior_indices
1366                    ]
1367                    pickle.dump(prediction, f)
1368        if remove_saved_features:
1369            self._remove_stores(parameters)
1370        self._save_prediction(
1371            prediction_name,
1372            parameters,
1373            task.behaviors_dict(),
1374            embedding,
1375            inference_time,
1376        )
1377        print("\n")
1378
1379    def evaluate_prediction(
1380        self,
1381        prediction_name: str,
1382        parameters_update: Dict = None,
1383        data_path: str = None,
1384        file_paths: Set = None,
1385        mode: str = None,
1386        remove_saved_features: bool = False,
1387    ) -> Tuple[float, dict]:
1388
1389        with open(
1390            os.path.join(
1391                self.project_path, "results", "predictions", f"{prediction_name}.pickle"
1392            ),
1393            "rb",
1394        ) as f:
1395            prediction = pickle.load(f)
1396        if parameters_update is None:
1397            parameters_update = {}
1398        parameters_update = self._update(
1399            self._predictions().load_parameters(prediction_name), parameters_update
1400        )
1401        parameters_update.pop("model")
1402        task, parameters, mode = self._make_task_prediction(
1403            "_",
1404            load_episode=None,
1405            parameters_update=parameters_update,
1406            data_path=data_path,
1407            file_paths=file_paths,
1408            mode=mode,
1409        )
1410        results = task.evaluate_prediction(prediction, data=mode)
1411        if remove_saved_features:
1412            self._remove_stores(parameters)
1413        print("\n")
1414        return results
1415
1416    def evaluate(
1417        self,
1418        episode_names: List,
1419        load_epochs: List = None,
1420        augment_n: int = 0,
1421        data_path: str = None,
1422        file_paths: Set = None,
1423        mode: str = None,
1424        parameters_update: Dict = None,
1425        multiple_episode_policy: str = "average",
1426        remove_saved_features: bool = False,
1427        skip_updating_meta: bool = True,
1428    ) -> Dict:
1429        """
1430        Load one or several models from previously run episodes to make an evaluation
1431
1432        By default it will run on the test (or validation, if there is no test) subset of the project dataset.
1433
1434        Parameters
1435        ----------
1436        episode_names : list
1437            a list of string episode names to load the models from
1438        load_epochs : list, optional
1439            a list of integer epoch indices to load the model from; if None, the last ones are used
1440        augment_n : int, default 0
1441            the number of augmentations to average over
1442        data_path : str, optional
1443            the data path to run the prediction for
1444        file_paths : set, optional
1445            a set of files to run the prediction for
1446        mode : {'test', 'val', 'train', 'all'}
1447            the subset of the data to make the prediction for (forced to 'all' if data_path is not None;
1448            by default 'test' if test subset is not empty and 'val' otherwise)
1449        parameters_update : dict, optional
1450            a dictionary with parameter updates (cannot change model parameters)
1451        remove_saved_features : bool, default False
1452            if `True`, the dataset will be deleted
1453
1454        Returns
1455        -------
1456        metric : dict
1457            a dictionary of average values of metric functions
1458        """
1459
1460        names = []
1461        for episode_name in episode_names:
1462            names += self._episodes().get_runs(episode_name)
1463        if len(set(episode_names)) == 1:
1464            print(f"EVALUATION {episode_names[0]}")
1465        else:
1466            print(f"EVALUATION {episode_names}")
1467        if len(names) > 1:
1468            evaluate = True
1469        else:
1470            evaluate = False
1471        if multiple_episode_policy == "average":
1472            try:
1473                (
1474                    task,
1475                    parameters,
1476                    mode,
1477                    prediction,
1478                    inference_time,
1479                ) = self._make_prediction(
1480                    "_",
1481                    episode_names,
1482                    load_epochs,
1483                    parameters_update,
1484                    mode=mode,
1485                    data_path=data_path,
1486                    file_paths=file_paths,
1487                    augment_n=augment_n,
1488                    evaluate=evaluate,
1489                )
1490            except:
1491                (
1492                    task,
1493                    parameters,
1494                    mode,
1495                    prediction,
1496                    inference_time,
1497                ) = self._aggregate_predictions(
1498                    "_",
1499                    episode_names,
1500                    load_epochs,
1501                    parameters_update,
1502                    mode=mode,
1503                    data_path=data_path,
1504                    file_paths=file_paths,
1505                    augment_n=augment_n,
1506                    evaluate=evaluate,
1507                )
1508            print("AGGREGATED:")
1509            _, results = task.evaluate_prediction(prediction, data=mode)
1510            if len(names) == 1 and mode == "val" and not skip_updating_meta:
1511                self._update_episode_metrics(names[0], results)
1512        elif multiple_episode_policy == "statistics":
1513            values = defaultdict(lambda: [])
1514            task = None
1515            for name in names:
1516                (
1517                    task,
1518                    parameters,
1519                    mode,
1520                    prediction,
1521                    inference_time,
1522                ) = self._make_prediction(
1523                    "_",
1524                    [name],
1525                    load_epochs,
1526                    parameters_update,
1527                    mode=mode,
1528                    data_path=data_path,
1529                    file_paths=file_paths,
1530                    augment_n=augment_n,
1531                    evaluate=evaluate,
1532                    task=task,
1533                )
1534                _, metrics = task.evaluate_prediction(prediction, data=mode)
1535                for name, value in metrics.items():
1536                    values[name].append(value)
1537                if mode == "val" and not skip_updating_meta:
1538                    self._update_episode_metrics(name, metrics)
1539            results = defaultdict(lambda: {})
1540            mean_string = ""
1541            std_string = ""
1542            for key, value_list in values.items():
1543                results[key]["mean"] = np.mean(value_list)
1544                results[key]["std"] = np.std(value_list)
1545                mean_string += f"{key} {np.mean(value_list):.3f}, "
1546                std_string += f"{key} {np.std(value_list):.3f}, "
1547            print("MEAN:")
1548            print(mean_string)
1549            print("STD:")
1550            print(std_string)
1551        else:
1552            raise ValueError(
1553                f"The {multiple_episode_policy} multiple episode policy is not recognized; please choose "
1554                f"from ['average', 'statistics']"
1555            )
1556        if len(names) > 0 and remove_saved_features:
1557            self._remove_stores(parameters)
1558        print(f"Inference time: {inference_time}")
1559        print("\n")
1560        return results
1561
1562    def _generate_similarity_score(
1563        self,
1564        prediction_name: str,
1565        target_video_id: str,
1566        target_clip: str,
1567        target_start: int,
1568        target_end: int,
1569    ) -> Dict:
1570        with open(
1571            os.path.join(
1572                self.project_path,
1573                "results",
1574                "predictions",
1575                f"{prediction_name}.pickle",
1576            ),
1577            "rb",
1578        ) as f:
1579            prediction = pickle.load(f)
1580        target = prediction[target_video_id][target_clip][:, target_start:target_end]
1581        score_dict = defaultdict(lambda: {})
1582        for video_id in prediction:
1583            for clip_id in prediction[video_id]:
1584                score_dict[video_id][clip_id] = torch.cdist(
1585                    target.T, prediction[video_id][score_dict].T
1586                ).min(0)
1587        return score_dict
1588
1589    def _suggest_intervals_from_dict(self, score_dict, min_length, n_intervals) -> Dict:
1590        interval_address = {}
1591        interval_value = {}
1592        s = 0
1593        n = 0
1594        for video_id, video_dict in score_dict.items():
1595            for clip_id, value in video_dict.items():
1596                s += value.mean()
1597                n += 1
1598        mean_value = s / n
1599        alpha = 1.75
1600        for it in range(10):
1601            id = 0
1602            interval_address = {}
1603            interval_value = {}
1604            for video_id, video_dict in score_dict.items():
1605                for clip_id, value in video_dict.items():
1606                    res_indices_start, res_indices_end = apply_threshold(
1607                        value,
1608                        threshold=(2 - alpha * (0.9**it)) * mean_value,
1609                        low=True,
1610                        error_mask=None,
1611                        min_frames=min_length,
1612                        smooth_interval=0,
1613                    )
1614                    for start, end in zip(res_indices_start, res_indices_end):
1615                        interval_address[id] = [video_id, clip_id, start, end]
1616                        interval_value[id] = score_dict[video_id][clip_id][
1617                            start:end
1618                        ].mean()
1619                        id += 1
1620            if len(interval_address) >= n_intervals:
1621                break
1622        if len(interval_address) < n_intervals:
1623            warnings.warn(
1624                f"Could not get {n_intervals} intervals from the data, saving the result with {len(interval_address)} intervals"
1625            )
1626        sorted_intervals = sorted(
1627            interval_value.items(), key=lambda x: x[1], reverse=True
1628        )
1629        output_intervals = [
1630            interval_address[x[0]]
1631            for x in sorted_intervals[: min(len(sorted_intervals), n_intervals)]
1632        ]
1633        output = defaultdict(lambda: [])
1634        for video_id, clip_id, start, end in output_intervals:
1635            output[video_id].append([start, end, clip_id])
1636        return output
1637
1638    def list_episodes(
1639        self,
1640        episode_names: List = None,
1641        value_filter: str = "",
1642        display_parameters: List = None,
1643        print_results: bool = True,
1644    ) -> pd.DataFrame:
1645        """
1646        Get a filtered pandas dataframe with episode metadata
1647
1648        Parameters
1649        ----------
1650        episode_names : list
1651            a list of strings of episode names
1652        value_filter : str
1653            a string of filters to apply; of this general structure:
1654            'group_name1/par_name1::(</>/<=/>=/=)value1,group_name2/par_name2::(</>/<=/>=/=)value2', e.g.
1655            'data/overlap::=50,results/recall::>0.5,data/feature_extraction::=kinematic,meta/training_time::>=00:00:10'
1656        display_parameters : list
1657            list of parameters to display (e.g. ['data/overlap', 'results/recall'])
1658        print_results : bool, default True
1659            if True, the result will be printed to standard output
1660
1661        Returns
1662        -------
1663        pd.DataFrame
1664            the filtered dataframe
1665        """
1666
1667        episodes = self._episodes().list_episodes(
1668            episode_names, value_filter, display_parameters
1669        )
1670        if print_results:
1671            print("TRAINING EPISODES")
1672            print(episodes)
1673            print("\n")
1674        return episodes
1675
1676    def list_predictions(
1677        self,
1678        episode_names: List = None,
1679        value_filter: str = "",
1680        display_parameters: List = None,
1681        print_results: bool = True,
1682    ) -> pd.DataFrame:
1683        """
1684        Get a filtered pandas dataframe with prediction metadata
1685
1686        Parameters
1687        ----------
1688        episode_names : list
1689            a list of strings of episode names
1690        value_filter : str
1691            a string of filters to apply; of this general structure:
1692            'group_name1/par_name1:(<>=)value1,group_name2/par_name2:(<>=)value2', e.g.
1693            'data/overlap:=50,results/recall:>0.5,data/feature_extraction:=kinematic'
1694        display_parameters : list
1695            list of parameters to display (e.g. ['data/overlap', 'results/recall'])
1696        print_results : bool, default True
1697            if True, the result will be printed to standard output
1698
1699        Returns
1700        -------
1701        pd.DataFrame
1702            the filtered dataframe
1703        """
1704
1705        predictions = self._predictions().list_episodes(
1706            episode_names, value_filter, display_parameters
1707        )
1708        if print_results:
1709            print("PREDICTIONS")
1710            print(predictions)
1711            print("\n")
1712        return predictions
1713
1714    def list_searches(
1715        self,
1716        search_names: List = None,
1717        value_filter: str = "",
1718        display_parameters: List = None,
1719        print_results: bool = True,
1720    ) -> pd.DataFrame:
1721        """
1722        Get a filtered pandas dataframe with hyperparameter search metadata
1723
1724        Parameters
1725        ----------
1726        search_names : list
1727            a list of strings of search names
1728        value_filter : str
1729            a string of filters to apply; of this general structure:
1730            'group_name1/par_name1:(<>=)value1,group_name2/par_name2:(<>=)value2', e.g.
1731            'data/overlap:=50,results/recall:>0.5,data/feature_extraction:=kinematic'
1732        display_parameters : list
1733            list of parameters to display (e.g. ['data/overlap', 'results/recall'])
1734        print_results : bool, default True
1735            if True, the result will be printed to standard output
1736
1737        Returns
1738        -------
1739        pd.DataFrame
1740            the filtered dataframe
1741        """
1742
1743        searches = self._searches().list_episodes(
1744            search_names, value_filter, display_parameters
1745        )
1746        if print_results:
1747            print("SEARCHES")
1748            print(searches)
1749            print("\n")
1750        return searches
1751
1752    def get_best_parameters(
1753        self,
1754        search_name: str,
1755        round_to_binary: List = None,
1756    ):
1757        params, model = self._searches().get_best_params(
1758            search_name, round_to_binary=round_to_binary
1759        )
1760        params = self._update(params, {"general": {"model_name": model}})
1761        return params
1762
1763    def list_best_parameters(
1764        self, search_name: str, print_results: bool = True
1765    ) -> Dict:
1766        """
1767        Get the raw dictionary of best parameters found by a search
1768
1769        Parameters
1770        ----------
1771        search_name : str
1772            the name of the search
1773        print_results : bool, default True
1774            if True, the result will be printed to standard output
1775
1776        Returns
1777        -------
1778        best_params : dict
1779            a dictionary of the best parameters where the keys are in '{group}/{name}' format
1780        """
1781
1782        params = self._searches().get_best_params_raw(search_name)
1783        if print_results:
1784            print(f"SEARCH RESULTS {search_name}")
1785            for k, v in params.items():
1786                print(f"{k}: {v}")
1787            print("\n")
1788        return params
1789
1790    def plot_episodes(
1791        self,
1792        episode_names: List,
1793        metrics: List,
1794        modes: List = None,
1795        title: str = None,
1796        episode_labels: List = None,
1797        save_path: str = None,
1798        add_hlines: List = None,
1799        epoch_limits: List = None,
1800        colors: List = None,
1801        add_highpoint_hlines: bool = False,
1802    ) -> None:
1803        """
1804        Plot episode training curves
1805
1806        Parameters
1807        ----------
1808        episode_names : list
1809            a list of episode names to plot; to plot to episodes in one line combine them in a list
1810            (e.g. ['episode1', ['episode2', 'episode3']] to plot episode2 and episode3 as one experiment)
1811        metrics : list
1812            a list of metric to plot
1813        modes : list, optional
1814            a list of modes to plot ('train' and/or 'val'; `['val']` by default)
1815        title : str, optional
1816            title for the plot
1817        episode_labels : list, optional
1818            a list of strings used to label the curves (has to be the same length as episode_names)
1819        save_path : str, optional
1820            the path to save the resulting plot
1821        add_hlines : list, optional
1822            a list of float values (or (value, label) tuples) to mark with horizontal lines
1823        colors: list, optional
1824            a list of matplotlib colors
1825        add_highpoint_hlines : bool, default False
1826            if `True`, horizontal lines will be added at the highest value of each episode
1827        """
1828
1829        if modes is None:
1830            modes = ["val"]
1831        if add_hlines is None:
1832            add_hlines = []
1833        logs = []
1834        epochs = []
1835        labels = []
1836        if episode_labels is not None:
1837            assert len(episode_labels) == len(episode_names)
1838        for name_i, name in enumerate(episode_names):
1839            log_params = product(metrics, modes)
1840            for metric, mode in log_params:
1841                if episode_labels is not None:
1842                    label = episode_labels[name_i]
1843                else:
1844                    label = deepcopy(name)
1845                if len(modes) != 1:
1846                    label += f"_{mode}"
1847                if len(metrics) != 1:
1848                    label += f"_{metric}"
1849                labels.append(label)
1850                if isinstance(name, Iterable) and not isinstance(name, str):
1851                    epoch_list = defaultdict(lambda: [])
1852                    multi_logs = defaultdict(lambda: [])
1853                    for i, n in enumerate(name):
1854                        runs = self._episodes().get_runs(n)
1855                        if len(runs) > 1:
1856                            for run in runs:
1857                                index = run.split("::")[-1]
1858                                if multi_logs[index] == []:
1859                                    if multi_logs["null"] is None:
1860                                        raise RuntimeError(
1861                                            "The run indices are not consistent across episodes!"
1862                                        )
1863                                    else:
1864                                        multi_logs[index] += multi_logs["null"]
1865                                multi_logs[index] += list(
1866                                    self._episode(run).get_metric_log(mode, metric)
1867                                )
1868                                start = (
1869                                    0
1870                                    if len(epoch_list[index]) == 0
1871                                    else epoch_list[index][-1]
1872                                )
1873                                epoch_list[index] += [
1874                                    x + start
1875                                    for x in self._episode(run).get_epoch_list(mode)
1876                                ]
1877                            multi_logs["null"] = None
1878                        else:
1879                            if len(multi_logs.keys()) > 1:
1880                                raise RuntimeError(
1881                                    "Cannot plot a single-run episode after a multi-run episode!"
1882                                )
1883                            multi_logs["null"] += list(
1884                                self._episode(n).get_metric_log(mode, metric)
1885                            )
1886                            start = (
1887                                0
1888                                if len(epoch_list["null"]) == 0
1889                                else epoch_list["null"][-1]
1890                            )
1891                            epoch_list["null"] += [
1892                                x + start for x in self._episode(n).get_epoch_list(mode)
1893                            ]
1894                    if len(multi_logs.keys()) == 1:
1895                        log = multi_logs["null"]
1896                        epochs.append(epoch_list["null"])
1897                    else:
1898                        log = tuple([v for k, v in multi_logs.items() if k != "null"])
1899                        epochs.append(
1900                            tuple([v for k, v in epoch_list.items() if k != "null"])
1901                        )
1902                else:
1903                    runs = self._episodes().get_runs(name)
1904                    if len(runs) > 1:
1905                        log = []
1906                        for run in runs:
1907                            tracked_metrics = self._episode(run).get_metrics()
1908                            if metric in tracked_metrics:
1909                                log.append(
1910                                    list(
1911                                        self._episode(run).get_metric_log(mode, metric)
1912                                    )
1913                                )
1914                            else:
1915                                relevant = []
1916                                for m in tracked_metrics:
1917                                    m_split = m.split("_")
1918                                    if (
1919                                        "_".join(m_split[:-1]) == metric
1920                                        and m_split[-1].isnumeric()
1921                                    ):
1922                                        relevant.append(m)
1923                                if len(relevant) == 0:
1924                                    raise ValueError(
1925                                        f"The {metric} metric was not tracked at {run}"
1926                                    )
1927                                arr = 0
1928                                for m in relevant:
1929                                    arr += self._episode(run).get_metric_log(mode, m)
1930                                arr /= len(relevant)
1931                                log.append(list(arr))
1932                        log = tuple(log)
1933                        epochs.append(
1934                            tuple(
1935                                [
1936                                    self._episode(run).get_epoch_list(mode)
1937                                    for run in runs
1938                                ]
1939                            )
1940                        )
1941                    else:
1942                        tracked_metrics = self._episode(name).get_metrics()
1943                        if metric in tracked_metrics:
1944                            log = list(self._episode(name).get_metric_log(mode, metric))
1945                        else:
1946                            relevant = []
1947                            for m in tracked_metrics:
1948                                m_split = m.split("_")
1949                                if (
1950                                    "_".join(m_split[:-1]) == metric
1951                                    and m_split[-1].isnumeric()
1952                                ):
1953                                    relevant.append(m)
1954                            if len(relevant) == 0:
1955                                raise ValueError(
1956                                    f"The {metric} metric was not tracked at {name}"
1957                                )
1958                            arr = 0
1959                            for m in relevant:
1960                                arr += self._episode(name).get_metric_log(mode, m)
1961                            arr /= len(relevant)
1962                            log = list(arr)
1963                        epochs.append(self._episode(name).get_epoch_list(mode))
1964                logs.append(log)
1965        # if episode_labels is not None:
1966        #     print(f'{len(episode_labels)=}, {len(logs)=}')
1967        #     if len(episode_labels) != len(logs):
1968
1969        #         raise ValueError(
1970        #             f"The length of episode_labels ({len(episode_labels)}) has to be equal to the length of "
1971        #             f"curves ({len(logs)})!"
1972        #         )
1973        #     else:
1974        #         labels = episode_labels
1975        if colors is None:
1976            colors = cm.rainbow(np.linspace(0, 1, len(logs)))
1977        if len(colors) != len(logs):
1978            raise ValueError(
1979                "The length of colors has to be equal to the length of curves (metrics * modes * episode_names)!"
1980            )
1981        plt.figure()
1982        length = 0
1983        for log, label, color, epoch_list in zip(logs, labels, colors, epochs):
1984            if type(log) is list:
1985                if len(log) > length:
1986                    length = len(log)
1987                plt.plot(
1988                    epoch_list,
1989                    log,
1990                    label=label,
1991                    color=color,
1992                )
1993                if add_highpoint_hlines:
1994                    plt.axhline(np.max(log), linestyle="dashed", color=color)
1995            else:
1996                for l, xx in zip(log, epoch_list):
1997                    if len(l) > length:
1998                        length = len(l)
1999                    plt.plot(
2000                        xx,
2001                        l,
2002                        color=color,
2003                        alpha=0.2,
2004                    )
2005                if not all([len(x) == len(log[0]) for x in log]):
2006                    warnings.warn(
2007                        f"Got logs with unequal lengths in parallel runs for {label}"
2008                    )
2009                    log = list(log)
2010                    epoch_list = list(epoch_list)
2011                    for i, x in enumerate(epoch_list):
2012                        to_remove = []
2013                        for j, y in enumerate(x[1:]):
2014                            if y <= x[j - 1]:
2015                                y_ind = x.index(y)
2016                                to_remove += list(range(y_ind, j))
2017                        epoch_list[i] = [
2018                            y for j, y in enumerate(x) if j not in to_remove
2019                        ]
2020                        log[i] = [y for j, y in enumerate(log[i]) if j not in to_remove]
2021                    length = min([len(x) for x in log])
2022                    for i in range(len(log)):
2023                        log[i] = log[i][:length]
2024                        epoch_list[i] = epoch_list[i][:length]
2025                    if not all([x == epoch_list[0] for x in epoch_list]):
2026                        raise RuntimeError(
2027                            f"Got different epoch indices in parallel runs for {label}"
2028                        )
2029                mean = np.array(log).mean(0)
2030                plt.plot(
2031                    epoch_list[0],
2032                    mean,
2033                    label=label,
2034                    color=color,
2035                )
2036                if add_highpoint_hlines:
2037                    plt.axhline(np.max(mean), linestyle="dashed", color=color)
2038        for x in add_hlines:
2039            label = None
2040            if isinstance(x, Iterable):
2041                x, label = x
2042            plt.axhline(x, label=label)
2043            plt.xlim((0, length))
2044
2045        plt.legend()
2046        plt.xlabel("epochs")
2047        if len(metrics) == 1:
2048            plt.ylabel(metrics[0])
2049        else:
2050            plt.ylabel("value")
2051        if title is None:
2052            if len(episode_names) == 1:
2053                title = episode_names[0]
2054            elif len(metrics) == 1:
2055                title = metrics[0]
2056        if epoch_limits is not None:
2057            plt.xlim(epoch_limits)
2058        if title is not None:
2059            plt.title(title)
2060        plt.show()
2061        if save_path is not None:
2062            plt.savefig(save_path)
2063
2064    def update_parameters(
2065        self,
2066        parameters_update: Dict = None,
2067        load_search: str = None,
2068        load_parameters: List = None,
2069        round_to_binary: List = None,
2070    ) -> None:
2071        """
2072        Update the parameters in the project config files
2073
2074        Parameters
2075        ----------
2076        parameters_update : dict, optional
2077            a dictionary of parameter updates
2078        load_search : str, optional
2079            the name of hyperparameter search results to load to config
2080        load_parameters : list, optional
2081            a list of lists of string names of the parameters to load from the searches
2082        round_to_binary : list, optional
2083            a list of string names of the loaded parameters that should be rounded to the nearest power of two
2084        """
2085
2086        keys = [
2087            "general",
2088            "losses",
2089            "metrics",
2090            "ssl",
2091            "training",
2092            "data",
2093        ]
2094        parameters = self._read_parameters(catch_blanks=False)
2095        if parameters_update is not None:
2096            if "model" in parameters_update:
2097                model_params = parameters_update.pop("model")
2098            else:
2099                model_params = None
2100            if "features" in parameters_update:
2101                feat_params = parameters_update.pop("features")
2102            else:
2103                feat_params = None
2104            if "augmentations" in parameters_update:
2105                aug_params = parameters_update.pop("augmentations")
2106            else:
2107                aug_params = None
2108            parameters = self._update(parameters, parameters_update)
2109            model_name = parameters["general"]["model_name"]
2110            parameters["model"] = self._open_yaml(
2111                os.path.join(self.project_path, "config", "model", f"{model_name}.yaml")
2112            )
2113            if model_params is not None:
2114                parameters["model"] = self._update(parameters["model"], model_params)
2115            feat_name = parameters["general"]["feature_extraction"]
2116            parameters["features"] = self._open_yaml(
2117                os.path.join(
2118                    self.project_path, "config", "features", f"{feat_name}.yaml"
2119                )
2120            )
2121            if feat_params is not None:
2122                parameters["features"] = self._update(
2123                    parameters["features"], feat_params
2124                )
2125            aug_name = options.extractor_to_transformer[
2126                parameters["general"]["feature_extraction"]
2127            ]
2128            parameters["augmentations"] = self._open_yaml(
2129                os.path.join(
2130                    self.project_path, "config", "augmentations", f"{aug_name}.yaml"
2131                )
2132            )
2133            if aug_params is not None:
2134                parameters["augmentations"] = self._update(
2135                    parameters["augmentations"], aug_params
2136                )
2137        if load_search is not None:
2138            parameters_update, model_name = self._searches().get_best_params(
2139                load_search, load_parameters, round_to_binary
2140            )
2141            parameters["general"]["model_name"] = model_name
2142            parameters["model"] = self._open_yaml(
2143                os.path.join(self.project_path, "config", "model", f"{model_name}.yaml")
2144            )
2145            parameters = self._update(parameters, parameters_update)
2146        for key in keys:
2147            with open(
2148                os.path.join(self.project_path, "config", f"{key}.yaml"), "w", encoding="utf-8"
2149            ) as f:
2150                YAML().dump(parameters[key], f)
2151        model_name = parameters["general"]["model_name"]
2152        model_path = os.path.join(
2153            self.project_path, "config", "model", f"{model_name}.yaml"
2154        )
2155        with open(model_path, "w", encoding="utf-8") as f:
2156            YAML().dump(parameters["model"], f)
2157        features_name = parameters["general"]["feature_extraction"]
2158        features_path = os.path.join(
2159            self.project_path, "config", "features", f"{features_name}.yaml"
2160        )
2161        with open(features_path, "w", encoding="utf-8") as f:
2162            YAML().dump(parameters["features"], f)
2163        aug_name = options.extractor_to_transformer[features_name]
2164        aug_path = os.path.join(
2165            self.project_path, "config", "augmentations", f"{aug_name}.yaml"
2166        )
2167        with open(aug_path, "w", encoding="utf-8") as f:
2168            YAML().dump(parameters["augmentations"], f)
2169
2170    def get_summary(
2171        self,
2172        episode_names: list,
2173        method: str = "last",
2174        average: int = 1,
2175        metrics: List = None,
2176    ) -> Dict:
2177        """
2178        Get a summary of episode statistics
2179
2180        If the episode has multiple runs, the statistics will be aggregated over all of them.
2181
2182        Parameters
2183        ----------
2184        episode_name : str
2185            the name of the episode
2186        method : ["best", "last"]
2187            the method for choosing the epochs
2188        average : int, default 1
2189            the number of epochs to average over (for each run)
2190        metrics : list, optional
2191            a list of metrics
2192
2193        Returns
2194        -------
2195        statistics : dict
2196            a nested dictionary where first-level keys are metric names and second-level keys are 'mean' for the mean
2197            and 'std' for the standard deviation
2198        """
2199
2200        runs = []
2201        for episode_name in episode_names:
2202            runs_ep = self._episodes().get_runs(episode_name)
2203            if len(runs_ep) == 0:
2204                raise RuntimeError(
2205                    f"There is no {episode_name} episode in the project memory"
2206                )
2207            runs += runs_ep
2208        if metrics is None:
2209            metrics = self._episode(runs[0]).get_metrics()
2210
2211        values = {m: [] for m in metrics}
2212        for run in runs:
2213            for m in metrics:
2214                log = self._episode(run).get_metric_log(mode="val", metric_name=m)
2215                if method == "best":
2216                    log = sorted(log)
2217                    values[m] += list(log[-average:])
2218                elif method == "last":
2219                    if len(log) == 0:
2220                        episodes = self._episodes().data
2221                        if average == 1 and ("results", m) in episodes.columns:
2222                            values[m] += [episodes.loc[run, ("results", m)]]
2223                        else:
2224                            raise RuntimeError(f"Did not find {m} metric for {run} run")
2225                    values[m] += list(log[-average:])
2226                elif method.startswith("epoch"):
2227                    epoch = int(method[5:]) - 1
2228                    pars = self._episodes().load_parameters(run)
2229                    step = int(pars["training"]["validation_interval"])
2230                    values[m] += [log[epoch // step]]
2231                else:
2232                    raise ValueError(
2233                        f"The {method} method is not recognized! Please choose from ['last', 'best', 'epoch...']"
2234                    )
2235        statistics = defaultdict(lambda: {})
2236        for m, v in values.items():
2237            statistics[m]["mean"] = np.mean(v)
2238            statistics[m]["std"] = np.std(v)
2239        print(f"SUMMARY {episode_names}")
2240        for m, v in statistics.items():
2241            print(f'{m}: mean {v["mean"]:.3f}, std {v["std"]:.3f}')
2242        print("\n")
2243        return dict(statistics)
2244
2245    @staticmethod
2246    def remove_project(name: str, projects_path: str = None) -> None:
2247        """
2248        Remove all project files and experiment records and results
2249        """
2250
2251        if projects_path is None:
2252            projects_path = os.path.join(str(Path.home()), "DLC2Action")
2253        project_path = os.path.join(projects_path, name)
2254        if os.path.exists(project_path):
2255            shutil.rmtree(project_path)
2256
2257    def remove_saved_features(
2258        self,
2259        dataset_names: List = None,
2260        exceptions: List = None,
2261        remove_active: bool = False,
2262    ) -> None:
2263        """
2264        Remove saved pre-computed dataset files
2265
2266        By default, all pre-computed features will be deleted.
2267        No essential information can get lost, storing them only saves time. Be careful with deleting datasets
2268        while training or inference is happening though.
2269
2270        Parameters
2271        ----------
2272        dataset_names : list, optional
2273            a list of dataset names to delete (by default all names are added)
2274        exceptions : list, optional
2275            a list of dataset names to not be deleted
2276        remove_active : bool, default False
2277            if `False`, datasets used by unfinished episodes will not be deleted
2278        """
2279
2280        print("Removing datasets...")
2281        if dataset_names is None:
2282            dataset_names = []
2283        if exceptions is None:
2284            exceptions = []
2285        if not remove_active:
2286            exceptions += self._episodes().get_active_datasets()
2287        dataset_path = os.path.join(self.project_path, "saved_datasets")
2288        if os.path.exists(dataset_path):
2289            if dataset_names == []:
2290                dataset_names = set([f.split(".")[0] for f in os.listdir(dataset_path)])
2291
2292            to_remove = [
2293                x
2294                for x in dataset_names
2295                if os.path.exists(os.path.join(dataset_path, x)) and x not in exceptions
2296            ]
2297            if len(to_remove) > 2:
2298                to_remove = tqdm(to_remove)
2299            for dataset in to_remove:
2300                shutil.rmtree(os.path.join(dataset_path, dataset))
2301            to_remove = [
2302                f"{x}.pickle"
2303                for x in dataset_names
2304                if os.path.exists(os.path.join(dataset_path, f"{x}.pickle"))
2305                and x not in exceptions
2306            ]
2307            for dataset in to_remove:
2308                os.remove(os.path.join(dataset_path, dataset))
2309            names = self._saved_datasets().dataset_names()
2310            self._saved_datasets().remove(names)
2311        print("\n")
2312
2313    def remove_extra_checkpoints(
2314        self, episode_names: List = None, exceptions: List = None
2315    ) -> None:
2316        """
2317        Remove intermediate model checkpoint files (only leave the results of the last epoch)
2318
2319        By default, all intermediate checkpoints will be deleted.
2320        Files in the model folder that are not associated with any record in the meta files are also deleted.
2321
2322        Parameters
2323        ----------
2324        episode_names : list, optional
2325            a list of episode names to clean (by default all names are added)
2326        exceptions : list, optional
2327            a list of episode names to not clean
2328        """
2329
2330        model_path = os.path.join(self.project_path, "results", "model")
2331        try:
2332            all_names = self._episodes().data.index
2333        except:
2334            all_names = os.listdir(model_path)
2335        if episode_names is None:
2336            episode_names = all_names
2337        if exceptions is None:
2338            exceptions = []
2339        to_remove = [x for x in episode_names if x not in exceptions]
2340        folders = os.listdir(model_path)
2341        for folder in folders:
2342            if folder not in all_names:
2343                shutil.rmtree(os.path.join(model_path, folder))
2344            elif folder in to_remove:
2345                files = os.listdir(os.path.join(model_path, folder))
2346                for file in sorted(files)[:-1]:
2347                    os.remove(os.path.join(model_path, folder, file))
2348
2349    def remove_search(self, search_name: str) -> None:
2350        """
2351        Remove a hyperparameter search record
2352
2353        Parameters
2354        ----------
2355        search_name : str
2356            the name of the search to remove
2357        """
2358
2359        self._searches().remove_episode(search_name)
2360        graph_path = os.path.join(self.project_path, "results", "searches", search_name)
2361        if os.path.exists(graph_path):
2362            shutil.rmtree(graph_path)
2363
2364    def remove_prediction(self, prediction_name: str) -> None:
2365        """
2366        Remove a prediction record
2367
2368        Parameters
2369        ----------
2370        prediction_name : str
2371            the name of the prediction to remove
2372        """
2373
2374        self._predictions().remove_episode(prediction_name)
2375        prediction_path = os.path.join(
2376            self.project_path, "results", "predictions", prediction_name
2377        )
2378        if os.path.exists(prediction_path):
2379            shutil.rmtree(prediction_path)
2380
2381    def remove_episode(self, episode_name: str) -> None:
2382        """
2383        Remove all model, logs and metafile records related to an episode
2384
2385        Parameters
2386        ----------
2387        episode_name : str
2388            the name of the episode to remove
2389        """
2390
2391        runs = self._episodes().get_runs(episode_name)
2392        runs.append(episode_name)
2393        for run in runs:
2394            self._episodes().remove_episode(run)
2395            model_path = os.path.join(self.project_path, "results", "model", run)
2396            if os.path.exists(model_path):
2397                shutil.rmtree(model_path)
2398            log_path = os.path.join(self.project_path, "results", "logs", f"{run}.txt")
2399            if os.path.exists(log_path):
2400                os.remove(log_path)
2401
2402    def prune_unfinished(self, exceptions: List = None) -> None:
2403        """
2404        Remove all interrupted episodes
2405
2406        Remove all episodes that either don't have a log file or have less epochs in the log file than in
2407        the training parameters or have a model folder but not a record. Note that it can remove episodes that are
2408        currently running!
2409
2410        Parameters
2411        ----------
2412        exceptions : list
2413            the episodes to keep even if they are interrupted
2414
2415        Returns
2416        -------
2417        pruned : list
2418            a list of the episode names that were pruned
2419        """
2420
2421        if exceptions is None:
2422            exceptions = []
2423        unfinished = self._episodes().unfinished_episodes()
2424        unfinished = [x for x in unfinished if x not in exceptions]
2425        model_folders = os.listdir(os.path.join(self.project_path, "results", "model"))
2426        unfinished += [
2427            x for x in model_folders if x not in self._episodes().list_episodes().index
2428        ]
2429        print(f"PRUNING {unfinished}")
2430        for episode_name in unfinished:
2431            self.remove_episode(episode_name)
2432        print(f"\n")
2433        return unfinished
2434
2435    def prediction_path(self, prediction_name: str) -> str:
2436        """
2437        Get the path where prediction files are saved
2438
2439        Parameters
2440        ----------
2441        prediction_name : str
2442            name of the prediction
2443
2444        Returns
2445        -------
2446        prediction_path : str
2447            the file path
2448        """
2449
2450        return os.path.join(
2451            self.project_path, "results", "predictions", f"{prediction_name}"
2452        )
2453
2454    @classmethod
2455    def print_data_types(cls):
2456        print("DATA TYPES:")
2457        for key, value in cls.data_types().items():
2458            print(f"{key}:")
2459            print(value.__doc__)
2460
2461    @classmethod
2462    def print_annotation_types(cls):
2463        print("ANNOTATION TYPES:")
2464        for key, value in cls.annotation_types().items():
2465            print(f"{key}:")
2466            print(value.__doc__)
2467
2468    @staticmethod
2469    def data_types() -> List:
2470        """
2471        Get available data types
2472
2473        Returns
2474        -------
2475        list
2476            available data types
2477        """
2478
2479        return options.input_stores
2480
2481    @staticmethod
2482    def annotation_types() -> List:
2483        """
2484        Get available annotation types
2485
2486        Returns
2487        -------
2488        list
2489            available annotation types
2490        """
2491
2492        return options.annotation_stores
2493
2494    def _save_mask(self, file: Dict, mask_name: str):
2495        """
2496        Save a mask file
2497        """
2498
2499        if not os.path.exists(self._mask_path()):
2500            os.mkdir(self._mask_path())
2501        with open(os.path.join(self._mask_path(), mask_name + ".pickle"), "wb") as f:
2502            pickle.dump(file, f)
2503
2504    def _load_mask(self, mask_name: str) -> Dict:
2505        """
2506        Load a mask file
2507        """
2508
2509        with open(os.path.join(self._mask_path(), mask_name + ".pickle"), "rb") as f:
2510            data = pickle.load(f)
2511        return data
2512
2513    def _thresholds(self) -> DecisionThresholds:
2514        """
2515        Get the decision thresholds meta object
2516        """
2517
2518        return DecisionThresholds(self._thresholds_path())
2519
2520    def _episodes(self) -> SavedRuns:
2521        """
2522        Get the episodes meta object
2523
2524        Returns
2525        -------
2526        episodes : SavedRuns
2527            the episodes meta object
2528        """
2529
2530        try:
2531            return SavedRuns(self._episodes_path(), self.project_path)
2532        except:
2533            self.load_metadata_backup()
2534            return SavedRuns(self._episodes_path(), self.project_path)
2535
2536    def _predictions(self) -> SavedRuns:
2537        """
2538        Get the predictions meta object
2539
2540        Returns
2541        -------
2542        predictions : SavedRuns
2543            the predictions meta object
2544        """
2545
2546        try:
2547            return SavedRuns(self._predictions_path(), self.project_path)
2548        except:
2549            self.load_metadata_backup()
2550            return SavedRuns(self._predictions_path(), self.project_path)
2551
2552    def _saved_datasets(self) -> SavedStores:
2553        """
2554        Get the datasets meta object
2555
2556        Returns
2557        -------
2558        datasets : SavedStores
2559            the datasets meta object
2560        """
2561
2562        try:
2563            return SavedStores(self._saved_datasets_path())
2564        except:
2565            self.load_metadata_backup()
2566            return SavedStores(self._saved_datasets_path())
2567
2568    def _prediction(self, name: str) -> Run:
2569        """
2570        Get a prediction meta object
2571
2572        Parameters
2573        ----------
2574        name : str
2575            episode name
2576
2577        Returns
2578        -------
2579        prediction : Run
2580            the prediction meta object
2581        """
2582
2583        try:
2584            return Run(name, self.project_path, meta_path=self._predictions_path())
2585        except:
2586            self.load_metadata_backup()
2587            return Run(name, self.project_path, meta_path=self._predictions_path())
2588
2589    def _episode(self, name: str) -> Run:
2590        """
2591        Get an episode meta object
2592
2593        Parameters
2594        ----------
2595        name : str
2596            episode name
2597
2598        Returns
2599        -------
2600        episode : Run
2601            the episode meta object
2602        """
2603
2604        try:
2605            return Run(name, self.project_path, meta_path=self._episodes_path())
2606        except:
2607            self.load_metadata_backup()
2608            return Run(name, self.project_path, meta_path=self._episodes_path())
2609
2610    def _searches(self) -> Searches:
2611        """
2612        Get the hyperparameter search meta object
2613
2614        Returns
2615        -------
2616        searches : Searches
2617            the searches meta object
2618        """
2619
2620        try:
2621            return Searches(self._searches_path(), self.project_path)
2622        except:
2623            self.load_metadata_backup()
2624            return Searches(self._searches_path(), self.project_path)
2625
2626    def _update_configs(self) -> None:
2627        """
2628        Update the project config files with newly added files and parameters
2629        """
2630
2631        self.update_parameters({"data": {"data_path": self.data_path}})
2632        folders = ["augmentations", "features", "model"]
2633        original_path = os.path.join(
2634            os.path.dirname(os.path.dirname(__file__)), "config"
2635        )
2636        project_path = os.path.join(self.project_path, "config")
2637        filenames = [x for x in os.listdir(original_path) if x.endswith("yaml")]
2638        for folder in folders:
2639            filenames += [
2640                os.path.join(folder, x)
2641                for x in os.listdir(os.path.join(original_path, folder))
2642            ]
2643        filenames.append(os.path.join("data", f"{self.data_type}.yaml"))
2644        if self.annotation_type != "none":
2645            filenames.append(os.path.join("annotation", f"{self.annotation_type}.yaml"))
2646        for file in filenames:
2647            filepath_original = os.path.join(original_path, file)
2648            if file.startswith("data") or file.startswith("annotation"):
2649                file = os.path.basename(file)
2650            filepath_project = os.path.join(project_path, file)
2651            if not os.path.exists(filepath_project):
2652                shutil.copy(filepath_original, filepath_project)
2653            else:
2654                original_pars = self._open_yaml(filepath_original)
2655                project_pars = self._open_yaml(filepath_project)
2656                to_remove = []
2657                for key, value in project_pars.items():
2658                    if key not in original_pars:
2659                        if key not in ["data_type", "annotation_type"]:
2660                            to_remove.append(key)
2661                for key in to_remove:
2662                    project_pars.pop(key)
2663                to_remove = []
2664                for key, value in original_pars.items():
2665                    if key in project_pars:
2666                        to_remove.append(key)
2667                for key in to_remove:
2668                    original_pars.pop(key)
2669                project_pars = self._update(project_pars, original_pars)
2670                with open(filepath_project, "w", encoding="utf-8") as f:
2671                    YAML().dump(project_pars, f)
2672
2673    def _update_project(self) -> None:
2674        """
2675        Update project files with the current version
2676        """
2677
2678        version_file = self._version_path()
2679        ok = True
2680        if not os.path.exists(version_file):
2681            ok = False
2682        else:
2683            with open(version_file) as f:
2684                project_version = f.read()
2685            if project_version < __version__:
2686                ok = False
2687            elif project_version > __version__:
2688                warnings.warn(
2689                    f"The project expects a higher dlc2action version ({project_version}), please update!"
2690                )
2691        if not ok:
2692            project_config_path = os.path.join(self.project_path, "config")
2693            config_path = os.path.join(
2694                os.path.dirname(os.path.dirname(__path__)), "config"
2695            )
2696            episodes = self._episodes()
2697            folders = ["annotation", "augmentations", "data", "features", "model"]
2698
2699            project_annotation_configs = os.listdir(
2700                os.path.join(project_config_path, "annotation")
2701            )
2702            annotation_configs = os.listdir(os.path.join(config_path, "annotation"))
2703            for ann_config in annotation_configs:
2704                if ann_config not in project_annotation_configs:
2705                    shutil.copytree(
2706                        os.path.join(config_path, "annotation", ann_config),
2707                        os.path.join(project_config_path, "annotation", ann_config),
2708                        dirs_exist_ok=True,
2709                    )
2710                else:
2711                    project_pars = self._open_yaml(
2712                        os.path.join(project_config_path, "annotation", ann_config)
2713                    )
2714                    pars = self._open_yaml(
2715                        os.path.join(config_path, "annotation", ann_config)
2716                    )
2717                    new_keys = set(pars.keys()) - set(project_pars.keys())
2718                    for key in new_keys:
2719                        project_pars[key] = pars[key]
2720                        c = self._get_comment(pars.ca.items.get(key))
2721                        project_pars.yaml_add_eol_comment(c, key=key)
2722                        episodes.update(
2723                            condition=f"general/annotation_type::={ann_config}",
2724                            update={f"data/{key}": pars[key]},
2725                        )
2726
2727    def _initialize_project(
2728        self,
2729        data_type: str,
2730        annotation_type: str = None,
2731        data_path: str = None,
2732        annotation_path: str = None,
2733        copy: bool = True,
2734    ) -> None:
2735        """
2736        Initialize a new project
2737        """
2738
2739        if data_type not in self.data_types():
2740            raise ValueError(
2741                f"The {data_type} data type is not available. "
2742                f"Please choose from {self.data_types()}"
2743            )
2744        if annotation_type not in self.annotation_types():
2745            raise ValueError(
2746                f"The {annotation_type} annotation type is not available. "
2747                f"Please choose from {self.annotation_types()}"
2748            )
2749        os.mkdir(self.project_path)
2750        folders = ["results", "saved_datasets", "meta", "config"]
2751        for f in folders:
2752            os.mkdir(os.path.join(self.project_path, f))
2753        results_subfolders = [
2754            "model",
2755            "logs",
2756            "predictions",
2757            "splits",
2758            "searches",
2759        ]
2760        for sf in results_subfolders:
2761            os.mkdir(os.path.join(self.project_path, "results", sf))
2762        if data_path is not None:
2763            if copy:
2764                os.mkdir(os.path.join(self.project_path, "data"))
2765                shutil.copytree(
2766                    data_path,
2767                    os.path.join(self.project_path, "data"),
2768                    dirs_exist_ok=True,
2769                )
2770                data_path = os.path.join(self.project_path, "data")
2771        if annotation_path is not None:
2772            if copy:
2773                os.mkdir(os.path.join(self.project_path, "annotation"))
2774                shutil.copytree(
2775                    annotation_path,
2776                    os.path.join(self.project_path, "annotation"),
2777                    dirs_exist_ok=True,
2778                )
2779                annotation_path = os.path.join(self.project_path, "annotation")
2780        self._generate_config(
2781            data_type,
2782            annotation_type,
2783            data_path=data_path,
2784            annotation_path=annotation_path,
2785        )
2786        self._generate_meta()
2787
2788    def _read_types(self) -> Tuple[str, str]:
2789        """
2790        Get data type and annotation type from existing project files
2791        """
2792
2793        config_path = os.path.join(self.project_path, "config", "general.yaml")
2794        with open(config_path) as f:
2795            pars = YAML().load(f)
2796        data_type = pars["data_type"]
2797        annotation_type = pars["annotation_type"]
2798        return annotation_type, data_type
2799
2800    def _read_paths(self) -> Tuple[str, str]:
2801        """
2802        Get data type and annotation type from existing project files
2803        """
2804
2805        config_path = os.path.join(self.project_path, "config", "data.yaml")
2806        with open(config_path) as f:
2807            pars = YAML().load(f)
2808        data_path = pars["data_path"]
2809        annotation_path = pars["annotation_path"]
2810        return annotation_path, data_path
2811
2812    def _generate_config(
2813        self, data_type: str, annotation_type: str, data_path: str, annotation_path: str
2814    ) -> None:
2815        """
2816        Initialize the config files
2817        """
2818
2819        default_path = os.path.join(
2820            os.path.dirname(os.path.dirname(__file__)), "config"
2821        )
2822        config_path = os.path.join(self.project_path, "config")
2823        files = ["losses", "metrics", "ssl", "training"]
2824        for f in files:
2825            shutil.copy(os.path.join(default_path, f"{f}.yaml"), config_path)
2826        shutil.copytree(
2827            os.path.join(default_path, "model"), os.path.join(config_path, "model")
2828        )
2829        shutil.copytree(
2830            os.path.join(default_path, "features"),
2831            os.path.join(config_path, "features"),
2832        )
2833        shutil.copytree(
2834            os.path.join(default_path, "augmentations"),
2835            os.path.join(config_path, "augmentations"),
2836        )
2837        yaml = YAML()
2838        data_param_path = os.path.join(default_path, "data", f"{data_type}.yaml")
2839        if os.path.exists(data_param_path):
2840            with open(data_param_path, encoding="utf-8") as f:
2841                data_params = yaml.load(f)
2842        if data_params is None:
2843            data_params = {}
2844        if annotation_type is None:
2845            ann_params = {}
2846        else:
2847            ann_param_path = os.path.join(
2848                default_path, "annotation", f"{annotation_type}.yaml"
2849            )
2850            if os.path.exists(ann_param_path):
2851                ann_params = self._open_yaml(ann_param_path)
2852            elif annotation_type == "none":
2853                ann_params = {}
2854            else:
2855                raise ValueError(
2856                    f"The {annotation_type} data type is not available. "
2857                    f"Please choose from {BehaviorDataset.annotation_types()}"
2858                )
2859        if ann_params is None:
2860            ann_params = {}
2861        data_params = self._update(data_params, ann_params)
2862        data_params["data_path"] = data_path
2863        data_params["annotation_path"] = annotation_path
2864        with open(os.path.join(config_path, "data.yaml"), "w", encoding="utf-8") as f:
2865            yaml.dump(data_params, f)
2866        with open(os.path.join(default_path, "general.yaml"), encoding="utf-8") as f:
2867            general_params = yaml.load(f)
2868        general_params["data_type"] = data_type
2869        general_params["annotation_type"] = annotation_type
2870        with open(os.path.join(config_path, "general.yaml"), "w", encoding="utf-8") as f:
2871            yaml.dump(general_params, f)
2872
2873    def _generate_meta(self) -> None:
2874        """
2875        Initialize the meta files
2876        """
2877
2878        config_file = os.path.join(self.project_path, "config")
2879        meta_fields = ["time"]
2880        columns = [("meta", field) for field in meta_fields]
2881        episodes = pd.DataFrame(columns=pd.MultiIndex.from_tuples(columns))
2882        episodes.to_pickle(self._episodes_path())
2883        meta_fields = ["time", "objective"]
2884        result_fields = ["best_params", "best_value"]
2885        columns = [("meta", field) for field in meta_fields] + [
2886            ("results", field) for field in result_fields
2887        ]
2888        searches = pd.DataFrame(columns=pd.MultiIndex.from_tuples(columns))
2889        searches.to_pickle(self._searches_path())
2890        meta_fields = ["time"]
2891        columns = [("meta", field) for field in meta_fields]
2892        predictions = pd.DataFrame(columns=pd.MultiIndex.from_tuples(columns))
2893        predictions.to_pickle(self._predictions_path())
2894        with open(os.path.join(config_file, "data.yaml")) as f:
2895            data_keys = list(YAML().load(f).keys())
2896        saved_data = pd.DataFrame(columns=data_keys)
2897        saved_data.to_pickle(self._saved_datasets_path())
2898        pd.DataFrame().to_pickle(self._thresholds_path())
2899        # with open(self._version_path()) as f:
2900        #     f.write(__version__)
2901
2902    def _open_yaml(self, path: str) -> CommentedMap:
2903        """
2904        Load a parameter dictionary from a .yaml file
2905        """
2906
2907        with open(path, encoding="utf-8") as f:
2908            data = YAML().load(f)
2909        if data is None:
2910            data = {}
2911        return data
2912
2913    def _compare(self, d: Dict, u: Dict, allow_diff: float = 1e-7):
2914        """
2915        Compare nested dictionaries with 'almost equal' condition
2916        """
2917
2918        ok = True
2919        if u.keys() != d.keys():
2920            ok = False
2921        else:
2922            for k, v in u.items():
2923                if isinstance(v, Mapping):
2924                    ok = self._compare(d[k], v, allow_diff=allow_diff)
2925                else:
2926                    if isinstance(v, float) or isinstance(d[k], float):
2927                        if not isinstance(d[k], float) and not isinstance(d[k], int):
2928                            ok = False
2929                        elif not isinstance(v, float) and not isinstance(v, int):
2930                            ok = False
2931                        elif np.abs(v - d[k]) > allow_diff:
2932                            ok = False
2933                    elif v != d[k]:
2934                        ok = False
2935        return ok
2936
2937    def _check_comment(self, comment_sequence: List) -> bool:
2938        """
2939        Check if a comment already exists in a ruamel.yaml comment sequence
2940        """
2941
2942        if comment_sequence is None:
2943            return False
2944        c = self._get_comment(comment_sequence)
2945        if c != "":
2946            return True
2947        else:
2948            return False
2949
2950    def _get_comment(self, comment_sequence: List, strip=True) -> str:
2951        """
2952        Get the comment string from a ruamel.yaml comment sequence
2953        """
2954
2955        if comment_sequence is None:
2956            return ""
2957        c = ""
2958        for cm in comment_sequence:
2959            if cm is not None:
2960                if isinstance(cm, Iterable):
2961                    for c in cm:
2962                        if c is not None:
2963                            c = c.value
2964                            break
2965                    break
2966                else:
2967                    c = cm.value
2968                    break
2969        if strip:
2970            c = c.strip()
2971        return c
2972
2973    def _update(self, d: Union[CommentedMap, Dict], u: Union[CommentedMap, Dict]):
2974        """
2975        Update a nested dictionary
2976        """
2977
2978        if "general" in u and "model_name" in u["general"] and "model" in d:
2979            model_name = u["general"]["model_name"]
2980            if d["general"]["model_name"] != model_name:
2981                d["model"] = self._open_yaml(
2982                    os.path.join(
2983                        self.project_path, "config", "model", f"{model_name}.yaml"
2984                    )
2985                )
2986        d_copied = deepcopy(d)
2987        for k, v in u.items():
2988            if (
2989                k in d_copied
2990                and isinstance(d_copied[k], list)
2991                and isinstance(v, Mapping)
2992                and all([isinstance(x, int) for x in v.keys()])
2993            ):
2994                for kk, vv in v.items():
2995                    d_copied[k][kk] = vv
2996            elif (
2997                isinstance(v, Mapping)
2998                and k in d_copied
2999                and isinstance(d_copied[k], Mapping)
3000            ):
3001                if d_copied[k] is None:
3002                    d_k = CommentedMap()
3003                else:
3004                    d_k = d_copied[k]
3005                d_copied[k] = self._update(d_k, v)
3006            else:
3007                d_copied[k] = v
3008                if isinstance(u, CommentedMap) and u.ca.items.get(k) is not None:
3009                    c = self._get_comment(u.ca.items.get(k), strip=False)
3010                    if isinstance(d_copied, CommentedMap) and not self._check_comment(
3011                        d_copied.ca.items.get(k)
3012                    ):
3013                        d_copied.yaml_add_eol_comment(c, key=k)
3014        return d_copied
3015
3016    def _update_with_search(
3017        self,
3018        d: Dict,
3019        search_name: str,
3020        load_parameters: list = None,
3021        round_to_binary: list = None,
3022    ):
3023        """
3024        Update a dictionary with best parameters from a hyperparameter search
3025        """
3026
3027        u, _ = self._searches().get_best_params(
3028            search_name, load_parameters, round_to_binary
3029        )
3030        return self._update(d, u)
3031
3032    def _read_parameters(self, catch_blanks=True) -> Dict:
3033        """
3034        Compose a parameter dictionary to create a task from the config files
3035        """
3036
3037        config_path = os.path.join(self.project_path, "config")
3038        keys = [
3039            "data",
3040            "general",
3041            "losses",
3042            "metrics",
3043            "ssl",
3044            "training",
3045        ]
3046        parameters = {}
3047        for key in keys:
3048            parameters[key] = self._open_yaml(os.path.join(config_path, f"{key}.yaml"))
3049        features = parameters["general"]["feature_extraction"]
3050        parameters["features"] = self._open_yaml(
3051            os.path.join(config_path, "features", f"{features}.yaml")
3052        )
3053        transformer = options.extractor_to_transformer[features]
3054        parameters["augmentations"] = self._open_yaml(
3055            os.path.join(config_path, "augmentations", f"{transformer}.yaml")
3056        )
3057        model = parameters["general"]["model_name"]
3058        parameters["model"] = self._open_yaml(
3059            os.path.join(config_path, "model", f"{model}.yaml")
3060        )
3061        # input = parameters["general"]["input"]
3062        # parameters["model"] = self._open_yaml(
3063        #     os.path.join(config_path, "model", f"{model}.yaml")
3064        # )
3065        if catch_blanks:
3066            blanks = self._get_blanks()
3067            if len(blanks) > 0:
3068                self.list_blanks()
3069                raise ValueError(
3070                    f"Please fill in all the blanks before running experiments"
3071                )
3072        return parameters
3073
3074    def set_main_parameters(self, model_name: str = None, metric_names: List = None):
3075        """
3076        Select the model and the metrics
3077
3078        Parameters
3079        ----------
3080        model_name : str, optional
3081            model name; run `project.help("model") to find out more
3082        metric_names : list, optional
3083            a list of metric function names; run `project.help("metrics") to find out more
3084        """
3085
3086        pars = {"general": {}}
3087        if model_name is not None:
3088            assert model_name in options.models
3089            pars["general"]["model_name"] = model_name
3090        if metric_names is not None:
3091            for metric in metric_names:
3092                assert metric in options.metrics
3093            pars["general"]["metric_functions"] = metric_names
3094        self.update_parameters(pars)
3095
3096    def help(self, keyword: str = None):
3097        """
3098        Get information on available options
3099
3100        Parameters
3101        ----------
3102        keyword : str, optional
3103            the keyword for options (run without arguments to see which keywords are available)
3104
3105        """
3106
3107        if keyword is None:
3108            print("AVAILABLE HELP FUNCTIONS:")
3109            print("- Try running `project.help(keyword)` with the following keywords:")
3110            print("    - model: to get more information on available models,")
3111            print(
3112                "    - features: to get more information on available feature extraction modes,"
3113            )
3114            print(
3115                "    - partition_method: to get more information on available train/test/val partitioning methods,"
3116            )
3117            print("    - metrics: to see a list of available metric functions.")
3118            print("    - data: to see help for expected data structure")
3119            print(
3120                "- To start working with this project, first run `project.list_blanks()` to check which parameters need to be filled in."
3121            )
3122            print(
3123                "- After a model and metrics are set, run `project.list_basic_parameters()` to see a list of the most important parameters that you might want to modify"
3124            )
3125            print(
3126                f"- If you want to dig deeper, get the full dictionary with project._read_parameters() (it is a `ruamel.yaml.comments.CommentedMap` instance)."
3127            )
3128        elif keyword == "model":
3129            print("MODELS:")
3130            for key, model in options.models.items():
3131                print(f"{key}:")
3132                print(model.__doc__)
3133        elif keyword == "features":
3134            print("FEATURE EXTRACTORS:")
3135            for key, extractor in options.feature_extractors.items():
3136                print(f"{key}:")
3137                print(extractor.__doc__)
3138        elif keyword == "partition_method":
3139            print("PARTITION METHODS:")
3140            print(
3141                BehaviorDataset.partition_train_test_val.__doc__.split(
3142                    "The partitioning method:"
3143                )[1].split("val_frac :")[0]
3144            )
3145        elif keyword == "metrics":
3146            print("METRICS:")
3147            for key, metric in options.metrics.items():
3148                print(f"{key}:")
3149                print(metric.__doc__)
3150        elif keyword == "data":
3151            print("DATA:")
3152            print(f"Video data: {self.data_type}")
3153            print(options.input_stores[self.data_type].__doc__)
3154            print(f"Annotation data: {self.annotation_type}")
3155            print(options.annotation_stores[self.annotation_type].__doc__)
3156            print(
3157                "Annotation path and data path don't have to be separate, you can keep everything in one folder."
3158            )
3159        else:
3160            raise ValueError(f"The {keyword} keyword is not recognized")
3161        print("\n")
3162
3163    def _process_value(self, value):
3164        if isinstance(value, str):
3165            value = f'"{value}"'
3166        elif isinstance(value, CommentedSet):
3167            value = {x for x in value}
3168        return value
3169
3170    def _get_blanks(self):
3171        caught = []
3172        parameters = self._read_parameters(catch_blanks=False)
3173        for big_key, big_value in parameters.items():
3174            for key, value in big_value.items():
3175                if value == "???":
3176                    caught.append(
3177                        (big_key, key, self._get_comment(big_value.ca.items.get(key)))
3178                    )
3179        return caught
3180
3181    def list_blanks(self, blanks=None):
3182        """
3183        List parameters that need to be filled in
3184
3185        Parameters
3186        ----------
3187        blanks : list, optional
3188            a list of the parameters to list, if already known
3189        """
3190
3191        if blanks is None:
3192            blanks = self._get_blanks()
3193        if len(blanks) > 0:
3194            to_update = defaultdict(lambda: [])
3195            for b, k, c in blanks:
3196                to_update[b].append((k, c))
3197            print("Before running experiments, please update all the blanks.")
3198            print("To do that, you can run this.")
3199            print("--------------------------------------------------------")
3200            print(f"project.update_parameters(")
3201            print(f"    {{")
3202            for big_key, keys in to_update.items():
3203                print(f'        "{big_key}": {{')
3204                for key, comment in keys:
3205                    print(f'            "{key}": ..., {comment}')
3206                print(f"        }},")
3207            print(f"    }}")
3208            print(")")
3209            print("--------------------------------------------------------")
3210            print("Replace ... with relevant values.")
3211        else:
3212            print("There is no blanks left!")
3213
3214    def list_basic_parameters(
3215        self,
3216    ):
3217        """
3218        Get a list of most relevant parameters and code to modify them
3219        """
3220
3221        parameters = self._read_parameters()
3222        print("BASIC PARAMETERS:")
3223        model_name = parameters["general"]["model_name"]
3224        metric_names = parameters["general"]["metric_functions"]
3225        loss_name = parameters["general"]["loss_function"]
3226        feature_extraction = parameters["general"]["feature_extraction"]
3227        print("Here is a list of current parameters.")
3228        print(
3229            "You can copy this code, change the parameters you want to set and run it to update the project config."
3230        )
3231        print("--------------------------------------------------------")
3232        print("project.update_parameters(")
3233        print("    {")
3234        for group in ["general", "data", "training"]:
3235            print(f'        "{group}": {{')
3236            for key in options.basic_parameters[group]:
3237                if key in parameters[group]:
3238                    print(
3239                        f'            "{key}": {self._process_value(parameters[group][key])}, {self._get_comment(parameters[group].ca.items.get(key))}'
3240                    )
3241            print("        },")
3242        print('        "losses": {')
3243        print(f'            "{loss_name}": {{')
3244        for key in options.basic_parameters["losses"][loss_name]:
3245            if key in parameters["losses"][loss_name]:
3246                print(
3247                    f'                "{key}": {self._process_value(parameters["losses"][loss_name][key])}, {self._get_comment(parameters["losses"][loss_name].ca.items.get(key))}'
3248                )
3249        print("            },")
3250        print("        },")
3251        print('        "metrics": {')
3252        for metric in metric_names:
3253            print(f'            "{metric}": {{')
3254            for key in parameters["metrics"][metric]:
3255                print(
3256                    f'                "{key}": {self._process_value(parameters["metrics"][metric][key])}, {self._get_comment(parameters["metrics"][metric].ca.items.get(key))}'
3257                )
3258            print("            },")
3259        print("        },")
3260        print('        "model": {')
3261        for key in options.basic_parameters["model"][model_name]:
3262            if key in parameters["model"]:
3263                print(
3264                    f'            "{key}": {self._process_value(parameters["model"][key])}, {self._get_comment(parameters["model"].ca.items.get(key))}'
3265                )
3266
3267        print("        },")
3268        print('        "features": {')
3269        for key in options.basic_parameters["features"][feature_extraction]:
3270            if key in parameters["features"]:
3271                print(
3272                    f'            "{key}": {self._process_value(parameters["features"][key])}, {self._get_comment(parameters["features"].ca.items.get(key))}'
3273                )
3274
3275        print("        },")
3276        print('        "augmentations": {')
3277        for key in options.basic_parameters["augmentations"][feature_extraction]:
3278            if key in parameters["augmentations"]:
3279                print(
3280                    f'            "{key}": {self._process_value(parameters["augmentations"][key])}, {self._get_comment(parameters["augmentations"].ca.items.get(key))}'
3281                )
3282        print("        },")
3283        print("    },")
3284        print(")")
3285        print("--------------------------------------------------------")
3286        print("\n")
3287
3288    def _create_record(
3289        self,
3290        episode_name: str,
3291        behaviors_dict: Dict,
3292        load_episode: str = None,
3293        parameters_update: Dict = None,
3294        task: TaskDispatcher = None,
3295        load_epoch: int = None,
3296        load_search: str = None,
3297        load_parameters: list = None,
3298        round_to_binary: list = None,
3299        load_strict: bool = True,
3300        n_seeds: int = 1,
3301    ) -> TaskDispatcher:
3302        """
3303        Create a meta data episode record
3304        """
3305
3306        if episode_name in self._episodes().data.index:
3307            return
3308        if type(n_seeds) is not int or n_seeds < 1:
3309            raise ValueError(
3310                f"The n_seeds parameter has to be an integer larger than 0; got {n_seeds}"
3311            )
3312        if parameters_update is None:
3313            parameters_update = {}
3314        parameters = self._read_parameters()
3315        parameters = self._update(parameters, parameters_update)
3316        if load_search is not None:
3317            parameters = self._update_with_search(
3318                parameters, load_search, load_parameters, round_to_binary
3319            )
3320        parameters = self._fill(
3321            parameters,
3322            episode_name,
3323            load_episode,
3324            load_epoch=load_epoch,
3325            only_load_model=True,
3326            load_strict=load_strict,
3327            continuing=True,
3328        )
3329        self._save_episode(episode_name, parameters, behaviors_dict)
3330        return task
3331
3332    def _save_thresholds(
3333        self,
3334        episode_names: List,
3335        metric_name: str,
3336        parameters: Dict,
3337        thresholds: List,
3338        load_epochs: List,
3339    ):
3340        """
3341        Save optimal decision thresholds in the meta records
3342        """
3343
3344        metric_parameters = parameters["metrics"][metric_name]
3345        self._thresholds().save_thresholds(
3346            episode_names, load_epochs, metric_name, metric_parameters, thresholds
3347        )
3348
3349    def _save_episode(
3350        self,
3351        episode_name: str,
3352        parameters: Dict,
3353        behaviors_dict: Dict,
3354        suppress_validation: bool = False,
3355        training_time: str = None,
3356        norm_stats: Dict = None,
3357    ) -> None:
3358        """
3359        Save an episode in the meta files
3360        """
3361
3362        try:
3363            split_info = self._split_info_from_filename(
3364                parameters["training"]["split_path"]
3365            )
3366            parameters["training"]["partition_method"] = split_info["partition_method"]
3367        except:
3368            pass
3369        if norm_stats is not None:
3370            norm_stats = dict(norm_stats)
3371        parameters["training"]["stats"] = norm_stats
3372        self._episodes().save_episode(
3373            episode_name,
3374            parameters,
3375            behaviors_dict,
3376            suppress_validation=suppress_validation,
3377            training_time=training_time,
3378        )
3379
3380    def _update_episode_results(
3381        self,
3382        episode_name: str,
3383        logs: Tuple,
3384        training_time: str = None,
3385    ) -> None:
3386        """
3387        Save the results of a run in the meta files
3388        """
3389
3390        self._episodes().update_episode_results(episode_name, logs, training_time)
3391
3392    def _save_prediction(
3393        self,
3394        episode_name: str,
3395        parameters: Dict,
3396        behaviors_dict: Dict,
3397        embedding: bool = False,
3398        inference_time: str = None,
3399    ) -> None:
3400        """
3401        Save a prediction in the meta files
3402        """
3403
3404        parameters = self._update(
3405            parameters,
3406            {"meta": {"embedding": embedding, "inference_time": inference_time}},
3407        )
3408        self._predictions().save_episode(episode_name, parameters, behaviors_dict)
3409
3410    def _save_search(
3411        self,
3412        search_name: str,
3413        parameters: Dict,
3414        n_trials: int,
3415        best_params: Dict,
3416        best_value: float,
3417        metric: str,
3418        search_space: Dict,
3419    ) -> None:
3420        """
3421        Save a hyperparameter search in the meta files
3422        """
3423
3424        self._searches().save_search(
3425            search_name,
3426            parameters,
3427            n_trials,
3428            best_params,
3429            best_value,
3430            metric,
3431            search_space,
3432        )
3433
3434    def _save_stores(self, parameters: Dict) -> None:
3435        """
3436        Save a pickled dataset in the meta files
3437        """
3438
3439        name = os.path.basename(parameters["data"]["feature_save_path"])
3440        self._saved_datasets().save_store(name, self._get_data_pars(parameters))
3441        self.create_metadata_backup()
3442
3443    def _remove_stores(self, parameters: Dict, remove_active: bool = False) -> None:
3444        """
3445        Remove the pre-computed features folder
3446        """
3447
3448        name = os.path.basename(parameters["data"]["feature_save_path"])
3449        if remove_active or name not in self._episodes().get_active_datasets():
3450            self.remove_saved_features([name])
3451
3452    def _check_episode_validity(
3453        self, episode_name: str, allow_doublecolon: bool = False, force: bool = False
3454    ) -> None:
3455        """
3456        Check whether the episode name is valid
3457        """
3458
3459        if episode_name.startswith("_"):
3460            raise ValueError(
3461                "Names starting with an underscore are reserved by dlc2action and cannot be used!"
3462            )
3463        elif "." in episode_name:
3464            raise ValueError("Names containing '.' cannot be used!")
3465        if not allow_doublecolon and "::" in episode_name:
3466            raise ValueError(
3467                "Names containing '::' are reserved by dlc2action and cannot be used!"
3468            )
3469        if force:
3470            self.remove_episode(episode_name)
3471        elif not self._episodes().check_name_validity(episode_name):
3472            raise ValueError(
3473                f"The {episode_name} name is already taken! Set force=True to overwrite."
3474            )
3475
3476    def _check_search_validity(self, search_name: str, force: bool = False) -> None:
3477        """
3478        Check whether the search name is valid
3479        """
3480
3481        if search_name.startswith("_"):
3482            raise ValueError(
3483                "Names starting with an underscore are reserved by dlc2action and cannot be used!"
3484            )
3485        elif "." in search_name:
3486            raise ValueError("Names containing '.' cannot be used!")
3487        if force:
3488            self.remove_search(search_name)
3489        elif not self._searches().check_name_validity(search_name):
3490            raise ValueError(f"The {search_name} name is already taken!")
3491
3492    def _check_prediction_validity(
3493        self, prediction_name: str, force: bool = False
3494    ) -> None:
3495        """
3496        Check whether the prediction name is valid
3497        """
3498
3499        if prediction_name.startswith("_"):
3500            raise ValueError(
3501                "Names starting with an underscore are reserved by dlc2action and cannot be used!"
3502            )
3503        elif "." in prediction_name:
3504            raise ValueError("Names containing '.' cannot be used!")
3505        if force:
3506            self.remove_prediction(prediction_name)
3507        elif not self._predictions().check_name_validity(prediction_name):
3508            raise ValueError(f"The {prediction_name} name is already taken!")
3509
3510    def _training_time(self, episode_name: str) -> int:
3511        """
3512        Get the training time of an episode in seconds
3513        """
3514
3515        return self._episode(episode_name).training_time()
3516
3517    def _mask_path(self) -> str:
3518        """
3519        Get the path to the masks folder
3520        """
3521
3522        return os.path.join(self.project_path, "results", "masks")
3523
3524    def _thresholds_path(self) -> str:
3525        """
3526        Get the path to the thresholds meta file
3527        """
3528
3529        return os.path.join(self.project_path, "meta", "thresholds.pickle")
3530
3531    def _episodes_path(self) -> str:
3532        """
3533        Get the path to the episodes meta file
3534        """
3535
3536        return os.path.join(self.project_path, "meta", "episodes.pickle")
3537
3538    def _saved_datasets_path(self) -> str:
3539        """
3540        Get the path to the datasets meta file
3541        """
3542
3543        return os.path.join(self.project_path, "meta", "saved_datasets.pickle")
3544
3545    def _predictions_path(self) -> str:
3546        """
3547        Get the path to the predictions meta file
3548        """
3549
3550        return os.path.join(self.project_path, "meta", "predictions.pickle")
3551
3552    def _dataset_store_path(self, name: str) -> str:
3553        """
3554        Get the path to a specific pickled dataset
3555        """
3556
3557        return os.path.join(self.project_path, "saved_datasets", f"{name}.pickle")
3558
3559    def _searches_path(self) -> str:
3560        """
3561        Get the path to the hyperparameter search meta file
3562        """
3563
3564        return os.path.join(self.project_path, "meta", "searches.pickle")
3565
3566    def _search_path(self, name: str) -> str:
3567        """
3568        Get the default path to the graph folder for a specific hyperparameter search
3569        """
3570
3571        return os.path.join(self.project_path, "results", "searches", name)
3572
3573    def _version_path(self) -> str:
3574        """
3575        Get the path to the version file
3576        """
3577
3578        return os.path.join(self.project_path, "meta", "version.txt")
3579
3580    def _default_split_file(self, split_info: Dict) -> Optional[str]:
3581        """
3582        Generate a path to a split file from split parameters
3583        """
3584
3585        if split_info["partition_method"].startswith("time"):
3586            return None
3587        val_frac = split_info["val_frac"]
3588        test_frac = split_info["test_frac"]
3589        split_name = f'{split_info["partition_method"]}_val{val_frac * 100}%_test{test_frac * 100}%_len{split_info["len_segment"]}_overlap{split_info["overlap"]}'
3590        if not split_info["only_load_annotated"]:
3591            split_name += "_all"
3592        split_name += ".txt"
3593        return os.path.join(self.project_path, "results", "splits", split_name)
3594
3595    def _split_info_from_filename(self, split_name: str) -> Dict:
3596        """
3597        Get split parameters from default path to a split file
3598        """
3599
3600        if split_name is None:
3601            return {}
3602        try:
3603            name = os.path.basename(split_name)[:-4]
3604            split = name.split("_")
3605            if len(split) == 6:
3606                only_load_annotated = False
3607            else:
3608                only_load_annotated = True
3609            len_segment = int(split[3][3:])
3610            overlap = int(split[4][7:])
3611            method, val, test = split[:3]
3612            val = float(val[3:-1]) / 100
3613            test = float(test[4:-1]) / 100
3614            return {
3615                "partition_method": method,
3616                "val_frac": val,
3617                "test_frac": test,
3618                "only_load_annotated": only_load_annotated,
3619                "len_segment": len_segment,
3620                "overlap": overlap,
3621            }
3622        except:
3623            return {"partition_method": "file"}
3624
3625    def _fill(
3626        self,
3627        parameters: Dict,
3628        episode_name: str,
3629        load_experiment: str = None,
3630        load_epoch: int = None,
3631        load_strict: bool = True,
3632        only_load_model: bool = False,
3633        continuing: bool = False,
3634        enforce_split_parameters: bool = False,
3635    ) -> Dict:
3636        """
3637        Update the parameters from the config files with project specific information
3638
3639        Fill in the constant file path parameters and generate a unique log file and a model folder.
3640        Fill in the split file if the same split has been run before in the project and change partition method to
3641        from_file.
3642        Fill in saved data path if a dataset with the same data parameters already exists in the project.
3643        If load_experiment is not None, fill in the checkpoint path as well.
3644        The only_load_model training parameter is defined by the corresponding argument.
3645        If continuing is True, new files are not created and all information is loaded from load_experiment.
3646        If prediction is True, log and model files are not created.
3647        The enforce_split_parameters parameter is used to resolve conflicts
3648        between split file path and split parameters when they arise.
3649        """
3650
3651        pars = deepcopy(parameters)
3652        if episode_name == "_":
3653            self.remove_episode("_")
3654        log = os.path.join(self.project_path, "results", "logs", f"{episode_name}.txt")
3655        model_save_path = os.path.join(
3656            self.project_path, "results", "model", episode_name
3657        )
3658        if not continuing and (os.path.exists(log) or os.path.exists(model_save_path)):
3659            raise ValueError(
3660                f"The {episode_name} episode name is already in use! Set force=True to overwrite."
3661            )
3662        keys = ["val_frac", "test_frac", "partition_method"]
3663        if "len_segment" not in pars["general"] and "len_segment" in pars["data"]:
3664            pars["general"]["len_segment"] = pars["data"]["len_segment"]
3665        if "overlap" not in pars["general"] and "overlap" in pars["data"]:
3666            pars["general"]["overlap"] = pars["data"]["overlap"]
3667        if "len_segment" in pars["data"]:
3668            pars["data"].pop("len_segment")
3669        if "overlap" in pars["data"]:
3670            pars["data"].pop("overlap")
3671        split_info = {k: pars["training"][k] for k in keys}
3672        split_info["only_load_annotated"] = pars["general"]["only_load_annotated"]
3673        split_info["len_segment"] = pars["general"]["len_segment"]
3674        split_info["overlap"] = pars["general"]["overlap"]
3675        pars["training"]["log_file"] = log
3676        if not os.path.exists(model_save_path):
3677            os.mkdir(model_save_path)
3678        pars["training"]["model_save_path"] = model_save_path
3679        if load_experiment is not None:
3680            if load_experiment not in self._episodes().data.index:
3681                raise ValueError(f"The {load_experiment} episode does not exist!")
3682            old_episode = self._episode(load_experiment)
3683            old_file = old_episode.split_file()
3684            old_info = self._split_info_from_filename(old_file)
3685            if len(old_info) == 0:
3686                old_info = old_episode.split_info()
3687            if enforce_split_parameters:
3688                if split_info["partition_method"] != "file":
3689                    pars["training"]["split_path"] = self._default_split_file(
3690                        split_info
3691                    )
3692            else:
3693                equal = True
3694                if old_info["partition_method"] != split_info["partition_method"]:
3695                    equal = False
3696                if old_info["partition_method"] != "file":
3697                    if (
3698                        old_info["val_frac"] != split_info["val_frac"]
3699                        or old_info["test_frac"] != split_info["test_frac"]
3700                    ):
3701                        equal = False
3702                if not continuing and not equal:
3703                    warnings.warn(
3704                        f"The partitioning parameters in the loaded experiment ({old_info}) "
3705                        f"are not equal to the current partitioning parameters ({split_info}). "
3706                        f"The current parameters are replaced."
3707                    )
3708                pars["training"]["split_path"] = old_file
3709            pars["training"]["checkpoint_path"] = old_episode.model_file(load_epoch)
3710            pars["training"]["load_strict"] = load_strict
3711        else:
3712            pars["training"]["checkpoint_path"] = None
3713            if pars["training"]["partition_method"] == "file":
3714                if (
3715                    "split_path" not in pars["training"]
3716                    or pars["training"]["split_path"] is None
3717                ):
3718                    raise ValueError(
3719                        "The partition_method parameter is set to file but the "
3720                        "split_path parameter is not set!"
3721                    )
3722                elif not os.path.exists(pars["training"]["split_path"]):
3723                    raise ValueError(
3724                        f'The {pars["training"]["split_path"]} split file does not exist'
3725                    )
3726            else:
3727                pars["training"]["split_path"] = self._default_split_file(split_info)
3728        pars["training"]["only_load_model"] = only_load_model
3729        pars["data"]["saved_data_path"] = None
3730        pars["data"]["feature_save_path"] = None
3731        pars_data_copy = self._get_data_pars(pars)
3732        saved_data_name = self._saved_datasets().find_name(pars_data_copy)
3733        if saved_data_name is not None:
3734            pars["data"]["saved_data_path"] = self._dataset_store_path(saved_data_name)
3735            pars["data"]["feature_save_path"] = self._dataset_store_path(
3736                saved_data_name
3737            ).split(".")[0]
3738        else:
3739            dataset_path = self._dataset_store_path(episode_name)
3740            if os.path.exists(dataset_path):
3741                name, ext = dataset_path.split(".")
3742                i = 0
3743                while os.path.exists(f"{name}_{i}.{ext}"):
3744                    i += 1
3745                dataset_path = f"{name}_{i}.{ext}"
3746            pars["data"]["saved_data_path"] = dataset_path
3747            pars["data"]["feature_save_path"] = dataset_path.split(".")[0]
3748        split_split = pars["training"]["partition_method"].split(":")
3749        random = True
3750        for partition_method in options.partition_methods["fixed"]:
3751            method_split = partition_method.split(":")
3752            if len(split_split) != len(method_split):
3753                continue
3754            equal = True
3755            for x, y in zip(split_split, method_split):
3756                if y.startswith("{"):
3757                    continue
3758                if x != y:
3759                    equal = False
3760                    break
3761            if equal:
3762                random = False
3763                break
3764        if random and os.path.exists(pars["training"]["split_path"]):
3765            pars["training"]["partition_method"] = "file"
3766        pars["general"]["save_dataset"] = True
3767        return pars
3768
3769    def _get_data_pars(self, pars: Dict) -> Dict:
3770        """
3771        Get a complete description of the data from a general parameters dictionary
3772        """
3773
3774        pars_data_copy = deepcopy(pars["data"])
3775        for par in [
3776            "only_load_annotated",
3777            "exclusive",
3778            "feature_extraction",
3779            "ignored_clips",
3780            "len_segment",
3781            "overlap",
3782        ]:
3783            pars_data_copy[par] = pars["general"].get(par, None)
3784        pars_data_copy.update(pars["features"])
3785        return pars_data_copy
3786
3787    def count_classes(
3788        self,
3789        load_episode: str = None,
3790        parameters_update: Dict = None,
3791        remove_saved_features: bool = False,
3792        bouts: bool = True,
3793    ) -> Dict:
3794        """
3795        Get a dictionary of class counts in different modes
3796
3797        Parameters
3798        ----------
3799        load_episode : str, optional
3800            the episode settings to load
3801        parameters_update : dict, optional
3802            a dictionary of parameter updates (only for "data" and "general" categories)
3803        remove_saved_features : bool, default False
3804            if `True`, the dataset that is used for computation is then deleted
3805        bouts : bool, default False
3806            if `True`, instead of frame counts segment counts are returned
3807
3808        Returns
3809        -------
3810        class_counts : dict
3811            a dictionary where first-level keys are "train", "val" and "test", second-level keys are
3812            class names and values are class counts (in frames)
3813        """
3814
3815        if load_episode is None:
3816            task, parameters = self._make_task_training(
3817                episode_name="_", parameters_update=parameters_update, throwaway=True
3818            )
3819        else:
3820            task, parameters, _ = self._make_task_prediction(
3821                "_",
3822                load_episode=load_episode,
3823                parameters_update=parameters_update,
3824            )
3825        class_counts = task.count_classes(bouts=bouts)
3826        behaviors = task.behaviors_dict()
3827        class_counts = {
3828            kk: {behaviors.get(k, "unknown"): v for k, v in vv.items()}
3829            for kk, vv in class_counts.items()
3830        }
3831        if remove_saved_features:
3832            self._remove_stores(parameters)
3833        return class_counts
3834
3835    def plot_class_distribution(
3836        self,
3837        parameters_update: Dict = None,
3838        frame_cutoff: int = 1,
3839        bout_cutoff: int = 1,
3840        print_full: bool = False,
3841        remove_saved_features: bool = False,
3842    ) -> None:
3843        """
3844        Make a class distribution plot
3845
3846        You can either specify the parameters, choose an existing dataset or do neither (in that case a dataset
3847        is created or laoded for the computation with the default parameters).
3848
3849        Parameters
3850        ----------
3851        parameters_update : dict, optional
3852            a dictionary of parameter updates (only for "data" and "general" categories)
3853        remove_saved_features : bool, default False
3854            if `True`, the dataset that is used for computation is then deleted
3855        """
3856
3857        task, parameters = self._make_task_training(
3858            episode_name="_", parameters_update=parameters_update, throwaway=True
3859        )
3860        cutoff = {True: bout_cutoff, False: frame_cutoff}
3861        for bouts in [True, False]:
3862            class_counts = task.count_classes(bouts=bouts)
3863            if print_full:
3864                print("Bouts:" if bouts else "Frames:")
3865                for k, v in class_counts.items():
3866                    if sum(v.values()) != 0:
3867                        print(f"  {k}:")
3868                        values, keys = zip(
3869                            *[
3870                                x
3871                                for x in sorted(zip(v.values(), v.keys()), reverse=True)
3872                                if x[-1] != -100
3873                            ]
3874                        )
3875                        for kk, vv in zip(keys, values):
3876                            print(f"    {task.behaviors_dict()[kk]}: {vv}")
3877            class_counts = {
3878                kk: {k: v for k, v in vv.items() if v >= cutoff[bouts]}
3879                for kk, vv in class_counts.items()
3880            }
3881            for key, d in class_counts.items():
3882                if sum(d.values()) != 0:
3883                    values, keys = zip(
3884                        *[x for x in sorted(zip(d.values(), d.keys())) if x[-1] != -100]
3885                    )
3886                    keys = [task.behaviors_dict()[x] for x in keys]
3887                    plt.bar(keys, values)
3888                    plt.title(key)
3889                    plt.xticks(rotation=45, ha="right")
3890                    if bouts:
3891                        plt.ylabel("bouts")
3892                    else:
3893                        plt.ylabel("frames")
3894                    plt.tight_layout()
3895                    plt.show()
3896        if remove_saved_features:
3897            self._remove_stores(parameters)
3898
3899    def _generate_mask(
3900        self,
3901        mask_name: str,
3902        perc_annotated: float = 0.1,
3903        parameters_update: Dict = None,
3904        remove_saved_features: bool = False,
3905    ) -> None:
3906        """
3907        Generate a real_lens for active learning simulation
3908
3909        Parameters
3910        ----------
3911        mask_name : str
3912            the name of the real_lens
3913        """
3914
3915        print(f"GENERATING {mask_name}")
3916        task, parameters = self._make_task_training(
3917            f"_{mask_name}", parameters_update=parameters_update, throwaway=True
3918        )
3919        val_intervals, val_ids = task.dataset("val").get_intervals()  # 1
3920        unannotated_intervals = task.dataset("train").get_unannotated_intervals()  # 2
3921        unannotated_intervals = task.dataset("val").get_unannotated_intervals(
3922            first_intervals=unannotated_intervals
3923        )
3924        ids = task.dataset("train").get_ids()
3925        mask = {video_id: {} for video_id in ids}
3926        total_all = 0
3927        total_masked = 0
3928        for video_id, clip_ids in ids.items():
3929            for clip_id in clip_ids:
3930                frames = np.ones(task.dataset("train").get_len(video_id, clip_id))
3931                if clip_id in val_intervals[video_id]:
3932                    for start, end in val_intervals[video_id][clip_id]:
3933                        frames[start:end] = 0
3934                if clip_id in unannotated_intervals[video_id]:
3935                    for start, end in unannotated_intervals[video_id][clip_id]:
3936                        frames[start:end] = 0
3937                annotated = np.where(frames)[0]
3938                total_all += len(annotated)
3939                masked = annotated[-int(len(annotated) * (1 - perc_annotated)) :]
3940                total_masked += len(masked)
3941                mask[video_id][clip_id] = self._get_intervals(masked)
3942        file = {
3943            "masked": mask,
3944            "val_intervals": val_intervals,
3945            "val_ids": val_ids,
3946            "unannotated": unannotated_intervals,
3947        }
3948        self._save_mask(file, mask_name)
3949        if remove_saved_features:
3950            self._remove_stores(parameters)
3951        print("\n")
3952        # print(f'Unmasked: {sum([(vv == 0).sum() for v in real_lens.values() for vv in v.values()])} frames')
3953
3954    def _get_intervals(self, frame_indices: np.ndarray):
3955        """
3956        Get a list of intervals from a list of frame indices
3957
3958        Example: `[0, 1, 2, 5, 6, 8] -> [[0, 3], [5, 7], [8, 9]]`.
3959
3960        Parameters
3961        ----------
3962        frame_indices : np.ndarray
3963            a list of frame indices
3964
3965        Returns
3966        -------
3967        intervals : list
3968            a list of interval boundaries
3969        """
3970
3971        masked_intervals = []
3972        if len(frame_indices) > 0:
3973            breaks = np.where(np.diff(frame_indices) != 1)[0]
3974            start = frame_indices[0]
3975            for k in breaks:
3976                masked_intervals.append([start, frame_indices[k] + 1])
3977                start = frame_indices[k + 1]
3978            masked_intervals.append([start, frame_indices[-1] + 1])
3979        return masked_intervals
3980
3981    def _update_mask_with_uncertainty(
3982        self,
3983        mask_name: str,
3984        episode_name: Union[str, None],
3985        classes: List,
3986        load_epoch: int = None,
3987        n_frames: int = 10000,
3988        method: str = "least_confidence",
3989        min_length: int = 30,
3990        augment_n: int = 0,
3991        parameters_update: Dict = None,
3992    ):
3993        """
3994        Update real_lens with frame-wise uncertainty scores for active learning
3995
3996        Parameters
3997        ----------
3998        mask_name : str
3999            the name of the real_lens
4000        episode_name : str
4001            the name of the episode to load
4002        classes : list
4003            a list of class names or indices; their uncertainty scores will be computed separately and stacked
4004        n_frames : int, default 10000
4005            the number of frames to "annotate"
4006        method : {"least_confidence", "entropy"}
4007            the method used to calculate the scores from the probability predictions (`"least_confidence"`: `1 - p_i` if
4008            `p_i > 0.5` or `p_i` if `p_i < 0.5`; `"entropy"`: `- p_i * log(p_i) - (1 - p_i) * log(1 - p_i)`)
4009        min_length : int
4010            the minimum length (in frames) of the annotated intervals
4011        augment_n : int, default 0
4012            the number of augmentations to average over
4013        parameters_update : dict, optional
4014            the dictionary used to update the parameters from the config
4015
4016        Returns
4017        -------
4018        score_dicts : dict
4019            a nested dictionary where first level keys are video ids, second level keys are clip ids and values
4020            are score tensors
4021        """
4022
4023        print(f"UPDATING {mask_name}")
4024        task, parameters, _ = self._make_task_prediction(
4025            prediction_name=mask_name,
4026            load_episode=episode_name,
4027            parameters_update=parameters_update,
4028            load_epoch=load_epoch,
4029            mode="train",
4030        )
4031        score_tensors = task.generate_uncertainty_score(classes, augment_n, method)
4032        self._update_mask(task, mask_name, score_tensors, n_frames, min_length)
4033        print("\n")
4034
4035    def _update_mask_with_BALD(
4036        self,
4037        mask_name: str,
4038        episode_name: str,
4039        classes: List,
4040        load_epoch: int = None,
4041        augment_n: int = 0,
4042        n_frames: int = 10000,
4043        num_models: int = 10,
4044        kernel_size: int = 11,
4045        min_length: int = 30,
4046        parameters_update: Dict = None,
4047    ):
4048        """
4049        Update real_lens with frame-wise Bayesian Active Learning by Disagreement scores for active learning
4050
4051        Parameters
4052        ----------
4053        mask_name : str
4054            the name of the real_lens
4055        episode_name : str
4056            the name of the episode to load
4057        classes : list
4058            a list of class names or indices; their uncertainty scores will be computed separately and stacked
4059        augment_n : int, default 0
4060            the number of augmentations to average over
4061        n_frames : int, default 10000
4062            the number of frames to "annotate"
4063        num_models : int, default 10
4064            the number of dropout masks to apply
4065        kernel_size : int, default 11
4066            the size of the smoothing gaussian kernel
4067        min_length : int
4068            the minimum length (in frames) of the annotated intervals
4069        parameters_update : dict, optional
4070            the dictionary used to update the parameters from the config
4071
4072        Returns
4073        -------
4074        score_dicts : dict
4075            a nested dictionary where first level keys are video ids, second level keys are clip ids and values
4076            are score tensors
4077        """
4078
4079        print(f"UPDATING {mask_name}")
4080        task, parameters, mode = self._make_task_prediction(
4081            mask_name,
4082            load_episode=episode_name,
4083            parameters_update=parameters_update,
4084            load_epoch=load_epoch,
4085        )
4086        score_tensors = task.generate_bald_score(
4087            classes, augment_n, num_models, kernel_size
4088        )
4089        self._update_mask(task, mask_name, score_tensors, n_frames, min_length)
4090        print("\n")
4091
4092    def _suggest_intervals(
4093        self,
4094        dataset: BehaviorDataset,
4095        score_tensors: Dict,
4096        n_frames: int,
4097        min_length: int,
4098    ) -> Dict:
4099        """
4100        Suggest intervals with highest score of total length `n_frames`
4101
4102        Parameters
4103        ----------
4104        dataset : BehaviorDataset
4105            the dataset
4106        score_tensors : dict
4107            a dictionary where keys are clip ids and values are framewise score tensors
4108        n_frames : int
4109            the number of frames to "annotate"
4110        min_length : int
4111
4112        Returns
4113        -------
4114        active_learning_intervals : Dict
4115            active learning dictionary with suggested intervals
4116        """
4117
4118        video_intervals, _ = dataset.get_intervals()
4119        taken = {
4120            video_id: defaultdict(lambda: {}) for video_id in video_intervals.keys()
4121        }
4122        annotated = dataset.get_annotated_intervals()
4123        for video_id in video_intervals:
4124            for clip_id in video_intervals[video_id]:
4125                taken[video_id][clip_id] = torch.zeros(
4126                    dataset.get_len(video_id, clip_id)
4127                )
4128                if video_id in annotated and clip_id in annotated[video_id]:
4129                    for start, end in annotated[video_id][clip_id]:
4130                        score_tensors[video_id][clip_id][:, start:end] = -10
4131                        taken[video_id][clip_id][int(start) : int(end)] = 1
4132        n_frames = (
4133            sum([(vv == 1).sum() for v in taken.values() for vv in v.values()])
4134            + n_frames
4135        )
4136        factor = 1
4137        threshold_start = float(
4138            torch.mean(
4139                torch.tensor(
4140                    [
4141                        torch.mean(
4142                            torch.tensor([torch.mean(y[y > 0]) for y in x.values()])
4143                        )
4144                        for x in score_tensors.values()
4145                    ]
4146                )
4147            )
4148        )
4149        while (
4150            sum([(vv == 1).sum() for v in taken.values() for vv in v.values()])
4151            < n_frames
4152        ):
4153            threshold = threshold_start * factor
4154            intervals = []
4155            interval_scores = []
4156            key1 = list(score_tensors.keys())[0]
4157            key2 = list(score_tensors[key1].keys())[0]
4158            num_scores = score_tensors[key1][key2].shape[0]
4159            for i in range(num_scores):
4160                v_dict = dataset.find_valleys(
4161                    predicted=score_tensors,
4162                    threshold=threshold,
4163                    min_frames=min_length,
4164                    main_class=i,
4165                    low=False,
4166                )
4167                for v_id, interval_list in v_dict.items():
4168                    intervals += [x + [v_id] for x in interval_list]
4169                    interval_scores += [
4170                        float(torch.mean(score_tensors[v_id][clip_id][i, start:end]))
4171                        for start, end, clip_id in interval_list
4172                    ]
4173            intervals = np.array(intervals)[np.argsort(interval_scores)[::-1]]
4174            i = 0
4175            while sum(
4176                [(vv == 1).sum() for v in taken.values() for vv in v.values()]
4177            ) < n_frames and i < len(intervals):
4178                start, end, clip_id, video_id = intervals[i]
4179                i += 1
4180                taken[video_id][clip_id][int(start) : int(end)] = 1
4181            factor *= 0.9
4182            if factor < 0.05:
4183                warnings.warn(f"Could not find enough frames!")
4184                break
4185        active_learning_intervals = {video_id: [] for video_id in video_intervals}
4186        for video_id in taken:
4187            for clip_id in taken[video_id]:
4188                if video_id in annotated and clip_id in annotated[video_id]:
4189                    for start, end in annotated[video_id][clip_id]:
4190                        taken[video_id][clip_id][int(start) : int(end)] = 0
4191                if (taken[video_id][clip_id] == 1).sum() == 0:
4192                    continue
4193                indices = np.where(taken[video_id][clip_id].numpy())[0]
4194                boundaries = self._get_intervals(indices)
4195                active_learning_intervals[video_id] += [
4196                    [start, end, clip_id] for start, end in boundaries
4197                ]
4198        return active_learning_intervals
4199
4200    def _update_mask(
4201        self,
4202        task: TaskDispatcher,
4203        mask_name: str,
4204        score_tensors: Dict,
4205        n_frames: int,
4206        min_length: int,
4207    ) -> None:
4208        """
4209        Update the real_lens with intervals with the highest score of total length `n_frames`
4210
4211        Parameters
4212        ----------
4213        mask_name : str
4214            the name of the real_lens
4215        score_tensors : dict
4216            a dictionary where keys are clip ids and values are framewise score tensors
4217        n_frames : int
4218            the number of frames to "annotate"
4219        min_length : int
4220            the minimum length of the annotated intervals
4221        """
4222
4223        mask = self._load_mask(mask_name)
4224        video_intervals, _ = task.dataset("train").get_intervals()
4225        masked = {
4226            video_id: defaultdict(lambda: {}) for video_id in video_intervals.keys()
4227        }
4228        total_masked = 0
4229        total_all = 0
4230        for video_id in video_intervals:
4231            for clip_id in video_intervals[video_id]:
4232                masked[video_id][clip_id] = torch.zeros(
4233                    task.dataset("train").get_len(video_id, clip_id)
4234                )
4235                if (
4236                    video_id in mask["unannotated"]
4237                    and clip_id in mask["unannotated"][video_id]
4238                ):
4239                    for start, end in mask["unannotated"][video_id][clip_id]:
4240                        score_tensors[video_id][clip_id][:, start:end] = -10
4241                        masked[video_id][clip_id][int(start) : int(end)] = 1
4242                if (
4243                    video_id in mask["val_intervals"]
4244                    and clip_id in mask["val_intervals"][video_id]
4245                ):
4246                    for start, end in mask["val_intervals"][video_id][clip_id]:
4247                        score_tensors[video_id][clip_id][:, start:end] = -10
4248                        masked[video_id][clip_id][int(start) : int(end)] = 1
4249                total_all += torch.sum(masked[video_id][clip_id] == 0)
4250                if video_id in mask["masked"] and clip_id in mask["masked"][video_id]:
4251                    # print(f'{real_lens["masked"][video_id][clip_id]=}')
4252                    for start, end in mask["masked"][video_id][clip_id]:
4253                        masked[video_id][clip_id][int(start) : int(end)] = 1
4254                        total_masked += end - start
4255        old_n_frames = sum(
4256            [(vv == 0).sum() for v in masked.values() for vv in v.values()]
4257        )
4258        n_frames = old_n_frames + n_frames
4259        factor = 1
4260        while (
4261            sum([(vv == 0).sum() for v in masked.values() for vv in v.values()])
4262            < n_frames
4263        ):
4264            threshold = float(
4265                torch.mean(
4266                    torch.tensor(
4267                        [
4268                            torch.mean(
4269                                torch.tensor([torch.mean(y[y > 0]) for y in x.values()])
4270                            )
4271                            for x in score_tensors.values()
4272                        ]
4273                    )
4274                )
4275            )
4276            threshold = threshold * factor
4277            intervals = []
4278            interval_scores = []
4279            key1 = list(score_tensors.keys())[0]
4280            key2 = list(score_tensors[key1].keys())[0]
4281            num_scores = score_tensors[key1][key2].shape[0]
4282            for i in range(num_scores):
4283                v_dict = task.dataset("train").find_valleys(
4284                    predicted=score_tensors,
4285                    threshold=threshold,
4286                    min_frames=min_length,
4287                    main_class=i,
4288                    low=False,
4289                )
4290                for v_id, interval_list in v_dict.items():
4291                    intervals += [x + [v_id] for x in interval_list]
4292                    interval_scores += [
4293                        float(torch.mean(score_tensors[v_id][clip_id][i, start:end]))
4294                        for start, end, clip_id in interval_list
4295                    ]
4296            intervals = np.array(intervals)[np.argsort(interval_scores)[::-1]]
4297            i = 0
4298            while sum(
4299                [(vv == 0).sum() for v in masked.values() for vv in v.values()]
4300            ) < n_frames and i < len(intervals):
4301                start, end, clip_id, video_id = intervals[i]
4302                i += 1
4303                masked[video_id][clip_id][int(start) : int(end)] = 0
4304            factor *= 0.9
4305            if factor < 0.05:
4306                warnings.warn(f"Could not find enough frames!")
4307                break
4308        mask["masked"] = {video_id: {} for video_id in video_intervals}
4309        total_masked_new = 0
4310        for video_id in masked:
4311            for clip_id in masked[video_id]:
4312                if (
4313                    video_id in mask["unannotated"]
4314                    and clip_id in mask["unannotated"][video_id]
4315                ):
4316                    for start, end in mask["unannotated"][video_id][clip_id]:
4317                        masked[video_id][clip_id][int(start) : int(end)] = 0
4318                if (
4319                    video_id in mask["val_intervals"]
4320                    and clip_id in mask["val_intervals"][video_id]
4321                ):
4322                    for start, end in mask["val_intervals"][video_id][clip_id]:
4323                        masked[video_id][clip_id][int(start) : int(end)] = 0
4324                indices = np.where(masked[video_id][clip_id].numpy())[0]
4325                mask["masked"][video_id][clip_id] = self._get_intervals(indices)
4326        for video_id in mask["masked"]:
4327            for clip_id in mask["masked"][video_id]:
4328                for start, end in mask["masked"][video_id][clip_id]:
4329                    total_masked_new += end - start
4330        self._save_mask(mask, mask_name)
4331        with open(
4332            os.path.join(self.project_path, "results", f"{mask_name}.txt"), "a"
4333        ) as f:
4334            f.write(f"from {total_masked} to {total_masked_new} / {total_all}" + "\n")
4335        print(f"Unmasked from {total_masked} to {total_masked_new} / {total_all}")
4336
4337    def plot_confusion_matrix(
4338        self,
4339        episode_name: str,
4340        load_epoch: int = None,
4341        parameters_update: Dict = None,
4342        type: str = "recall",
4343        mode: str = "val",
4344        remove_saved_features: bool = False,
4345    ) -> Tuple[ndarray, Iterable]:
4346        """
4347        Make a confusion matrix plot and return the data
4348
4349        If the annotation is non-exclusive, only false positive labels are considered.
4350
4351        Parameters
4352        ----------
4353        episode_name : str
4354            the name of the episode to load
4355        load_epoch : int, optional
4356            the index of the epoch to load (by default the last one is loaded)
4357        parameters_update : dict, optional
4358            a dictionary of parameter updates (only for "data" and "general" categories)
4359        mode : {'val', 'all', 'test', 'train'}
4360            the subset of the data to make the prediction for (forced to 'all' if data_path is not None)
4361        type : {"recall", "precision"}
4362            for datasets with non-exclusive annotation, if `type` is `"recall"`, only false positives are taken
4363            into account, and if `type` is `"precision"`, only false negatives
4364        remove_saved_features : bool, default False
4365            if `True`, the dataset that is used for computation is then deleted
4366
4367        Returns
4368        -------
4369        confusion_matrix : np.ndarray
4370            a confusion matrix of shape `(#classes, #classes)` where `A[i, j] = F_ij/N_i`, `F_ij` is the number of
4371            frames that have the i-th label in the ground truth and a false positive j-th label in the prediction,
4372            `N_i` is the number of frames that have the i-th label in the ground truth
4373        classes : list
4374            a list of labels
4375        """
4376
4377        task, parameters, mode = self._make_task_prediction(
4378            "_",
4379            load_episode=episode_name,
4380            load_epoch=load_epoch,
4381            parameters_update=parameters_update,
4382            mode=mode,
4383        )
4384        dataset = task.dataset(mode)
4385        prediction = task.predict(dataset, raw_output=True)
4386        confusion_matrix, classes, type = dataset.get_confusion_matrix(prediction, type)
4387        if remove_saved_features:
4388            self._remove_stores(parameters)
4389        fig, ax = plt.subplots(figsize=(len(classes), len(classes)))
4390        ax.imshow(confusion_matrix)
4391        # Show all ticks and label them with the respective list entries
4392        ax.set_xticks(np.arange(len(classes)))
4393        ax.set_xticklabels(classes)
4394        ax.set_yticks(np.arange(len(classes)))
4395        ax.set_yticklabels(classes)
4396        # Rotate the tick labels and set their alignment.
4397        plt.setp(ax.get_xticklabels(), rotation=45, ha="right", rotation_mode="anchor")
4398        # Loop over data dimensions and create text annotations.
4399        for i in range(len(classes)):
4400            for j in range(len(classes)):
4401                ax.text(
4402                    j,
4403                    i,
4404                    np.round(confusion_matrix[i, j], 2),
4405                    ha="center",
4406                    va="center",
4407                    color="w",
4408                )
4409        if type is not None:
4410            ax.set_title(f"{type} {episode_name}")
4411        else:
4412            ax.set_title(episode_name)
4413        fig.tight_layout()
4414        plt.show()
4415        return confusion_matrix, classes
4416
4417    def plot_predictions(
4418        self,
4419        episode_name: str,
4420        load_epoch: int = None,
4421        parameters_update: Dict = None,
4422        add_legend: bool = True,
4423        ground_truth: bool = True,
4424        colormap: str = "viridis",
4425        hide_axes: bool = False,
4426        min_classes: int = 1,
4427        width: float = 10,
4428        whole_video: bool = False,
4429        transparent: bool = False,
4430        drop_classes: Set = None,
4431        search_classes: Set = None,
4432        num_plots: int = 1,
4433        remove_saved_features: bool = False,
4434        smooth_interval_prediction: int = 0,
4435        data_path: str = None,
4436        file_paths: Set = None,
4437        mode: str = "val",
4438        behavior_name: str = None,
4439    ) -> None:
4440        """
4441        Visualize random predictions
4442
4443        Parameters
4444        ----------
4445        episode_name : str
4446            the name of the episode to load
4447        load_epoch : int, optional
4448            the epoch to load (by default last)
4449        parameters_update : dict, optional
4450            parameter update dictionary
4451        add_legend : bool, default True
4452            if True, legend will be added to the plot
4453        ground_truth : bool, default True
4454            if True, ground truth will be added to the plot
4455        colormap : str, default 'Accent'
4456            the `matplotlib` colormap to use
4457        hide_axes : bool, default True
4458            if `True`, the axes will be hidden on the plot
4459        min_classes : int, default 1
4460            the minimum number of classes in a displayed interval
4461        width : float, default 10
4462            the width of the plot
4463        whole_video : bool, default False
4464            if `True`, whole videos are plotted instead of segments
4465        transparent : bool, default False
4466            if `True`, the background on the plot is transparent
4467        drop_classes : set, optional
4468            a set of class names to not be displayed
4469        search_classes : set, optional
4470            if given, only intervals where at least one of the classes is in ground truth will be shown
4471        num_plots : int, default 1
4472            the number of plots to make
4473        remove_saved_features : bool, default False
4474            if `True`, the dataset will be deleted after computation
4475        smooth_interval_prediction : int, default 0
4476            if >0, predictions shorter than this number of frames are removed (filled with prediction for the previous frame)
4477        data_path : str, optional
4478            the data path to run the prediction for
4479        mode : {'all', 'test', 'val', 'train'}
4480            the subset of the data to make the prediction for (forced to 'all' if data_path is not None)
4481        file_paths : set, optional
4482            a set of string file paths (data with all prefixes + feature files, in any order) to run the prediction
4483            for
4484        behavior_name : str, optional
4485            for non-exclusive classificaton datasets, choose which behavior to visualize (by default first in list)
4486        """
4487
4488        other_path = os.path.join(self.project_path, "results", "other")
4489        task, parameters, mode = self._make_task_prediction(
4490            "_",
4491            load_episode=episode_name,
4492            parameters_update=parameters_update,
4493            load_epoch=load_epoch,
4494            data_path=data_path,
4495            file_paths=file_paths,
4496            mode=mode,
4497        )
4498        if not os.path.exists(other_path):
4499            os.mkdir(other_path)
4500        for i in range(num_plots):
4501            task.visualize_results(
4502                save_path=os.path.join(
4503                    other_path, f"{episode_name}_prediction_{i}.jpg"
4504                ),
4505                add_legend=add_legend,
4506                ground_truth=ground_truth,
4507                colormap=colormap,
4508                hide_axes=hide_axes,
4509                min_classes=min_classes,
4510                whole_video=whole_video,
4511                transparent=transparent,
4512                dataset=mode,
4513                drop_classes=drop_classes,
4514                search_classes=search_classes,
4515                width=width,
4516                smooth_interval_prediction=smooth_interval_prediction,
4517                behavior_name=behavior_name,
4518            )
4519        if remove_saved_features:
4520            self._remove_stores(parameters)
4521
4522    def create_metadata_backup(self) -> None:
4523        """
4524        Create a copy of the meta files
4525        """
4526
4527        meta_copy_path = os.path.join(self.project_path, "meta", "backup")
4528        meta_path = os.path.join(self.project_path, "meta")
4529        if os.path.exists(meta_copy_path):
4530            shutil.rmtree(meta_copy_path)
4531        os.mkdir(meta_copy_path)
4532        for file in os.listdir(meta_path):
4533            if file == "backup":
4534                continue
4535            shutil.copy(
4536                os.path.join(meta_path, file), os.path.join(meta_copy_path, file)
4537            )
4538
4539    def load_metadata_backup(self) -> None:
4540        """
4541        Load from previously created meta data backup (in case of corruption)
4542        """
4543
4544        meta_copy_path = os.path.join(self.project_path, "meta", "backup")
4545        meta_path = os.path.join(self.project_path, "meta")
4546        for file in os.listdir(meta_copy_path):
4547            shutil.copy(
4548                os.path.join(meta_copy_path, file), os.path.join(meta_path, file)
4549            )
4550
4551    def get_behavior_dictionary(self, episode_name: str) -> Dict:
4552        """
4553        Get the behavior dictionary for an episode
4554
4555        Parameters
4556        ----------
4557        episode_name : str
4558            the name of the episode
4559
4560        Returns
4561        -------
4562        behaviors_dictionary : dict
4563            a dictionary where keys are label indices and values are label names
4564        """
4565
4566        run = self._episodes().get_runs(episode_name)[0]
4567        return self._episode(run).get_behaviors_dict()
4568
4569    def import_episodes(
4570        self,
4571        episodes_directory: str,
4572        name_map: Dict = None,
4573        repeat_policy: str = "error",
4574    ) -> None:
4575        """
4576        Import episodes exported with `Project.export_episodes`
4577
4578        Parameters
4579        ----------
4580        episodes_directory : str
4581            the path to the exported episodes directory
4582        name_map : dict
4583            a name change dictionary for the episodes: keys are old names, values are new names
4584        """
4585
4586        if name_map is None:
4587            name_map = {}
4588        episodes = pd.read_pickle(os.path.join(episodes_directory, "episodes.pickle"))
4589        to_remove = []
4590        import_string = "Imported episodes: "
4591        for episode_name in episodes.index:
4592            if episode_name in name_map:
4593                import_string += f"{episode_name} "
4594                episode_name = name_map[episode_name]
4595                import_string += f"({episode_name}), "
4596            else:
4597                import_string += f"{episode_name}, "
4598            try:
4599                self._check_episode_validity(episode_name, allow_doublecolon=True)
4600            except ValueError as e:
4601                if str(e).endswith("is already taken!"):
4602                    if repeat_policy == "skip":
4603                        to_remove.append(episode_name)
4604                    elif repeat_policy == "force":
4605                        self.remove_episode(episode_name)
4606                    elif repeat_policy == "error":
4607                        raise ValueError(
4608                            f"The {episode_name} episode name is already taken; please use the name_map parameter to rename it"
4609                        )
4610                    else:
4611                        raise ValueError(
4612                            f"The {repeat_policy} repeat policy is not recognized; please choose from ['skip', 'force' ans 'error']"
4613                        )
4614        episodes = episodes.drop(index=to_remove)
4615        self._episodes().update(
4616            episodes,
4617            name_map=name_map,
4618            force=(repeat_policy == "force"),
4619            data_path=self.data_path,
4620            annotation_path=self.annotation_path,
4621        )
4622        for episode_name in episodes.index:
4623            if episode_name in name_map:
4624                new_episode_name = name_map[episode_name]
4625            else:
4626                new_episode_name = episode_name
4627            model_dir = os.path.join(
4628                self.project_path, "results", "model", new_episode_name
4629            )
4630            old_model_dir = os.path.join(episodes_directory, "model", episode_name)
4631            if os.path.exists(model_dir):
4632                shutil.rmtree(model_dir)
4633            os.mkdir(model_dir)
4634            for file in os.listdir(old_model_dir):
4635                shutil.copyfile(
4636                    os.path.join(old_model_dir, file), os.path.join(model_dir, file)
4637                )
4638            log_file = os.path.join(
4639                self.project_path, "results", "logs", f"{new_episode_name}.txt"
4640            )
4641            old_log_file = os.path.join(
4642                episodes_directory, "logs", f"{episode_name}.txt"
4643            )
4644            shutil.copyfile(old_log_file, log_file)
4645        print(import_string)
4646        print("\n")
4647
4648    def export_episodes(
4649        self, episode_names: List, output_directory: str, name: str = None
4650    ) -> None:
4651        """
4652        Save selected episodes as a file that can be imported into another project with `Project.import_episodes`
4653
4654        Parameters
4655        ----------
4656        episode_names : list
4657            a list of string episode names
4658        output_directory : str
4659            the path to the directory where the episodes will be saved
4660        name : str, optional
4661            the name of the episodes directory (by default `exported_episodes`)
4662        """
4663
4664        if name is None:
4665            name = "exported_episodes"
4666        if os.path.exists(
4667            os.path.join(output_directory, name + ".zip")
4668        ) or os.path.exists(os.path.join(output_directory, name)):
4669            i = 1
4670            while os.path.exists(
4671                os.path.join(output_directory, name + f"_{i}.zip")
4672            ) or os.path.exists(os.path.join(output_directory, name + f"_{i}")):
4673                i += 1
4674            name = name + f"_{i}"
4675        dest_dir = os.path.join(output_directory, name)
4676        os.mkdir(dest_dir)
4677        os.mkdir(os.path.join(dest_dir, "model"))
4678        os.mkdir(os.path.join(dest_dir, "logs"))
4679        runs = []
4680        for episode in episode_names:
4681            runs += self._episodes().get_runs(episode)
4682        for run in runs:
4683            shutil.copytree(
4684                os.path.join(self.project_path, "results", "model", run),
4685                os.path.join(dest_dir, "model", run),
4686            )
4687            shutil.copyfile(
4688                os.path.join(self.project_path, "results", "logs", f"{run}.txt"),
4689                os.path.join(dest_dir, "logs", f"{run}.txt"),
4690            )
4691        data = self._episodes().get_subset(runs)
4692        data.to_pickle(os.path.join(dest_dir, "episodes.pickle"))
4693
4694    def get_results_table(
4695        self,
4696        episode_names: List,
4697        metrics: List = None,
4698        include_std: bool = False,
4699        classes: List = None,
4700    ):
4701        """
4702        Genererate a `pandas` dataframe with a summary of episode results
4703
4704        Parameters
4705        ----------
4706        episode_names : list
4707            a list of names of episodes to include
4708        metrics : list, optional
4709            a list of metric names to include
4710        include_std : bool, default False
4711            if `True`, for episodes with multiple runs the mean and standard deviation will be displayed;
4712            otherwise only mean
4713        classes : list, optional
4714            a list of names of classes to include (by default all are included)
4715
4716        Returns
4717        -------
4718        results : pd.DataFrame
4719            a table with the results
4720        """
4721
4722        run_names = []
4723        for episode in episode_names:
4724            run_names += self._episodes().get_runs(episode)
4725        episodes = self.list_episodes(run_names, print_results=False)
4726        metric_columns = [x for x in episodes.columns if x[0] == "results"]
4727        results_df = pd.DataFrame()
4728        if metrics is not None:
4729            metric_columns = [
4730                x for x in metric_columns if x[1].split("_")[0] in metrics
4731            ]
4732        for episode in episode_names:
4733            results = []
4734            metric_set = set()
4735            for run in self._episodes().get_runs(episode):
4736                beh_dict = self.get_behavior_dictionary(run)
4737                res_dict = defaultdict(lambda: {})
4738                for column in metric_columns:
4739                    if np.isnan(episodes.loc[run, column]):
4740                        continue
4741                    split = column[1].split("_")
4742                    if split[-1].isnumeric():
4743                        beh_ind = int(split[-1])
4744                        metric_name = "_".join(split[:-1])
4745                        beh = beh_dict[beh_ind]
4746                    else:
4747                        beh = "average"
4748                        metric_name = column[1]
4749                    res_dict[beh][metric_name] = episodes.loc[run, column]
4750                    metric_set.add(metric_name)
4751                if "average" not in res_dict:
4752                    res_dict["average"] = {}
4753                for metric in metric_set:
4754                    if metric not in res_dict["average"]:
4755                        arr = [
4756                            res_dict[beh][metric]
4757                            for beh in res_dict
4758                            if metric in res_dict[beh]
4759                        ]
4760                        res_dict["average"][metric] = np.mean(arr)
4761                results.append(res_dict)
4762            episode_results = {}
4763            for metric in metric_set:
4764                for beh in results[0].keys():
4765                    if classes is not None and beh not in classes:
4766                        continue
4767                    arr = []
4768                    for res_dict in results:
4769                        if metric in res_dict[beh]:
4770                            arr.append(res_dict[beh][metric])
4771                    if len(arr) > 0:
4772                        if include_std:
4773                            episode_results[
4774                                (beh, f"{episode} {metric} mean")
4775                            ] = np.mean(arr)
4776                            episode_results[(beh, f"{episode} {metric} std")] = np.std(
4777                                arr
4778                            )
4779                        else:
4780                            episode_results[(beh, f"{episode} {metric}")] = np.mean(arr)
4781            for key, value in episode_results.items():
4782                results_df.loc[key[0], key[1]] = value
4783        print(f"RESULTS:")
4784        print(results_df)
4785        print("\n")
4786        return results_df
4787
4788    def episode_exists(self, episode_name: str) -> bool:
4789        """
4790        Check if an episode already exists
4791
4792        Parameters
4793        ----------
4794        episode_name : str
4795            the episode name
4796
4797        Returns
4798        -------
4799        exists : bool
4800            `True` if the episode exists
4801        """
4802
4803        return self._episodes().check_name_validity(episode_name)
4804
4805    def search_exists(self, search_name: str) -> bool:
4806        """
4807        Check if a search already exists
4808
4809        Parameters
4810        ----------
4811        search_name : str
4812            the search name
4813
4814        Returns
4815        -------
4816        exists : bool
4817            `True` if the search exists
4818        """
4819
4820        return self._searches().check_name_validity(search_name)
4821
4822    def prediction_exists(self, prediction_name: str) -> bool:
4823        """
4824        Check if a prediction already exists
4825
4826        Parameters
4827        ----------
4828        prediction_name : str
4829            the prediction name
4830
4831        Returns
4832        -------
4833        exists : bool
4834            `True` if the prediction exists
4835        """
4836
4837        return self._predictions().check_name_validity(prediction_name)
4838
4839    @staticmethod
4840    def project_name_available(projects_path: str, project_name: str):
4841        if projects_path is None:
4842            projects_path = os.path.join(str(Path.home()), "DLC2Action")
4843        return not os.path.exists(os.path.join(projects_path, project_name))
4844
4845    def _update_episode_metrics(self, episode_name: str, metrics: Dict):
4846        """
4847        Update meta data with evaluation results
4848        """
4849
4850        self._episodes().update_episode_metrics(episode_name, metrics)
4851
4852    def rename_episode(self, episode_name: str, new_episode_name: str):
4853        shutil.move(
4854            os.path.join(self.project_path, "results", "model", episode_name),
4855            os.path.join(self.project_path, "results", "model", new_episode_name),
4856        )
4857        shutil.move(
4858            os.path.join(self.project_path, "results", "logs", f"{episode_name}.txt"),
4859            os.path.join(
4860                self.project_path, "results", "logs", f"{new_episode_name}.txt"
4861            ),
4862        )
4863        self._episodes().rename_episode(episode_name, new_episode_name)
4864
4865
4866class _Runner:
4867    """
4868    A helper class for running hyperparameter searches
4869    """
4870
4871    def __init__(
4872        self,
4873        search_name,
4874        search_space: Dict,
4875        load_episode: str,
4876        load_epoch: int,
4877        metric: str,
4878        average: int,
4879        task: Union[TaskDispatcher, None],
4880        remove_saved_features: bool,
4881        project: Project,
4882    ):
4883        """
4884        Parameters
4885        ----------
4886        search_space : dict
4887            a dictionary representing the search space; of this general structure:
4888            {'group/param_name': ('float/int/float_log/int_log', start, end),
4889            'group/param_name': ('categorical', [choices])}, e.g.
4890            {'data/overlap': ('int', 5, 100), 'training/lr': ('float_log', 1e-4, 1e-2),
4891            'data/feature_extraction': ('categorical', ['kinematic', 'bones'])}
4892        load_episode : str
4893            the name of the episode to load the model from
4894        load_epoch : int
4895            the epoch to load the model from (if not provided, the last checkpoint is used)
4896        metric : str
4897            the metric to maximize/minimize (see direction)
4898        average : int
4899            the number of epochs to average the metric; if 0, the last value is taken
4900        remove_saved_features : bool
4901            if `True`, the old datasets will be deleted when data parameters change
4902        project : Project
4903            the parent `Project` instance
4904        """
4905
4906        self.search_space = search_space
4907        self.load_episode = load_episode
4908        self.load_epoch = load_epoch
4909        self.metric = metric
4910        self.average = average
4911        self.feature_save_path = None
4912        self.remove_saved_featuress = remove_saved_features
4913        self.save_stores = project._save_stores
4914        self.remove_datasets = project.remove_saved_features
4915        self.task = task
4916        self.search_name = search_name
4917        self.update = project._update
4918        self.remove_episode = project.remove_episode
4919        self.fill = project._fill
4920
4921    def clean(self):
4922        """
4923        Remove datasets if needed
4924        """
4925
4926        if self.remove_saved_featuress:
4927            self.remove_datasets([os.path.basename(self.feature_save_path)])
4928
4929    def run(self, trial, parameters):
4930        """
4931        Make a trial run
4932        """
4933
4934        params = deepcopy(parameters)
4935        param_update = defaultdict(
4936            lambda: defaultdict(lambda: defaultdict(lambda: defaultdict(lambda: {})))
4937        )
4938        for full_name, space in self.search_space.items():
4939            group, param_name = full_name.split("/")[0], "/".join(
4940                full_name.split("/")[1:]
4941            )
4942            log = space[0][-3:] == "log"
4943            if space[0].startswith("int"):
4944                value = trial.suggest_int(full_name, space[1], space[2], log=log)
4945            elif space[0].startswith("float"):
4946                value = trial.suggest_float(full_name, space[1], space[2], log=log)
4947            elif space[0] == "categorical":
4948                value = trial.suggest_categorical(full_name, space[1])
4949            else:
4950                raise ValueError(
4951                    "The search space has to be formatted as either "
4952                    '("float"/"int"/"float_log"/"int_log", start, end) '
4953                    f'or ("categorical", [choices]); got {space} for {group}/{param_name}'
4954                )
4955            if len(param_name.split("/")) == 1:
4956                param_update[group][param_name] = value
4957            else:
4958                pars = param_name.split("/")
4959                pars = [int(x) if x.isnumeric() else x for x in pars]
4960                if len(pars) == 2:
4961                    param_update[group][pars[0]][pars[1]] = value
4962                elif len(pars) == 3:
4963                    param_update[group][pars[0]][pars[1]][pars[2]] = value
4964                elif len(pars) == 4:
4965                    param_update[group][pars[0]][pars[1]][pars[2]][pars[3]] = value
4966        params = self.update(params, param_update)
4967        self.remove_episode(f"_{self.search_name}")
4968        params = self.fill(
4969            params,
4970            f"_{self.search_name}",
4971            self.load_episode,
4972            load_epoch=self.load_epoch,
4973            only_load_model=True,
4974        )
4975        if self.feature_save_path != params["data"]["feature_save_path"]:
4976            if self.feature_save_path is not None:
4977                self.clean()
4978            self.feature_save_path = params["data"]["feature_save_path"]
4979        self.save_stores(params)
4980        if self.task is None:
4981            self.task = TaskDispatcher(deepcopy(params))
4982        else:
4983            self.task.update_task(params)
4984
4985        _, metrics_log = self.task.train(trial, self.metric)
4986        metric_values = metrics_log["val"][self.metric]
4987        if self.average > 0:
4988            value = np.mean(sorted(metric_values)[-self.average :])
4989        else:
4990            value = metric_values[-1]
4991        return value