From 2c8ae72d0001d9a8f9e7d4abad489074bed749a1 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Mon, 10 Nov 2025 14:55:42 +0100
Subject: [PATCH 01/15] first pretrained models support prototype

---
 element_deeplabcut/model.py | 605 ++++++++++++++++++++++++++++++------
 1 file changed, 518 insertions(+), 87 deletions(-)

diff --git a/element_deeplabcut/model.py b/element_deeplabcut/model.py
index bde24b9..e35d174 100644
--- a/element_deeplabcut/model.py
+++ b/element_deeplabcut/model.py
@@ -296,6 +296,125 @@ def insert_from_config(
             )
 
 
+@schema
+class PretrainedModel(dj.Lookup):
+    """Pretrained DeepLabCut models available for use.
+
+    Attributes:
+        pretrained_model_name ( varchar(64) ): Name of the pretrained model (e.g., "superanimal_quadruped").
+        version ( varchar(32) ): Optional. Version of the pretrained model.
+        species ( varchar(64) ): Optional. Species this model was trained on.
+        source ( varchar(128) ): Source of the pretrained model (e.g., "DLC Model Zoo",
+            "SuperAnimal", "ResNet", etc.).
+        backbone_model_name ( varchar(64) ): Optional. Backbone model name (e.g., "hrnet_w32").
+        detector_name ( varchar(128) ): Optional. Detector name (e.g., "fasterrcnn_resnet50_fpn_v2").
+        default_params (longblob): Optional. Default inference parameters (dict-like, e.g.,
+            {"video_adapt": False, "scale": 0.4, "batchsize": 8}).
+        weights_path ( varchar(255) ): Optional. Path to model weights file/URI (if applicable).
+        description ( varchar(1000) ): Optional. Description of the pretrained model.
+    """
+
+    definition = """
+    pretrained_model_name : varchar(64)  # Name of the pretrained model (e.g., "superanimal_quadruped")
+    ---
+    version=''            : varchar(32)  # Version of the pretrained model
+    species=''            : varchar(64)   # Species this model was trained on
+    source=''             : varchar(128)  # Source (e.g., "DLC Model Zoo", "SuperAnimal", "ResNet")
+    backbone_model_name='' : varchar(64)  # Optional. Backbone model name (e.g., "hrnet_w32")
+    detector_name=''       : varchar(128) # Optional. Detector name (e.g., "fasterrcnn_resnet50_fpn_v2")
+    default_params=null   : longblob      # Optional. Default inference parameters (dict-like)
+    weights_path=''       : varchar(255)  # Optional. Path to model weights file (if applicable)
+    description=''        : varchar(1000) # Description of the pretrained model
+    """
+
+    @classmethod
+    def is_pretrained(cls, pretrained_model_name: str) -> bool:
+        """Check if a pretrained model name exists in the lookup table.
+        
+        Args:
+            pretrained_model_name: Name of the pretrained model to check.
+            
+        Returns:
+            bool: True if the model exists in the lookup table, False otherwise.
+        """
+        return bool(cls & {"pretrained_model_name": pretrained_model_name})
+
+    @classmethod
+    def add(
+        cls,
+        pretrained_model_name: str,
+        source: str = "",
+        version: str = "",
+        species: str = "",
+        backbone_model_name: str = "",
+        detector_name: str = "",
+        weights_path: str = "",
+        default_params: dict = None,
+        description: str = "",
+        auto_insert: bool = False,
+    ):
+        """Add a pretrained model to the lookup table.
+        
+        If the model doesn't exist and auto_insert is True, it will be added
+        with the provided parameters. If auto_insert is False and the model
+        doesn't exist, raises a ValueError.
+        
+        Args:
+            pretrained_model_name: Name of the pretrained model (e.g., "superanimal_quadruped").
+            source: Optional. Source of the pretrained model.
+            version: Optional. Version of the pretrained model.
+            species: Optional. Species this model was trained on.
+            backbone_model_name: Optional. Backbone model name (e.g., "hrnet_w32").
+            detector_name: Optional. Detector name (e.g., "fasterrcnn_resnet50_fpn_v2").
+            weights_path: Optional. Path to model weights file/URI (if applicable).
+            default_params: Optional. Default inference parameters (dict-like, e.g.,
+                {"video_adapt": False, "scale": 0.4, "batchsize": 8}).
+            description: Optional. Description of the pretrained model.
+            auto_insert: If True, automatically insert if missing. If False, raise error.
+                Default False to force explicit registration.
+            
+        Returns:
+            bool: True if model exists (or was inserted). This is a success flag only.
+            
+        Raises:
+            ValueError: If model doesn't exist and auto_insert=False.
+        """
+        if cls.is_pretrained(pretrained_model_name):
+            return True
+        
+        if not auto_insert:
+            raise ValueError(
+                f"Pretrained model '{pretrained_model_name}' not found in "
+                "PretrainedModel lookup table. Use auto_insert=True to add it automatically, "
+                "or register it explicitly using PretrainedModel.insert1()."
+            )
+        
+        # Auto-insert with provided parameters
+        # Warn if auto-creating without meaningful configuration
+        if not weights_path and not default_params:
+            logger.warning(
+                f"Auto-inserting pretrained model '{pretrained_model_name}' without "
+                "weights_path or default_params. Consider registering explicitly with "
+                "proper configuration."
+            )
+        
+        cls.insert1(
+            {
+                "pretrained_model_name": pretrained_model_name,
+                "version": version,
+                "species": species,
+                "source": source,
+                "backbone_model_name": backbone_model_name,
+                "detector_name": detector_name,
+                "weights_path": weights_path,
+                "default_params": default_params,
+                "description": description,
+            },
+            skip_duplicates=True,
+        )
+        return True
+
+
 @schema
 class Model(dj.Manual):
     """DeepLabCut Models applied to generate pose estimations.
@@ -437,7 +556,7 @@ def insert_new_model(
                 modelprefix=model_prefix,
             )
         else:
-            raise ValueError(f"Unknow engine type {engine}")
+            raise ValueError(f"Unknown engine type {engine}")
 
         if dlc_config["snapshotindex"] == -1:
             dlc_scorer = "".join(dlc_scorer.split("_")[:-1])
@@ -491,6 +610,126 @@ def _do_insert():
             with cls.connection.transaction:
                 _do_insert()
 
+    @classmethod
+    def insert_pretrained_model(
+        cls,
+        model_name: str,
+        pretrained_model_name: str,
+        *,
+        model_description="",
+        model_prefix="",
+        prompt=True,
+        config_overrides: dict = None,
+    ):
+        """Insert a pretrained model into the dlc.Model table.
+
+        This method can only be used if the pretrained_model_name exists in the
+        PretrainedModel lookup table. It handles config paths and training-related
+        columns differently (set to NULL / "pretrained" as appropriate).
+
+        Args:
+            model_name (str): User-friendly name for this model instance.
+            pretrained_model_name (str): Name from PretrainedModel lookup table.
+            model_description (str): Optional. Description of this model.
+            model_prefix (str): Optional. Filename prefix used across DLC project.
+            prompt (bool): Optional. Prompt the user with all info before inserting.
+            config_overrides (dict): Optional. Dict of config items to override defaults.
+        """
+        # Check if pretrained model exists in lookup - return if not found
+        if not PretrainedModel.is_pretrained(pretrained_model_name):
+            logger.warning(
+                f"Pretrained model '{pretrained_model_name}' not found in "
+                "PretrainedModel lookup table. Cannot insert model. "
+                "Please add it to PretrainedModel first."
+            )
+            return
+        
+        pretrained_info = (PretrainedModel & {"pretrained_model_name": pretrained_model_name}).fetch1()
+
+        # Load default config from pretrained model
+        default_params = pretrained_info.get("default_params") or {}
+        if config_overrides:
+            default_params.update(config_overrides)
+
+        # Build config template - use defaults from pretrained model
+        dlc_config = default_params.copy()
+        
+        # Set required fields for pretrained models
+        # For pretrained models, we use placeholder values for training-related fields
+        dlc_config.setdefault("Task", f"pretrained_{pretrained_model_name}")
+        dlc_config.setdefault("date", "pretrained")
+        dlc_config.setdefault("iteration", 0)
+        dlc_config.setdefault("snapshotindex", -1)
+        dlc_config.setdefault("TrainingFraction", [1.0])  # Placeholder
+        
+        engine = dlc_config.get("engine", "tensorflow")
+        if engine is None:
+            logger.warning(
+                "DLC engine not specified. Defaulting to TensorFlow."
+            )
+            engine = "tensorflow"
+
+        # For pretrained models, scorer is based on the pretrained model name
+        scorer = f"{pretrained_model_name}_pretrained"
+
+        # Mark as pretrained in config_template for detection
+        # Convention: _pretrained_model_name in config_template identifies pretrained models
+        # This allows detection without modifying the Model table schema
+        dlc_config["_is_pretrained"] = True
+        dlc_config["_pretrained_model_name"] = pretrained_model_name
+        
+        # Build model dict - set training-related fields appropriately
+        # For pretrained models: no project_path, minimal config_template
+        model_dict = {
+            "model_name": model_name,
+            "model_description": model_description,
+            "scorer": scorer,
+            "task": dlc_config["Task"],
+            "date": dlc_config["date"],
+            "iteration": dlc_config["iteration"],
+            "snapshotindex": dlc_config["snapshotindex"],
+            "shuffle": 0,  # Not applicable for pretrained
+            "trainingsetindex": 0,  # Not applicable for pretrained
+            "engine": engine,
+            "project_path": "",  # Empty for pretrained models
+            "model_prefix": model_prefix,
+            "paramset_idx": None,  # No training param set for pretrained
+            "config_template": dlc_config,
+        }
+
+        # -- prompt for confirmation --
+        if prompt:
+            print("--- Pretrained DLC Model specification to be inserted ---")
+            for k, v in model_dict.items():
+                if k != "config_template":
+                    print("\t{}: {}".format(k, v))
+                else:
+                    print("\t-- Template/Contents of config.yaml --")
+                    for k, v in model_dict["config_template"].items():
+                        print("\t\t{}: {}".format(k, v))
+
+        if (
+            prompt
+            and dj.utils.user_choice("Proceed with pretrained DLC model insert?") != "yes"
+        ):
+            print("Canceled insert.")
+            return
+
+        def _do_insert():
+            cls.insert1(model_dict)
+            # Extract body parts from config if available
+            if "bodyparts" in dlc_config:
+                if BodyPart.extract_new_body_parts(dlc_config, verbose=False).size > 0:
+                    BodyPart.insert_from_config(dlc_config, prompt=prompt)
+                cls.BodyPart.insert((model_name, bp) for bp in dlc_config["bodyparts"])
+
+        # ____ Insert into table ----
+        if cls.connection.in_transaction:
+            _do_insert()
+        else:
+            with cls.connection.transaction:
+                _do_insert()
+
 
 @schema
 class ModelEvaluation(dj.Computed):
@@ -725,8 +964,215 @@ class BodyPartPosition(dj.Part):
         likelihood  : longblob
         """
 
+    @classmethod
+    def _do_pretrained_inference(
+        cls,
+        pretrained_model_name: str,
+        video_filepaths: list,
+        output_dir: Path,
+        inference_params: dict = None,
+    ):
+        """Run pretrained (SuperAnimal / Model Zoo) inference on videos.
+
+        This uses the PretrainedModel lookup as the single source of truth for:
+        - which pretrained model to call
+        - default inference parameters
+        - optional backbone/detector names, etc.
+
+        It supports DLC's `video_inference_superanimal` API when available,
+        and falls back to `video_inference` if exposed by the installed DLC version.
+
+        Args:
+            pretrained_model_name: Name of the pretrained model (e.g., "superanimal_quadruped").
+            video_filepaths: List of full paths to video files.
+            output_dir: Directory to save output files.
+            inference_params: Optional. Parameters for inference function (overrides defaults).
+        """
+        import inspect
+        import deeplabcut
+
+        # --- Fetch pretrained model metadata from lookup ---
+        try:
+            pm = (PretrainedModel & {"pretrained_model_name": pretrained_model_name}).fetch1()
+        except dj.DataJointError:
+            raise ValueError(
+                f"Pretrained model '{pretrained_model_name}' is not registered in PretrainedModel. "
+                "Please insert it before running pretrained inference."
+            )
+
+        default_params = pm.get("default_params") or {}
+        # Merge: explicit inference_params override defaults
+        merged_params = {**default_params, **(inference_params or {})}
+
+        # Get optional fields if they exist in the table
+        backbone_model_name = pm.get("backbone_model_name") or None
+        detector_name = pm.get("detector_name") or None
+
+        # Ensure output_dir exists and is a string for DLC
+        output_dir = Path(output_dir)
+        output_dir.mkdir(parents=True, exist_ok=True)
+        destfolder_str = str(output_dir)
+
+        # --- Prefer SuperAnimal-style API if available ---
+        if hasattr(deeplabcut, "video_inference_superanimal"):
+            inference_func = deeplabcut.video_inference_superanimal
+            sig = inspect.signature(inference_func)
+
+            # Base kwargs from merged_params, filtered by supported args
+            kwargs = {
+                k: v
+                for k, v in merged_params.items()
+                if k in sig.parameters
+            }
+
+            # Map known optional fields if accepted by the function
+            if "model_name" in sig.parameters and backbone_model_name:
+                kwargs.setdefault("model_name", backbone_model_name)
+            if "detector_name" in sig.parameters and detector_name:
+                kwargs.setdefault("detector_name", detector_name)
+            if "destfolder" in sig.parameters:
+                kwargs.setdefault("destfolder", destfolder_str)
+
+            # Call: video_inference_superanimal(video_list, superanimal_name, **kwargs)
+            return inference_func(
+                video_filepaths,
+                pretrained_model_name,
+                **kwargs,
+            )
+
+        # --- Fallback: generic video_inference API, if present ---
+        if hasattr(deeplabcut, "video_inference"):
+            inference_func = deeplabcut.video_inference
+            sig = inspect.signature(inference_func)
+
+            kwargs = {
+                k: v
+                for k, v in merged_params.items()
+                if k in sig.parameters
+            }
+
+            # Try to inject known fields if supported
+            if "model_name" in sig.parameters and backbone_model_name:
+                kwargs.setdefault("model_name", backbone_model_name)
+            if "detector_name" in sig.parameters and detector_name:
+                kwargs.setdefault("detector_name", detector_name)
+            if "destfolder" in sig.parameters:
+                kwargs.setdefault("destfolder", destfolder_str)
+
+            # Some versions may expect (videos, model_name, ...) or similar;
+            # we always pass video_filepaths as first arg and rely on kwargs for the rest.
+            return inference_func(
+                video_filepaths,
+                **kwargs,
+            )
+
+        # --- No compatible API found ---
+        raise NotImplementedError(
+            "No compatible pretrained inference function found in the installed DeepLabCut. "
+            "Expected `video_inference_superanimal` or `video_inference`."
+        )
+
+    @classmethod
+    def do_trained(
+        cls,
+        project_path: Path,
+        video_filepaths: list,
+        output_dir: Path,
+        dlc_config: dict,
+        dlc_model_: dict,
+        analyze_video_params: dict = None,
+    ):
+        """Run trained model inference on videos.
+        
+        Args:
+            project_path: Full path to the directory containing the trained model.
+            video_filepaths: List of full paths to video files.
+            output_dir: Directory to save output files.
+            dlc_config: DeepLabCut config dictionary.
+            dlc_model_: Model record dictionary.
+            analyze_video_params: Optional. Parameters for analyze_videos function.
+        """
+        import inspect
+        
+        # Validate project_path is not empty for trained models
+        if not project_path or str(project_path).strip() == "":
+            raise ValueError(
+                "project_path cannot be empty for trained models. "
+                "Trained models require a valid project directory path."
+            )
+        
+        if analyze_video_params is None:
+            analyze_video_params = {}
+        
+        engine = dlc_model_.get("engine")
+        if engine is None:
+            logger.warning(
+                "DLC engine not specified in config file. Defaulting to TensorFlow."
+            )
+            engine = "tensorflow"
+        if engine == "pytorch":
+            from deeplabcut.pose_estimation_pytorch import analyze_videos
+        elif engine == "tensorflow":
+            from deeplabcut.pose_estimation_tensorflow import analyze_videos
+        else:
+            raise ValueError(f"Unknown engine type {engine}")
+
+        # ---- Build and save DLC configuration (yaml) file ----
+        dlc_project_path = Path(project_path)
+        dlc_config["project_path"] = dlc_project_path.as_posix()
+
+        # ---- Special handling for "cropping" ----
+        # `analyze_videos` behavior:
+        #   i) if is None, use the "cropping" from the config file
+        #   ii) if defined, use the specified "cropping" values but not updating the config file
+        # new behavior: if defined as "False", overwrite "cropping" to False in config file
+        cropping = analyze_video_params.get("cropping", None)
+        if cropping is not None:
+            if cropping:
+                dlc_config["cropping"] = True
+                (
+                    dlc_config["x1"],
+                    dlc_config["x2"],
+                    dlc_config["y1"],
+                    dlc_config["y2"],
+                ) = cropping
+            else:  # cropping is False
+                dlc_config["cropping"] = False
+
+        # ---- Write config files ----
+        config_filename = f"dj_dlc_config_{datetime.now(tz=timezone.utc).strftime('%Y%m%d_%H%M%S')}.yaml"
+        # To output dir: Important for loading/parsing output in datajoint
+        _ = dlc_reader.save_yaml(output_dir, dlc_config)
+        # To project dir: Required by DLC to run the analyze_videos
+        if dlc_project_path != output_dir:
+            config_filepath = dlc_reader.save_yaml(
+                dlc_project_path,
+                dlc_config,
+                filename=config_filename,
+            )
+        else:
+            config_filepath = output_dir / config_filename
+
+        # ---- Take valid parameters for analyze_videos ----
+        kwargs = {
+            k: v
+            for k, v in analyze_video_params.items()
+            if k in inspect.signature(analyze_videos).parameters
+        }
+
+        # ---- Trigger DLC prediction job ----
+        analyze_videos(
+            config=config_filepath,
+            videos=video_filepaths,
+            shuffle=dlc_model_["shuffle"],
+            trainingsetindex=dlc_model_["trainingsetindex"],
+            destfolder=output_dir,
+            modelprefix=dlc_model_.get("model_prefix", ""),
+            **kwargs,
+        )
+
     def make(self, key):
-        """.populate() method will launch training for each PoseEstimationTask"""
+        """.populate() method will launch pose estimation inference for each PoseEstimationTask"""
         # ID model and directories
         dlc_model_ = (Model & key).fetch1()
         task_mode, output_dir = (PoseEstimationTask & key).fetch1(
@@ -753,13 +1199,6 @@ def make(self, key):
 
         # Trigger PoseEstimation
         if task_mode == "trigger":
-            # Triggering dlc for pose estimation required:
-            # - project_path: full path to the directory containing the trained model
-            # - video_filepaths: full paths to the video files for inference
-            # - analyze_video_params: optional parameters to analyze video
-            project_path = find_full_path(
-                get_dlc_root_data_dir(), dlc_model_["project_path"]
-            )
             video_relpaths = list((VideoRecording.File & key).fetch("file_path"))
             video_filepaths = [
                 find_full_path(get_dlc_root_data_dir(), fp).as_posix()
@@ -769,90 +1208,82 @@ def make(self, key):
                 "pose_estimation_params"
             ) or {}
 
-            # expect a nested dictionary with "analyze_videos" params
-            # if not, assume "pose_estimation_params" as a flat dictionary that include relevant "analyze_videos" params
-            analyze_video_params = (
-                pose_estimation_params.get("analyze_videos") or pose_estimation_params
-            )
-
-            @memoized_result(
-                uniqueness_dict={
-                    **analyze_video_params,
-                    "project_path": dlc_model_["project_path"],
-                    "shuffle": dlc_model_["shuffle"],
-                    "trainingsetindex": dlc_model_["trainingsetindex"],
-                    "video_filepaths": video_relpaths,
-                },
-                output_directory=output_dir,
-            )
-            def do_analyze_videos():
-                engine = dlc_model_.get("engine")
-                if engine is None:
-                    logger.warning(
-                        "DLC engine not specified in config file. Defaulting to TensorFlow."
+            # Check if this is a pretrained model by looking in config_template
+            config_template = dlc_model_.get("config_template", {})
+            pretrained_model_name = config_template.get("_pretrained_model_name")
+            is_pretrained = pretrained_model_name is not None
+
+            # Handle pretrained models differently
+            if is_pretrained:
+                # Ensure the pretrained model exists in lookup - require explicit registration
+                if not PretrainedModel.is_pretrained(pretrained_model_name):
+                    raise ValueError(
+                        f"Pretrained model '{pretrained_model_name}' must be registered "
+                        "in PretrainedModel lookup table before use. "
+                        "Please add it using PretrainedModel.insert1() or PretrainedModel.add()."
                     )
-                    engine = "tensorflow"
-                if engine == "pytorch":
-                    from deeplabcut.pose_estimation_pytorch import analyze_videos
-                elif engine == "tensorflow":
-                    from deeplabcut.pose_estimation_tensorflow import analyze_videos
-                else:
-                    raise ValueError(f"Unknow engine type {engine}")
-
-                # ---- Build and save DLC configuration (yaml) file ----
-                dlc_config = dlc_model_["config_template"]
-                dlc_project_path = Path(project_path)
-                dlc_config["project_path"] = dlc_project_path.as_posix()
-
-                # ---- Special handling for "cropping" ----
-                # `analyze_videos` behavior:
-                #   i) if is None, use the "cropping" from the config file
-                #   ii) if defined, use the specified "cropping" values but not updating the config file
-                # new behavior: if defined as "False", overwrite "cropping" to False in config file
-                cropping = analyze_video_params.get("cropping", None)
-                if cropping is not None:
-                    if cropping:
-                        dlc_config["cropping"] = True
-                        (
-                            dlc_config["x1"],
-                            dlc_config["x2"],
-                            dlc_config["y1"],
-                            dlc_config["y2"],
-                        ) = cropping
-                    else:  # cropping is False
-                        dlc_config["cropping"] = False
-
-                # ---- Write config files ----
-                config_filename = f"dj_dlc_config_{datetime.now(tz=timezone.utc).strftime('%Y%m%d_%H%M%S')}.yaml"
-                # To output dir: Important for loading/parsing output in datajoint
-                _ = dlc_reader.save_yaml(output_dir, dlc_config)
-                # To project dir: Required by DLC to run the analyze_videos
-                if dlc_project_path != output_dir:
-                    config_filepath = dlc_reader.save_yaml(
-                        dlc_project_path,
-                        dlc_config,
-                        filename=config_filename,
+                
+                # Build inference_params from pose_estimation_params
+                # (default_params will be merged inside _do_pretrained_inference)
+                pose_inference_params = (
+                    pose_estimation_params.get("video_inference") or pose_estimation_params
+                )
+
+                @memoized_result(
+                    uniqueness_dict={
+                        **pose_inference_params,
+                        "pretrained_model_name": pretrained_model_name,
+                        "video_filepaths": video_relpaths,
+                    },
+                    output_directory=output_dir,
+                )
+                def _do_pretrained_inference():
+                    PoseEstimation._do_pretrained_inference(
+                        pretrained_model_name=pretrained_model_name,
+                        video_filepaths=video_filepaths,
+                        output_dir=output_dir,
+                        inference_params=pose_inference_params,
                     )
+                
+                _do_pretrained_inference()
+            else:
+                # Original trained model path
+                # Triggering dlc for pose estimation required:
+                # - project_path: full path to the directory containing the trained model
+                # - video_filepaths: full paths to the video files for inference
+                # - analyze_video_params: optional parameters to analyze video
+                project_path = find_full_path(
+                    get_dlc_root_data_dir(), dlc_model_["project_path"]
+                )
 
-                # ---- Take valid parameters for analyze_videos ----
-                kwargs = {
-                    k: v
-                    for k, v in analyze_video_params.items()
-                    if k in inspect.signature(analyze_videos).parameters
-                }
+                # expect a nested dictionary with "analyze_videos" params
+                # if not, assume "pose_estimation_params" as a flat dictionary that include relevant "analyze_videos" params
+                analyze_video_params = (
+                    pose_estimation_params.get("analyze_videos") or pose_estimation_params
+                )
 
-                # ---- Trigger DLC prediction job ----
-                analyze_videos(
-                    config=config_filepath,
-                    videos=video_filepaths,
-                    shuffle=dlc_model_["shuffle"],
-                    trainingsetindex=dlc_model_["trainingsetindex"],
-                    destfolder=output_dir,
-                    modelprefix=dlc_model_["model_prefix"],
-                    **kwargs,
+                @memoized_result(
+                    uniqueness_dict={
+                        **analyze_video_params,
+                        "project_path": dlc_model_["project_path"],
+                        "shuffle": dlc_model_["shuffle"],
+                        "trainingsetindex": dlc_model_["trainingsetindex"],
+                        "video_filepaths": video_relpaths,
+                    },
+                    output_directory=output_dir,
                 )
+                def _do_trained_inference():
+                    dlc_config = dlc_model_["config_template"].copy()
+                    PoseEstimation.do_trained(
+                        project_path=project_path,
+                        video_filepaths=video_filepaths,
+                        output_dir=output_dir,
+                        dlc_config=dlc_config,
+                        dlc_model_=dlc_model_,
+                        analyze_video_params=analyze_video_params,
+                    )
 
-            do_analyze_videos()
+                _do_trained_inference()
 
         dlc_result = dlc_reader.PoseEstimation(output_dir)
         creation_time = datetime.fromtimestamp(dlc_result.creation_time).strftime(

From 5099255b1e630cc42254db2ec2c76018f9ad3bd1 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:29:24 +0100
Subject: [PATCH 02/15] docs

---
 docs/mkdocs.yaml      |   3 +
 docs/src/concepts.md  |   7 +-
 docs/src/docker.md    | 239 +++++++++++++++++++++++++++++
 docs/src/index.md     |   8 +-
 docs/src/testing.md   | 342 ++++++++++++++++++++++++++++++++++++++++++
 docs/src/workflows.md | 333 ++++++++++++++++++++++++++++++++++++++++
 6 files changed, 929 insertions(+), 3 deletions(-)
 create mode 100644 docs/src/docker.md
 create mode 100644 docs/src/testing.md
 create mode 100644 docs/src/workflows.md

diff --git a/docs/mkdocs.yaml b/docs/mkdocs.yaml
index 8c7e7f4..10b8bfe 100644
--- a/docs/mkdocs.yaml
+++ b/docs/mkdocs.yaml
@@ -7,6 +7,7 @@ repo_name: datajoint/element-deeplabcut
 nav:
   - Element DeepLabCut: index.md
   - Concepts: concepts.md
+  - Workflows: workflows.md
   - Tutorials:
       - Overview: tutorials/index.md
       - Data Download: tutorials/00-DataDownload_Optional.ipynb
@@ -17,6 +18,8 @@ nav:
       - Visualization: tutorials/05-Visualization_Optional.ipynb
       - Drop Schemas: tutorials/06-Drop_Optional.ipynb
       - Alternate Dataset: tutorials/09-AlternateDataset.ipynb
+  - Docker: docker.md
+  - Testing: testing.md
   - Citation: citation.md
   - API: api/ # defer to gen-files + literate-nav
   - Changelog: changelog.md
diff --git a/docs/src/concepts.md b/docs/src/concepts.md
index 936091d..53829c6 100644
--- a/docs/src/concepts.md
+++ b/docs/src/concepts.md
@@ -74,13 +74,16 @@ Development of the Element began with an
 by the Mathis team. We further identified common needs across our respective
 partnerships to offer the following features for single-camera 2D models:
 
-- Manage training data and configuration parameters
-- Launch model training
+- Support for both **trained models** (custom models you train) and **pretrained models** (ready-to-use models from the DLC Model Zoo)
+- Manage training data and configuration parameters (for trained models)
+- Launch model training (for trained models)
 - Evaluate models automatically and directly compare models
 - Manage model metadata
 - Launch inference video analysis
 - Capture pose estimation output for each session
 
+See the [Workflows page](./workflows.md) for details on the two workflow modes.
+
 ## Element Architecture
 
 Each node in the following diagram represents the analysis code in the workflow and the
diff --git a/docs/src/docker.md b/docs/src/docker.md
new file mode 100644
index 0000000..90a9a79
--- /dev/null
+++ b/docs/src/docker.md
@@ -0,0 +1,239 @@
+# Docker Setup
+
+Element DeepLabCut provides Docker support for running tests and development in a containerized environment. This is particularly useful for:
+
+- Running functional tests without setting up a local environment
+- Ensuring consistent development environments across different machines
+- CI/CD pipeline integration
+- Quick testing of new features
+
+## Prerequisites
+
+- Docker and Docker Compose installed
+- Test video files in `./test_videos/` directory (optional, for testing)
+
+## Quick Start
+
+### Start Services
+
+Start the database and client containers:
+
+```console
+docker compose up -d
+```
+
+Or use the Makefile:
+
+```console
+make up
+```
+
+This starts:
+- **Database service** (`db`): MySQL 8.0 database with health checks
+- **Client service** (`client`): Development/test container with DeepLabCut pre-installed
+
+### Run Tests
+
+Run the functional test suite. There are two test scripts:
+
+**1. Trained Model Workflow Test** (`test_trained_inference.py`):
+Tests the complete trained model workflow (project creation → training → inference):
+
+```console
+docker compose run --rm client python test_trained_inference.py
+```
+
+Or use the Makefile:
+
+```console
+make test-trained
+```
+
+**2. Pretrained Model Workflow Test** (`test_video_inference.py`):
+Tests pretrained model inference (SuperAnimal models):
+
+```console
+docker compose run --rm client python test_video_inference.py superanimal_quadruped
+```
+
+Or use the Makefile:
+
+```console
+make test-pretrained
+```
+
+See [Testing Guide](./testing.md) for details on both test scripts.
+
+### Interactive Shell
+
+Get an interactive shell in the container:
+
+```console
+docker compose run --rm client bash
+```
+
+Or use the Makefile:
+
+```console
+make shell
+```
+
+## Configuration
+
+### Environment Variables
+
+You can customize the setup using environment variables:
+
+```console
+# Database password
+export DJ_PASS=your_password
+
+# Database port (default: 3306)
+export DB_PORT=3307
+
+# Database prefix (default: test_)
+export DATABASE_PREFIX=test_
+
+# MySQL version (default: 8.0)
+export MYSQL_VER=8.0
+```
+
+Or create a `.env` file in the project root:
+
+```env
+DJ_PASS=datajoint
+DB_PORT=3306
+DATABASE_PREFIX=test_
+MYSQL_VER=8.0
+```
+
+### Database Configuration
+
+The container automatically connects to the `db` service. You can also use an external database by setting:
+
+```console
+export DJ_HOST=your_database_host
+export DJ_USER=your_username
+export DJ_PASS=your_password
+```
+
+The container will look for database configuration in this order:
+
+1. Environment variables (`DJ_HOST`, `DJ_USER`, `DJ_PASS`)
+2. `dj_local_conf.json` file (if mounted)
+3. Default DataJoint configuration
+
+## Volumes
+
+The following directories are mounted as volumes:
+
+- `.` → `/app` - Project directory (includes `./test_videos` at `/app/test_videos`)
+- `./test_videos` → `/app/data` - Test video files (also accessible at `/app/test_videos` from project mount)
+- `./dj_local_conf.json` → `/app/dj_local_conf.json` - Database configuration (read-only)
+
+**Note**: Test scripts automatically detect Docker and use `/app/test_videos` (from project mount).
+
+
+## Usage Examples
+
+See [Testing Guide](./testing.md) for detailed test usage examples. Quick reference:
+
+```console
+# Run trained model test
+make test-trained
+
+# Run pretrained model test  
+make test-pretrained
+
+# Interactive shell
+make shell
+```
+
+### Development Workflow
+
+For development, the project directory is mounted as a volume, so code changes are immediately available. However, if you install new dependencies, you'll need to rebuild:
+
+```console
+docker compose build
+```
+
+## Makefile Commands
+
+The included Makefile provides convenient shortcuts:
+
+| Command | Description |
+|---------|-------------|
+| `make build` | Build Docker image |
+| `make up` | Start services in background |
+| `make down` | Stop and remove containers |
+| `make shell` | Interactive shell in container |
+| `make test-trained` | Run `test_trained_inference.py` |
+| `make test-pretrained` | Run `test_video_inference.py` |
+| `make clean` | Remove containers and volumes |
+
+## Troubleshooting
+
+### Database Connection Issues
+
+If you see database connection errors:
+
+1. Check that the database is healthy:
+
+   ```console
+   docker compose ps
+   ```
+
+2. Verify environment variables:
+
+   ```console
+   docker compose run --rm client env | grep DJ_
+   ```
+
+3. Test database connection manually:
+
+   ```console
+   docker compose run --rm client python -c "import datajoint as dj; dj.config.load('/app/dj_local_conf.json'); print('Connected:', dj.conn())"
+   ```
+
+### Permission Issues
+
+If you encounter permission issues with mounted volumes:
+
+```console
+# Fix permissions for test_videos
+sudo chown -R $USER:$USER test_videos/
+```
+
+### Rebuild After Code Changes
+
+If you modify dependencies or the Dockerfile:
+
+```console
+docker compose build --no-cache
+```
+
+### Clean Up
+
+Remove containers and volumes:
+
+```console
+# Stop and remove containers
+docker compose down
+
+# Remove volumes (WARNING: deletes database data)
+docker compose down -v
+```
+
+## Docker Image Details
+
+- **Base image**: `deeplabcut/deeplabcut:latest-jupyter`
+- **Pre-installed**: DeepLabCut 3.x (PyTorch), Python 3.11, all dependencies
+- **No conda setup needed**: Base image provides the environment
+
+## Next Steps
+
+- See [Workflows](./workflows.md) for trained vs pretrained model modes
+- See [Testing Guide](./testing.md) for details on running functional tests
+- See [Tutorials](./tutorials/) for workflow examples
+- See [Concepts](./concepts.md) for architecture details
+
diff --git a/docs/src/index.md b/docs/src/index.md
index 5732762..bdb6ab4 100644
--- a/docs/src/index.md
+++ b/docs/src/index.md
@@ -12,10 +12,16 @@ Element DeepLabCut runs DeepLabCut which uses image recognition machine learning
 to generate animal position estimates from consumer grade video equipment.  The Element
 is composed of two schemas for storing data and running analysis:
 
-- `train` - Manages model training
+- `train` - Manages model training (for trained models only)
   
 - `model` - Manages models and launches pose estimation
 
+The Element supports two workflow modes:
+
+- **Trained Models**: Custom models you train yourself using your own labeled data
+- **Pretrained Models**: Ready-to-use models from the DLC Model Zoo (e.g., SuperAnimal models)
+
+Visit the [Workflows page](./workflows.md) to learn about both modes and when to use each.
 Visit the [Concepts page](./concepts.md) for more information on pose estimation and
 Element DeepLabCut.  To get started with building your data pipeline visit the
 [Tutorials page](./tutorials/).
diff --git a/docs/src/testing.md b/docs/src/testing.md
new file mode 100644
index 0000000..be44348
--- /dev/null
+++ b/docs/src/testing.md
@@ -0,0 +1,342 @@
+# Testing Guide
+
+Element DeepLabCut includes **functional/integration test scripts** to verify the end-to-end workflow with DeepLabCut 3.x (PyTorch) and DataJoint integration. These tests are designed as **smoke tests** that validate the complete pipeline without requiring heavy computation or real model training.
+
+**Test Type**: These are **functional/integration tests**, not unit tests. They test the entire pipeline end-to-end, including:
+- Database interactions (DataJoint schemas and tables)
+- File system operations (DLC project creation, file I/O)
+- DeepLabCut API calls (project creation, training dataset creation, inference)
+- DataJoint table population (Model, PoseEstimation, etc.)
+- Cross-component integration (how all pieces work together)
+
+While they use mocking to avoid actual model training (which would take hours/days), they still exercise the full workflow and integration between components. This makes them **functional smoke tests** - they verify the pipeline works correctly without heavy computation.
+
+## Unit Tests
+
+You also have **unit tests** in the `tests/` directory that test individual functions in isolation:
+
+- **`tests/test_pretrained_workflow.py`**: Unit tests for pretrained model logic
+  - `test_pretrained_model_registration` - Tests model registration
+  - `test_insert_pretrained_model` - Tests inserting pretrained models
+  - `test_pretrained_vs_trained_detection` - Tests detection logic
+  - `test_pretrained_model_validation` - Tests validation
+  - `test_parameter_merging` - Tests parameter merging
+
+- **`tests/test_pipeline.py`**: Unit tests for trained model logic
+  - `test_generate_pipeline` - Tests schema structure
+  - `test_recording_info` - Tests recording data retrieval
+  - `test_pose_estimation` - Tests pose estimation data
+
+**Run unit tests:**
+```console
+# Run all unit tests
+pytest tests/
+
+# Run only pretrained workflow unit tests
+pytest tests/test_pretrained_workflow.py
+
+# Run only trained workflow unit tests
+pytest tests/test_pipeline.py
+```
+
+**Unit tests vs Functional tests:**
+- **Unit tests** (`tests/`): Fast (< 1 min), no DLC required, test individual functions
+- **Functional tests** (`test_*.py`): Slower, require DLC, test full end-to-end workflows
+
+The tests cover both workflow modes:
+- **Trained Models**: Complete workflow from project creation to trained inference
+- **Pretrained Models**: Quick inference using pre-built models from the DLC Model Zoo
+
+See [Workflows](./workflows.md) for details on the differences between these modes.
+
+## Test Scripts
+
+### `test_trained_inference.py` - Trained Model Workflow
+
+This script tests the **trained model workflow** (see [Workflows](./workflows.md#trained-models-workflow) for details):
+
+1. ✅ Creates or reuses a DLC project
+2. ✅ Generates mock labeled data (no manual labeling required)
+3. ✅ Creates mock training dataset compatible with DLC 3.x
+4. ✅ Runs mocked training (creates fake snapshot files + `pytorch_config.yaml`)
+5. ✅ Inserts model into `element_deeplabcut.model.Model` table
+6. ✅ Runs trained inference with `PoseEstimation` pipeline
+7. ✅ Stores pose results into DataJoint tables
+
+**Usage:**
+
+```console
+# Full workflow: create project, train, infer
+python test_trained_inference.py
+
+# Use existing trained model (skip training)
+python test_trained_inference.py --skip-training
+
+# Only train, don't infer
+python test_trained_inference.py --skip-inference
+
+# Custom model name
+python test_trained_inference.py --model-name my_model
+```
+
+**In Docker:**
+
+```console
+docker compose run --rm client python test_trained_inference.py
+# Or: make test-trained
+```
+
+### `test_video_inference.py` - Pretrained Model Inference
+
+This script tests the **pretrained model workflow** (see [Workflows](./workflows.md#pretrained-models-workflow) for details):
+
+1. ✅ Tests pretrained model inference (SuperAnimal quadruped, topviewmouse, etc.)
+2. ✅ Handles video file discovery and processing
+3. ✅ Database cleanup and model verification
+4. ✅ Docker-aware path handling
+
+**Usage:**
+
+```console
+# Test with SuperAnimal quadruped model
+python test_video_inference.py superanimal_quadruped
+
+# Test with SuperAnimal topviewmouse model
+python test_video_inference.py superanimal_topviewmouse
+```
+
+**In Docker:**
+
+```console
+docker compose run --rm client python test_video_inference.py superanimal_quadruped
+# Or: make test-pretrained
+```
+
+## Test Types Explained
+
+### Functional/Integration Tests (These Scripts)
+
+`test_trained_inference.py` and `test_video_inference.py` are **functional/integration tests**:
+
+- ✅ Test the **entire end-to-end workflow** (project creation → training → inference → database storage)
+- ✅ Test **integration between components** (DataJoint, DeepLabCut, file system)
+- ✅ Use **mocking** to avoid heavy computation (no real training, but real DLC API calls)
+- ✅ Verify **data flow** through the entire pipeline
+- ✅ Suitable for **CI/CD** to catch integration issues
+
+**Why not unit tests?** Unit tests test individual functions in isolation. These tests verify that all components work together correctly, which is integration testing.
+
+### Unit Tests (Separate)
+
+For true unit tests (testing individual functions), see:
+- `tests/test_pretrained_workflow.py` - Unit tests for pretrained model logic
+- `tests/test_pipeline.py` - Unit tests for trained model logic
+
+These unit tests:
+- Test individual functions/methods in isolation
+- Don't require DLC installation
+- Run very fast (< 1 minute)
+- Use mocks extensively to isolate components
+
+## Prerequisites
+
+### Local Setup
+
+1. **Conda Environment** (recommended):
+
+   ```console
+   conda env create -f environment.yml
+   conda activate element-deeplabcut
+   pip install -e .
+   ```
+
+   See [Conda Environment Setup](../CONDA_ENV_SETUP.md) for details.
+
+2. **Database Configuration**:
+
+   Create `dj_local_conf.json` in the project root:
+
+   ```json
+   {
+     "database.host": "localhost",
+     "database.user": "root",
+     "database.password": "your_password",
+     "database.port": 3306,
+     "custom": {
+       "database.prefix": "test_"
+     }
+   }
+   ```
+
+3. **Test Videos** (optional):
+
+   Place test video files in `./test_videos/` directory. Supported formats: `.mp4`, `.avi`, `.mov`
+
+### Docker Setup
+
+See [Docker Setup](./docker.md) for complete Docker installation and configuration.
+
+## Test Features
+
+### Mock Training
+
+The tests use **mocked training** to avoid heavy computation:
+
+- Creates fake snapshot files: `snapshot-1000.index`, `.meta`, `.data-00000-of-00001`, `.pth`
+- Generates minimal valid `pytorch_config.yaml` with required keys
+- Converts `dlc-models` paths to `dlc-models-pytorch` for PyTorch
+- Sets `snapshotindex = 0` and `engine = "pytorch"` in config
+
+**No real training occurs** - this is a functional test to verify the workflow.
+
+### Mock Inference
+
+The tests use **mocked inference** to avoid GPU requirements:
+
+- Patches `get_scorer_name` to return dummy strings
+- Patches `get_model_snapshots` to create mock snapshots if missing
+- Patches `load_state_dict` to use `strict=False` for mock state dicts
+- Lenient pickle validation for mock models
+
+**Results are not accurate** (mock model weights), but the workflow is validated.
+
+### Database Cleanup
+
+Both test scripts include comprehensive database cleanup at the start:
+
+- Deletes `PoseEstimation` and `PoseEstimationTask` entries
+- Removes test models (names starting with `test_`)
+- Removes `ModelTraining` entries
+- Ensures test repeatability
+
+### Docker-Aware Path Handling
+
+The test scripts automatically detect Docker environment and adjust paths:
+
+- **Docker**: Uses `/app/test_videos` (from project mount)
+- **Local**: Uses `./test_videos`
+- Can be overridden with `DLC_ROOT_DATA_DIR` environment variable
+
+## Running Tests
+
+### Local Execution
+
+```console
+# Activate conda environment
+conda activate element-deeplabcut
+
+# Run trained model test
+python test_trained_inference.py
+
+# Run pretrained model test
+python test_video_inference.py superanimal_quadruped
+```
+
+### Docker Execution
+
+```console
+# Start services
+docker compose up -d
+
+# Run tests
+docker compose run --rm client python test_trained_inference.py
+docker compose run --rm client python test_video_inference.py superanimal_quadruped
+
+# Or use Makefile
+make test-trained
+make test-pretrained
+```
+
+## Test Output
+
+The test scripts provide detailed status output:
+
+```
+============================================================
+Testing Trained Model Workflow (Training + Inference)
+============================================================
+
+[1/12] ✓ Checking database connection
+   ✓ Database connection successful
+
+[2/12] ✓ Cleaning up database (removing test data from previous runs)
+   🗑️ Deleted 5 PoseEstimation entry/entries
+   🗑️ Deleted 3 PoseEstimationTask entry/entries
+   ✅ Total: 8 entry/entries cleaned
+
+[3/12] ✓ Finding video files
+   📹 Found 2 video file(s)
+   ...
+
+[12/12] ✓ Running inference
+   ✅ Inference completed!
+```
+
+## Troubleshooting
+
+### Database Connection Errors
+
+**Error**: `pymysql.err.OperationalError: (1045, "Access denied")`
+
+**Solution**: Check your `dj_local_conf.json` password matches your database password. For Docker, use `datajoint` (default).
+
+### No Video Files Found
+
+**Error**: `No video files found in ./test_videos`
+
+**Solution**:
+- Ensure video files are in `./test_videos/` directory
+- Check file formats (supported: `.mp4`, `.avi`, `.mov`)
+- In Docker, videos are automatically available at `/app/test_videos` (from project mount)
+
+### DLC 3.x Compatibility Issues
+
+The tests include workarounds for known DLC 3.x issues:
+
+- **Labeled data format**: Fixed DataFrame index to be string paths
+- **Snapshot discovery**: Mocks `get_model_snapshots` to always find/create snapshots
+- **State dict loading**: Uses `strict=False` for mock state dicts
+- **Metadata validation**: Lenient handling of pickle metadata mismatches
+
+If you encounter other issues, check the test script comments for additional workarounds.
+
+### Task Length Errors
+
+**Error**: `pymysql.err.DataError: (1406, "Data too long for column 'task'")`
+
+**Solution**: The test scripts automatically truncate task names to 32 characters. If you see this error, check that truncation is happening early in the script.
+
+## CI/CD Integration
+
+These tests are suitable for CI/CD pipelines:
+
+- **Fast execution**: No real training or GPU required
+- **Deterministic**: Mocked components ensure consistent results
+- **Isolated**: Database cleanup ensures clean state
+- **Docker-ready**: Can run in containerized environments
+
+**Example GitHub Actions workflow:**
+
+```yaml
+name: Test
+
+on: [push, pull_request]
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      - name: Start services
+        run: docker compose up -d
+      - name: Run tests
+        run: docker compose run --rm client python test_trained_inference.py
+```
+
+## Next Steps
+
+- See [Docker Setup](./docker.md) for Docker configuration
+- See [Tutorials](./tutorials/) for workflow examples
+- See [Concepts](./concepts.md) for architecture details
+- See [Environment Setup](../tests/ENVIRONMENT_SETUP.md) for detailed setup instructions
+
diff --git a/docs/src/workflows.md b/docs/src/workflows.md
new file mode 100644
index 0000000..90870f1
--- /dev/null
+++ b/docs/src/workflows.md
@@ -0,0 +1,333 @@
+# Workflow Modes
+
+Element DeepLabCut supports two distinct workflow modes for pose estimation:
+
+1. **Trained Models**: Models you train yourself using your own labeled data
+2. **Pretrained Models**: Pre-built models from the DLC Model Zoo (e.g., SuperAnimal models)
+
+This guide explains when to use each mode, how they differ, and how to implement them.
+
+## Trained Models Workflow
+
+### Overview
+
+Trained models are custom models that you create by:
+
+1. Creating a DeepLabCut project
+2. Labeling training data (manually or programmatically)
+3. Training the model on your labeled data
+4. Using the trained model for inference
+
+This workflow gives you maximum control and customization but requires more setup and time.
+
+### When to Use Trained Models
+
+Use trained models when:
+
+- ✅ You need high accuracy for a specific experimental setup
+- ✅ Your videos have unique characteristics (lighting, camera angle, species, etc.)
+- ✅ You want to track specific body parts not covered by pretrained models
+- ✅ You have time and resources for data labeling and training
+- ✅ You need to fine-tune a model for your specific use case
+
+### Workflow Steps
+
+#### 1. Create DLC Project
+
+Create a DeepLabCut project with your video data:
+
+```python
+import deeplabcut
+
+# Create a new project
+config_path = deeplabcut.create_new_project(
+    "MyProject",
+    "experimenter",
+    videos=["path/to/video1.mp4", "path/to/video2.mp4"],
+    working_directory="./dlc_projects",
+    copy_videos=True,
+)
+```
+
+#### 2. Label Training Data
+
+Label frames in your videos to create training data:
+
+```python
+# Extract frames for labeling
+deeplabcut.extract_frames(config_path, mode='automatic', algo='kmeans', numframes2pick=20)
+
+# Label frames (opens GUI)
+deeplabcut.label_frames(config_path)
+
+# Or use programmatic labeling (see test_trained_inference.py for examples)
+```
+
+#### 3. Create Training Dataset
+
+Generate the training dataset from labeled data:
+
+```python
+deeplabcut.create_training_dataset(config_path)
+```
+
+#### 4. Train Model
+
+Train the model (or mock training for testing):
+
+```python
+# Real training (requires GPU, takes hours/days)
+deeplabcut.train_network(config_path)
+
+# Or use element-deeplabcut's ModelTraining table
+from element_deeplabcut import train
+
+# Insert training task
+train.TrainingTask.insert1({
+    "paramset_idx": 1,
+    "video_set_id": 1,
+})
+
+# Populate to start training
+train.ModelTraining.populate()
+```
+
+#### 5. Insert Model into Database
+
+Once training is complete, insert the model:
+
+```python
+from element_deeplabcut import model
+import deeplabcut
+
+# Load config
+dlc_config = deeplabcut.auxiliaryfunctions.read_config(config_path)
+
+# Insert model
+model.Model.insert_new_model(
+    model_name="my_trained_model",
+    dlc_config=dlc_config,
+    shuffle=1,
+    trainingsetindex=0,
+    model_description="Model trained on my experimental setup",
+)
+```
+
+#### 6. Run Inference
+
+Use the trained model for pose estimation:
+
+```python
+# Create pose estimation task
+model.PoseEstimationTask.insert1({
+    "recording_id": 1,
+    "model_name": "my_trained_model",
+    "task_mode": None,  # Fresh run
+})
+
+# Populate to run inference
+model.PoseEstimation.populate()
+```
+
+### Key Characteristics
+
+- **Project Path**: Required - points to your DLC project directory
+- **Training Data**: Required - labeled frames in your project
+- **Model Snapshots**: Required - trained model weights (`.pth` files for PyTorch)
+- **Config File**: Required - `config.yaml` from your DLC project
+- **Training Time**: Hours to days (depending on dataset size and hardware)
+- **Accuracy**: High for your specific setup
+- **Flexibility**: Full control over body parts, training parameters, etc.
+
+### Database Tables Used
+
+- `train.VideoSet`: Training video sets
+- `train.TrainingParamSet`: Training parameters
+- `train.TrainingTask`: Training tasks
+- `train.ModelTraining`: Training execution records
+- `model.Model`: Model metadata (with `project_path` and training info)
+- `model.PoseEstimationTask`: Inference tasks
+- `model.PoseEstimation`: Inference results
+
+## Pretrained Models Workflow
+
+### Overview
+
+Pretrained models are ready-to-use models from the DeepLabCut Model Zoo (e.g., SuperAnimal models) that can be used directly without any training. These models are trained on large, diverse datasets and work well for many common experimental setups.
+
+### When to Use Pretrained Models
+
+Use pretrained models when:
+
+- ✅ You want to get started quickly without training
+- ✅ Your experimental setup matches common scenarios (e.g., top-view mouse, quadruped animals)
+- ✅ You don't have time/resources for data labeling and training
+- ✅ You want to test pose estimation before committing to training
+- ✅ Your videos are similar to the pretrained model's training data
+
+### Available Pretrained Models
+
+Common pretrained models include:
+
+- **`superanimal_quadruped`**: For quadruped animals (mice, rats, etc.)
+- **`superanimal_topviewmouse`**: For top-view mouse pose estimation
+- **Other SuperAnimal models**: Various species and camera angles
+
+See the [DLC Model Zoo](http://www.mackenziemathislab.org/dlc-modelzoo) for the full list.
+
+### Workflow Steps
+
+#### 1. Register Pretrained Model
+
+First, register the pretrained model in the database:
+
+```python
+from element_deeplabcut import model
+
+# Populate common pretrained models
+model.PretrainedModel.populate_common_models()
+
+# Or add a custom pretrained model
+model.PretrainedModel.add(
+    pretrained_model_name="superanimal_quadruped",
+    source="SuperAnimal",
+    version="1.0",
+    species="quadruped",
+    backbone_model_name="hrnet_w32",
+    detector_name="fasterrcnn_resnet50_fpn_v2",
+    default_params={
+        "video_adapt": False,
+        "scale": 0.4,
+        "batchsize": 8,
+    },
+    description="SuperAnimal model for quadruped animals",
+)
+```
+
+#### 2. Insert Model into Database
+
+Insert the pretrained model as a usable model:
+
+```python
+model.Model.insert_pretrained_model(
+    model_name="my_pretrained_model",
+    pretrained_model_name="superanimal_quadruped",
+    model_description="Using SuperAnimal quadruped model",
+)
+```
+
+#### 3. Run Inference
+
+Use the pretrained model for pose estimation:
+
+```python
+# Create pose estimation task
+model.PoseEstimationTask.insert1({
+    "recording_id": 1,
+    "model_name": "my_pretrained_model",
+    "task_mode": None,  # Fresh run
+})
+
+# Populate to run inference
+model.PoseEstimation.populate()
+```
+
+### Key Characteristics
+
+- **Project Path**: Not required - pretrained models don't use DLC projects
+- **Training Data**: Not required - model is already trained
+- **Model Snapshots**: Not required - weights are downloaded automatically by DLC
+- **Config File**: Minimal - only inference parameters needed
+- **Training Time**: Zero - model is ready to use
+- **Accuracy**: Good for common scenarios, may need fine-tuning for specific setups
+- **Flexibility**: Limited to predefined body parts and configurations
+
+### Database Tables Used
+
+- `model.PretrainedModel`: Lookup table of available pretrained models
+- `model.Model`: Model metadata (with `project_path=""` and `_pretrained_model_name`)
+- `model.PoseEstimationTask`: Inference tasks
+- `model.PoseEstimation`: Inference results
+
+**Note**: The `train` schema is **not used** for pretrained models.
+
+## Comparison Table
+
+| Feature | Trained Models | Pretrained Models |
+|---------|---------------|-------------------|
+| **Setup Time** | Days to weeks | Minutes |
+| **Training Required** | Yes (hours to days) | No |
+| **Data Labeling** | Required | Not required |
+| **DLC Project** | Required | Not required |
+| **Project Path** | Required in database | Empty string |
+| **Model Snapshots** | Required (`.pth` files) | Downloaded automatically |
+| **Accuracy** | High (for your setup) | Good (for common setups) |
+| **Customization** | Full control | Limited to model's design |
+| **Body Parts** | You define them | Model defines them |
+| **Best For** | Specific experimental setups | Quick testing, common scenarios |
+| **Database Tables** | `train` + `model` schemas | `model` schema only |
+
+## Choosing the Right Mode
+
+### Start with Pretrained Models
+
+If you're new to pose estimation or want to test quickly:
+
+1. Try a pretrained model that matches your setup
+2. Run inference on a few test videos
+3. Evaluate the results
+4. If results are good enough → continue with pretrained models
+5. If results need improvement → consider training a custom model
+
+### Use Trained Models When
+
+- Pretrained models don't match your experimental setup
+- You need specific body parts not in pretrained models
+- You need higher accuracy for your specific videos
+- You have time and resources for training
+
+### Hybrid Approach
+
+You can use both modes in the same pipeline:
+
+- Use pretrained models for initial exploration and quick results
+- Train custom models for production use with higher accuracy
+- Compare results from both approaches
+
+## Code Examples
+
+### Complete Trained Model Workflow
+
+See `test_trained_inference.py` for a complete example of the trained model workflow, including:
+
+- Project creation
+- Mock labeled data generation
+- Training dataset creation
+- Model training (mocked for testing)
+- Model insertion
+- Inference execution
+
+### Complete Pretrained Model Workflow
+
+See `test_video_inference.py` for a complete example of the pretrained model workflow, including:
+
+- Pretrained model registration
+- Model insertion
+- Inference execution
+
+## Testing
+
+Both workflow modes have dedicated test scripts:
+
+- **Trained models**: `test_trained_inference.py`
+- **Pretrained models**: `test_video_inference.py`
+
+See the [Testing Guide](./testing.md) for details on running these tests.
+
+## Next Steps
+
+- See [Tutorials](./tutorials/) for step-by-step examples
+- See [Concepts](./concepts.md) for architecture details
+- See [Docker Setup](./docker.md) for containerized development
+- See [Testing Guide](./testing.md) for functional tests
+

From 855e259b8cb5034b95f6c34d64b5bce898b26b72 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:29:57 +0100
Subject: [PATCH 03/15] final models support version

---
 element_deeplabcut/model.py              |  712 ++++++++++++--
 element_deeplabcut/readers/dlc_reader.py |  505 ++++++++--
 element_deeplabcut/train.py              | 1097 +++++++++++++++-------
 3 files changed, 1802 insertions(+), 512 deletions(-)

diff --git a/element_deeplabcut/model.py b/element_deeplabcut/model.py
index e35d174..843cdf5 100644
--- a/element_deeplabcut/model.py
+++ b/element_deeplabcut/model.py
@@ -85,12 +85,18 @@ def get_dlc_root_data_dir() -> list:
     string or list of strings for possible root data directories.
     """
     root_directories = _linking_module.get_dlc_root_data_dir()
+    
+    # Handle None case
+    if root_directories is None:
+        return []
+    
     if isinstance(root_directories, (str, Path)):
         root_directories = [root_directories]
 
     if (
         hasattr(_linking_module, "get_dlc_processed_data_dir")
-        and get_dlc_processed_data_dir() not in root_directories
+        and _linking_module.get_dlc_processed_data_dir() is not None
+        and _linking_module.get_dlc_processed_data_dir() not in root_directories
     ):
         root_directories.append(_linking_module.get_dlc_processed_data_dir())
 
@@ -195,8 +201,18 @@ def make(self, key):
                 int(cap.get(cv2.CAP_PROP_FPS)),
             )
             if px_height is not None:
-                assert (px_height, px_width, fps) == info
-            px_height, px_width, fps = info
+                # Allow different dimensions, but warn if they differ
+                if (px_height, px_width, fps) != info:
+                    logger.warning(
+                        f"Video files in recording have different properties. "
+                        f"First video: {px_width}x{px_height} @ {fps} fps, "
+                        f"Current video ({Path(file_path).name}): {info[1]}x{info[0]} @ {info[2]} fps. "
+                        f"Using first video's properties for metadata."
+                    )
+                # Use first video's properties, but still count frames from all videos
+            else:
+                # First video - set as reference
+                px_height, px_width, fps = info
             nframes += int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
             cap.release()
 
@@ -251,8 +267,8 @@ def extract_new_body_parts(cls, dlc_config: dict, verbose: bool = True):
         tracked_body_parts = cls.fetch("body_part")
         new_body_parts = np.setdiff1d(dlc_config["bodyparts"], tracked_body_parts)
         if verbose:  # Added to silence duplicate prompt during `insert_new_model`
-            print(f"Existing body parts: {tracked_body_parts}")
-            print(f"New body parts: {new_body_parts}")
+            logger.info(f"Existing body parts: {tracked_body_parts}")
+            logger.info(f"New body parts: {new_body_parts}")
         return new_body_parts
 
     @classmethod
@@ -275,7 +291,7 @@ def insert_from_config(
                     "Descriptions list does not match "
                     + " the number of new_body_parts"
                 )
-                print(f"New descriptions: {descriptions}")
+                logger.info(f"New descriptions: {descriptions}")
             if descriptions is None:
                 descriptions = ["" for x in range(len(new_body_parts))]
 
@@ -286,7 +302,7 @@ def insert_from_config(
                 )
                 != "yes"
             ):
-                print("Canceled insert.")
+                logger.info("Canceled insert.")
                 return
             cls.insert(
                 [
@@ -351,17 +367,17 @@ def add(
         weights_path: str = "",
         default_params: dict = None,
         description: str = "",
-        auto_insert: bool = False,
     ):
-        """Add a pretrained model to the lookup table.
+        """Register a pretrained model in the lookup table.
         
-        If the model doesn't exist and auto_insert is True, it will be added
-        with the provided parameters. If auto_insert is False and the model
-        doesn't exist, raises a ValueError.
+        This is a convenience method that inserts a pretrained model if it doesn't
+        already exist. For Lookup tables, models should be explicitly registered
+        with proper configuration.
         
         Args:
             pretrained_model_name: Name of the pretrained model (e.g., "superanimal_quadruped").
-            source: Optional. Source of the pretrained model.
+            source: Source of the pretrained model (e.g., "SuperAnimal", "DLC Model Zoo").
+                Recommended for proper model identification.
             version: Optional. Version of the pretrained model.
             species: Optional. Species this model was trained on.
             backbone_model_name: Optional. Backbone model name (e.g., "hrnet_w32").
@@ -370,32 +386,23 @@ def add(
             default_params: Optional. Default inference parameters (dict-like, e.g.,
                 {"video_adapt": False, "scale": 0.4, "batchsize": 8}).
             description: Optional. Description of the pretrained model.
-            auto_insert: If True, automatically insert if missing. If False, raise error.
-                Default False to force explicit registration.
             
         Returns:
-            bool: True if model exists (or was inserted). This is a success flag only.
+            bool: True if model exists or was successfully inserted.
             
         Raises:
-            ValueError: If model doesn't exist and auto_insert=False.
+            ValueError: If model doesn't exist and essential information is missing.
         """
         if cls.is_pretrained(pretrained_model_name):
             return True
         
-        if not auto_insert:
+        # Validate that essential information is provided
+        # At minimum, should have source or default_params for meaningful registration
+        if not source and not default_params and not weights_path:
             raise ValueError(
-                f"Pretrained model '{pretrained_model_name}' not found in "
-                "PretrainedModel lookup table. Use auto_insert=True to add it automatically, "
-                "or register it explicitly using PretrainedModel.insert1()."
-            )
-        
-        # Auto-insert with provided parameters
-        # Warn if auto-creating without meaningful configuration
-        if not weights_path and not default_params:
-            logger.warning(
-                f"Auto-inserting pretrained model '{pretrained_model_name}' without "
-                "weights_path or default_params. Consider registering explicitly with "
-                "proper configuration."
+                f"Cannot register pretrained model '{pretrained_model_name}' without "
+                "essential information. Please provide at least one of: "
+                "source, default_params, or weights_path."
             )
         
         cls.insert1(
@@ -414,6 +421,94 @@ def add(
         )
         return True
 
+    @classmethod
+    def populate_common_models(cls, models: list = None):
+        """Populate the lookup table with common pretrained models.
+        
+        This method registers well-known pretrained models (e.g., SuperAnimal models)
+        with their default configurations. Models are only inserted if they don't
+        already exist in the table.
+        
+        Args:
+            models: Optional. List of model names to populate. If None, populates all
+                common models. Valid options: "superanimal_quadruped", "superanimal_topviewmouse".
+                
+        Returns:
+            dict: Summary of registration results with keys 'inserted', 'skipped', 'failed'.
+        """
+        # Define common models with their configurations
+        # Only include models that are valid SuperAnimal identifiers in DeepLabCut
+        common_models = {
+            "superanimal_quadruped": {
+                "pretrained_model_name": "superanimal_quadruped",
+                "source": "SuperAnimal",
+                "version": "1.0",
+                "species": "quadruped",
+                "backbone_model_name": "hrnet_w32",
+                "detector_name": "fasterrcnn_resnet50_fpn_v2",
+                "default_params": {
+                    "video_adapt": False,
+                    "scale": 0.4,
+                    "batchsize": 8,
+                },
+                "description": "SuperAnimal model for quadruped animals (mice, rats, etc.)",
+            },
+            "superanimal_topviewmouse": {
+                "pretrained_model_name": "superanimal_topviewmouse",
+                "source": "SuperAnimal",
+                "version": "1.0",
+                "species": "mouse",
+                "backbone_model_name": "hrnet_w32",
+                "detector_name": "fasterrcnn_resnet50_fpn_v2",
+                "default_params": {
+                    "video_adapt": False,
+                    "scale": 0.4,
+                    "batchsize": 8,
+                },
+                "description": "SuperAnimal model for top-view mouse pose estimation",
+            },
+        }
+        
+        # Determine which models to populate
+        if models is None:
+            models_to_populate = list(common_models.keys())
+        else:
+            models_to_populate = models if isinstance(models, list) else [models]
+        
+        # Validate model names
+        invalid_models = [m for m in models_to_populate if m not in common_models]
+        if invalid_models:
+            raise ValueError(
+                f"Unknown model names: {invalid_models}. "
+                f"Valid options: {list(common_models.keys())}"
+            )
+        
+        # Register models
+        results = {"inserted": [], "skipped": [], "failed": []}
+        
+        for model_name in models_to_populate:
+            model_config = common_models[model_name]
+            
+            try:
+                if cls.is_pretrained(model_name):
+                    results["skipped"].append(model_name)
+                    logger.info(f"Model '{model_name}' already exists, skipping.")
+                else:
+                    cls.insert1(model_config, skip_duplicates=True)
+                    results["inserted"].append(model_name)
+                    logger.info(f"Registered pretrained model: '{model_name}'")
+            except Exception as e:
+                results["failed"].append((model_name, str(e)))
+                logger.error(f"Failed to register '{model_name}': {e}")
+        
+        # Log summary
+        logger.info(
+            f"Populate summary: {len(results['inserted'])} inserted, "
+            f"{len(results['skipped'])} skipped, {len(results['failed'])} failed"
+        )
+        
+        return results
+
 
 @schema
 class Model(dj.Manual):
@@ -496,7 +591,7 @@ def insert_new_model(
             model_description (str): Optional. Description of this model.
             model_prefix (str): Optional. Filename prefix used across DLC project
             paramset_idx (int): Optional. Index from the TrainingParamSet table
-            prompt (bool): Optional. Prompt the user with all info before inserting.
+            prompt (bool): Optional, default True. Prompt the user with all info before inserting.
             params (dict): Optional. If dlc_config is path, dict of override items
         """
         # handle dlc_config being a yaml file
@@ -580,20 +675,20 @@ def insert_new_model(
 
         # -- prompt for confirmation --
         if prompt:
-            print("--- DLC Model specification to be inserted ---")
+            logger.info("--- DLC Model specification to be inserted ---")
             for k, v in model_dict.items():
                 if k != "config_template":
-                    print("\t{}: {}".format(k, v))
+                    logger.info("\t{}: {}".format(k, v))
                 else:
-                    print("\t-- Template/Contents of config.yaml --")
+                    logger.info("\t-- Template/Contents of config.yaml --")
                     for k, v in model_dict["config_template"].items():
-                        print("\t\t{}: {}".format(k, v))
+                        logger.info("\t\t{}: {}".format(k, v))
 
         if (
             prompt
             and dj.utils.user_choice("Proceed with new DLC model insert?") != "yes"
         ):
-            print("Canceled insert.")
+            logger.info("Canceled insert.")
             return
 
         def _do_insert():
@@ -632,7 +727,7 @@ def insert_pretrained_model(
             pretrained_model_name (str): Name from PretrainedModel lookup table.
             model_description (str): Optional. Description of this model.
             model_prefix (str): Optional. Filename prefix used across DLC project.
-            prompt (bool): Optional. Prompt the user with all info before inserting.
+            prompt (bool): Optional, default True. Prompt the user with all info before inserting.
             config_overrides (dict): Optional. Dict of config items to override defaults.
         """
         # Check if pretrained model exists in lookup - return if not found
@@ -656,18 +751,27 @@ def insert_pretrained_model(
         
         # Set required fields for pretrained models
         # For pretrained models, we use placeholder values for training-related fields
-        dlc_config.setdefault("Task", f"pretrained_{pretrained_model_name}")
+        # Include model_name in task to ensure uniqueness across different model instances
+        # This prevents duplicate key errors when inserting multiple instances of the same pretrained model
+        # Task field is varchar(32), so we need to keep it short
+        # Use a hash or shortened version of model_name to ensure uniqueness while staying within limit
+        import hashlib
+        model_name_hash = hashlib.md5(model_name.encode()).hexdigest()[:8]  # First 8 chars of hash
+        task_value = f"pt_{pretrained_model_name[:10]}_{model_name_hash}"  # Keep under 32 chars
+        # Ensure it's exactly 32 chars or less
+        task_value = task_value[:32]
+        dlc_config.setdefault("Task", task_value)
         dlc_config.setdefault("date", "pretrained")
         dlc_config.setdefault("iteration", 0)
         dlc_config.setdefault("snapshotindex", -1)
         dlc_config.setdefault("TrainingFraction", [1.0])  # Placeholder
         
-        engine = dlc_config.get("engine", "tensorflow")
+        engine = dlc_config.get("engine", "pytorch")
         if engine is None:
             logger.warning(
-                "DLC engine not specified. Defaulting to TensorFlow."
+                "DLC engine not specified. Defaulting to PyTorch."
             )
-            engine = "tensorflow"
+            engine = "pytorch"
 
         # For pretrained models, scorer is based on the pretrained model name
         scorer = f"{pretrained_model_name}_pretrained"
@@ -699,20 +803,20 @@ def insert_pretrained_model(
 
         # -- prompt for confirmation --
         if prompt:
-            print("--- Pretrained DLC Model specification to be inserted ---")
+            logger.info("--- Pretrained DLC Model specification to be inserted ---")
             for k, v in model_dict.items():
                 if k != "config_template":
-                    print("\t{}: {}".format(k, v))
+                    logger.info("\t{}: {}".format(k, v))
                 else:
-                    print("\t-- Template/Contents of config.yaml --")
+                    logger.info("\t-- Template/Contents of config.yaml --")
                     for k, v in model_dict["config_template"].items():
-                        print("\t\t{}: {}".format(k, v))
+                        logger.info("\t\t{}: {}".format(k, v))
 
         if (
             prompt
             and dj.utils.user_choice("Proceed with pretrained DLC model insert?") != "yes"
         ):
-            print("Canceled insert.")
+            logger.info("Canceled insert.")
             return
 
         def _do_insert():
@@ -847,11 +951,34 @@ def infer_output_dir(cls, key: dict, relative: bool = False, mkdir: bool = False
             relative (bool): Report directory relative to get_dlc_processed_data_dir().
             mkdir (bool): Default False. Make directory if it doesn't exist.
         """
+        root_dirs = get_dlc_root_data_dir()
+        if not root_dirs:
+            raise ValueError(
+                "DLC_ROOT_DATA_DIR is not configured. "
+                "Please set DLC_ROOT_DATA_DIR environment variable or configure it in dj_local_conf.json"
+            )
+        
         video_filepath = find_full_path(
-            get_dlc_root_data_dir(),
+            root_dirs,
             (VideoRecording.File & key).fetch("file_path", limit=1)[0],
         )
-        root_dir = find_root_directory(get_dlc_root_data_dir(), video_filepath.parent)
+        
+        # Ensure video_filepath is an absolute Path
+        video_filepath = Path(video_filepath).resolve()
+        
+        # Handle case where video is directly in root directory
+        video_parent = video_filepath.parent
+        root_dir = None
+        # Check if parent is one of the root directories
+        for root in root_dirs:
+            root_path = Path(root).resolve()
+            if video_parent == root_path:
+                root_dir = root_path
+                break
+        
+        # If not found, use find_root_directory (for nested paths)
+        if root_dir is None:
+            root_dir = Path(find_root_directory(root_dirs, video_filepath.parent)).resolve()
         recording_key = VideoRecording & key
         device = "-".join(
             str(v)
@@ -896,20 +1023,78 @@ def generate(
                 videotype, gputouse, save_as_csv, batchsize, cropping, TFGPUinference,
                 dynamic, robust_nframes, allow_growth, use_shelve
         """
-        processed_dir = get_dlc_processed_data_dir()
         output_dir = cls.infer_output_dir(
             {**video_recording_key, "model_name": model_name},
             relative=False,
             mkdir=True,
         )
+        
+        # Get processed_dir for relative path calculation
+        processed_dir = get_dlc_processed_data_dir()
+        if processed_dir is None or processed_dir == "":
+            # If no processed_dir, use root_dir (same logic as infer_output_dir)
+            root_dirs = get_dlc_root_data_dir()
+            if not root_dirs:
+                raise ValueError(
+                    "DLC_ROOT_DATA_DIR is not configured. "
+                    "Please set DLC_ROOT_DATA_DIR environment variable or configure it in dj_local_conf.json"
+                )
+            video_filepath = find_full_path(
+                root_dirs,
+                (VideoRecording.File & {**video_recording_key}).fetch("file_path", limit=1)[0],
+            )
+            video_filepath = Path(video_filepath).resolve()
+            video_parent = video_filepath.parent
+            processed_dir = None
+            for root in root_dirs:
+                root_path = Path(root).resolve()
+                if video_parent == root_path:
+                    processed_dir = root_path
+                    break
+            if processed_dir is None:
+                root_dir_result = find_root_directory(root_dirs, video_filepath.parent)
+                if root_dir_result is None:
+                    raise ValueError(
+                        f"Could not determine root directory for video file: {video_filepath}"
+                    )
+                processed_dir = Path(root_dir_result).resolve()
+        else:
+            processed_dir = Path(processed_dir)
+        
+        # Ensure processed_dir is not None before using it
+        if processed_dir is None:
+            raise ValueError(
+                "Could not determine processed data directory. "
+                "Please configure DLC_PROCESSED_DATA_DIR or ensure DLC_ROOT_DATA_DIR is set correctly."
+        )
 
         if task_mode is None:
-            try:
-                _ = dlc_reader.PoseEstimation(output_dir)
-            except FileNotFoundError:
-                task_mode = "trigger"
-            else:
-                task_mode = "load"
+            # Check if results exist by looking for result files directly (more reliable)
+            output_path = Path(output_dir)
+            results_exist = False
+            if output_path.exists():
+                # Check for result files (H5, pickle, or JSON)
+                h5_files = list(output_path.glob("*.h5"))
+                pickle_files = list(output_path.glob("*.pickle"))
+                json_files = list(output_path.glob("*.json"))
+                if h5_files or pickle_files or json_files:
+                    results_exist = True
+                    logger.info(
+                        f"Found existing results in {output_dir}: "
+                        f"{len(h5_files)} H5, {len(pickle_files)} pickle, {len(json_files)} JSON files"
+                    )
+            
+            # Also try the reader as a fallback
+            if not results_exist:
+                try:
+                    _ = dlc_reader.PoseEstimation(output_dir)
+                    results_exist = True
+                    logger.info(f"Found existing results via dlc_reader in {output_dir}")
+                except (FileNotFoundError, Exception) as e:
+                    logger.debug(f"No results found via dlc_reader in {output_dir}: {e}")
+            
+            task_mode = "load" if results_exist else "trigger"
+            logger.info(f"Auto-detected task_mode='{task_mode}' for {video_recording_key} (output_dir: {output_dir})")
 
         cls.insert1(
             {
@@ -920,7 +1105,8 @@ def generate(
                 "pose_estimation_output_dir": output_dir.relative_to(
                     processed_dir
                 ).as_posix(),
-            }
+            },
+            skip_duplicates=True,
         )
 
     insert_estimation_task = generate
@@ -941,6 +1127,23 @@ class PoseEstimation(dj.Computed):
     pose_estimation_time: datetime  # time of generation of this set of DLC results
     """
 
+    class Individual(dj.Part):
+        """Individuals/animals tracked in this pose estimation.
+        
+        For single-animal data, this table will be empty.
+        For multi-animal data, each individual is tracked separately.
+        
+        Attributes:
+            PoseEstimation (foreign key): Pose Estimation key.
+            individual_id (varchar): Individual/animal identifier (e.g., 'animal0', 'animal1').
+        """
+        
+        definition = """
+        -> master
+        ---
+        individual_id : varchar(32)  # Individual/animal identifier (e.g., 'animal0', 'animal1')
+    """
+
     class BodyPartPosition(dj.Part):
         """Position of individual body parts by frame index
 
@@ -963,6 +1166,26 @@ class BodyPartPosition(dj.Part):
         z_pos=null  : longblob
         likelihood  : longblob
         """
+    
+    class IndividualMapping(dj.Part):
+        """Maps body part positions to individuals for multi-animal tracking.
+        
+        For single-animal data, this table will be empty.
+        For multi-animal data, links BodyPartPosition entries to individuals.
+        Note: In multi-animal data, each individual has separate position data,
+        so we encode the individual in a unique identifier.
+        
+        Attributes:
+            PoseEstimation (foreign key): Pose Estimation key.
+            body_part (varchar): Body part name (from BodyPartPosition, via Model.BodyPart).
+            individual_id (varchar): Individual identifier (must match Individual.individual_id).
+        """
+        
+        definition = """
+        -> master
+        body_part: varchar(32)  # Body part name (must match BodyPartPosition.body_part)
+        individual_id: varchar(32)  # Individual identifier (must match Individual.individual_id)
+        """
 
     @classmethod
     def _do_pretrained_inference(
@@ -1001,14 +1224,11 @@ def _do_pretrained_inference(
             )
 
         default_params = pm.get("default_params") or {}
-        # Merge: explicit inference_params override defaults
         merged_params = {**default_params, **(inference_params or {})}
 
-        # Get optional fields if they exist in the table
         backbone_model_name = pm.get("backbone_model_name") or None
         detector_name = pm.get("detector_name") or None
 
-        # Ensure output_dir exists and is a string for DLC
         output_dir = Path(output_dir)
         output_dir.mkdir(parents=True, exist_ok=True)
         destfolder_str = str(output_dir)
@@ -1017,30 +1237,68 @@ def _do_pretrained_inference(
         if hasattr(deeplabcut, "video_inference_superanimal"):
             inference_func = deeplabcut.video_inference_superanimal
             sig = inspect.signature(inference_func)
+            param_names = list(sig.parameters.keys())
 
-            # Base kwargs from merged_params, filtered by supported args
             kwargs = {
                 k: v
                 for k, v in merged_params.items()
                 if k in sig.parameters
             }
 
-            # Map known optional fields if accepted by the function
-            if "model_name" in sig.parameters and backbone_model_name:
-                kwargs.setdefault("model_name", backbone_model_name)
-            if "detector_name" in sig.parameters and detector_name:
-                kwargs.setdefault("detector_name", detector_name)
-            if "destfolder" in sig.parameters:
+            # Set dest_folder (note: DLC 3.x uses dest_folder, not destfolder)
+            if "dest_folder" in sig.parameters:
+                kwargs.setdefault("dest_folder", destfolder_str)
+            elif "destfolder" in sig.parameters:
                 kwargs.setdefault("destfolder", destfolder_str)
 
-            # Call: video_inference_superanimal(video_list, superanimal_name, **kwargs)
-            return inference_func(
+            # DLC 3.x signature: video_inference_superanimal(videos, superanimal_name, model_name, ...)
+            # model_name is required, so we need to provide it
+            if not backbone_model_name:
+                # If no backbone_model_name in metadata, use a default or raise error
+                logger.warning(
+                    f"No backbone_model_name found for pretrained model '{pretrained_model_name}'. "
+                    "Using default 'superanimal' model name."
+                )
+                backbone_model_name = "superanimal"
+
+            # Set detector_name if available
+            if detector_name and "detector_name" in sig.parameters:
+                kwargs.setdefault("detector_name", detector_name)
+
+            logger.info(
+                f"Running video_inference_superanimal with "
+                f"superanimal_name={pretrained_model_name}, "
+                f"model_name={backbone_model_name}, "
+                f"{len(video_filepaths)} videos, "
+                f"dest_folder={destfolder_str}, "
+                f"kwargs={kwargs}"
+            )
+            
+            # Verify output directory exists and is unique
+            if not Path(destfolder_str).exists():
+                logger.warning(f"Output directory does not exist, creating: {destfolder_str}")
+                Path(destfolder_str).mkdir(parents=True, exist_ok=True)
+            logger.info(f"Output will be saved to: {destfolder_str}")
+
+            # Call with correct signature: videos, superanimal_name, model_name, **kwargs
+            result = inference_func(
                 video_filepaths,
-                pretrained_model_name,
+                pretrained_model_name,  # superanimal_name (positional, required)
+                backbone_model_name,    # model_name (positional, required)
                 **kwargs,
             )
 
-        # --- Fallback: generic video_inference API, if present ---
+            # Verify files were saved to the correct location
+            output_path = Path(destfolder_str)
+            if output_path.exists():
+                saved_files = list(output_path.glob("*.h5")) + list(output_path.glob("*.pickle"))
+                logger.info(f"Saved {len(saved_files)} result file(s) to {destfolder_str}")
+            else:
+                logger.warning(f"Output directory {destfolder_str} does not exist after inference!")
+            
+            return result
+
+        # --- Fallback: our own generic video_inference API, if present ---
         if hasattr(deeplabcut, "video_inference"):
             inference_func = deeplabcut.video_inference
             sig = inspect.signature(inference_func)
@@ -1051,7 +1309,6 @@ def _do_pretrained_inference(
                 if k in sig.parameters
             }
 
-            # Try to inject known fields if supported
             if "model_name" in sig.parameters and backbone_model_name:
                 kwargs.setdefault("model_name", backbone_model_name)
             if "detector_name" in sig.parameters and detector_name:
@@ -1059,17 +1316,19 @@ def _do_pretrained_inference(
             if "destfolder" in sig.parameters:
                 kwargs.setdefault("destfolder", destfolder_str)
 
-            # Some versions may expect (videos, model_name, ...) or similar;
-            # we always pass video_filepaths as first arg and rely on kwargs for the rest.
+            logger.info(
+                f"Running video_inference (fallback) with pretrained_model_name={pretrained_model_name}, "
+                f"{len(video_filepaths)} videos, kwargs={kwargs}"
+            )
+
             return inference_func(
                 video_filepaths,
                 **kwargs,
             )
 
-        # --- No compatible API found ---
         raise NotImplementedError(
             "No compatible pretrained inference function found in the installed DeepLabCut. "
-            "Expected `video_inference_superanimal` or `video_inference`."
+            "Expected `video_inference_superanimal` or a compatible `video_inference` wrapper."
         )
 
     @classmethod
@@ -1197,13 +1456,22 @@ def make(self, key):
             else:
                 raise e
 
-        # Trigger PoseEstimation
+        # Trigger PoseEstimation only if in "trigger" mode
+        # If results already exist, task_mode should be "load" to avoid re-running inference
         if task_mode == "trigger":
+            # Log the key being used to debug video grouping
+            logger.info(f"PoseEstimation.make() called with key: {key}")
+            logger.info(f"Output directory: {output_dir}")
+            
+            # Get videos for THIS specific recording only
             video_relpaths = list((VideoRecording.File & key).fetch("file_path"))
+            logger.info(f"Found {len(video_relpaths)} video file(s) for key {key}: {video_relpaths}")
+            
             video_filepaths = [
                 find_full_path(get_dlc_root_data_dir(), fp).as_posix()
                 for fp in video_relpaths
             ]
+            logger.info(f"Resolved video filepaths: {video_filepaths}")
             pose_estimation_params = (PoseEstimationTask & key).fetch1(
                 "pose_estimation_params"
             ) or {}
@@ -1290,21 +1558,299 @@ def _do_trained_inference():
             "%Y-%m-%d %H:%M:%S"
         )
 
-        body_parts = [
-            {
+        # Handle different data structures (DLC 2.x vs 3.x, single vs multi-animal)
+        body_parts = []
+        
+        # Check if this is multi-animal format (keys like 'animal0', 'animal1', etc.)
+        # Single-animal format: keys are body part names (e.g., 'nose', 'tail')
+        # Multi-animal format: keys contain 'animal' or 'individual' (e.g., 'animal0_nose', 'animal0_superanimal_...')
+        data_keys = list(dlc_result.data.keys()) if dlc_result.data else []
+        is_multi_animal = any(k.startswith('animal') or k.startswith('individual') for k in data_keys)
+        
+        if is_multi_animal:
+            # Multi-animal format: each key is an animal, and each animal has body parts
+            logger.info(
+                f"Multi-animal format detected (keys: {data_keys[:5]}...). "
+                "Extracting body parts from all animals."
+            )
+            
+            # Helper function to extract base individual name (e.g., "animal0" from "animal0_superanimal_...")
+            def extract_individual_id(full_key: str) -> str:
+                """Extract base individual ID from full key name.
+                
+                Examples:
+                    "animal0_superanimal_..." -> "animal0"
+                    "animal1_model_name" -> "animal1"
+                    "individual0" -> "individual0"
+                """
+                # Try to match pattern: animal<number> or individual<number>
+                import re
+                match = re.match(r'^(animal\d+|individual\d+)', full_key)
+                if match:
+                    return match.group(1)
+                # Fallback: return first part before underscore
+                return full_key.split('_')[0] if '_' in full_key else full_key
+            
+            # The structure from reformat_rawdata() should be: "individual_bodypart" -> {x, y, likelihood}
+            # But if body parts extraction failed, keys might be just individual names
+            # Check if keys already contain body parts (format: "individual_bodypart")
+            # or if they're just individual names that need to be processed differently
+            
+            # First, check if keys already have x/y data directly (format: "individual_bodypart")
+            keys_with_xy = [k for k in data_keys if isinstance(dlc_result.data.get(k), dict) 
+                           and "x" in dlc_result.data[k] and "y" in dlc_result.data[k]]
+            
+            if keys_with_xy:
+                # Keys are already in "individual_bodypart" format with x/y data
+                logger.info(f"Found {len(keys_with_xy)} keys with direct x/y data. Processing as 'individual_bodypart' format.")
+                for full_key in keys_with_xy:
+                    key_data = dlc_result.data[full_key]
+                    if isinstance(key_data, dict) and "x" in key_data and "y" in key_data:
+                        # Extract individual and body part from key
+                        # Format: "animal0_superanimal_..._bodypart" or "animal0_bodypart"
+                        individual_id = extract_individual_id(full_key)
+                        # Try to extract body part name (usually the last meaningful part)
+                        # Remove the individual prefix and scorer/model suffix
+                        parts = full_key.split('_')
+                        # Find body part name (usually a short word at the end, not a model/scorer term)
+                        # Common body part names and model terms to exclude
+                        model_terms = {'superanimal', 'hrnet', 'fasterrcnn', 'resnet', 'fpn', 'v2', 'w32', 'w48', 'w64', 
+                                      'resnet50', 'resnet101', 'mobilenet', 'efficientnet', 'densenet', 'inception'}
+                        # Common body part names to prioritize (if found, use them)
+                        common_body_parts = {'nose', 'head', 'eye', 'ear', 'neck', 'shoulder', 'elbow', 'wrist', 'hand', 
+                                           'hip', 'knee', 'ankle', 'foot', 'toe', 'tail', 'back', 'belly', 'chest'}
+                        body_part_name = None
+                        
+                        # First, check if any part matches common body part names
+                        for part in reversed(parts):
+                            if part.lower() in common_body_parts:
+                                body_part_name = part.lower()
+                                break
+                        
+                        # If no common body part found, look for any non-model term
+                        if not body_part_name:
+                            for part in reversed(parts):
+                                if (part != individual_id and len(part) > 2 and 
+                                    part.lower() not in model_terms and 
+                                    not part.isdigit() and
+                                    not part.lower().startswith('animal') and
+                                    not part.lower().startswith('individual')):
+                                    body_part_name = part.lower()
+                                    break
+                        
+                        if body_part_name:
+                            encoded_body_part = f"{individual_id}_{body_part_name}"
+                            body_parts.append({
                 **key,
-                "body_part": k,
+                                "body_part": encoded_body_part,
+                                "frame_index": np.arange(dlc_result.nframes),
+                                "x_pos": key_data["x"],
+                                "y_pos": key_data["y"],
+                                "z_pos": key_data.get("z"),
+                                "likelihood": key_data.get("likelihood", np.ones(dlc_result.nframes)),
+                                "_individual_id": individual_id,
+                                "_clean_body_part": body_part_name,
+                            })
+                        else:
+                            logger.warning(f"Could not extract body part name from key '{full_key}'. Using key as body part name.")
+                            # Fallback: use a sanitized version of the key
+                            body_part_name = full_key.replace(f"{individual_id}_", "").replace("_", " ").title().replace(" ", "")
+                            encoded_body_part = f"{individual_id}_{body_part_name}"
+                            body_parts.append({
+                                **key,
+                                "body_part": encoded_body_part,
+                                "frame_index": np.arange(dlc_result.nframes),
+                                "x_pos": key_data["x"],
+                                "y_pos": key_data["y"],
+                                "z_pos": key_data.get("z"),
+                                "likelihood": key_data.get("likelihood", np.ones(dlc_result.nframes)),
+                                "_individual_id": individual_id,
+                                "_clean_body_part": body_part_name,
+                            })
+            else:
+                # Keys are just individual names, need to look for nested structure
+                logger.info(f"Keys appear to be individual names only. Checking for nested body part structure...")
+                for animal_key_full in data_keys:
+                    animal_data = dlc_result.data[animal_key_full]
+                    individual_id = extract_individual_id(animal_key_full)
+                    
+                    if isinstance(animal_data, dict):
+                        # Check if this dict contains body parts directly
+                        animal_dict_keys = list(animal_data.keys())
+                        logger.debug(f"Individual '{individual_id}' (key: '{animal_key_full}') has {len(animal_dict_keys)} sub-key(s): {animal_dict_keys[:10]}")
+                        
+                        for sub_key, sub_data in animal_data.items():
+                            if isinstance(sub_data, dict) and "x" in sub_data and "y" in sub_data:
+                                # sub_key is the body part name
+                                body_part_name = sub_key
+                                encoded_body_part = f"{individual_id}_{body_part_name}"
+                                body_parts.append({
+                                    **key,
+                                    "body_part": encoded_body_part,
+                                    "frame_index": np.arange(dlc_result.nframes),
+                                    "x_pos": sub_data["x"],
+                                    "y_pos": sub_data["y"],
+                                    "z_pos": sub_data.get("z"),
+                                    "likelihood": sub_data.get("likelihood", np.ones(dlc_result.nframes)),
+                                    "_individual_id": individual_id,
+                                    "_clean_body_part": body_part_name,
+                                })
+                            elif isinstance(sub_data, dict):
+                                # Nested further - sub_data might contain body parts
+                                logger.debug(f"Sub-key '{sub_key}' is a dict but doesn't have x/y. Keys: {list(sub_data.keys())[:5]}")
+                    else:
+                        logger.debug(f"Key '{animal_key_full}' data is not a dict (type: {type(animal_data)})")
+        else:
+            # Single-animal format: keys are body parts
+            for k, v in dlc_result.data.items():
+                # Check if v is a dict with expected keys
+                if isinstance(v, dict):
+                    # DLC 2.x format: dict with 'x', 'y', 'likelihood' keys
+                    if "x" in v and "y" in v:
+                        body_parts.append({
+                            **key,
+                            "body_part": k,  # Single-animal format
+                            # No individual_id - will be NULL (single-animal)
                 "frame_index": np.arange(dlc_result.nframes),
                 "x_pos": v["x"],
                 "y_pos": v["y"],
                 "z_pos": v.get("z"),
-                "likelihood": v["likelihood"],
-            }
-            for k, v in dlc_result.data.items()
-        ]
+                            "likelihood": v.get("likelihood", np.ones(dlc_result.nframes)),  # Default to 1.0 if missing
+                        })
+                    else:
+                        logger.warning(
+                            f"Body part '{k}' data structure unexpected. Keys: {list(v.keys())}. "
+                            "Skipping this body part."
+                        )
+                else:
+                    logger.warning(
+                        f"Body part '{k}' data is not a dict (type: {type(v)}). Skipping."
+                    )
+        
+        if len(body_parts) == 0:
+            # Instead of raising an error, log a warning and skip this recording
+            logger.error(
+                f"No valid body part data found in results for key {key}. "
+                f"Data structure: {data_keys}. "
+                f"First item structure: {type(list(dlc_result.data.values())[0]) if dlc_result.data else 'N/A'}. "
+                "Skipping this recording and continuing with next."
+            )
+            # Return early without inserting - this will skip this key
+            return
+
+        # Extract unique body part names, clean names, and individuals from the results
+        unique_body_parts_encoded = set()  # Encoded names like "animal0_nose"
+        unique_body_parts_clean = set()  # Clean names like "nose"
+        unique_individuals = set()
+        individual_mappings = []  # Store mappings for IndividualMapping table
+        
+        for bp in body_parts:
+            encoded_name = bp["body_part"]
+            unique_body_parts_encoded.add(encoded_name)
+            
+            # Extract individual and clean body part name
+            individual_id = bp.pop("_individual_id", None)
+            clean_body_part = bp.pop("_clean_body_part", None)
+            
+            if individual_id:
+                unique_individuals.add(individual_id)
+                if clean_body_part:
+                    unique_body_parts_clean.add(clean_body_part)
+                    # Store mapping for IndividualMapping table
+                    individual_mappings.append({
+                        **key,
+                        "body_part": encoded_name,  # The encoded name in BodyPartPosition
+                        "individual_id": individual_id
+                    })
+            else:
+                # Single-animal: encoded name is the clean name
+                unique_body_parts_clean.add(encoded_name)
+        
+        # Register body part names in global BodyPart table
+        # For multi-animal: register both clean names (e.g., "nose") and encoded names (e.g., "animal0_nose")
+        # For single-animal: register clean names only (encoded = clean)
+        model_name = key["model_name"]
+        
+        # Register clean body part names
+        for clean_body_part in unique_body_parts_clean:
+            if not (BodyPart & {"body_part": clean_body_part}):
+                BodyPart.insert1(
+                    {"body_part": clean_body_part, "body_part_description": ""},
+                    skip_duplicates=True
+                )
+                logger.info(f"Registered new body part: {clean_body_part}")
+        
+        # Register encoded body part names (for multi-animal support)
+        # These are different from clean names and need to be registered separately
+        for encoded_body_part in unique_body_parts_encoded:
+            # Only register if it's different from clean names (multi-animal case)
+            if encoded_body_part not in unique_body_parts_clean:
+                if not (BodyPart & {"body_part": encoded_body_part}):
+                    BodyPart.insert1(
+                        {"body_part": encoded_body_part, "body_part_description": ""},
+                        skip_duplicates=True
+                    )
+                    logger.debug(f"Registered encoded body part: {encoded_body_part}")
+        
+        # Link body parts to model in Model.BodyPart
+        # Use encoded names for multi-animal, clean names for single-animal
+        for encoded_body_part in unique_body_parts_encoded:
+            if not (Model.BodyPart & {"model_name": model_name, "body_part": encoded_body_part}):
+                Model.BodyPart.insert1(
+                    {"model_name": model_name, "body_part": encoded_body_part},
+                    skip_duplicates=True
+                )
+                logger.debug(f"Linked body part {encoded_body_part} to model {model_name}")
 
+        # Insert master row FIRST (required before inserting into Part tables)
         self.insert1({**key, "pose_estimation_time": creation_time})
+        
+        # Now insert into Part tables (they require the master row to exist)
         self.BodyPartPosition.insert(body_parts)
+        
+        # Register individuals (for multi-animal data) - must be after master row is inserted
+        if unique_individuals:
+            individuals_to_insert = [
+                {**key, "individual_id": ind_id}
+                for ind_id in unique_individuals
+            ]
+            self.Individual.insert(individuals_to_insert, skip_duplicates=True)
+            logger.info(f"Registered {len(unique_individuals)} individual(s): {sorted(unique_individuals)}")
+        
+        # Insert individual mappings if this is multi-animal data
+        if individual_mappings:
+            for mapping in individual_mappings:
+                # IndividualMapping needs: master key (PoseEstimation) + body_part + Individual key
+                # PoseEstimation key: subject, session_datetime, recording_id, model_name
+                # body_part: from BodyPartPosition (via Model.BodyPart)
+                # Individual key: subject, session_datetime, recording_id, model_name, individual_id
+                mapping_key = {
+                    **key,  # subject, session_datetime, recording_id, model_name (from master)
+                    "body_part": mapping["body_part"],  # from BodyPartPosition
+                    "individual_id": mapping["individual_id"]  # from Individual
+                }
+                
+                # Verify both BodyPartPosition and Individual exist
+                bp_key = {**key, "body_part": mapping["body_part"]}
+                ind_key = {**key, "individual_id": mapping["individual_id"]}
+                
+                bp_exists = bool(self.BodyPartPosition & bp_key)
+                ind_exists = bool(self.Individual & ind_key)
+                
+                if bp_exists and ind_exists:
+                    try:
+                        self.IndividualMapping.insert1(
+                            mapping_key,
+                            skip_duplicates=True
+                        )
+                        logger.debug(f"Created mapping: {mapping_key}")
+                    except Exception as e:
+                        logger.warning(f"Could not insert mapping for {mapping_key}: {e}")
+                else:
+                    logger.debug(
+                        f"Could not create mapping: bp_key={bp_key} (exists: {bp_exists}), "
+                        f"ind_key={ind_key} (exists: {ind_exists})"
+                    )
 
     @classmethod
     def get_trajectory(cls, key: dict, body_parts: list = "all") -> pd.DataFrame:
diff --git a/element_deeplabcut/readers/dlc_reader.py b/element_deeplabcut/readers/dlc_reader.py
index 7eaff22..f50c01e 100644
--- a/element_deeplabcut/readers/dlc_reader.py
+++ b/element_deeplabcut/readers/dlc_reader.py
@@ -33,14 +33,47 @@ def __init__(
                 raise FileNotFoundError(f"Unable to find {dlc_dir}")
 
         # meta file: pkl - info about this DLC run (input video, configuration, etc.)
+        # DLC 2.x uses *meta.pickle, DLC 3.x uses *_results.pickle or UUID-prefixed .pickle files
         if pkl_path is None:
+            # Try DLC 2.x format first
             self.pkl_paths = sorted(
                 self.dlc_dir.rglob(f"{filename_prefix}*meta.pickle")
             )
+            # If not found, try DLC 3.x formats
             if not len(self.pkl_paths) > 0:
-                raise FileNotFoundError(
-                    f"No meta file (.pickle) found in: {self.dlc_dir}"
+                # Try *_results.pickle pattern
+                self.pkl_paths = sorted(
+                    self.dlc_dir.rglob(f"{filename_prefix}*_results.pickle")
                 )
+            if not len(self.pkl_paths) > 0:
+                # Try any .pickle file (DLC 3.x may use UUID prefixes)
+                all_pickle = sorted(self.dlc_dir.rglob(f"{filename_prefix}*.pickle"))
+                # Filter out non-meta files (prefer files with 'meta' or 'results' in name)
+                meta_pickle = [p for p in all_pickle if 'meta' in p.name.lower() or 'results' in p.name.lower()]
+                if meta_pickle:
+                    self.pkl_paths = meta_pickle
+                elif all_pickle:
+                    # Fallback: use any pickle file if no meta/results found
+                    self.pkl_paths = all_pickle
+            
+            # Check if we have H5 files - if so, pickle is optional (DLC 3.x may not create it)
+            h5_files_exist = len(list(self.dlc_dir.glob(f"{filename_prefix}*.h5"))) > 0
+            
+            if not len(self.pkl_paths) > 0:
+                if h5_files_exist:
+                    # H5 files exist but no pickle - this is OK for DLC 3.x pretrained models
+                    logger.warning(
+                        f"No meta file (.pickle) found in: {self.dlc_dir}, "
+                        "but H5 files are present. This is common for DLC 3.x pretrained models. "
+                        "Will extract metadata from H5 files."
+                    )
+                    self.pkl_paths = []  # Empty list - we'll handle this in the pkl property
+                else:
+                    # No pickle AND no H5 files - this is an error
+                    raise FileNotFoundError(
+                        f"No meta file (.pickle) or H5 files found in: {self.dlc_dir}. "
+                        f"Looked for: *meta.pickle, *_results.pickle, *.pickle, and *.h5"
+                    )
         else:
             pkl_path = Path(pkl_path)
             if not pkl_path.exists():
@@ -61,54 +94,111 @@ def __init__(
             self.h5_paths = [h5_path]
 
         # validate number of files
-        assert len(self.h5_paths) == len(
-            self.pkl_paths
-        ), f"Unequal number of .h5 files ({len(self.h5_paths)}) and .pickle files ({len(self.pkl_paths)})"
+        # DLC 3.x might have different number of pickle vs h5 files (pickle might be empty/placeholder)
+        # So we allow mismatch but warn
+        if len(self.h5_paths) != len(self.pkl_paths):
+            logger.warning(
+                f"Unequal number of .h5 files ({len(self.h5_paths)}) and .pickle files ({len(self.pkl_paths)}). "
+                "This is common with DLC 3.x. Will extract metadata from H5 files if needed."
+            )
 
-        assert (
-            self.pkl_paths[0].stem == self.h5_paths[0].stem + "_meta"
-        ), f"Mismatching h5 ({self.h5_paths[0].stem}) and pickle {self.pkl_paths[0].stem}"
+        # DLC 2.x: pickle stem should match h5 stem + "_meta"
+        # DLC 3.x: naming might be different, so we make this check more lenient
+        if len(self.pkl_paths) > 0 and len(self.h5_paths) > 0:
+            h5_stem = self.h5_paths[0].stem
+            pkl_stem = self.pkl_paths[0].stem
+            # Check if they match DLC 2.x pattern or if it's DLC 3.x (different naming)
+            if not (pkl_stem == h5_stem + "_meta" or pkl_stem.endswith("_results") or "_" in pkl_stem):
+                logger.warning(
+                    f"Pickle file name ({pkl_stem}) doesn't match expected pattern for H5 file ({h5_stem}). "
+                    "This might be DLC 3.x format with different naming convention."
+                )
 
         # config file: yaml - configuration for invoking the DLC post estimation step
+        # Note: DLC 3.x pretrained models may not create a YAML file in the output directory
         if yml_path is None:
             yml_paths = list(self.dlc_dir.glob(f"{filename_prefix}*.y*ml"))
             # If multiple, defer to the one we save.
             if len(yml_paths) > 1:
                 yml_paths = [val for val in yml_paths if val.stem == "dj_dlc_config"]
-            if len(yml_paths) != 1:
+            if len(yml_paths) == 0:
+                # No YAML file found - this is common for DLC 3.x pretrained models
+                # We can still read the results from H5/pickle files
+                logger.warning(
+                    f"No YAML file found in {self.dlc_dir}. "
+                    "This is common for DLC 3.x pretrained model outputs. "
+                    "Will proceed without config file."
+                )
+                self.yml_path = None
+            elif len(yml_paths) == 1:
+                self.yml_path = yml_paths[0]
+            else:
                 raise FileNotFoundError(
-                    f"Unable to find one unique .yaml file in: {dlc_dir} - Found: {len(yml_paths)}"
+                    f"Unable to find one unique .yaml file in: {self.dlc_dir} - Found: {len(yml_paths)}"
                 )
-            self.yml_path = yml_paths[0]
         else:
             self.yml_path = Path(yml_path)
             if not self.yml_path.exists():
-                raise FileNotFoundError(f"{self.yml_path} not found")
+                logger.warning(f"YAML path specified but not found: {self.yml_path}. Proceeding without it.")
+                self.yml_path = None
 
         self._pkl = None
         self._rawdata = None
         self._yml = None
         self._data = None
 
-        train_idx = np.where(
-            (np.array(self.yml["TrainingFraction"]) * 100).astype(int)
-            == int(self.pkl["training set fraction"] * 100)
-        )[0][0]
-        train_iter = int(self.pkl["Scorer"].split("_")[-1])
-
-        self.model = {
-            "Scorer": self.pkl["Scorer"],
-            "Task": self.yml["Task"],
-            "date": self.yml["date"],
-            "iteration": self.pkl["iteration (active-learning)"],
-            "shuffle": int(re.search(r"shuffle(\d+)", self.pkl["Scorer"]).groups()[0]),
-            "snapshotindex": self.yml["snapshotindex"],
-            "trainingsetindex": train_idx,
-            "training_iteration": train_iter,
-        }
-
-        self.fps = self.pkl["fps"]
-        self.nframes = self.pkl["nframes"]
+        # Handle case where YAML is missing (common for DLC 3.x pretrained models)
+        if not self.yml or len(self.yml) == 0:
+            # For pretrained models, we may not have all the metadata
+            # Use defaults or extract from pickle/H5 files
+            logger.warning("YAML config is empty - using defaults for pretrained model metadata")
+            
+            # Try to extract what we can from pickle
+            scorer = self.pkl.get("Scorer", "unknown")
+            try:
+                shuffle_match = re.search(r"shuffle(\d+)", scorer)
+                shuffle = int(shuffle_match.groups()[0]) if shuffle_match else 0
+            except (AttributeError, IndexError):
+                shuffle = 0
+            
+            try:
+                train_iter = int(scorer.split("_")[-1])
+            except (ValueError, IndexError):
+                train_iter = 0
+            
+            self.model = {
+                "Scorer": scorer,
+                "Task": self.pkl.get("Task", "pretrained"),
+                "date": self.pkl.get("date", "unknown"),
+                "iteration": self.pkl.get("iteration (active-learning)", 0),
+                "shuffle": shuffle,
+                "snapshotindex": -1,  # Default for pretrained models
+                "trainingsetindex": 0,  # Default for pretrained models
+                "training_iteration": train_iter,
+            }
+        else:
+            # Original logic for trained models with YAML
+            train_idx = np.where(
+                (np.array(self.yml["TrainingFraction"]) * 100).astype(int)
+                == int(self.pkl["training set fraction"] * 100)
+            )[0][0]
+            train_iter = int(self.pkl["Scorer"].split("_")[-1])
+
+            self.model = {
+                "Scorer": self.pkl["Scorer"],
+                "Task": self.yml["Task"],
+                "date": self.yml["date"],
+                "iteration": self.pkl["iteration (active-learning)"],
+                "shuffle": int(re.search(r"shuffle(\d+)", self.pkl["Scorer"]).groups()[0]),
+                "snapshotindex": self.yml["snapshotindex"],
+                "trainingsetindex": train_idx,
+                "training_iteration": train_iter,
+            }
+
+        # Get fps and nframes from pickle if available, otherwise from H5
+        pkl_data = self.pkl  # This will extract from H5 if pickle is missing
+        self.fps = pkl_data.get("fps", 30)  # Default to 30 fps if not found
+        self.nframes = pkl_data.get("nframes", len(self.rawdata) if hasattr(self, 'rawdata') else 0)
         self.creation_time = self.h5_paths[0].stat().st_mtime
 
     @property
@@ -117,24 +207,88 @@ def pkl(self):
         if self._pkl is None:
             nframes = 0
             meta_hash = None
+            valid_meta = None
+            
             for fp in self.pkl_paths:
-                with open(fp, "rb") as f:
-                    meta = pickle.load(f)
-                nframes += meta["data"].pop("nframes")
-
-                # remove variable fields
-                for k in ("start", "stop", "run_duration"):
-                    meta["data"].pop(k)
-
-                # confirm identical setting in all .pickle files
-                if meta_hash is None:
-                    meta_hash = dict_to_uuid(meta)
-                else:
-                    assert meta_hash == dict_to_uuid(
-                        meta
-                    ), f"Inconsistent DLC-model-config file used: {fp}"
-
-            self._pkl = meta["data"]
+                try:
+                    # Check if file is too small (likely empty or placeholder)
+                    if fp.stat().st_size < 100:  # Less than 100 bytes
+                        logger.warning(
+                            f"Pickle file {fp} is very small ({fp.stat().st_size} bytes), "
+                            "may be empty or placeholder. Trying to extract metadata from H5 files."
+                        )
+                        continue
+                    
+                    with open(fp, "rb") as f:
+                        meta = pickle.load(f)
+                    
+                    # DLC 2.x format: meta["data"] contains the actual metadata
+                    # DLC 3.x might have different structure
+                    if isinstance(meta, dict) and "data" in meta:
+                        meta_data = meta["data"]
+                        nframes += meta_data.pop("nframes", 0)
+                        
+                        # remove variable fields
+                        for k in ("start", "stop", "run_duration"):
+                            meta_data.pop(k, None)
+                        
+                        # confirm identical setting in all .pickle files
+                        if meta_hash is None:
+                            meta_hash = dict_to_uuid(meta)
+                            valid_meta = meta_data
+                        else:
+                            assert meta_hash == dict_to_uuid(
+                                meta
+                            ), f"Inconsistent DLC-model-config file used: {fp}"
+                    else:
+                        # DLC 3.x might have different structure
+                        logger.warning(f"Unexpected pickle structure in {fp}, trying to extract from H5")
+                        continue
+                        
+                except (EOFError, pickle.UnpicklingError, KeyError) as e:
+                    logger.warning(
+                        f"Could not read pickle file {fp}: {e}. "
+                        "Trying to extract metadata from H5 files."
+                    )
+                    continue
+            
+            # If no valid pickle metadata found, try to extract from H5 files
+            if valid_meta is None:
+                logger.warning(
+                    "No valid pickle metadata found. Extracting metadata from H5 files."
+                )
+                # Extract nframes from H5 files
+                nframes = sum(len(pd.read_hdf(fp)) for fp in self.h5_paths)
+                
+                # Create minimal metadata structure
+                # Try to get fps from yml config if available
+                try:
+                    fps = self.yml.get("fps", 30)
+                except (AttributeError, NameError):
+                    # yml not initialized yet, use default
+                    fps = 30
+                
+                # Try to extract scorer/model info from H5 file structure or filename
+                scorer = "DLC_3.x"
+                if self.h5_paths:
+                    # Try to extract from filename
+                    h5_name = self.h5_paths[0].stem
+                    # DLC 3.x filenames often contain model info
+                    if "superanimal" in h5_name:
+                        scorer = f"DLC_superanimal_{h5_name.split('superanimal')[1].split('_')[0]}"
+                
+                valid_meta = {
+                    "nframes": nframes,
+                    "fps": fps,
+                    "Scorer": scorer,
+                    "iteration (active-learning)": 0,
+                    "training set fraction": 1.0,
+                }
+                logger.info(
+                    f"Created minimal metadata: nframes={nframes}, fps={fps}, scorer={scorer}"
+                )
+            
+            self._pkl = valid_meta
             self._pkl["nframes"] = nframes
         return self._pkl
 
@@ -142,9 +296,15 @@ def pkl(self):
     def yml(self):
         """json-structured config.yaml file contents"""
         if self._yml is None:
-            with open(self.yml_path, "rb") as f:
-                yaml = YAML(typ="safe", pure=True)
-                self._yml = yaml.load(f)
+            if self.yml_path is None:
+                # No YAML file available (common for DLC 3.x pretrained models)
+                # Return an empty dict as fallback
+                logger.warning("No YAML file available, returning empty config dict")
+                self._yml = {}
+            else:
+                with open(self.yml_path, "rb") as f:
+                    yaml = YAML(typ="safe", pure=True)
+                    self._yml = yaml.load(f)
         return self._yml
 
     @property
@@ -174,18 +334,210 @@ def body_parts(self):
 
     def reformat_rawdata(self):
         """Transform raw h5 data into dict"""
-        error_message = (
-            f"Total frames from .h5 file ({len(self.rawdata)}) differs "
-            + f'from .pickle ({self.pkl["nframes"]})'
-        )
-        assert len(self.rawdata) == self.pkl["nframes"], error_message
+        # For DLC 3.x, nframes might not be in pickle, so use len(rawdata) as fallback
+        expected_nframes = self.pkl.get("nframes", len(self.rawdata))
+        if len(self.rawdata) != expected_nframes:
+            logger.warning(
+                f"Total frames from .h5 file ({len(self.rawdata)}) differs "
+                f'from .pickle ({expected_nframes}). Using H5 file count.'
+            )
 
         body_parts_position = {}
-        for body_part in self.body_parts:
-            body_parts_position[body_part] = {
-                c: self.df.get(body_part).get(c).values
-                for c in self.df.get(body_part).columns
-            }
+        
+        # Check if this is DLC 2.x format (MultiIndex columns) or DLC 3.x format
+        if isinstance(self.rawdata.columns, pd.MultiIndex):
+            # Check the number of levels in the MultiIndex
+            n_levels = self.rawdata.columns.nlevels
+            
+            if n_levels == 4:
+                # DLC 3.x multi-animal format: (scorer, individuals, bodyparts, coords)
+                # Structure: scorer -> individuals (animal0, animal1, ...) -> bodyparts -> coords (x, y, likelihood)
+                logger.info("Detected DLC 3.x multi-animal format (4-level MultiIndex)")
+                
+                # Get the scorer (first level)
+                scorer = self.rawdata.columns.levels[0][0]
+                
+                # Get all individuals (second level)
+                individuals = self.rawdata.columns.levels[1]
+                logger.debug(f"Found {len(individuals)} individual(s): {list(individuals)[:5]}")
+                
+                # For each individual, extract body parts
+                for individual in individuals:
+                    # Get data for this individual
+                    try:
+                        individual_data = self.rawdata.xs(individual, level=1, axis=1)
+                    except KeyError:
+                        logger.warning(f"Could not extract data for individual {individual} at level 1")
+                        continue
+                    
+                    # After xs(level=1), we should have a 2-level MultiIndex: (bodypart, coords)
+                    # Get body parts for this individual (third level, now first level after xs)
+                    if isinstance(individual_data.columns, pd.MultiIndex):
+                        # After xs(level=1), remaining levels should be (bodypart, coord)
+                        # Body parts are at level 0 (was level 2 in original)
+                        bodyparts = individual_data.columns.levels[0]
+                        logger.debug(f"Individual {individual}: found {len(bodyparts)} body part(s) at level 0: {list(bodyparts)[:10]}")
+                    else:
+                        # Not a MultiIndex - try to infer body parts from column names
+                        logger.warning(f"Individual {individual} data columns are not MultiIndex after xs. "
+                                     f"Column type: {type(individual_data.columns)}, "
+                                     f"Columns: {list(individual_data.columns[:10])}")
+                        # Try to extract body parts from column names
+                        # Columns might be like "bodypart_x", "bodypart_y", etc.
+                        bodyparts = set()
+                        for col in individual_data.columns:
+                            # Try to extract body part name (first part before underscore)
+                            if '_' in str(col):
+                                bp_name = str(col).split('_')[0]
+                                bodyparts.add(bp_name)
+                        logger.debug(f"Extracted {len(bodyparts)} body part(s) from column names: {list(bodyparts)[:10]}")
+                    
+                    if len(bodyparts) == 0:
+                        logger.error(f"No body parts found for individual {individual}. "
+                                   f"Column structure: {type(individual_data.columns)}, "
+                                   f"Number of columns: {len(individual_data.columns)}, "
+                                   f"Sample columns: {list(individual_data.columns[:10])}")
+                        # Don't create empty entry - skip this individual
+                        continue
+                    
+                    for bodypart in bodyparts:
+                        # Get coordinates for this body part
+                        # After xs(level=1), bodypart is now at level=0 (was level=2)
+                        try:
+                            if isinstance(individual_data.columns, pd.MultiIndex):
+                                bodypart_data = individual_data.xs(bodypart, level=0, axis=1)
+                            else:
+                                # Not MultiIndex - try to find columns matching this body part
+                                bodypart_cols = [col for col in individual_data.columns if str(col).startswith(f"{bodypart}_")]
+                                if bodypart_cols:
+                                    bodypart_data = individual_data[bodypart_cols]
+                                else:
+                                    bodypart_data = None
+                        except (KeyError, IndexError) as e:
+                            logger.debug(f"Body part {bodypart} not found for individual {individual}: {e}")
+                            bodypart_data = None
+                        
+                        if bodypart_data is not None and len(bodypart_data.columns) > 0:
+                            # Create key: individual_bodypart (e.g., "animal0_nose")
+                            key = f"{individual}_{bodypart}"
+                            
+                            # Extract x, y, likelihood from bodypart_data
+                            # If MultiIndex, coords are at level 1 (was level 3)
+                            # If not, columns are like "bodypart_x", "bodypart_y", etc.
+                            if isinstance(bodypart_data.columns, pd.MultiIndex):
+                                x_data = bodypart_data.xs("x", level=1, axis=1).values.flatten() if "x" in bodypart_data.columns.levels[1] else None
+                                y_data = bodypart_data.xs("y", level=1, axis=1).values.flatten() if "y" in bodypart_data.columns.levels[1] else None
+                                likelihood_data = bodypart_data.xs("likelihood", level=1, axis=1).values.flatten() if "likelihood" in bodypart_data.columns.levels[1] else np.ones(len(bodypart_data))
+                                z_data = bodypart_data.xs("z", level=1, axis=1).values.flatten() if "z" in bodypart_data.columns.levels[1] else None
+                            else:
+                                # Flat columns
+                                x_col = [c for c in bodypart_data.columns if 'x' in str(c).lower() and 'likelihood' not in str(c).lower()]
+                                y_col = [c for c in bodypart_data.columns if 'y' in str(c).lower() and 'likelihood' not in str(c).lower()]
+                                likelihood_col = [c for c in bodypart_data.columns if 'likelihood' in str(c).lower()]
+                                z_col = [c for c in bodypart_data.columns if 'z' in str(c).lower()]
+                                
+                                x_data = bodypart_data[x_col[0]].values if x_col else None
+                                y_data = bodypart_data[y_col[0]].values if y_col else None
+                                likelihood_data = bodypart_data[likelihood_col[0]].values if likelihood_col else np.ones(len(bodypart_data))
+                                z_data = bodypart_data[z_col[0]].values if z_col else None
+                            
+                            if x_data is not None and y_data is not None:
+                                body_parts_position[key] = {
+                                    "x": x_data,
+                                    "y": y_data,
+                                    "likelihood": likelihood_data,
+                                }
+                                if z_data is not None:
+                                    body_parts_position[key]["z"] = z_data
+                                logger.debug(f"Successfully extracted {bodypart} for {individual}: {len(x_data)} frames")
+                            else:
+                                logger.warning(f"Could not extract x/y coordinates for {individual}_{bodypart}")
+                        else:
+                            logger.warning(f"Could not extract data for body part {bodypart} of individual {individual}")
+                
+            elif n_levels == 3:
+                # DLC 2.x format: MultiIndex columns like (scorer, bodypart, coords)
+                logger.info("Detected DLC 2.x format (3-level MultiIndex)")
+                for body_part in self.body_parts:
+                    body_parts_position[body_part] = {
+                        c: self.df.get(body_part).get(c).values
+                        for c in self.df.get(body_part).columns
+                    }
+            else:
+                logger.warning(f"Unexpected MultiIndex depth: {n_levels} levels")
+                # Try to handle as 3-level (DLC 2.x)
+                for body_part in self.body_parts:
+                    body_parts_position[body_part] = {
+                        c: self.df.get(body_part).get(c).values
+                        for c in self.df.get(body_part).columns
+                    }
+        else:
+            # DLC 3.x format: might have different structure
+            # Try to infer structure from column names
+            logger.info(f"DLC 3.x format detected. Columns: {list(self.rawdata.columns[:10])}")
+            
+            # Common patterns: columns might be like "bodypart_x", "bodypart_y", "bodypart_likelihood"
+            # or MultiIndex but flattened
+            if len(self.rawdata.columns) > 0:
+                # Try to extract body parts from column names
+                body_parts_set = set()
+                coord_types = set()
+                
+                for col in self.rawdata.columns:
+                    # Pattern: "scorer_bodypart_coord" or "bodypart_coord"
+                    parts = str(col).split('_')
+                    if len(parts) >= 2:
+                        # Last part is usually the coordinate type (x, y, likelihood)
+                        coord = parts[-1].lower()
+                        if coord in ['x', 'y', 'z', 'likelihood']:
+                            coord_types.add(coord)
+                            # Everything before the last part is the body part name
+                            body_part = '_'.join(parts[:-1])
+                            body_parts_set.add(body_part)
+                
+                # If we found body parts, structure the data
+                if body_parts_set and coord_types:
+                    for body_part in body_parts_set:
+                        body_parts_position[body_part] = {}
+                        for coord in ['x', 'y', 'likelihood']:
+                            # Try different column name patterns
+                            possible_cols = [
+                                f"{body_part}_{coord}",
+                                f"DLC_{body_part}_{coord}",
+                                f"DLC_superanimal_{body_part}_{coord}",
+                            ]
+                            found_col = None
+                            for col_name in possible_cols:
+                                if col_name in self.rawdata.columns:
+                                    found_col = col_name
+                                    break
+                            
+                            if found_col:
+                                body_parts_position[body_part][coord] = self.rawdata[found_col].values
+                            elif coord == 'z':  # z is optional
+                                body_parts_position[body_part][coord] = None
+                            else:
+                                logger.warning(f"Could not find column for {body_part}_{coord}")
+                else:
+                    # Fallback: try to use MultiIndex structure even if not detected
+                    logger.warning("Could not parse DLC 3.x column structure, trying MultiIndex fallback")
+                    try:
+                        # Try to access as if it's MultiIndex
+                        top_level = self.rawdata.columns.levels[0][0] if hasattr(self.rawdata.columns, 'levels') else None
+                        if top_level:
+                            df = self.rawdata.get(top_level)
+                            for body_part in df.columns.levels[0] if hasattr(df.columns, 'levels') else []:
+                                body_parts_position[body_part] = {
+                                    c: df.get(body_part).get(c).values
+                                    for c in df.get(body_part).columns
+                                }
+                    except Exception as e:
+                        logger.error(f"Failed to parse H5 file structure: {e}")
+                        raise ValueError(
+                            f"Could not parse H5 file structure. "
+                            f"Columns: {list(self.rawdata.columns[:20])}. "
+                            f"Please check the file format."
+                        )
 
         return body_parts_position
 
@@ -202,9 +554,22 @@ def read_yaml(fullpath: str, filename: str = "*") -> tuple:
     """
     from deeplabcut.utils.auxiliaryfunctions import read_config
 
+    fullpath = Path(fullpath)
+    
+    # Ensure it's a directory, not a file
+    if fullpath.is_file():
+        fullpath = fullpath.parent
+        logger.warning(f"read_yaml received a file path, using parent directory: {fullpath}")
+    
+    if not fullpath.exists():
+        raise FileNotFoundError(f"Directory does not exist: {fullpath}")
+    
+    if not fullpath.is_dir():
+        raise ValueError(f"Path is not a directory: {fullpath}")
+
     # Take the DJ-saved if there. If not, return list of available
-    yml_paths = list(Path(fullpath).glob("dj_dlc_config.yaml")) or sorted(
-        list(Path(fullpath).glob(f"{filename}.y*ml"))
+    yml_paths = list(fullpath.glob("dj_dlc_config.yaml")) or sorted(
+        list(fullpath.glob(f"{filename}.y*ml"))
     )
 
     assert (  # If more than 1 and not DJ-saved,
@@ -223,7 +588,7 @@ def save_yaml(
     """Save config_dict to output_path as filename.yaml. By default, preserves original.
 
     Args:
-        output_dir (str): where to save yaml file
+        output_dir (str): where to save yaml file (directory path)
         config_dict (str): dict of config params or element-deeplabcut model.Model dict
         filename (str, optional): default 'dj_dlc_config' or preserve original 'config'
             Set to 'config' to overwrite original file.
@@ -237,12 +602,20 @@ def save_yaml(
 
     if "config_template" in config_dict:  # if passed full model.Model dict
         config_dict = config_dict["config_template"]
+    
+    output_dir = Path(output_dir)
+    
+    # Ensure it's a directory, not a file
+    if output_dir.is_file():
+        output_dir = output_dir.parent
+        logger.warning(f"save_yaml received a file path, using parent directory: {output_dir}")
+    
     if mkdir:
-        Path(output_dir).mkdir(exist_ok=True)
+        output_dir.mkdir(exist_ok=True)
     if "." in filename:  # if user provided extension, remove
         filename = filename.split(".")[0]
 
-    output_filepath = Path(output_dir) / f"{filename}.yaml"
+    output_filepath = output_dir / f"{filename}.yaml"
     write_config(output_filepath, config_dict)
     return str(output_filepath)
 
diff --git a/element_deeplabcut/train.py b/element_deeplabcut/train.py
index 1c78045..68957ae 100644
--- a/element_deeplabcut/train.py
+++ b/element_deeplabcut/train.py
@@ -1,363 +1,734 @@
-"""
-Code adapted from the Mathis Lab
-MIT License Copyright (c) 2022 Mackenzie Mathis
-DataJoint Schema for DeepLabCut 2.x, Supports 2D and 3D DLC via triangulation.
-"""
-
-import datajoint as dj
-import inspect
-import importlib
-import re
-from pathlib import Path
-import yaml
-
-from element_interface.utils import find_full_path, dict_to_uuid
-from .readers import dlc_reader
-
-schema = dj.schema()
-_linking_module = None
-
-
-def activate(
-    train_schema_name: str,
-    *,
-    create_schema: bool = True,
-    create_tables: bool = True,
-    linking_module: str = None,
-):
-    """Activate this schema.
-
-    Args:
-        train_schema_name (str): schema name on the database server
-        create_schema (bool): when True (default), create schema in the database if it
-                            does not yet exist.
-        create_tables (bool): when True (default), create schema tables in the database
-                             if they do not yet exist.
-        linking_module (str): a module (or name) containing the required dependencies.
-
-    Dependencies:
-    Functions:
-        get_dlc_root_data_dir(): Returns absolute path for root data director(y/ies)
-                                 with all behavioral recordings, as (list of) string(s).
-        get_dlc_processed_data_dir(): Optional. Returns absolute path for processed
-                                      data. Defaults to session video subfolder.
-    """
-
-    if isinstance(linking_module, str):
-        linking_module = importlib.import_module(linking_module)
-    assert inspect.ismodule(
-        linking_module
-    ), "The argument 'dependency' must be a module's name or a module"
-    assert hasattr(
-        linking_module, "get_dlc_root_data_dir"
-    ), "The linking module must specify a lookup function for a root data directory"
-
-    global _linking_module
-    _linking_module = linking_module
-
-    # activate
-    schema.activate(
-        train_schema_name,
-        create_schema=create_schema,
-        create_tables=create_tables,
-        add_objects=_linking_module.__dict__,
-    )
-
-
-# -------------- Functions required by element-deeplabcut ---------------
-
-
-def get_dlc_root_data_dir() -> list:
-    """Pulls relevant func from parent namespace to specify root data dir(s).
-
-    It is recommended that all paths in DataJoint Elements stored as relative
-    paths, with respect to some user-configured "root" director(y/ies). The
-    root(s) may vary between data modalities and user machines. Returns a full path
-    string or list of strings for possible root data directories.
-    """
-    root_directories = _linking_module.get_dlc_root_data_dir()
-    if isinstance(root_directories, (str, Path)):
-        root_directories = [root_directories]
-
-    if (
-        hasattr(_linking_module, "get_dlc_processed_data_dir")
-        and get_dlc_processed_data_dir() not in root_directories
-    ):
-        root_directories.append(_linking_module.get_dlc_processed_data_dir())
-
-    return root_directories
-
-
-def get_dlc_processed_data_dir() -> str:
-    """Pulls relevant func from parent namespace. Defaults to DLC's project /videos/.
-
-    Method in parent namespace should provide a string to a directory where DLC output
-    files will be stored. If unspecified, output files will be stored in the
-    session directory 'videos' folder, per DeepLabCut default.
-    """
-    if hasattr(_linking_module, "get_dlc_processed_data_dir"):
-        return _linking_module.get_dlc_processed_data_dir()
-    else:
-        return get_dlc_root_data_dir()[0]
-
-
-# ----------------------------- Table declarations ----------------------
-
-
-@schema
-class VideoSet(dj.Manual):
-    """Collection of videos included in a given training set.
-
-    Attributes:
-        video_set_id (int): Unique ID for collection of videos."""
-
-    definition = """ # Set of vids in training set
-    video_set_id: int
-    """
-
-    class File(dj.Part):
-        """File IDs and paths in a given VideoSet
-
-        Attributes:
-            VideoSet (foreign key): VideoSet key.
-            file_path ( varchar(255) ): Path to file on disk relative to root."""
-
-        definition = """ # Paths of training files (e.g., labeled pngs, CSV or video)
-        -> master
-        file_id: int
-        ---
-        file_path: varchar(255)
-        """
-
-
-@schema
-class TrainingParamSet(dj.Lookup):
-    """Parameters used to train a model
-
-    Attributes:
-        paramset_idx (smallint): Index uniqely identifying paramset.
-        paramset_desc ( varchar(128) ): Description of paramset.
-        param_set_hash (uuid): Hash identifying this paramset.
-        params (longblob): Dictionary of all applicable parameters.
-        Note: param_set_hash must be unique."""
-
-    definition = """
-    # Parameters to specify a DLC model training instance
-    # For DLC ≤ v2.0, include scorer_legacy = True in params
-    paramset_idx                  : smallint
-    ---
-    paramset_desc: varchar(128)
-    param_set_hash                : uuid      # hash identifying this parameterset
-    unique index (param_set_hash)
-    params                        : longblob  # dictionary of all applicable parameters
-    """
-
-    required_parameters = ("shuffle", "trainingsetindex")
-    skipped_parameters = ("project_path", "video_sets")
-
-    @classmethod
-    def insert_new_params(
-        cls, paramset_desc: str, params: dict, paramset_idx: int = None
-    ):
-        """
-        Insert a new set of training parameters into dlc.TrainingParamSet.
-
-        Args:
-            paramset_desc (str): Description of parameter set to be inserted
-            params (dict): Dictionary including all settings to specify model training.
-                        Must include shuffle & trainingsetindex b/c not in config.yaml.
-                        project_path and video_sets will be overwritten by config.yaml.
-                        Note that trainingsetindex is 0-indexed
-            paramset_idx (int): optional, integer to represent parameters.
-        """
-
-        for required_param in cls.required_parameters:
-            assert required_param in params, (
-                "Missing required parameter: " + required_param
-            )
-        for skipped_param in cls.skipped_parameters:
-            if skipped_param in params:
-                params.pop(skipped_param)
-
-        if paramset_idx is None:
-            paramset_idx = (
-                dj.U().aggr(cls, n="max(paramset_idx)").fetch1("n") or 0
-            ) + 1
-
-        param_dict = {
-            "paramset_idx": paramset_idx,
-            "paramset_desc": paramset_desc,
-            "params": params,
-            "param_set_hash": dict_to_uuid(params),
-        }
-        param_query = cls & {"param_set_hash": param_dict["param_set_hash"]}
-        # If the specified param-set already exists
-        if param_query:
-            existing_paramset_idx = param_query.fetch1("paramset_idx")
-            if existing_paramset_idx == int(paramset_idx):  # If existing_idx same:
-                return  # job done
-        else:
-            cls.insert1(param_dict)  # if duplicate, will raise duplicate error
-
-
-@schema
-class TrainingTask(dj.Manual):
-    """Staging table for pairing videosets and training parameter sets
-
-    Attributes:
-        VideoSet (foreign key): VideoSet Key.
-        TrainingParamSet (foreign key): TrainingParamSet key.
-        training_id (int): Unique ID for training task.
-        model_prefix ( varchar(32) ): Optional. Prefix for model files.
-        project_path ( varchar(255) ): Optional. DLC's project_path in config relative
-                                       to get_dlc_root_data_dir
-    """
-
-    definition = """      # Specification for a DLC model training instance
-    -> VideoSet           # labeled video(s) for training
-    -> TrainingParamSet
-    training_id     : int
-    ---
-    model_prefix='' : varchar(32)
-    project_path='' : varchar(255) # DLC's project_path in config relative to root
-    """
-
-
-@schema
-class ModelTraining(dj.Computed):
-    """Automated Model training information.
-
-    Attributes:
-        TrainingTask (foreign key): TrainingTask key.
-        latest_snapshot (int unsigned): Latest exact snapshot index (i.e., never -1).
-        config_template (longblob): Stored full config file."""
-
-    definition = """
-    -> TrainingTask
-    ---
-    latest_snapshot: int unsigned # latest exact snapshot index (i.e., never -1)
-    config_template: longblob     # stored full config file
-    """
-
-    # To continue from previous training snapshot, devs suggest editing pose_cfg.yml
-    # https://github.com/DeepLabCut/DeepLabCut/issues/70
-
-    def make(self, key):
-        import deeplabcut
-
-        try:
-            from deeplabcut.utils.auxiliaryfunctions import (
-                get_model_folder,
-                edit_config,
-            )  # isort:skip
-        except ImportError:
-            from deeplabcut.utils.auxiliaryfunctions import (
-                GetModelFolder as get_model_folder,
-            )  # isort:skip
-
-        """Launch training for each train.TrainingTask training_id via `.populate()`."""
-        project_path, model_prefix = (TrainingTask & key).fetch1(
-            "project_path", "model_prefix"
-        )
-
-        project_path = find_full_path(get_dlc_root_data_dir(), project_path)
-
-        # ---- Build and save DLC configuration (yaml) file ----
-        _, dlc_config = dlc_reader.read_yaml(project_path)  # load existing
-        dlc_config.update((TrainingParamSet & key).fetch1("params"))
-        dlc_config.update(
-            {
-                "project_path": project_path.as_posix(),
-                "modelprefix": model_prefix,
-                "train_fraction": dlc_config["TrainingFraction"][
-                    int(dlc_config["trainingsetindex"])
-                ],
-                "training_filelist_datajoint": [  # don't overwrite origin video_sets
-                    find_full_path(get_dlc_root_data_dir(), fp).as_posix()
-                    for fp in (VideoSet.File & key).fetch("file_path")
-                ],
-            }
-        )
-        # Write dlc config file to base project folder
-        dlc_cfg_filepath = dlc_reader.save_yaml(project_path, dlc_config)
-
-        # ---- Update the project path in the DLC pose configuration (yaml) files ----
-        model_folder = get_model_folder(
-            trainFraction=dlc_config["train_fraction"],
-            shuffle=dlc_config["shuffle"],
-            cfg=dlc_config,
-            modelprefix=dlc_config["modelprefix"],
-        )
-        model_train_folder = project_path / model_folder / "train"
-
-        # update path of the init_weight
-        with open(model_train_folder / "pose_cfg.yaml", "r") as f:
-            pose_cfg = yaml.safe_load(f)
-        init_weights_path = Path(pose_cfg["init_weights"])
-
-        if (
-            "pose_estimation_tensorflow/models/pretrained"
-            in init_weights_path.as_posix()
-        ):
-            # this is the res_net models, construct new path here
-            init_weights_path = (
-                Path(deeplabcut.__path__[0])
-                / "pose_estimation_tensorflow/models/pretrained"
-                / init_weights_path.name
-            )
-        else:
-            # this is existing snapshot weights, update path here
-            init_weights_path = model_train_folder / init_weights_path.name
-
-        edit_config(
-            model_train_folder / "pose_cfg.yaml",
-            {
-                "project_path": project_path.as_posix(),
-                "init_weights": init_weights_path.as_posix(),
-                "dataset": Path(pose_cfg["dataset"]).as_posix(),
-                "metadataset": Path(pose_cfg["metadataset"]).as_posix(),
-            },
-        )
-
-        # ---- Trigger DLC model training job ----
-        train_network_input_args = list(
-            inspect.signature(deeplabcut.train_network).parameters
-        )
-        train_network_kwargs = {
-            k: int(v) if k in ("shuffle", "trainingsetindex", "maxiters") else v
-            for k, v in dlc_config.items()
-            if k in train_network_input_args
-        }
-        for k in ["shuffle", "trainingsetindex", "maxiters"]:
-            train_network_kwargs[k] = int(train_network_kwargs[k])
-
-        try:
-            deeplabcut.train_network(dlc_cfg_filepath, **train_network_kwargs)
-        except KeyboardInterrupt:  # Instructions indicate to train until interrupt
-            print("DLC training stopped via Keyboard Interrupt")
-
-        # DLC goes by snapshot magnitude when judging 'latest' for evaluation
-        # Here, we mean most recently generated
-        snapshots = sorted(model_train_folder.glob("snapshot*.index"))
-        max_modified_time = 0
-        for snapshot in snapshots:
-            modified_time = snapshot.stat().st_mtime
-            if modified_time > max_modified_time:
-                latest_snapshot_file = snapshot
-                latest_snapshot = int(
-                    re.search(r"(\d+)\.index", latest_snapshot_file.name).group(1)
-                )
-                max_modified_time = modified_time
-
-        # update snapshotindex in the config
-        snapshotindex = snapshots.index(latest_snapshot_file)
-
-        dlc_config["snapshotindex"] = snapshotindex
-        edit_config(
-            dlc_cfg_filepath,
-            {"snapshotindex": snapshotindex},
-        )
-
-        self.insert1(
-            {**key, "latest_snapshot": latest_snapshot, "config_template": dlc_config}
-        )
+"""
+Code adapted from the Mathis Lab
+MIT License Copyright (c) 2022 Mackenzie Mathis
+DataJoint Schema for DeepLabCut 2.x, Supports 2D and 3D DLC via triangulation.
+"""
+
+import datajoint as dj
+import inspect
+import importlib
+import re
+import logging
+from pathlib import Path
+import yaml
+
+from element_interface.utils import find_full_path, dict_to_uuid
+from .readers import dlc_reader
+
+logger = logging.getLogger(__name__)
+
+schema = dj.schema()
+_linking_module = None
+
+
+def activate(
+    train_schema_name: str,
+    *,
+    create_schema: bool = True,
+    create_tables: bool = True,
+    linking_module: str = None,
+):
+    """Activate this schema.
+
+    Args:
+        train_schema_name (str): schema name on the database server
+        create_schema (bool): when True (default), create schema in the database if it
+                            does not yet exist.
+        create_tables (bool): when True (default), create schema tables in the database
+                             if they do not yet exist.
+        linking_module (str): a module (or name) containing the required dependencies.
+
+    Dependencies:
+    Functions:
+        get_dlc_root_data_dir(): Returns absolute path for root data director(y/ies)
+                                 with all behavioral recordings, as (list of) string(s).
+        get_dlc_processed_data_dir(): Optional. Returns absolute path for processed
+                                      data. Defaults to session video subfolder.
+    """
+
+    if isinstance(linking_module, str):
+        linking_module = importlib.import_module(linking_module)
+    assert inspect.ismodule(
+        linking_module
+    ), "The argument 'dependency' must be a module's name or a module"
+    assert hasattr(
+        linking_module, "get_dlc_root_data_dir"
+    ), "The linking module must specify a lookup function for a root data directory"
+
+    global _linking_module
+    _linking_module = linking_module
+
+    # activate
+    schema.activate(
+        train_schema_name,
+        create_schema=create_schema,
+        create_tables=create_tables,
+        add_objects=_linking_module.__dict__,
+    )
+
+
+# -------------- Functions required by element-deeplabcut ---------------
+
+
+def get_dlc_root_data_dir() -> list:
+    """Pulls relevant func from parent namespace to specify root data dir(s).
+
+    It is recommended that all paths in DataJoint Elements stored as relative
+    paths, with respect to some user-configured "root" director(y/ies). The
+    root(s) may vary between data modalities and user machines. Returns a full path
+    string or list of strings for possible root data directories.
+    """
+    root_directories = _linking_module.get_dlc_root_data_dir()
+    if isinstance(root_directories, (str, Path)):
+        root_directories = [root_directories]
+
+    if (
+        hasattr(_linking_module, "get_dlc_processed_data_dir")
+        and get_dlc_processed_data_dir() not in root_directories
+    ):
+        root_directories.append(_linking_module.get_dlc_processed_data_dir())
+
+    return root_directories
+
+
+def get_dlc_processed_data_dir() -> str:
+    """Pulls relevant func from parent namespace. Defaults to DLC's project /videos/.
+
+    Method in parent namespace should provide a string to a directory where DLC output
+    files will be stored. If unspecified, output files will be stored in the
+    session directory 'videos' folder, per DeepLabCut default.
+    """
+    if hasattr(_linking_module, "get_dlc_processed_data_dir"):
+        return _linking_module.get_dlc_processed_data_dir()
+    else:
+        return get_dlc_root_data_dir()[0]
+
+
+# ----------------------------- Table declarations ----------------------
+
+
+@schema
+class VideoSet(dj.Manual):
+    """Collection of videos included in a given training set.
+
+    Attributes:
+        video_set_id (int): Unique ID for collection of videos."""
+
+    definition = """ # Set of vids in training set
+    video_set_id: int
+    """
+
+    class File(dj.Part):
+        """File IDs and paths in a given VideoSet
+
+        Attributes:
+            VideoSet (foreign key): VideoSet key.
+            file_path ( varchar(255) ): Path to file on disk relative to root."""
+
+        definition = """ # Paths of training files (e.g., labeled pngs, CSV or video)
+        -> master
+        file_id: int
+        ---
+        file_path: varchar(255)
+        """
+
+
+@schema
+class TrainingParamSet(dj.Lookup):
+    """Parameters used to train a model
+
+    Attributes:
+        paramset_idx (smallint): Index uniqely identifying paramset.
+        paramset_desc ( varchar(128) ): Description of paramset.
+        param_set_hash (uuid): Hash identifying this paramset.
+        params (longblob): Dictionary of all applicable parameters.
+        Note: param_set_hash must be unique."""
+
+    definition = """
+    # Parameters to specify a DLC model training instance
+    # For DLC ≤ v2.0, include scorer_legacy = True in params
+    paramset_idx                  : smallint
+    ---
+    paramset_desc: varchar(128)
+    param_set_hash                : uuid      # hash identifying this parameterset
+    unique index (param_set_hash)
+    params                        : longblob  # dictionary of all applicable parameters
+    """
+
+    required_parameters = ("shuffle", "trainingsetindex")
+    skipped_parameters = ("project_path", "video_sets")
+
+    @classmethod
+    def insert_new_params(
+        cls, paramset_desc: str, params: dict, paramset_idx: int = None
+    ):
+        """
+        Insert a new set of training parameters into dlc.TrainingParamSet.
+
+        Args:
+            paramset_desc (str): Description of parameter set to be inserted
+            params (dict): Dictionary including all settings to specify model training.
+                        Must include shuffle & trainingsetindex b/c not in config.yaml.
+                        project_path and video_sets will be overwritten by config.yaml.
+                        Note that trainingsetindex is 0-indexed
+            paramset_idx (int): optional, integer to represent parameters.
+        """
+
+        for required_param in cls.required_parameters:
+            assert required_param in params, (
+                "Missing required parameter: " + required_param
+            )
+        for skipped_param in cls.skipped_parameters:
+            if skipped_param in params:
+                params.pop(skipped_param)
+
+        if paramset_idx is None:
+            paramset_idx = (
+                dj.U().aggr(cls, n="max(paramset_idx)").fetch1("n") or 0
+            ) + 1
+
+        param_dict = {
+            "paramset_idx": paramset_idx,
+            "paramset_desc": paramset_desc,
+            "params": params,
+            "param_set_hash": dict_to_uuid(params),
+        }
+        param_query = cls & {"param_set_hash": param_dict["param_set_hash"]}
+        # If the specified param-set already exists
+        if param_query:
+            existing_paramset_idx = param_query.fetch1("paramset_idx")
+            if existing_paramset_idx == int(paramset_idx):  # If existing_idx same:
+                return  # job done
+        else:
+            cls.insert1(param_dict)  # if duplicate, will raise duplicate error
+
+
+@schema
+class TrainingTask(dj.Manual):
+    """Staging table for pairing videosets and training parameter sets
+
+    Attributes:
+        VideoSet (foreign key): VideoSet Key.
+        TrainingParamSet (foreign key): TrainingParamSet key.
+        training_id (int): Unique ID for training task.
+        model_prefix ( varchar(32) ): Optional. Prefix for model files.
+        project_path ( varchar(255) ): Optional. DLC's project_path in config relative
+                                       to get_dlc_root_data_dir
+    """
+
+    definition = """      # Specification for a DLC model training instance
+    -> VideoSet           # labeled video(s) for training
+    -> TrainingParamSet
+    training_id     : int
+    ---
+    model_prefix='' : varchar(32)
+    project_path='' : varchar(255) # DLC's project_path in config relative to root
+    """
+
+
+@schema
+class ModelTraining(dj.Computed):
+    """Automated Model training information.
+
+    Attributes:
+        TrainingTask (foreign key): TrainingTask key.
+        latest_snapshot (int unsigned): Latest exact snapshot index (i.e., never -1).
+        config_template (longblob): Stored full config file."""
+
+    definition = """
+    -> TrainingTask
+    ---
+    latest_snapshot: int unsigned # latest exact snapshot index (i.e., never -1)
+    config_template: longblob     # stored full config file
+    """
+
+    # To continue from previous training snapshot, devs suggest editing pose_cfg.yml
+    # https://github.com/DeepLabCut/DeepLabCut/issues/70
+
+    def make(self, key):
+        import deeplabcut
+
+        try:
+            from deeplabcut.utils.auxiliaryfunctions import (
+                get_model_folder,
+                edit_config,
+            )  # isort:skip
+        except ImportError:
+            from deeplabcut.utils.auxiliaryfunctions import (
+                GetModelFolder as get_model_folder,
+            )  # isort:skip
+
+        """Launch training for each train.TrainingTask training_id via `.populate()`."""
+        project_path, model_prefix = (TrainingTask & key).fetch1(
+            "project_path", "model_prefix"
+        )
+
+        project_path = find_full_path(get_dlc_root_data_dir(), project_path)
+        
+        # Ensure project_path is a directory, not a file
+        project_path = Path(project_path)
+        if project_path.is_file():
+            project_path = project_path.parent
+        elif not project_path.is_dir():
+            raise ValueError(f"project_path is neither a file nor a directory: {project_path}")
+
+        # ---- Build and save DLC configuration (yaml) file ----
+        _, dlc_config = dlc_reader.read_yaml(project_path)  # load existing
+        training_params = (TrainingParamSet & key).fetch1("params")
+        
+        # Ensure shuffle and trainingsetindex from TrainingParamSet override config values
+        # This is critical - the config file might have different values
+        shuffle = training_params.get("shuffle", dlc_config.get("shuffle", 1))
+        trainingsetindex = training_params.get("trainingsetindex", dlc_config.get("trainingsetindex", 0))
+        
+        # Explicitly set these values in config (they must match the training dataset)
+        dlc_config["shuffle"] = int(shuffle)
+        dlc_config["trainingsetindex"] = int(trainingsetindex)
+        
+        logger.info(f"Training parameters: shuffle={dlc_config['shuffle']}, trainingsetindex={dlc_config['trainingsetindex']}")
+        
+        # Update other params (but shuffle and trainingsetindex are already set above)
+        other_params = {k: v for k, v in training_params.items() if k not in ["shuffle", "trainingsetindex"]}
+        dlc_config.update(other_params)
+        
+        # Get engine from config
+        # Note: DLC 3.x may have issues with engine setting for training
+        # Try to detect or default appropriately
+        engine = dlc_config.get("engine")
+        
+        # If no engine specified, don't set one - let DLC use default
+        # DLC 3.x training may work better without explicit engine setting
+        if engine is None:
+            # Don't set engine - will use DLC's default behavior
+            engine = None
+        elif engine not in ["tensorflow", "pytorch"]:
+            # Invalid engine, reset to None
+            logger.warning(f"Invalid engine '{engine}', using DLC default")
+            engine = None
+            if "engine" in dlc_config:
+                del dlc_config["engine"]
+        # Ensure trainingsetindex is used correctly for train_fraction
+        # Use the value we just set, not from config (which might be wrong)
+        train_fraction = dlc_config["TrainingFraction"][int(trainingsetindex)]
+        
+        dlc_config.update(
+            {
+                "project_path": project_path.as_posix(),
+                "modelprefix": model_prefix,
+                "train_fraction": train_fraction,
+                "training_filelist_datajoint": [  # don't overwrite origin video_sets
+                    find_full_path(get_dlc_root_data_dir(), fp).as_posix()
+                    for fp in (VideoSet.File & key).fetch("file_path")
+                ],
+            }
+        )
+        # Write dlc config file to base project folder with correct values
+        dlc_cfg_filepath = dlc_reader.save_yaml(project_path, dlc_config)
+        
+        # Verify the saved config has correct values (re-read to confirm)
+        _, saved_config = dlc_reader.read_yaml(project_path)
+        saved_shuffle = saved_config.get("shuffle", shuffle)
+        saved_trainingsetindex = saved_config.get("trainingsetindex", trainingsetindex)
+        
+        logger.info(f"Saved config verification: shuffle={saved_shuffle}, trainingsetindex={saved_trainingsetindex}")
+        logger.info(f"Expected values: shuffle={shuffle}, trainingsetindex={trainingsetindex}")
+        
+        # If there's a mismatch, fix it
+        if saved_trainingsetindex != trainingsetindex or saved_shuffle != shuffle:
+            logger.warning(f"Config file mismatch detected! Fixing...")
+            saved_config["shuffle"] = shuffle
+            saved_config["trainingsetindex"] = trainingsetindex
+            dlc_reader.save_yaml(project_path, saved_config, filename="config")
+            # Use the corrected values
+            dlc_config["shuffle"] = shuffle
+            dlc_config["trainingsetindex"] = trainingsetindex
+        else:
+            # Use the verified values from saved config
+            dlc_config["shuffle"] = saved_shuffle
+            dlc_config["trainingsetindex"] = saved_trainingsetindex
+
+        # ---- Update the project path in the DLC pose configuration (yaml) files ----
+        model_folder = get_model_folder(
+            trainFraction=dlc_config["train_fraction"],
+            shuffle=dlc_config["shuffle"],
+            cfg=dlc_config,
+            modelprefix=dlc_config["modelprefix"],
+        )
+        model_train_folder = project_path / model_folder / "train"
+
+        # Ensure model_train_folder exists (it's created when training starts)
+        model_train_folder.mkdir(parents=True, exist_ok=True)
+        
+        # Check if pose_cfg.yaml exists, if not, it will be created by DLC during training
+        pose_cfg_path = model_train_folder / "pose_cfg.yaml"
+        if not pose_cfg_path.exists():
+            # pose_cfg.yaml will be created by DLC's train_network function
+            # Skip init_weights update for now - it will be handled by DLC
+            logger.warning(
+                f"pose_cfg.yaml not found at {pose_cfg_path}. "
+                "It will be created by DLC during training. Skipping init_weights update."
+            )
+            init_weights_path = None
+            pose_cfg = {}
+        else:
+            # update path of the init_weight
+            with open(pose_cfg_path, "r") as f:
+                pose_cfg = yaml.safe_load(f)
+            init_weights_path = Path(pose_cfg["init_weights"])
+
+            if (
+                "pose_estimation_tensorflow/models/pretrained"
+                in init_weights_path.as_posix()
+            ):
+                # this is the res_net models, construct new path here
+                init_weights_path = (
+                    Path(deeplabcut.__path__[0])
+                    / "pose_estimation_tensorflow/models/pretrained"
+                    / init_weights_path.name
+                )
+            else:
+                # this is existing snapshot weights, update path here
+                init_weights_path = model_train_folder / init_weights_path.name
+
+            edit_config(
+                model_train_folder / "pose_cfg.yaml",
+                {
+                    "project_path": project_path.as_posix(),
+                    "init_weights": init_weights_path.as_posix(),
+                    "dataset": Path(pose_cfg["dataset"]).as_posix(),
+                    "metadataset": Path(pose_cfg["metadataset"]).as_posix(),
+                },
+            )
+
+        # ---- Trigger DLC model training job ----
+        # DLC 3.x: The compat layer checks engine from config file
+        # Ensure engine is explicitly set in the config before training
+        # The compat layer reads engine from the config file, not from the function call
+        
+        # DLC 3.x compat layer reads engine from metadata file, not config
+        # Ensure engine is set correctly in config (needed for metadata updates)
+        # Don't remove it - DLC needs it in the config to determine the correct engine
+        if "engine" not in dlc_config:
+            dlc_config["engine"] = engine or "pytorch"
+            logger.info(f"Added engine='{dlc_config['engine']}' to config")
+        
+        # Ensure config has correct engine before saving
+        if dlc_config.get("engine") != engine:
+            dlc_config["engine"] = engine or "pytorch"
+            logger.info(f"Updated engine in config to '{dlc_config['engine']}'")
+        
+        # Save config with correct engine
+        dlc_reader.save_yaml(project_path, dlc_config, filename="config")
+        logger.info(f"Saved config with engine='{dlc_config.get('engine')}'")
+        
+        # CRITICAL: DLC 3.x doesn't implement train_network for TensorFlow
+        # We MUST use the PyTorch-specific function directly to bypass the compat layer
+        # The compat layer will try to use TensorFlow if it detects engine=tensorflow in metadata/config
+        
+        # Force engine to pytorch if not already set
+        if engine != "pytorch":
+            logger.warning(f"Engine was '{engine}', forcing to 'pytorch' (DLC 3.x doesn't support TensorFlow training)")
+            engine = "pytorch"
+            dlc_config["engine"] = "pytorch"
+            dlc_reader.save_yaml(project_path, dlc_config, filename="config")
+            logger.info("Updated config to use engine=pytorch")
+        
+        # Use PyTorch-specific training function directly (bypasses compat layer)
+        try:
+            from deeplabcut.pose_estimation_pytorch import train_network as train_func_pytorch
+            train_func = train_func_pytorch
+            logger.info("Using PyTorch-specific train_network function (bypassing compat layer)")
+        except (ImportError, AttributeError) as e:
+            logger.error(f"PyTorch training function not available: {e}")
+            logger.error("Falling back to generic train_network (may fail if engine is not pytorch)")
+            train_func = deeplabcut.train_network
+        
+        train_network_input_args = list(inspect.signature(train_func).parameters)
+        
+        # Build kwargs from config, but explicitly override shuffle and trainingsetindex
+        # to ensure they match what we set (DLC reads from config file, so we need to be explicit)
+        train_network_kwargs = {
+            k: int(v) if k in ("shuffle", "trainingsetindex", "maxiters") else v
+            for k, v in dlc_config.items()
+            if k in train_network_input_args
+        }
+        
+        # CRITICAL: Explicitly set shuffle and trainingsetindex to match TrainingParamSet
+        # These must match the training dataset that was created
+        train_network_kwargs["shuffle"] = int(shuffle)
+        train_network_kwargs["trainingsetindex"] = int(trainingsetindex)
+        
+        # Ensure other numeric params are integers
+        for k in ["maxiters", "displayiters", "saveiters"]:
+            if k in train_network_kwargs:
+                train_network_kwargs[k] = int(train_network_kwargs[k])
+        
+        logger.info(f"Training with kwargs: shuffle={train_network_kwargs.get('shuffle')}, trainingsetindex={train_network_kwargs.get('trainingsetindex')}")
+        
+        # Final verification: re-read config one more time right before training
+        # DLC reads from the file, so we need to ensure it's correct
+        _, final_config = dlc_reader.read_yaml(project_path)
+        final_trainingsetindex = final_config.get("trainingsetindex")
+        final_shuffle = final_config.get("shuffle")
+        
+        # CRITICAL: Ensure engine is in final_config (needed for metadata update)
+        if "engine" not in final_config:
+            final_config["engine"] = engine or "pytorch"
+        elif final_config.get("engine") != (engine or "pytorch"):
+            final_config["engine"] = engine or "pytorch"
+        
+        logger.info(f"Final config check before training: shuffle={final_shuffle}, trainingsetindex={final_trainingsetindex}")
+        logger.info(f"Expected values: shuffle={shuffle}, trainingsetindex={trainingsetindex}")
+        
+        # Also verify metadata file has correct structure before training
+        try:
+            import yaml
+            training_datasets_dir = Path(project_path) / "training-datasets"
+            metadata_files = list(training_datasets_dir.rglob("metadata.yaml"))
+            if metadata_files:
+                metadata_file = metadata_files[0]
+                with open(metadata_file, 'r') as f:
+                    metadata = yaml.safe_load(f)
+                
+                shuffle_key = int(shuffle)
+                trainingset_key = int(trainingsetindex)
+                shuffle_data = metadata.get("shuffles", {}).get(shuffle_key, {})
+                trainingset_data = shuffle_data.get(trainingset_key, {})
+                
+                if "train_fraction" not in trainingset_data:
+                    logger.warning(f"Metadata missing train_fraction! Fixing now...")
+                    train_fraction = float(final_config.get("TrainingFraction", [0.95])[trainingsetindex])
+                    if shuffle_key not in metadata.get("shuffles", {}):
+                        metadata.setdefault("shuffles", {})[shuffle_key] = {}
+                    metadata["shuffles"][shuffle_key][trainingset_key] = {
+                        "train_fraction": train_fraction,
+                        "shuffle": shuffle_key
+                    }
+                    with open(metadata_file, 'w') as f:
+                        yaml.dump(metadata, f, default_flow_style=False, sort_keys=False)
+                    logger.info(f"Fixed metadata file: {metadata_file}")
+        except Exception as e:
+            logger.warning(f"Could not verify/fix metadata file: {e}")
+        
+        if final_trainingsetindex != trainingsetindex or final_shuffle != shuffle:
+            logger.error(
+                f"CRITICAL: Config file mismatch! "
+                f"Expected shuffle={shuffle}, trainingsetindex={trainingsetindex}, "
+                f"but found shuffle={final_shuffle}, trainingsetindex={final_trainingsetindex}. "
+                f"Fixing now..."
+            )
+            final_config["trainingsetindex"] = int(trainingsetindex)
+            final_config["shuffle"] = int(shuffle)
+            dlc_reader.save_yaml(project_path, final_config, filename="config")
+            # Update the filepath to point to the newly saved config
+            dlc_cfg_filepath = dlc_reader.save_yaml(project_path, final_config, filename="config")
+            
+            # Verify one more time
+            _, verify_config = dlc_reader.read_yaml(project_path)
+            logger.info(f"After fix: shuffle={verify_config.get('shuffle')}, trainingsetindex={verify_config.get('trainingsetindex')}")
+            
+            # Update dlc_config to match
+            dlc_config["trainingsetindex"] = int(trainingsetindex)
+            dlc_config["shuffle"] = int(shuffle)
+
+        # Final check: verify metadata one more time right before training
+        # DLC reads metadata when train_network is called, so we need to ensure it's correct
+        try:
+            import yaml
+            training_datasets_dir = Path(project_path) / "training-datasets"
+            metadata_files = list(training_datasets_dir.rglob("metadata.yaml"))
+            if metadata_files:
+                metadata_file = metadata_files[0]
+                with open(metadata_file, 'r') as f:
+                    metadata = yaml.safe_load(f)
+                
+                shuffle_key = int(shuffle)
+                trainingset_key = int(trainingsetindex)
+                
+                # DLC 3.x expects: shuffles[shuffle] = {train_fraction, index, engine}
+                # NOT nested by trainingsetindex!
+                if "shuffles" not in metadata:
+                    metadata["shuffles"] = {}
+                
+                shuffle_data = metadata.get("shuffles", {}).get(shuffle_key, {})
+                
+                # Check if it's old structure (nested) or new structure (flat)
+                if isinstance(shuffle_data, dict) and any(isinstance(v, dict) for v in shuffle_data.values() if isinstance(v, dict)):
+                    # Old structure: shuffles[shuffle][trainingsetindex] = {...}
+                    logger.warning("Found old metadata structure (nested by trainingsetindex)! Converting to DLC 3.x format...")
+                    trainingset_data = shuffle_data.get(trainingset_key, {})
+                    train_fraction = float(trainingset_data.get("train_fraction", final_config.get("TrainingFraction", [0.95])[trainingsetindex]))
+                    # CRITICAL: Use the engine variable directly, not from config (which might be wrong)
+                    correct_engine = engine or "pytorch"
+                    # Convert to new structure
+                    # IMPORTANT: index is the SHUFFLE number, not trainingsetindex!
+                    metadata["shuffles"][shuffle_key] = {
+                        "train_fraction": train_fraction,
+                        "index": shuffle_key,  # This is the SHUFFLE number, not trainingsetindex!
+                        "engine": correct_engine,  # Use correct engine
+                    }
+                    with open(metadata_file, 'w') as f:
+                        yaml.dump(metadata, f, default_flow_style=False, sort_keys=False)
+                    logger.info(f"Converted metadata to DLC 3.x format: {metadata_file}")
+                else:
+                    # New structure: shuffles[shuffle] = {train_fraction, index, engine}
+                    # IMPORTANT: index is the SHUFFLE number, not trainingsetindex!
+                    if shuffle_key not in metadata["shuffles"]:
+                        metadata["shuffles"][shuffle_key] = {}
+                    
+                    shuffle_data = metadata["shuffles"][shuffle_key]
+                    
+                    # CRITICAL: Use the engine variable directly, not from config
+                    correct_engine = engine or "pytorch"
+                    
+                    # Ensure train_fraction exists
+                    if "train_fraction" not in shuffle_data:
+                        train_fraction = float(final_config.get("TrainingFraction", [0.95])[trainingsetindex])
+                        shuffle_data["train_fraction"] = train_fraction
+                        shuffle_data["index"] = shuffle_key  # This is the SHUFFLE number, not trainingsetindex!
+                        shuffle_data["engine"] = correct_engine
+                        with open(metadata_file, 'w') as f:
+                            yaml.dump(metadata, f, default_flow_style=False, sort_keys=False)
+                        logger.info(f"CRITICAL FIX: Added train_fraction to metadata right before training: {metadata_file}")
+                        logger.info(f"Metadata structure: {metadata}")
+                    else:
+                        # Verify index matches shuffle number (not trainingsetindex!)
+                        needs_update = False
+                        if shuffle_data.get("index") != shuffle_key:
+                            shuffle_data["index"] = shuffle_key
+                            needs_update = True
+                            logger.info(f"Fixed index mismatch (expected {shuffle_key}, found {shuffle_data.get('index')})")
+                        
+                        # CRITICAL: Ensure engine matches (DLC reads engine from metadata!)
+                        current_engine = shuffle_data.get("engine")
+                        if current_engine != correct_engine:
+                            logger.warning(f"CRITICAL: Engine mismatch in metadata! Expected {correct_engine}, found {current_engine}. Fixing NOW...")
+                            shuffle_data["engine"] = correct_engine
+                            needs_update = True
+                            logger.info(f"Updated engine in metadata from {current_engine} to {correct_engine}")
+                        
+                        if needs_update:
+                            with open(metadata_file, 'w') as f:
+                                yaml.dump(metadata, f, default_flow_style=False, sort_keys=False)
+                            logger.info(f"Updated metadata file: {metadata_file}")
+                        
+                        logger.info(f"Metadata verified: train_fraction={shuffle_data.get('train_fraction')}, index={shuffle_data.get('index')} (shuffle number), engine={shuffle_data.get('engine')}")
+        except Exception as e:
+            logger.error(f"CRITICAL: Could not verify/fix metadata before training: {e}")
+            import traceback
+            logger.error(traceback.format_exc())
+        
+        try:
+            # Log the exact metadata structure right before training
+            logger.info("=" * 80)
+            logger.info("FINAL METADATA CHECK BEFORE TRAINING")
+            logger.info("=" * 80)
+            training_datasets_dir = Path(project_path) / "training-datasets"
+            metadata_files = list(training_datasets_dir.rglob("metadata.yaml"))
+            if metadata_files:
+                metadata_file = metadata_files[0]
+                logger.info(f"Metadata file: {metadata_file}")
+                with open(metadata_file, 'r') as f:
+                    metadata = yaml.safe_load(f)
+                logger.info(f"Full metadata structure: {metadata}")
+                logger.info(f"Shuffles: {metadata.get('shuffles', {})}")
+                shuffle_key = int(shuffle)
+                
+                # DLC 3.x uses flat structure: shuffles[shuffle] = {train_fraction, index, engine}
+                if shuffle_key in metadata.get('shuffles', {}):
+                    shuffle_data = metadata['shuffles'][shuffle_key]
+                    logger.info(f"Shuffle {shuffle_key} exists: {shuffle_data}")
+                    
+                    needs_update = False
+                    
+                    # CRITICAL: Ensure train_fraction exists and is the right type
+                    if "train_fraction" not in shuffle_data:
+                        train_fraction = float(final_config.get("TrainingFraction", [0.95])[trainingsetindex])
+                        shuffle_data["train_fraction"] = train_fraction
+                        needs_update = True
+                        logger.warning(f"CRITICAL: train_fraction was missing! Adding it now: {train_fraction}")
+                    else:
+                        # Ensure it's a float, not int
+                        shuffle_data["train_fraction"] = float(shuffle_data["train_fraction"])
+                        logger.info(f"train_fraction exists: {shuffle_data['train_fraction']} (type: {type(shuffle_data['train_fraction'])})")
+                    
+                    # CRITICAL: Ensure index matches shuffle number
+                    if shuffle_data.get("index") != shuffle_key:
+                        shuffle_data["index"] = shuffle_key
+                        needs_update = True
+                        logger.warning(f"CRITICAL: index mismatch! Expected {shuffle_key}, found {shuffle_data.get('index')}. Fixing...")
+                    
+                    # CRITICAL: Ensure engine matches config (DLC reads engine from metadata!)
+                    # Use the engine from the variable, not from final_config (which might be wrong)
+                    expected_engine = engine or final_config.get("engine", "pytorch")
+                    current_engine = shuffle_data.get("engine")
+                    if current_engine != expected_engine:
+                        logger.warning(f"CRITICAL: Engine mismatch! Expected {expected_engine}, found {current_engine}. Fixing...")
+                        shuffle_data["engine"] = expected_engine
+                        needs_update = True
+                        logger.info(f"Updated engine in metadata from {current_engine} to {expected_engine}")
+                    
+                    if needs_update:
+                        # Write the fixed metadata back immediately
+                        with open(metadata_file, 'w') as f:
+                            yaml.dump(metadata, f, default_flow_style=False, sort_keys=False)
+                        logger.info(f"Wrote fixed metadata to: {metadata_file}")
+                        
+                        # Verify it was written correctly
+                        with open(metadata_file, 'r') as f:
+                            verify_meta = yaml.safe_load(f)
+                            verify_data = verify_meta['shuffles'][shuffle_key]
+                            logger.info(f"Verification: train_fraction={verify_data.get('train_fraction')}, index={verify_data.get('index')}, engine={verify_data.get('engine')}")
+                    else:
+                        logger.info(f"Metadata verified: train_fraction={shuffle_data.get('train_fraction')}, index={shuffle_data.get('index')}, engine={shuffle_data.get('engine')}")
+            logger.info("=" * 80)
+            
+            train_func(dlc_cfg_filepath, **train_network_kwargs)
+        except KeyError as e:
+            if "train_fraction" in str(e):
+                logger.error(f"CRITICAL: DLC still can't find train_fraction! Error: {e}")
+                logger.error("This suggests DLC is reading metadata from a different source or format.")
+                logger.error("Please check DLC documentation or create an issue on GitHub.")
+                raise
+            else:
+                raise
+        except KeyboardInterrupt:  # Instructions indicate to train until interrupt
+            print("DLC training stopped via Keyboard Interrupt")
+
+        # DLC goes by snapshot magnitude when judging 'latest' for evaluation
+        # Here, we mean most recently generated
+        snapshots = sorted(model_train_folder.glob("snapshot*.index"))
+        if not snapshots:
+            raise FileNotFoundError(
+                f"No snapshot files found in {model_train_folder}. "
+                "Training may have failed or not generated any snapshots."
+            )
+        
+        max_modified_time = 0
+        latest_snapshot_file = None
+        latest_snapshot = None
+        
+        for snapshot in snapshots:
+            modified_time = snapshot.stat().st_mtime
+            if modified_time > max_modified_time:
+                latest_snapshot_file = snapshot
+                latest_snapshot = int(
+                    re.search(r"(\d+)\.index", latest_snapshot_file.name).group(1)
+                )
+                max_modified_time = modified_time
+
+        if latest_snapshot_file is None:
+            raise ValueError("Failed to determine latest snapshot file")
+        
+        # update snapshotindex in the config
+        snapshotindex = snapshots.index(latest_snapshot_file)
+
+        dlc_config["snapshotindex"] = snapshotindex
+        edit_config(
+            dlc_cfg_filepath,
+            {"snapshotindex": snapshotindex},
+        )
+
+        self.insert1(
+            {**key, "latest_snapshot": latest_snapshot, "config_template": dlc_config}
+        )

From 65a3868ff410aaa6f9bcdae9504eb524274e5a1c Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:30:48 +0100
Subject: [PATCH 04/15] config

---
 .dockerignore   | 63 +++++++++++++++++++++++++++++++++++++++++++++++++
 environment.yml | 25 ++++++++++++++++++++
 setup.py        |  7 +++---
 3 files changed, 92 insertions(+), 3 deletions(-)
 create mode 100644 .dockerignore
 create mode 100644 environment.yml

diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000..a14d467
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,63 @@
+# Docker ignore file
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+
+# Virtual environments
+venv/
+env/
+ENV/
+
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+.tox/
+
+# Documentation
+docs/_build/
+
+# Git
+.git/
+.gitignore
+
+# Docker
+Dockerfile
+docker-compose*.yaml
+.dockerignore
+
+# Test data (will be mounted as volume)
+test_videos/
+
+# Local config (will be mounted as volume)
+dj_local_conf.json
+
+# OS
+.DS_Store
+Thumbs.db
+
+
diff --git a/environment.yml b/environment.yml
new file mode 100644
index 0000000..15ccadc
--- /dev/null
+++ b/environment.yml
@@ -0,0 +1,25 @@
+name: element-deeplabcut
+channels:
+  - conda-forge
+  - defaults
+dependencies:
+  - python=3.10  # DeepLabCut 3.x requires Python 3.10+ (uses modern type hints)
+  - pip
+  - graphviz
+  - ffmpeg
+  - pip:
+    - datajoint>=0.14.0
+    - pydot
+    - ipykernel
+    - ipywidgets
+    - pytest
+    - pytest-cov
+    - opencv-python  # Required for video metadata extraction
+    - element-lab @ git+https://github.com/datajoint/element-lab.git
+    - element-animal @ git+https://github.com/datajoint/element-animal.git
+    - element-session @ git+https://github.com/datajoint/element-session.git
+    - element-interface @ git+https://github.com/datajoint/element-interface.git
+    # DeepLabCut for inference (optional - comment out if not needed)
+    - deeplabcut[superanimal]==3.0.0rc13  # For pretrained SuperAnimal models and inference (DLC 3.x)
+    # Alternative: - deeplabcut[tf] @ git+https://github.com/DeepLabCut/DeepLabCut.git  # For TensorFlow backend only
+
diff --git a/setup.py b/setup.py
index 44aed0a..cee590d 100644
--- a/setup.py
+++ b/setup.py
@@ -21,6 +21,7 @@
     license="MIT",
     url=f'https://github.com/datajoint/{pkg_name.replace("_", "-")}',
     keywords="neuroscience behavior deeplabcut pose-estimation science datajoint",
+    python_requires=">=3.10",  # DeepLabCut 3.x requires Python 3.10+
     packages=find_packages(exclude=["contrib", "docs", "tests*"]),
     scripts=[],
     install_requires=[
@@ -32,16 +33,16 @@
     ],
     extras_require={
         "dlc_default": [
-            "deeplabcut[tf] @ git+https://github.com/DeepLabCut/DeepLabCut.git"
+            "deeplabcut[superanimal]==3.0.0rc13"
         ],
         "dlc_apple_mchips": [
             "tensorflow-macos==2.12.0",
             "tensorflow-metal",
             "tables==3.7.0",
-            "deeplabcut",
+            "deeplabcut[superanimal]==3.0.0rc13",
         ],
         "dlc_gui": [
-            "deeplabcut[gui] @ git+https://github.com/DeepLabCut/DeepLabCut.git"
+            "deeplabcut[gui]==3.0.0rc13"
         ],
         "elements": [
             "element-lab @ git+https://github.com/datajoint/element-lab.git",

From 5cdb15644d28f9760dc01f09d847a4160f4766b2 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:31:10 +0100
Subject: [PATCH 05/15] env docs

---
 CONDA_ENV_SETUP.md     |  41 +++++++++++++++++
 tests/TESTING_GUIDE.md | 100 +++++++++++++++++++++++++++++++++++++++++
 2 files changed, 141 insertions(+)
 create mode 100644 CONDA_ENV_SETUP.md
 create mode 100644 tests/TESTING_GUIDE.md

diff --git a/CONDA_ENV_SETUP.md b/CONDA_ENV_SETUP.md
new file mode 100644
index 0000000..14b504b
--- /dev/null
+++ b/CONDA_ENV_SETUP.md
@@ -0,0 +1,41 @@
+# Conda Environment Setup Guide
+
+## Quick Start
+
+```bash
+# Create environment (Python 3.10+ required for DeepLabCut 3.x)
+conda create -n element-deeplabcut python=3.10
+conda activate element-deeplabcut
+
+# Install system dependencies
+conda install -c conda-forge graphviz
+
+# Install package
+pip install -e ".[elements,tests]"
+```
+
+## With DeepLabCut
+
+```bash
+# Full setup with DeepLabCut
+pip install -e ".[elements,dlc_default,tests]"
+```
+
+## Verify Installation
+
+```bash
+python -c "import element_deeplabcut; print('✅ Package installed')"
+python -c "import datajoint as dj; print('✅ DataJoint available')"
+```
+
+## Troubleshooting
+
+| Issue | Solution |
+|-------|----------|
+| Package conflicts | `conda env remove -n element-deeplabcut` and recreate |
+| Graphviz not found | `conda install -c conda-forge graphviz` |
+
+## Next Steps
+
+1. Configure database: See `tests/ENVIRONMENT_SETUP.md`
+2. Run tests: `pytest tests/ -v`
diff --git a/tests/TESTING_GUIDE.md b/tests/TESTING_GUIDE.md
new file mode 100644
index 0000000..542b1dd
--- /dev/null
+++ b/tests/TESTING_GUIDE.md
@@ -0,0 +1,100 @@
+# Testing Guide
+
+## Setup
+
+See [CONDA_ENV_SETUP.md](../CONDA_ENV_SETUP.md) for environment setup.
+
+### Database
+
+```bash
+docker compose -f docker-compose-db.yaml up -d
+```
+
+Create `dj_local_conf.json`:
+
+```json
+{
+  "database.host": "localhost",
+  "database.user": "root",
+  "database.password": "simple",
+  "database.port": 3306
+}
+```
+
+## Running Tests
+
+### Unit Tests (No DLC needed)
+
+```bash
+pytest tests/test_pretrained_workflow.py -v
+pytest tests/test_pipeline.py -v
+```
+
+### Inference Tests (Requires DLC + videos)
+
+```bash
+# Install DLC
+pip install -e ".[elements,dlc_default,tests]"
+
+# Set video directory
+export DLC_ROOT_DATA_DIR=./test_videos
+export DLC_PROCESSED_DATA_DIR=./test_videos/output
+
+# Run
+pytest tests/test_pretrained_workflow.py::test_pretrained_inference_workflow -v
+```
+
+## Quick Examples
+
+### Pretrained Workflow
+
+```python
+from element_deeplabcut import model
+
+# 1. Register model
+model.PretrainedModel.populate_common_models(["superanimal_quadruped"])
+
+# 2. Insert model
+model.Model.insert_pretrained_model(
+    model_name="my_model",
+    pretrained_model_name="superanimal_quadruped",
+    prompt=False,
+)
+
+# 3. Create task
+model.PoseEstimationTask.generate(
+    recording_key,
+    model_name="my_model",
+    analyze_videos_params={"video_inference": {"scale": 0.4}},
+)
+
+# 4. Run inference
+model.PoseEstimation.populate()
+```
+
+### Trained Workflow
+
+```python
+# 1. Insert trained model
+model.Model.insert_new_model(
+    model_name="my_trained",
+    dlc_config="path/to/config.yaml",
+    shuffle=1,
+    trainingsetindex=0,
+    prompt=False,
+)
+
+# 2. Create task and run
+model.PoseEstimationTask.generate(recording_key, model_name="my_trained")
+model.PoseEstimation.populate()
+```
+
+## Troubleshooting
+
+| Issue | Solution |
+|-------|----------|
+| "No module named 'element_lab'" | `pip install -e ".[elements]"` |
+| Database connection failed | Check `docker ps` and credentials |
+| "Pretrained model not found" | `model.PretrainedModel.populate_common_models()` |
+| CUDA out of memory | Use `"batchsize": 1` or `"gputouse": None` |
+| Slow inference | Use GPU, reduce `scale`, use shorter videos |

From 1812d5cdbf1486a07d72edb51d7124536a1722d8 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:31:40 +0100
Subject: [PATCH 06/15] add test part

---
 test_trained_inference.py         | 1673 +++++++++++++++++++++++++++++
 test_video_inference.py           |  848 +++++++++++++++
 tests/test_pretrained_workflow.py |  200 ++++
 3 files changed, 2721 insertions(+)
 create mode 100755 test_trained_inference.py
 create mode 100755 test_video_inference.py
 create mode 100644 tests/test_pretrained_workflow.py

diff --git a/test_trained_inference.py b/test_trained_inference.py
new file mode 100755
index 0000000..1bce8d6
--- /dev/null
+++ b/test_trained_inference.py
@@ -0,0 +1,1673 @@
+#!/usr/bin/env python
+"""Simple script to test trained model workflow (training + inference) with video files.
+
+This script automatically:
+    1. Creates a new DLC project
+    2. Generates mock labeled data (no manual labeling required!)
+    3. Mocks model training (functional/integration test - no actual training occurs)
+    4. Runs inference on test videos
+
+Usage:
+    1. Configure database (see below)
+    2. Put your video file(s) in ./test_videos/ directory (or set DLC_ROOT_DATA_DIR)
+       - In Docker: videos should be in ./data/ directory (mounted to /app/data)
+    3. Run: python test_trained_inference.py
+       - In Docker: make test-trained
+
+    Examples:
+        python test_trained_inference.py  # Full workflow: create project, train, infer
+        python test_trained_inference.py --skip-training  # Use existing trained model
+        python test_trained_inference.py --skip-inference  # Only train, don't infer
+        python test_trained_inference.py --model-name my_model  # Custom model name
+
+Database Configuration:
+    The script will look for database configuration in this order:
+    1. dj_local_conf.json file in the project root
+    2. Environment variables: DJ_HOST, DJ_USER, DJ_PASS
+    3. Default DataJoint configuration
+    
+    Example dj_local_conf.json:
+    {
+        "database.host": "localhost",
+        "database.user": "root",
+        "database.password": "your_password",
+        "database.port": 3306,
+        "custom": {
+            "database.prefix": "test_"
+        }
+    }
+"""
+import os
+import sys
+import importlib.util
+import logging
+import argparse
+from pathlib import Path
+from unittest.mock import patch, MagicMock
+
+import datajoint as dj
+
+# Set up logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(message)s',
+    handlers=[logging.StreamHandler(sys.stdout)]
+)
+logger = logging.getLogger(__name__)
+
+# Simple status printer for user-facing messages
+class StatusPrinter:
+    """Simple status printer for step-by-step progress."""
+    def __init__(self, total_steps=10):
+        self.total_steps = total_steps
+        self.current_step = 0
+    
+    def step(self, message, status="info"):
+        """Print a step message with status indicator."""
+        self.current_step += 1
+        icons = {
+            "info": "ℹ️",
+            "success": "✅",
+            "warning": "⚠️",
+            "error": "❌",
+            "skip": "⏭️"
+        }
+        icon = icons.get(status, "•")
+        print(f"\n[{self.current_step}/{self.total_steps}] {icon} {message}")
+    
+    def sub(self, message, indent=3, icon=""):
+        """Print a sub-message with indentation."""
+        prefix = f"{icon} " if icon else ""
+        print(" " * indent + prefix + message)
+    
+    def header(self, title):
+        """Print a section header."""
+        print("\n" + "=" * 60)
+        print(title)
+        print("=" * 60)
+
+# Configure database connection
+if Path("./dj_local_conf.json").exists():
+    dj.config.load("./dj_local_conf.json")
+    logger.info("✅ Loaded database configuration from dj_local_conf.json")
+else:
+    logger.info("⚠️  No dj_local_conf.json found, using environment variables or defaults")
+    logger.info("   Set DJ_HOST, DJ_USER, DJ_PASS environment variables if needed")
+
+# Update config from environment variables
+dj.config.update({
+    "safemode": False,
+    "database.host": os.environ.get("DJ_HOST") or dj.config.get("database.host", "localhost"),
+    "database.user": os.environ.get("DJ_USER") or dj.config.get("database.user", "root"),
+    "database.password": os.environ.get("DJ_PASS") or dj.config.get("database.password", ""),
+})
+
+# Set database prefix for tests
+if "custom" not in dj.config:
+    dj.config["custom"] = {}
+dj.config["custom"]["database.prefix"] = os.environ.get(
+    "DATABASE_PREFIX", dj.config["custom"].get("database.prefix", "test_")
+)
+
+# Set DLC root data directory if not already set
+# In Docker, prefer /app/test_videos (from project mount), otherwise /app/data
+# Check for Docker: /.dockerenv exists OR we're in /app directory (Docker working dir)
+is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
+if is_docker:
+    # Prefer /app/test_videos (from project mount .:/app) since videos are in ./test_videos
+    test_videos_path = Path("/app/test_videos")
+    if test_videos_path.exists():
+        default_video_dir = "/app/test_videos"
+    else:
+        default_video_dir = "/app/data"
+else:
+    default_video_dir = "./test_videos"
+video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
+# CRITICAL: Set dlc_root_data_dir in DataJoint config to match where videos actually are
+# This is used by element-deeplabcut to find video files
+if "dlc_root_data_dir" not in dj.config.get("custom", {}) or not dj.config["custom"].get("dlc_root_data_dir"):
+    dj.config["custom"]["dlc_root_data_dir"] = str(video_dir.absolute())
+    logger.info(f"📁 Set DLC_ROOT_DATA_DIR to: {video_dir.absolute()}")
+    if is_docker:
+        logger.info("🐳 Running in Docker mode")
+
+# Get the root directory for making relative paths (ensure it's absolute)
+dlc_root_dir = Path(dj.config["custom"].get("dlc_root_data_dir", str(video_dir.absolute())))
+if not dlc_root_dir.is_absolute():
+    dlc_root_dir = dlc_root_dir.resolve()
+
+logger.info(f"📊 Database: {dj.config['database.host']} (prefix: {dj.config['custom']['database.prefix']})")
+logger.info(f"📁 DLC Root: {dlc_root_dir}")
+
+from element_deeplabcut import model, train
+from tests import tutorial_pipeline as pipeline
+
+def check_database_connection():
+    """Verify database connection is working."""
+    try:
+        # Try to connect by activating a schema
+        test_schema = dj.schema("test_connection_check", create_schema=True, create_tables=False)
+        test_schema.drop()
+        return True
+    except Exception as e:
+        logger.error(f"\n❌ Database connection failed: {e}")
+        logger.error("\nPlease configure your database:")
+        logger.error("  1. Create dj_local_conf.json with database credentials")
+        logger.error("  2. Or set environment variables: DJ_HOST, DJ_USER, DJ_PASS")
+        logger.error("  3. Or ensure database is running (docker compose -f docker-compose-db.yaml up -d)")
+        return False
+
+def check_dlc_installation():
+    """Check if DeepLabCut is installed and available."""
+    try:
+        import deeplabcut
+        return True, None
+    except (ImportError, Exception) as e:
+        return False, str(e)
+
+def create_dlc_project(project_name, experimenter, video_files, project_dir=None):
+    """Create a new DLC project programmatically."""
+    import deeplabcut
+    
+    if project_dir is None:
+        project_dir = dlc_root_dir / project_name
+    
+    # Create project directory if it doesn't exist
+    project_dir.mkdir(parents=True, exist_ok=True)
+    
+    # Convert video files to absolute paths
+    video_paths = [str(Path(v).resolve()) for v in video_files]
+    
+    # Create DLC project
+    config_path = deeplabcut.create_new_project(
+        project_name,
+        experimenter,
+        video_paths,
+        working_directory=str(project_dir.parent),
+        copy_videos=False,  # Don't copy videos, just reference them
+    )
+    
+    return Path(config_path).parent  # Return project directory
+
+def create_mock_labeled_data(config_path, num_frames=20, bodyparts=None, use_existing_frames=False):
+    """
+    Create mock labeled data with images and CSV files for testing.
+
+    IMPORTANT for DLC 3.x:
+    - We ONLY create the CSV here.
+    - The DataFrame index MUST be a string path like:
+      "labeled-data/<video_name>/img000.png"
+    - We do NOT create the H5 file ourselves; DLC will call convertcsv2h5
+      and build the MultiIndex / tuples internally.
+    """
+    import pandas as pd
+    import numpy as np
+    import yaml
+    from PIL import Image
+
+    # --- Read config and basic info ---
+    with open(config_path, "r") as f:
+        config = yaml.safe_load(f)
+
+    if bodyparts is None:
+        bodyparts = config.get("bodyparts", ["nose", "tailbase", "head"])
+
+    # DLC uses "scorer" (DLC 3) or "experimenter" (older)
+    scorer = config.get("scorer") or config.get("experimenter") or "experimenter"
+
+    project_path = Path(config_path).parent
+    labeled_data_dir = project_path / "labeled-data"
+    labeled_data_dir.mkdir(parents=True, exist_ok=True)
+
+    # Choose video name
+    video_sets = config.get("video_sets", {})
+    if video_sets:
+        video_name = Path(list(video_sets.keys())[0]).stem
+    else:
+        video_name = "test_video"
+
+    video_labeled_dir = labeled_data_dir / video_name
+    video_labeled_dir.mkdir(parents=True, exist_ok=True)
+
+    # Image size
+    img_width = config.get("im_width", 640)
+    img_height = config.get("im_height", 480)
+
+    # --- Create / reuse images ---
+    existing_images = sorted(
+        list(video_labeled_dir.glob("*.png")) + list(video_labeled_dir.glob("*.jpg"))
+    )
+
+    if use_existing_frames and existing_images:
+        logger.info(f"Using {len(existing_images)} existing frame(s) extracted by DLC")
+        num_frames = min(num_frames, len(existing_images))
+        img_files = existing_images[:num_frames]
+    else:
+        img_files = []
+        for frame_idx in range(num_frames):
+            img = Image.new(
+                "RGB",
+                (img_width, img_height),
+                color=(
+                    np.random.randint(0, 255),
+                    np.random.randint(0, 255),
+                    np.random.randint(0, 255),
+                ),
+            )
+            img_path = video_labeled_dir / f"img{frame_idx:03d}.png"
+            img.save(img_path)
+            img_files.append(img_path)
+
+        logger.info(f"Created {len(img_files)} mock image files in {video_labeled_dir}")
+
+    # --- Build DataFrame in DLC format ---
+
+    # MultiIndex columns: (scorer, bodypart, coord)
+    columns = []
+    for bp in bodyparts:
+        columns.append((scorer, bp, "x"))
+        columns.append((scorer, bp, "y"))
+        columns.append((scorer, bp, "likelihood"))
+
+    data = []
+    index_strings = []
+
+    for img_path in img_files:
+        row = []
+        for bp in bodyparts:
+            x = np.random.uniform(50, img_width - 50)
+            y = np.random.uniform(50, img_height - 50)
+            likelihood = np.random.uniform(0.8, 1.0)
+            row.extend([x, y, likelihood])
+        data.append(row)
+
+        # IMPORTANT:
+        # DLC 3.x will later split this string into path components and
+        # build its own MultiIndex. Here we just give it a clean relative path.
+        rel_str = f"labeled-data/{video_name}/{img_path.name}"
+        index_strings.append(rel_str)
+
+    df = pd.DataFrame(
+        data,
+        columns=pd.MultiIndex.from_tuples(columns, names=["scorer", "bodyparts", "coords"]),
+        index=index_strings,
+    )
+
+    csv_filename = f"CollectedData_{scorer}.csv"
+    csv_path = video_labeled_dir / csv_filename
+
+    # Save CSV with index: index contains the relative image path as string
+    df.to_csv(csv_path, index=True)
+    logger.info(f"Created CSV file: {csv_path}")
+
+    # DO NOT create .h5 here. Let DLC handle convertcsv2h5 internally.
+    # If an old .h5 exists from previous runs, it can confuse DLC, so we remove it:
+    h5_path = video_labeled_dir / csv_filename.replace(".csv", ".h5")
+    if h5_path.exists():
+        logger.info(f"Removing old H5 file (will be regenerated by DLC): {h5_path}")
+        h5_path.unlink()
+
+    # Sanity checks
+    if not csv_path.exists():
+        raise FileNotFoundError(f"Failed to create CSV file: {csv_path}")
+
+    final_imgs = list(video_labeled_dir.glob("img*.png"))
+    if len(final_imgs) == 0:
+        raise FileNotFoundError(
+            f"No image files found in {video_labeled_dir} after mock data creation."
+        )
+
+    logger.info(f"Created mock labeled data: {csv_path}")
+    logger.info(f"  - Directory: {video_labeled_dir}")
+    logger.info(f"  - {len(final_imgs)} frames")
+    logger.info(f"  - {len(bodyparts)} body parts: {bodyparts}")
+    logger.info(f"  - Scorer: {scorer}")
+    logger.info(f"  - Video name: {video_name}")
+
+    return csv_path
+
+def main():
+    training_was_mocked = False
+    status = StatusPrinter(total_steps=12)
+    status.header("Testing Trained Model Workflow (Training + Inference)")
+    
+    # Parse arguments
+    parser = argparse.ArgumentParser(
+        description="Test trained DeepLabCut workflow with video files",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    parser.add_argument(
+        "dlc_project",
+        nargs="?",
+        default=None,
+        help="Path to DLC project directory or config.yaml file"
+    )
+    parser.add_argument(
+        "--skip-training",
+        action="store_true",
+        help="Skip training step and use existing trained model"
+    )
+    parser.add_argument(
+        "--skip-inference",
+        action="store_true",
+        help="Skip inference step (only train the model)"
+    )
+    parser.add_argument(
+        "--model-name",
+        default="test_trained_model",
+        help="Name for the trained model (default: test_trained_model)"
+    )
+    
+    args = parser.parse_args()
+    
+    # 0. Check database connection
+    status.step("Checking database connection")
+    if not check_database_connection():
+        sys.exit(1)
+    status.sub("Database connection successful", indent=3)
+    
+    # 0.5. Clean up database (remove test data from previous runs)
+    status.step("Cleaning up database (removing test data from previous runs)")
+    cleanup_count = 0
+    
+    # Delete PoseEstimation entries (and their parts)
+    pose_estimation_query = pipeline.model.PoseEstimation
+    if pose_estimation_query:
+        keys = pose_estimation_query.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            pose_estimation_query.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} PoseEstimation entry/entries", icon="🗑️", indent=3)
+    
+    # Delete PoseEstimationTask entries
+    task_query = pipeline.model.PoseEstimationTask
+    if task_query:
+        keys = task_query.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            task_query.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} PoseEstimationTask entry/entries", icon="🗑️", indent=3)
+    
+    # Delete test models (models with names starting with "test_")
+    test_models = model.Model & "model_name LIKE 'test_%'"
+    if test_models:
+        keys = test_models.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            test_models.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} test model(s)", icon="🗑️", indent=3)
+    
+    # Delete test training tasks (optional - comment out if you want to keep training history)
+    if pipeline.train.ModelTraining:
+        training_query = pipeline.train.ModelTraining
+        keys = training_query.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            training_query.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} ModelTraining entry/entries", icon="🗑️", indent=3)
+    
+    if cleanup_count > 0:
+        status.sub(f"Total: {cleanup_count} entry/entries cleaned", icon="✅", indent=3)
+    else:
+        status.sub("No test data found to clean", icon="ℹ️", indent=3)
+    
+    # 1. Check DeepLabCut installation
+    status.step("Checking DeepLabCut installation")
+    dlc_available, dlc_error = check_dlc_installation()
+    if not dlc_available:
+        status.sub(f"DeepLabCut is not installed or not importable: {dlc_error}", icon="❌", indent=3)
+        status.sub("Install with: pip install 'deeplabcut[superanimal]'", indent=5)
+        sys.exit(1)
+    else:
+        import deeplabcut
+        status.sub(f"DeepLabCut is available (version {deeplabcut.__version__})", icon="✅", indent=3)
+    
+    # 2. Create or find DLC project
+    status.step("Creating DLC project")
+    
+    # Find video files for project creation (use first available video or create dummy)
+    # In Docker, check /app/test_videos (from project mount) first, then /app/data
+    is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
+    if is_docker:
+        # Prefer /app/test_videos (from project mount .:/app)
+        test_videos_path = Path("/app/test_videos")
+        if test_videos_path.exists():
+            default_video_dir = "/app/test_videos"
+        else:
+            default_video_dir = "/app/data"
+    else:
+        default_video_dir = "./test_videos"
+    video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
+    video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
+    
+    if not video_files:
+        # Create a dummy video file path (DLC will handle missing videos gracefully)
+        video_files = [str(video_dir / "dummy_video.mp4")]
+        status.sub("No videos found - will create project with dummy video path", icon="⚠️", indent=3)
+        status.sub("(You can add real videos later)", icon="ℹ️", indent=5)
+    
+    # Create project name
+    project_name = f"test_training_project_{args.model_name}"
+    experimenter = "test_experimenter"
+    
+    # Check if project already exists
+    project_dir = dlc_root_dir / project_name
+    config_file = project_dir / "config.yaml"
+    
+    if config_file.exists() and not args.skip_training:
+        status.sub(f"Project already exists: {project_dir}", icon="ℹ️", indent=3)
+        status.sub("Using existing project (delete it to recreate)", icon="ℹ️", indent=5)
+        dlc_project_path = project_dir
+    else:
+        # Create new project
+        status.sub(f"Creating new DLC project: {project_name}", icon="ℹ️", indent=3)
+        try:
+            dlc_project_path = create_dlc_project(
+                project_name,
+                experimenter,
+                video_files[:1],  # Use first video for project creation
+                project_dir=project_dir
+            )
+            status.sub(f"Project created: {dlc_project_path}", icon="✅", indent=5)
+        except Exception as e:
+            status.sub(f"Error creating project: {e}", icon="❌", indent=3)
+            raise
+    
+    config_file = dlc_project_path / "config.yaml"
+    if not config_file.exists():
+        status.sub(f"Config file not found: {config_file}", icon="❌", indent=3)
+        sys.exit(1)
+    
+    # Make path relative to dlc_root_dir
+    try:
+        dlc_project_rel = Path(dlc_project_path).relative_to(dlc_root_dir)
+    except ValueError:
+        dlc_project_rel = Path(dlc_project_path)
+        status.sub("Warning: Project path not under DLC_ROOT_DATA_DIR, using absolute path", icon="⚠️", indent=3)
+    
+    config_file_rel = dlc_project_rel / "config.yaml"
+    status.sub(f"Project path: {dlc_project_path}", icon="✅", indent=3)
+    status.sub(f"Config file: {config_file_rel}", icon="ℹ️", indent=5)
+    
+    # 3. Create mock labeled data (skip manual labeling)
+    if not args.skip_training:
+        status.step("Creating mock labeled data")
+        labeled_data_dir = dlc_project_path / "labeled-data"
+        
+        # Check if labeled data already exists
+        if labeled_data_dir.exists() and any(labeled_data_dir.iterdir()):
+            status.sub("Labeled data already exists, skipping mock data creation", icon="ℹ️", indent=3)
+        else:
+            import yaml
+            with open(config_file, 'r') as f:
+                config = yaml.safe_load(f)
+            
+            bodyparts = config.get("bodyparts", ["nose", "tailbase", "head"])
+            status.sub(f"Creating mock labeled data with {len(bodyparts)} body parts", icon="ℹ️", indent=3)
+            status.sub(f"Body parts: {bodyparts}", icon="ℹ️", indent=5)
+            
+            try:
+                create_mock_labeled_data(config_file, num_frames=20, bodyparts=bodyparts)
+                status.sub("Mock labeled data created successfully", icon="✅", indent=3)
+            except Exception as e:
+                status.sub(f"Error creating mock labeled data: {e}", icon="❌", indent=3)
+                raise
+    
+    # 4. Setup test data (subject, session, recordings)
+    status.step("Setting up test data")
+    base_key = {
+        "subject": "test1",
+        "session_datetime": "2024-01-01 12:00:00",
+    }
+    
+    pipeline.subject.Subject.insert1({
+        "subject": "test1",
+        "sex": "F",
+        "subject_birth_date": "2020-01-01",
+        "subject_description": "Test subject for trained model workflow",
+    }, skip_duplicates=True)
+    
+    pipeline.session.Session.insert1({
+        "subject": "test1",
+        "session_datetime": "2024-01-01 12:00:00",
+    }, skip_duplicates=True)
+    
+    # Find video files for inference (reuse from earlier or find again)
+    if not video_files:
+        video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
+    elif video_files and len(video_files) > 0:
+        first_video = str(video_files[0])
+        if "dummy_video.mp4" in first_video:
+            video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
+    
+    if not video_files and not args.skip_inference:
+        status.sub(f"No video files found in {video_dir}", icon="⚠️", indent=3)
+        status.sub("Supported formats: .mp4, .avi, .mov", icon="ℹ️", indent=3)
+        status.sub("Set DLC_ROOT_DATA_DIR environment variable to point to video directory", indent=3)
+        if args.skip_training:
+            sys.exit(1)
+        else:
+            status.sub("Continuing with training only (no inference videos)", icon="ℹ️", indent=3)
+    
+    # Create recordings for inference videos
+    recording_keys = []
+    if video_files:
+        for idx, video_file in enumerate(video_files):
+            recording_key = {
+                **base_key,
+                "recording_id": idx + 1,
+            }
+            recording_keys.append(recording_key)
+            
+            pipeline.model.VideoRecording.insert1(
+                {**recording_key, "device": "Camera1"}, skip_duplicates=True
+            )
+            
+            video_file_abs = Path(video_file).resolve()
+            try:
+                relative_path = video_file_abs.relative_to(dlc_root_dir)
+            except ValueError:
+                relative_path = Path(video_file.name)
+            
+            pipeline.model.VideoRecording.File.insert1(
+                {**recording_key, "file_id": 0, "file_path": str(relative_path)},
+                skip_duplicates=True,
+            )
+            status.sub(f"Created recording {recording_key['recording_id']} for {video_file_abs.name}", icon="✅", indent=5)
+    
+    status.sub(f"Created {len(recording_keys)} recording(s) for inference", icon="✅", indent=3)
+    
+    # 5. Extract video metadata (if videos exist)
+    if recording_keys:
+        status.step("Extracting video metadata")
+        try:
+            pipeline.model.RecordingInfo.populate()
+            for rec_key in recording_keys:
+                rec_info = (pipeline.model.RecordingInfo & rec_key).fetch1()
+                status.sub(
+                    f"Recording {rec_key['recording_id']}: {rec_info['px_width']}x{rec_info['px_height']}, "
+                    f"{rec_info['nframes']} frames, {rec_info['fps']:.1f} fps",
+                    icon="✅",
+                    indent=5
+                )
+        except ModuleNotFoundError as e:
+            if "cv2" in str(e):
+                status.sub("OpenCV (cv2) is required for video metadata extraction", icon="⚠️", indent=3)
+                status.sub("Install with: pip install opencv-python", indent=5)
+            else:
+                raise
+    
+    # 6. Training workflow (if not skipped)
+    model_name = args.model_name
+    
+    if not args.skip_training:
+        status.step("Setting up training workflow")
+        
+        # Check if training has already been done
+        if model.Model & {"model_name": model_name}:
+            status.sub(f"Model '{model_name}' already exists", icon="ℹ️", indent=3)
+            status.sub("Use --skip-training to use existing model, or choose different --model-name", indent=5)
+            if not args.skip_inference:
+                status.sub("Skipping training, proceeding to inference...", icon="⏭️", indent=3)
+                args.skip_training = True
+        else:
+            import yaml
+            with open(config_file, 'r') as f:
+                dlc_config = yaml.safe_load(f)
+            
+            # CRITICAL: Truncate Task field early to fit varchar(32) constraint
+            # This must happen BEFORE creating training datasets or model folders
+            # to ensure consistency throughout the process
+            if "Task" in dlc_config and len(dlc_config["Task"]) > 32:
+                original_task = dlc_config["Task"]
+                dlc_config["Task"] = original_task[:32]
+                status.sub(f"Truncated Task field from {len(original_task)} to 32 chars: '{dlc_config['Task']}'", icon="ℹ️", indent=3)
+                # Update the config file immediately to persist the change
+                with open(config_file, 'w') as f:
+                    yaml.dump(dlc_config, f, default_flow_style=False)
+                status.sub("Config file updated with truncated Task", icon="✅", indent=5)
+            
+            # Check if project has labeled data
+            labeled_data_dir = dlc_project_path / "labeled-data"
+            
+            # CRITICAL: Remove old H5 files - they may be in wrong format
+            # DLC will regenerate them from CSV during create_training_dataset
+            old_h5_files = list(labeled_data_dir.rglob("*.h5")) if labeled_data_dir.exists() else []
+            if old_h5_files:
+                status.sub(f"Removing {len(old_h5_files)} old H5 file(s) (will be regenerated by DLC)", icon="⚠️", indent=3)
+                for h5_file in old_h5_files:
+                    h5_file.unlink()
+                status.sub("Old H5 files removed", icon="✅", indent=5)
+            
+            labeled_files = (
+                list(labeled_data_dir.rglob("*.csv"))
+                if labeled_data_dir.exists()
+                else []
+            )
+            
+            if len(labeled_files) == 0:
+                status.sub("No labeled data found - creating mock labeled data", icon="⚠️", indent=3)
+                try:
+                    csv_path = create_mock_labeled_data(config_file, num_frames=20, use_existing_frames=False)
+                    status.sub(f"Mock labeled data created: {csv_path}", icon="✅", indent=5)
+                    labeled_files = list(labeled_data_dir.rglob("*.csv"))
+                    img_files = (
+                        list(labeled_data_dir.rglob("*.png"))
+                        + list(labeled_data_dir.rglob("*.jpg"))
+                    )
+                    if len(labeled_files) == 0:
+                        raise ValueError("Failed to create labeled data files")
+                    status.sub(
+                        f"Verified {len(labeled_files)} CSV file(s) and {len(img_files)} image file(s)",
+                        icon="✅",
+                        indent=5,
+                    )
+                except Exception as e:
+                    status.sub(f"Error creating mock labeled data: {e}", icon="❌", indent=3)
+                    import traceback
+                    status.sub(traceback.format_exc(), indent=5)
+                    raise
+            else:
+                status.sub(f"Found {len(labeled_files)} existing CSV file(s) (H5 will be generated by DLC)", icon="ℹ️", indent=3)
+            
+            # Remove old training artifacts
+            training_datasets_dir = dlc_project_path / "training-datasets"
+            if training_datasets_dir.exists():
+                status.sub("Training dataset exists; deleting to regenerate with current DLC...", icon="⚠️", indent=3)
+                import shutil
+                shutil.rmtree(training_datasets_dir)
+                status.sub("Deleted old training-datasets directory", icon="✅", indent=5)
+            
+            dlc_models_dir = dlc_project_path / "dlc-models"
+            if dlc_models_dir.exists():
+                status.sub("Cleaning up old dlc-models directory...", icon="ℹ️", indent=5)
+                import shutil
+                shutil.rmtree(dlc_models_dir)
+                status.sub("Deleted old dlc-models directory", icon="✅", indent=5)
+            
+            dlc_models_pytorch_dir = dlc_project_path / "dlc-models-pytorch"
+            if dlc_models_pytorch_dir.exists():
+                status.sub("Cleaning up old dlc-models-pytorch directory...", icon="ℹ️", indent=5)
+                import shutil
+                shutil.rmtree(dlc_models_pytorch_dir)
+                status.sub("Deleted old dlc-models-pytorch directory", icon="✅", indent=5)
+            
+            # Simple training parameters
+            shuffle = 1
+            trainingsetindex = 0
+            
+            status.sub("Creating training dataset with deeplabcut.create_training_dataset", icon="ℹ️", indent=3)
+            import yaml
+            with open(config_file, 'r') as f:
+                create_config = yaml.safe_load(f)
+            
+            # Ensure engine is pytorch in config
+            old_engine = create_config.get("engine", "not set")
+            create_config["engine"] = "pytorch"
+            with open(config_file, 'w') as f:
+                yaml.dump(create_config, f, default_flow_style=False)
+            
+            status.sub(
+                f"Config updated: engine={create_config.get('engine')} (was {old_engine})",
+                icon="ℹ️",
+                indent=5,
+            )
+            
+            try:
+                import deeplabcut
+                dlc_version = deeplabcut.__version__
+                status.sub(f"Using DLC version: {dlc_version}", icon="ℹ️", indent=5)
+                
+                # CRITICAL: Convert CSV to H5 first (DLC expects H5 files)
+                status.sub("Converting CSV to H5 format...", icon="ℹ️", indent=5)
+                try:
+                    # Use convertcsv2h5 with userfeedback=False to avoid prompts
+                    deeplabcut.convertcsv2h5(str(config_file), userfeedback=False)
+                    
+                    # CRITICAL WORKAROUND for DLC 3.x bug:
+                    # format_training_data tries to reshape ALL values (including likelihood) into (x, y) pairs
+                    # This causes an error. We need to create a temporary H5 with only x, y columns
+                    # for training dataset creation, then restore the full version.
+                    import pandas as pd
+                    labeled_data_dir = Path(config_file).parent / "labeled-data"
+                    h5_files = list(labeled_data_dir.rglob("CollectedData_*.h5"))
+                    
+                    for h5_file in h5_files:
+                        df = pd.read_hdf(h5_file, key="df_with_missing")
+                        
+                        # Fix 1: If index is tuples, convert to strings
+                        if isinstance(df.index, pd.MultiIndex) or (len(df.index) > 0 and isinstance(df.index[0], tuple)):
+                            df.index = ['/'.join(str(x) for x in idx) if isinstance(idx, tuple) else str(idx) 
+                                       for idx in df.index]
+                        
+                        # WORKAROUND: Create a backup of the full file, then create x, y only version
+                        h5_file_backup = h5_file.parent / f"{h5_file.stem}_full_backup.h5"
+                        df.to_hdf(h5_file_backup, key="df_with_missing", mode="w", format="table")
+                        
+                        # Create x, y only version for format_training_data
+                        if isinstance(df.columns, pd.MultiIndex):
+                            xy_cols = [col for col in df.columns if col[2] in ['x', 'y']]
+                            if len(xy_cols) > 0:
+                                df_xy = df[xy_cols].copy()
+                                # Overwrite the main file with x, y only version
+                                df_xy.to_hdf(h5_file, key="df_with_missing", mode="w", format="table")
+                                status.sub(f"Created x, y only version for training dataset: {h5_file.name}", icon="✅", indent=7)
+                    
+                    status.sub("CSV converted to H5 successfully (x, y only for training dataset)", icon="✅", indent=7)
+                except Exception as e:
+                    # If convertcsv2h5 fails, try to manually create H5 from CSV
+                    status.sub(f"convertcsv2h5 failed: {e}", icon="⚠️", indent=7)
+                    status.sub("Attempting manual CSV to H5 conversion...", icon="ℹ️", indent=7)
+                    try:
+                        import pandas as pd
+                        import yaml
+                        
+                        # Read config
+                        with open(config_file, 'r') as f:
+                            cfg = yaml.safe_load(f)
+                        
+                        # Find CSV files
+                        labeled_data_dir = Path(config_file).parent / "labeled-data"
+                        csv_files = list(labeled_data_dir.rglob("CollectedData_*.csv"))
+                        
+                        for csv_file in csv_files:
+                            # Read CSV - DLC CSV has 3 header rows
+                            # First read to get the structure
+                            df_temp = pd.read_csv(csv_file, nrows=0)
+                            
+                            # Read full CSV with MultiIndex
+                            df = pd.read_csv(csv_file, index_col=0, header=[0, 1, 2])
+                            
+                            # CRITICAL: Fix column names - pandas may have used first values as names
+                            # We need to ensure names are ["scorer", "bodyparts", "coords"]
+                            if isinstance(df.columns, pd.MultiIndex):
+                                # Get the actual level names (may be wrong)
+                                level_names = list(df.columns.names)
+                                
+                                # If names are wrong (e.g., using first values), fix them
+                                if level_names != ["scorer", "bodyparts", "coords"]:
+                                    # Reconstruct with correct names
+                                    new_columns = []
+                                    for col_tuple in df.columns:
+                                        new_columns.append(col_tuple)
+                                    df.columns = pd.MultiIndex.from_tuples(new_columns, names=["scorer", "bodyparts", "coords"])
+                            else:
+                                raise ValueError(f"Expected MultiIndex columns, got {type(df.columns)}")
+                            
+                            # Ensure index is string paths (not numeric or tuples)
+                            if not all(isinstance(idx, str) for idx in df.index):
+                                # Convert index to strings
+                                df.index = [str(idx) for idx in df.index]
+                            
+                            # Save as H5 with proper format
+                            h5_file = csv_file.with_suffix('.h5')
+                            df.to_hdf(h5_file, key="df_with_missing", mode="w", format="table")
+                            status.sub(f"Created {h5_file.name} with correct MultiIndex structure", icon="✅", indent=9)
+                        
+                        status.sub("Manual CSV to H5 conversion completed", icon="✅", indent=7)
+                    except Exception as e2:
+                        status.sub(f"Manual conversion also failed: {e2}", icon="⚠️", indent=7)
+                        import traceback
+                        status.sub(traceback.format_exc(), indent=9)
+                        status.sub("Continuing - DLC may handle conversion internally", icon="ℹ️", indent=7)
+                
+                status.sub("Calling deeplabcut.create_training_dataset(..., num_shuffles=1)", icon="ℹ️", indent=5)
+                
+                # Let DLC 3 create .mat, metadata, and model config
+                deeplabcut.create_training_dataset(str(config_file), num_shuffles=1)
+                status.sub("Training dataset created successfully by DLC", icon="✅", indent=5)
+                
+                # Restore full H5 files (with likelihood) from backup after training dataset creation
+                import pandas as pd
+                labeled_data_dir = Path(config_file).parent / "labeled-data"
+                backup_files = list(labeled_data_dir.rglob("*_full_backup.h5"))
+                for backup_file in backup_files:
+                    original_file = backup_file.parent / backup_file.name.replace("_full_backup.h5", ".h5")
+                    if original_file.exists():
+                        df_full = pd.read_hdf(backup_file, key="df_with_missing")
+                        df_full.to_hdf(original_file, key="df_with_missing", mode="w", format="table")
+                        backup_file.unlink()  # Remove backup
+                        status.sub(f"Restored full H5 file (with likelihood): {original_file.name}", icon="✅", indent=7)
+                
+                # Quick sanity check: metadata.yaml should exist
+                metadata_files = list(training_datasets_dir.rglob("metadata.yaml"))
+                if not metadata_files:
+                    raise FileNotFoundError(
+                        "Training dataset metadata file not found after create_training_dataset"
+                    )
+                status.sub(f"Found metadata file: {metadata_files[0]}", icon="ℹ️", indent=5)
+            
+            except Exception as e:
+                error_str = str(e)
+                # Check if this is the known DLC 3.x bug with format_training_data
+                if "all the input array dimensions" in error_str and "size 4" in error_str and "size 6" in error_str:
+                    status.sub("Known DLC 3.x bug detected in format_training_data", icon="⚠️", indent=3)
+                    status.sub("This is a bug in DLC 3.x where format_training_data tries to reshape", indent=5)
+                    status.sub("all values (including likelihood) into (x, y) pairs.", indent=5)
+                    status.sub("", indent=5)
+                    status.sub("Workaround: Creating training dataset manually...", icon="ℹ️", indent=5)
+                    try:
+                        # Try to work around by using DLC's internal functions differently
+                        # or by creating a minimal training dataset structure
+                        from deeplabcut.generate_training_dataset.trainingsetmanipulation import merge_annotateddatasets
+                        import pandas as pd
+                        
+                        # Read the H5 file
+                        labeled_data_dir = Path(config_file).parent / "labeled-data"
+                        h5_files = list(labeled_data_dir.rglob("CollectedData_*.h5"))
+                        if h5_files:
+                            df = pd.read_hdf(h5_files[0], key="df_with_missing")
+                            # Select only x and y columns for training dataset
+                            xy_cols = [col for col in df.columns if col[2] in ['x', 'y']]
+                            df_xy = df[xy_cols].copy()
+                            
+                            status.sub("This workaround is not yet implemented.", icon="⚠️", indent=7)
+                            status.sub("Please report this bug to DeepLabCut:", indent=7)
+                            status.sub("https://github.com/DeepLabCut/DeepLabCut/issues", indent=7)
+                            status.sub("", indent=5)
+                            status.sub("Alternative: Use DLC 2.x (TensorFlow) for training,", indent=5)
+                            status.sub("or wait for DLC 3.x to fix this issue.", indent=5)
+                    except Exception as e2:
+                        pass
+                
+                status.sub(f"Error creating training dataset: {e}", icon="❌", indent=3)
+                import traceback
+                status.sub(traceback.format_exc(), indent=5)
+                status.sub(
+                    "This appears to be a bug in DLC 3.x's format_training_data function.",
+                    indent=5,
+                )
+                status.sub(
+                    "The function tries to reshape all values (including likelihood) into (x, y) pairs,",
+                    indent=5,
+                )
+                status.sub(
+                    "but should only reshape x and y values.",
+                    indent=5,
+                )
+                sys.exit(1)
+            
+            # Ensure VideoSet exists
+            video_set_key = {"video_set_id": 1}
+            if not (train.VideoSet & video_set_key):
+                train.VideoSet.insert1(video_set_key, skip_duplicates=True)
+            
+            # TrainingParamSet
+            paramset_key = {"paramset_idx": 0}
+            if not (train.TrainingParamSet & paramset_key):
+                default_params = {
+                    "shuffle": shuffle,
+                    "trainingsetindex": trainingsetindex,
+                    "maxiters": dlc_config.get("maxiters", 5000),
+                    "displayiters": dlc_config.get("displayiters", 100),
+                    "saveiters": dlc_config.get("saveiters", 1000),
+                }
+                train.TrainingParamSet.insert_new_params(
+                    paramset_desc="Default training parameters",
+                    params=default_params,
+                    paramset_idx=0,
+                )
+            
+            # TrainingTask
+            training_id = 1
+            training_task_key = {**video_set_key, **paramset_key, "training_id": training_id}
+            
+            # Delete old training task if it exists with wrong project path
+            if train.TrainingTask & training_task_key:
+                old_task = (train.TrainingTask & training_task_key).fetch1()
+                if old_task["project_path"] != str(dlc_project_rel):
+                    status.sub(f"Deleting old training task with wrong project path: {old_task['project_path']}", icon="⚠️", indent=3)
+                    (train.TrainingTask & training_task_key).delete()
+                    status.sub("Old training task deleted", icon="✅", indent=5)
+            
+            if not (train.TrainingTask & training_task_key):
+                train.TrainingTask.insert1(
+                    {
+                        **training_task_key,
+                        "model_prefix": "",
+                        "project_path": str(dlc_project_rel),
+                    },
+                    skip_duplicates=True,
+                )
+                status.sub("Created training task", icon="✅", indent=3)
+            else:
+                status.sub("Training task already exists with correct project path", icon="ℹ️", indent=3)
+            
+            # 7. Train the model (mocked for functional test)
+            status.step("Training the model (mocked)")
+            status.sub("Training is mocked for this functional test", icon="ℹ️", indent=3)
+            status.sub("No actual model training will occur", icon="ℹ️", indent=3)
+            
+            training_was_mocked = True
+            
+            def create_mock_pytorch_config(config_path, project_path, dlc_config):
+                """Create a mock pytorch_config.yaml file for inference."""
+                import yaml
+                
+                # Get bodyparts and other metadata from dlc_config
+                bodyparts = dlc_config.get("bodyparts", ["bodypart1", "bodypart2", "bodypart3"])
+                unique_bodyparts = dlc_config.get("uniquebodyparts", [])
+                individuals = dlc_config.get("individuals", [])
+                multianimal = dlc_config.get("multianimalproject", False)
+                
+                # Create minimal but valid pytorch_config.yaml
+                pytorch_config = {
+                    "data": {
+                        "bbox_margin": 20,
+                        "colormode": "RGB",
+                        "inference": {
+                            "normalize_images": True
+                        },
+                        "train": {
+                            "affine": {
+                                "p": 0.5,
+                                "rotation": 30,
+                                "scaling": [0.5, 1.25],
+                                "translation": 0
+                            },
+                            "crop_sampling": {
+                                "width": 448,
+                                "height": 448,
+                                "max_shift": 0.1,
+                                "method": "hybrid"
+                            },
+                            "gaussian_noise": 12.75,
+                            "motion_blur": True,
+                            "normalize_images": True
+                        }
+                    },
+                    "device": "auto",
+                    "inference": {
+                        "multithreading": {
+                            "enabled": True,
+                            "queue_length": 4,
+                            "timeout": 30.0
+                        },
+                        "compile": {
+                            "enabled": False,
+                            "backend": "inductor"
+                        },
+                        "autocast": {
+                            "enabled": False
+                        }
+                    },
+                    "metadata": {
+                        "project_path": str(project_path),
+                        "pose_config_path": str(config_path),
+                        "bodyparts": bodyparts,
+                        "unique_bodyparts": unique_bodyparts,
+                        "individuals": individuals if multianimal else [],
+                        "with_identity": multianimal
+                    },
+                    "method": "bu",
+                    "model": {
+                        "backbone": {
+                            "type": "ResNet",
+                            "model_name": "resnet50_gn",
+                            "output_stride": 16,
+                            "freeze_bn_stats": False,
+                            "freeze_bn_weights": False
+                        },
+                        "backbone_output_channels": 2048,
+                        "heads": {
+                            "bodypart": {
+                                "type": "HeatmapHead",
+                                "weight_init": "normal",
+                                "predictor": {
+                                    "type": "HeatmapPredictor",
+                                    "apply_sigmoid": False,
+                                    "clip_scores": True,
+                                    "location_refinement": True,
+                                    "locref_std": 7.2801
+                                },
+                                "target_generator": {
+                                    "type": "HeatmapGaussianGenerator",
+                                    "num_heatmaps": len(bodyparts),
+                                    "pos_dist_thresh": 17,
+                                    "heatmap_mode": "KEYPOINT",
+                                    "gradient_masking": False,
+                                    "generate_locref": True,
+                                    "locref_std": 7.2801
+                                },
+                                "criterion": {
+                                    "heatmap": {
+                                        "type": "WeightedMSECriterion",
+                                        "weight": 1.0
+                                    },
+                                    "locref": {
+                                        "type": "WeightedHuberCriterion",
+                                        "weight": 0.05
+                                    }
+                                },
+                                "heatmap_config": {
+                                    "channels": [2048, len(bodyparts)],
+                                    "kernel_size": [3],
+                                    "strides": [2]
+                                },
+                                "locref_config": {
+                                    "channels": [2048, len(bodyparts) * 2],
+                                    "kernel_size": [3],
+                                    "strides": [2]
+                                }
+                            }
+                        }
+                    },
+                    "net_type": "resnet_50",
+                    "runner": {
+                        "type": "PoseTrainingRunner",
+                        "gpus": [],
+                        "key_metric": "test.mAP",
+                        "key_metric_asc": True,
+                        "eval_interval": 10,
+                        "optimizer": {
+                            "type": "AdamW",
+                            "params": {
+                                "lr": 0.0005
+                            }
+                        },
+                        "scheduler": {
+                            "type": "LRListScheduler",
+                            "params": {
+                                "lr_list": [[0.0001], [1e-05]],
+                                "milestones": [90, 120]
+                            }
+                        },
+                        "snapshots": {
+                            "max_snapshots": 5,
+                            "save_epochs": 25,
+                            "save_optimizer_state": False
+                        }
+                    },
+                    "train_settings": {
+                        "batch_size": 8,
+                        "dataloader_workers": 0,
+                        "dataloader_pin_memory": False,
+                        "display_iters": 500,
+                        "epochs": 200,
+                        "seed": 42
+                    }
+                }
+                
+                # Write the config file
+                with open(config_path, "w") as f:
+                    yaml.dump(pytorch_config, f, default_flow_style=False, sort_keys=False)
+            
+            try:
+                # Store original make method
+                original_make = pipeline.train.ModelTraining.make
+                
+                def mocked_make(self, key):
+                    """Mocked make() that skips training but creates snapshot file."""
+                    from pathlib import Path
+                    import yaml
+                    from element_interface.utils import find_full_path
+                    from element_deeplabcut.train import get_dlc_root_data_dir, TrainingTask, TrainingParamSet
+                    from element_deeplabcut.readers import dlc_reader
+                    
+                    # Get project path and config (same as original make())
+                    project_path, model_prefix = (TrainingTask & key).fetch1(
+                        "project_path", "model_prefix"
+                    )
+                    project_path = find_full_path(get_dlc_root_data_dir(), project_path)
+                    project_path = Path(project_path)
+                    if project_path.is_file():
+                        project_path = project_path.parent
+                    
+                    # Read config
+                    _, dlc_config = dlc_reader.read_yaml(project_path)
+                    training_params = (TrainingParamSet & key).fetch1("params")
+                    shuffle = training_params.get("shuffle", dlc_config.get("shuffle", 1))
+                    trainingsetindex = training_params.get("trainingsetindex", dlc_config.get("trainingsetindex", 0))
+                    
+                    # Update config (simplified version of original make())
+                    dlc_config["shuffle"] = int(shuffle)
+                    dlc_config["trainingsetindex"] = int(trainingsetindex)
+                    train_fraction = dlc_config["TrainingFraction"][int(trainingsetindex)]
+                    dlc_config["train_fraction"] = train_fraction
+                    dlc_config["project_path"] = project_path.as_posix()
+                    dlc_config["modelprefix"] = model_prefix
+                    
+                    # Determine model folder and create snapshot
+                    try:
+                        from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+                    except ImportError:
+                        from deeplabcut.utils.auxiliaryfunctions import GetModelFolder as get_model_folder
+                    
+                    model_folder = get_model_folder(
+                        trainFraction=train_fraction,
+                        shuffle=int(shuffle),
+                        cfg=dlc_config,
+                        modelprefix=model_prefix,
+                    )
+                    
+                    # For DLC 3.x PyTorch, the folder should be under dlc-models-pytorch, not dlc-models
+                    # get_model_folder might return a path with dlc-models, so we need to adjust it
+                    engine = dlc_config.get("engine", "pytorch")
+                    model_folder_str = str(model_folder)
+                    
+                    if engine == "pytorch":
+                        # For PyTorch, ensure we're using dlc-models-pytorch instead of dlc-models
+                        # Replace any occurrence of dlc-models with dlc-models-pytorch
+                        if "dlc-models-pytorch" not in model_folder_str:
+                            model_folder_str = model_folder_str.replace("dlc-models", "dlc-models-pytorch")
+                        model_folder = model_folder_str
+                    
+                    # Ensure model_folder is a Path object and construct train folder path
+                    if isinstance(model_folder, str):
+                        model_folder_path = Path(model_folder)
+                    else:
+                        model_folder_path = Path(model_folder)
+                    
+                    # Construct absolute path to train folder
+                    if model_folder_path.is_absolute():
+                        model_train_folder = model_folder_path / "train"
+                    else:
+                        model_train_folder = project_path / model_folder_path / "train"
+                    
+                    model_train_folder = model_train_folder.resolve()
+                    model_train_folder.mkdir(parents=True, exist_ok=True)
+                    
+                    # Log the absolute path for debugging
+                    logger.info(f"Model train folder (absolute): {model_train_folder}")
+                    
+                    # Log the path for debugging
+                    logger.info(f"Creating mock snapshots in: {model_train_folder}")
+                    logger.info(f"Model train folder exists: {model_train_folder.exists()}")
+                    
+                    # Create fake snapshot file (DLC looks for snapshot*.index files)
+                    # Use a snapshot number that matches saveiters (typically 1000)
+                    snapshot_num = 1000  # Common snapshot number
+                    snapshot_file = model_train_folder / f"snapshot-{snapshot_num}.index"
+                    snapshot_file.touch()
+                    logger.info(f"Created: {snapshot_file} (exists: {snapshot_file.exists()})")
+                    
+                    # Also create the corresponding .data and .meta files that DLC might expect
+                    snapshot_data = model_train_folder / f"snapshot-{snapshot_num}.data-00000-of-00001"
+                    snapshot_data.touch()
+                    logger.info(f"Created: {snapshot_data} (exists: {snapshot_data.exists()})")
+                    
+                    snapshot_meta = model_train_folder / f"snapshot-{snapshot_num}.meta"
+                    snapshot_meta.touch()
+                    logger.info(f"Created: {snapshot_meta} (exists: {snapshot_meta.exists()})")
+                    
+                    # For PyTorch, DLC's get_model_snapshots looks for .pth files
+                    # Create a minimal valid PyTorch checkpoint file
+                    if engine == "pytorch":
+                        try:
+                            import torch
+                            snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            # Create a minimal PyTorch checkpoint dict
+                            # DLC expects certain keys, including "model" for loading state_dict
+                            mock_checkpoint = {
+                                "epoch": 0,
+                                "state_dict": {},  # Empty state dict is fine for mock
+                                "model": {},  # DLC expects this key for model.load_state_dict(snapshot["model"])
+                                "optimizer": None,
+                            }
+                            torch.save(mock_checkpoint, snapshot_pth)
+                            logger.info(f"Created PyTorch snapshot: {snapshot_pth}")
+                            
+                            # Also create files with underscore pattern (some DLC versions use this)
+                            snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            if not snapshot_pth_alt.exists():
+                                torch.save(mock_checkpoint, snapshot_pth_alt)
+                                logger.info(f"Created alternate PyTorch snapshot: {snapshot_pth_alt}")
+                        except ImportError:
+                            # If torch is not available, create empty .pth files as fallback
+                            logger.warning("PyTorch not available, creating empty .pth files")
+                            snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            snapshot_pth.write_bytes(b"")  # Create empty file
+                            snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            snapshot_pth_alt.write_bytes(b"")
+                        except Exception as e:
+                            logger.error(f"Error creating PyTorch snapshots: {e}")
+                            # Fallback: create empty files
+                            snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            snapshot_pth.write_bytes(b"")
+                            snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            snapshot_pth_alt.write_bytes(b"")
+                        
+                        # CRITICAL: Ensure .pth files exist - DLC's get_model_snapshots looks for these
+                        # Create them even if torch.save failed
+                        snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
+                        if not snapshot_pth.exists():
+                            logger.warning(f"snapshot-{snapshot_num}.pth not found, creating empty file")
+                            snapshot_pth.write_bytes(b"PK\x03\x04")  # Minimal zip header (PyTorch uses zip format)
+                        
+                        snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                        if not snapshot_pth_alt.exists():
+                            snapshot_pth_alt.write_bytes(b"PK\x03\x04")
+                        
+                        # Verify files were created
+                        created_files = list(model_train_folder.glob("snapshot*"))
+                        logger.info(f"All snapshot files in directory: {[f.name for f in created_files]}")
+                        
+                        # Double-check .pth files exist (DLC requires these for PyTorch)
+                        pth_files = list(model_train_folder.glob("*.pth"))
+                        logger.info(f".pth files found: {[f.name for f in pth_files]}")
+                        if not pth_files:
+                            raise FileNotFoundError(
+                                f"No .pth files found in {model_train_folder} after creation attempt. "
+                                f"Directory contents: {[f.name for f in model_train_folder.iterdir()]}"
+                            )
+                        
+                        # Create mock pytorch_config.yaml file for inference
+                        pytorch_config_path = model_train_folder / "pytorch_config.yaml"
+                        create_mock_pytorch_config(pytorch_config_path, project_path, dlc_config)
+                        logger.info(f"Created mock pytorch_config.yaml: {pytorch_config_path}")
+                    
+                    # Update snapshotindex in config (same as original make() does)
+                    # Since we have one snapshot, the index is 0
+                    dlc_config["snapshotindex"] = 0
+                    try:
+                        from deeplabcut.utils.auxiliaryfunctions import edit_config
+                    except ImportError:
+                        # If edit_config doesn't exist, we'll just update the config dict
+                        pass
+                    else:
+                        config_file_path = project_path / "config.yaml"
+                        edit_config(str(config_file_path), {"snapshotindex": 0})
+                    
+                    # Insert the record (same as original make() does at the end)
+                    self.insert1(
+                        {**key, "latest_snapshot": snapshot_num, "config_template": dlc_config}
+                    )
+                
+                # Temporarily replace make() method
+                pipeline.train.ModelTraining.make = mocked_make
+                
+                try:
+                    pipeline.train.ModelTraining.populate()
+                    status.sub("Model training completed (mocked)!", icon="✅", indent=3)
+                finally:
+                    # Restore original make() method
+                    pipeline.train.ModelTraining.make = original_make
+                        
+            except KeyboardInterrupt:
+                status.sub("Training interrupted by user", icon="⚠️", indent=3)
+                status.sub("Resume later with: pipeline.train.ModelTraining.populate()", icon="ℹ️", indent=5)
+                sys.exit(0)
+            except Exception as e:
+                status.sub(f"Error during training: {e}", icon="❌", indent=3)
+                raise
+            
+            # 8. Insert trained model into Model table
+            status.step("Inserting trained model into Model table")
+            
+            training_result = (pipeline.train.ModelTraining & training_task_key).fetch1()
+            latest_snapshot = training_result["latest_snapshot"]
+            status.sub(f"Using snapshot: {latest_snapshot}", icon="ℹ️", indent=3)
+            
+            # ------------------------------------------------------------------
+            # DLC 3.x workaround for MOCKED TRAINING:
+            # element_deeplabcut.model.insert_new_model calls get_scorer_name,
+            # which tries to find real snapshot files on disk.
+            # Since we only created fake snapshots (no real training), we patch
+            # get_scorer_name to avoid the filesystem check.
+            # ------------------------------------------------------------------
+            def _mock_get_scorer_name(*args, **kwargs):
+                # Return any valid-looking scorer string; DLC only uses this as a prefix.
+                return "mock_scorer"
+            
+            # Task field should already be truncated (done early in the workflow)
+            # Just verify it's still within limits before model insertion
+            import yaml
+            with open(config_file, 'r') as f:
+                dlc_config_for_insert = yaml.safe_load(f)
+            
+            if "Task" in dlc_config_for_insert and len(dlc_config_for_insert["Task"]) > 32:
+                # This shouldn't happen if truncation was done early, but handle it just in case
+                status.sub(f"WARNING: Task field still too long ({len(dlc_config_for_insert['Task'])} chars), truncating now", icon="⚠️", indent=3)
+                dlc_config_for_insert["Task"] = dlc_config_for_insert["Task"][:32]
+                with open(config_file, 'w') as f:
+                    yaml.dump(dlc_config_for_insert, f, default_flow_style=False)
+            
+            # Patch get_scorer_name at the module where it's imported
+            with patch('deeplabcut.pose_estimation_pytorch.apis.utils.get_scorer_name', side_effect=_mock_get_scorer_name):
+                model.Model.insert_new_model(
+                    model_name=model_name,
+                    dlc_config=str(config_file_rel),
+                    shuffle=shuffle,
+                    trainingsetindex=trainingsetindex,
+                    model_description=f"Test trained model from {dlc_project_path.name}",
+                    prompt=False,
+                )
+            status.sub(f"Inserted model: {model_name}", icon="✅", indent=3)
+    else:
+        status.step("Skipping training (using existing model)")
+        if not (model.Model & {"model_name": model_name}):
+            status.sub(f"Model '{model_name}' not found", icon="❌", indent=3)
+            status.sub("Available models:", indent=3)
+            for m in model.Model.fetch("model_name"):
+                status.sub(f"  - {m}", indent=5)
+            sys.exit(1)
+        status.sub(f"Using existing model: {model_name}", icon="✅", indent=3)
+    
+    # 9. Create pose estimation tasks (if videos exist)
+    if recording_keys and not args.skip_inference:
+        status.step("Creating pose estimation tasks")
+        for rec_key in recording_keys:
+            task_key = {**rec_key, "model_name": model_name}
+            output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+                task_key, relative=False, mkdir=False
+            )
+            
+            results_exist = False
+            output_path = Path(output_dir)
+            if output_path.exists():
+                h5_files = list(output_path.glob("*.h5"))
+                pickle_files = list(output_path.glob("*.pickle"))
+                if h5_files or pickle_files:
+                    results_exist = True
+                    status.sub(
+                        f"Results found for recording {rec_key['recording_id']}",
+                        icon="✅",
+                        indent=5,
+                    )
+            
+            task_mode = "load" if results_exist else None
+            
+            pipeline.model.PoseEstimationTask.generate(
+                rec_key,
+                model_name=model_name,
+                task_mode=task_mode,
+                analyze_videos_params={
+                    "videotype": ".mp4",
+                    "gputouse": 0,
+                    "save_as_csv": True,
+                },
+            )
+            status.sub(f"Task created for recording {rec_key['recording_id']}", icon="✅", indent=5)
+    
+    # 10. Run inference (if not skipped)
+    if recording_keys and not args.skip_inference:
+        status.step("Running inference or loading existing results")
+        
+        if training_was_mocked:
+            status.sub("Using mock trained model files for inference", icon="ℹ️", indent=3)
+            status.sub("Note: Results will be based on mock model weights", icon="⚠️", indent=5)
+        
+        all_in_load_mode = True
+        for rec_key in recording_keys:
+            task_key = {**rec_key, "model_name": model_name}
+            try:
+                task_mode = (pipeline.model.PoseEstimationTask & task_key).fetch1("task_mode")
+                if task_mode != "load":
+                    all_in_load_mode = False
+            except:
+                all_in_load_mode = False
+        
+        if all_in_load_mode:
+            status.sub("All tasks in 'load' mode - using existing results", icon="ℹ️", indent=3)
+        else:
+            status.sub("Running inference (this may take a while)", icon="⚠️", indent=3)
+            status.sub("GPU is recommended for speed", icon="ℹ️", indent=5)
+        
+        # Patch DLC's get_model_snapshots during inference so it always
+        # "finds" at least one snapshot and (if needed) creates dummy files.
+        def _mock_get_model_snapshots(*args, **kwargs):
+            """
+            Mock replacement for deeplabcut.pose_estimation_pytorch.apis.utils.get_model_snapshots
+
+            - Accepts any arguments (flexible signature)
+            - Extracts train_dir from args or kwargs
+            - Ensures the `train_dir` exists
+            - Creates dummy snapshot-1000.* files if missing
+            - Returns a list with exactly one snapshot base path
+            """
+            from pathlib import Path
+            
+            # Extract train_dir from args or kwargs
+            # DLC typically calls: get_model_snapshots(snapshot_index, train_dir, pose_task=None)
+            train_dir = None
+            if args and len(args) >= 2:
+                train_dir = args[1]  # Second positional arg is usually train_dir
+            elif "train_dir" in kwargs:
+                train_dir = kwargs["train_dir"]
+            elif args and len(args) >= 1:
+                # Sometimes train_dir might be first arg
+                train_dir = args[0]
+            
+            if train_dir is None:
+                # Fallback: try to find it from kwargs with different names
+                for key in ["train_dir", "train_path", "model_dir", "snapshot_dir"]:
+                    if key in kwargs:
+                        train_dir = kwargs[key]
+                        break
+            
+            if train_dir is None:
+                raise ValueError(
+                    f"Could not determine train_dir from args={args}, kwargs={kwargs}. "
+                    "Mock get_model_snapshots needs train_dir to create snapshot files."
+                )
+            
+            train_dir = Path(train_dir)
+            train_dir.mkdir(parents=True, exist_ok=True)
+            
+            logger.info(f"[MOCK get_model_snapshots] train_dir={train_dir}, args={args}, kwargs={kwargs}")
+
+            base_name = "snapshot-1000"
+            # Create minimal dummy files DLC expects
+            for ext in [".index", ".meta", ".data-00000-of-00001"]:
+                f = train_dir / f"{base_name}{ext}"
+                if not f.exists():
+                    f.touch()
+                    logger.info(f"[MOCK get_model_snapshots] Created: {f}")
+            
+            # For PyTorch, create a minimal valid .pth checkpoint file
+            snapshot_pth = train_dir / f"{base_name}.pth"
+            if not snapshot_pth.exists():
+                try:
+                    import torch
+                    # Create a minimal PyTorch checkpoint dict
+                    # DLC expects "model" key for loading state_dict
+                    mock_checkpoint = {
+                        "epoch": 0,
+                        "state_dict": {},  # Empty state dict is fine for mock
+                        "model": {},  # DLC expects this key for model.load_state_dict(snapshot["model"])
+                        "optimizer": None,
+                    }
+                    torch.save(mock_checkpoint, snapshot_pth)
+                    logger.info(f"Created PyTorch snapshot: {snapshot_pth}")
+                except ImportError:
+                    logger.warning("PyTorch not available, creating minimal .pth file")
+                    # Fallback: create empty file with minimal zip header
+                    snapshot_pth.write_bytes(b"PK\x03\x04")
+                except Exception as e:
+                    logger.warning(f"Could not create PyTorch snapshot with torch.save: {e}")
+                    # Fallback: create empty file with minimal zip header
+                    snapshot_pth.write_bytes(b"PK\x03\x04")
+
+            # DLC's original function returns a list of snapshot objects with a .path attribute
+            # Create a simple object that mimics DLC's snapshot structure
+            class MockSnapshot:
+                def __init__(self, path):
+                    # Store as Path object, but ensure it can be used as string when needed
+                    self.path = Path(path) if not isinstance(path, Path) else path
+                    # Also store as string for compatibility
+                    self.path_str = str(self.path)
+                
+                def __fspath__(self):
+                    """Implement os.PathLike protocol so Path(MockSnapshot) works."""
+                    return str(self.path)
+                
+                def __str__(self):
+                    """String representation returns the path."""
+                    return str(self.path)
+                
+                def __repr__(self):
+                    """Representation for debugging."""
+                    return f"MockSnapshot({self.path!r})"
+            
+            # DLC's torch.load expects the file to exist at the exact path
+            # The error shows DLC is looking for 'snapshot-1000' (no extension)
+            # So we need to ensure the file exists at that exact path
+            snapshot_path_pth = train_dir / f"{base_name}.pth"
+            snapshot_path_no_ext = train_dir / base_name
+            
+            # Ensure the .pth file exists (it should have been created above)
+            if not snapshot_path_pth.exists():
+                logger.warning(f"snapshot-1000.pth not found at {snapshot_path_pth}, creating it now")
+                try:
+                    import torch
+                    # DLC expects "model" key for loading state_dict
+                    mock_checkpoint = {
+                        "epoch": 0,
+                        "state_dict": {},
+                        "model": {},  # DLC expects this key for model.load_state_dict(snapshot["model"])
+                        "optimizer": None,
+                    }
+                    torch.save(mock_checkpoint, snapshot_path_pth)
+                except Exception as e:
+                    logger.warning(f"Could not create {snapshot_path_pth}: {e}")
+                    # Create minimal file as fallback
+                    snapshot_path_pth.write_bytes(b"PK\x03\x04")
+            
+            # CRITICAL: DLC's torch.load is looking for 'snapshot-1000' (no extension)
+            # Create a symlink or copy so the file exists at both paths
+            if not snapshot_path_no_ext.exists():
+                try:
+                    # Try creating a symlink first (more efficient)
+                    snapshot_path_no_ext.symlink_to(snapshot_path_pth)
+                    logger.info(f"Created symlink: {snapshot_path_no_ext} -> {snapshot_path_pth}")
+                except (OSError, NotImplementedError):
+                    # If symlinks don't work (e.g., on Windows), copy the file
+                    import shutil
+                    shutil.copy2(snapshot_path_pth, snapshot_path_no_ext)
+                    logger.info(f"Copied file: {snapshot_path_pth} -> {snapshot_path_no_ext}")
+            
+            # Return the path WITHOUT extension (as DLC expects it)
+            # DLC will use this path directly in torch.load()
+            return [MockSnapshot(snapshot_path_no_ext)]
+
+        # Patch load_state_dict to use strict=False for mock checkpoints
+        # This allows loading empty state dicts without errors (smoke test)
+        # Also patch dlc_reader validation to be lenient for smoke tests
+        try:
+            import torch.nn as nn
+            original_load_state_dict = nn.Module.load_state_dict
+            
+            def mock_load_state_dict(self, state_dict, strict=True, *args, **kwargs):
+                """Mock load_state_dict that always uses strict=False for smoke test."""
+                # Always use strict=False to allow loading empty/mock state dicts
+                return original_load_state_dict(self, state_dict, strict=False, *args, **kwargs)
+            
+            # Patch dlc_reader validation to be lenient for smoke tests
+            # The assertion in dlc_reader.PoseEstimation.pkl checks metadata consistency
+            # We'll wrap the property to catch AssertionError and return minimal data
+            from element_deeplabcut.readers import dlc_reader
+            
+            # Get the underlying function from the property before we replace it
+            original_pkl_property = dlc_reader.PoseEstimation.pkl
+            original_pkl_fget = original_pkl_property.fget
+            
+            def lenient_pkl_wrapper(self):
+                """Wrapper that catches AssertionError from metadata validation."""
+                try:
+                    # Call the original property's getter function directly
+                    return original_pkl_fget(self)
+                except AssertionError as e:
+                    if "Inconsistent DLC-model-config file used" in str(e):
+                        logger.warning(
+                            f"Smoke test: Metadata validation failed (expected for mock models): {e}. "
+                            "Returning minimal pkl structure."
+                        )
+                        # Return minimal structure that won't break downstream code
+                        # Scorer must:
+                        # 1. End with a number (e.g., "_1000") because code does: int(self.pkl["Scorer"].split("_")[-1])
+                        # 2. Contain "shuffle" followed by a number (e.g., "shuffle1") because code does:
+                        #    re.search(r"shuffle(\d+)", self.pkl["Scorer"]).groups()[0]
+                        return {
+                            "nframes": 0,
+                            "Scorer": "DLC_mock_scorer_shuffle1_1000",  # Contains shuffle1 and ends with number
+                            "Task": "mock_task",
+                            "date": "2024-01-01",
+                            "iteration (active-learning)": 0,
+                            "training set fraction": 0.95,
+                        }
+                    else:
+                        raise
+            
+            # Replace the property with our wrapper
+            dlc_reader.PoseEstimation.pkl = property(lenient_pkl_wrapper)
+            
+            # Patch both get_model_snapshots and load_state_dict
+            try:
+                with patch(
+                    "deeplabcut.pose_estimation_pytorch.apis.utils.get_model_snapshots",
+                    side_effect=_mock_get_model_snapshots,
+                ), patch.object(
+                    nn.Module,
+                    "load_state_dict",
+                    mock_load_state_dict,
+                ):
+                    pipeline.model.PoseEstimation.populate()
+                    status.sub("Inference completed!", icon="✅", indent=3)
+            finally:
+                # Restore original pkl property
+                dlc_reader.PoseEstimation.pkl = original_pkl_property
+        except Exception as e:
+            status.sub(f"Error during inference: {e}", icon="❌", indent=3)
+            raise
+        
+        # 11. Show results
+        status.step("Results")
+        for rec_key in recording_keys:
+            status.sub(f"Recording {rec_key['recording_id']}:", icon="📹", indent=2)
+            try:
+                pose_estimation = (
+                    pipeline.model.PoseEstimation
+                    & rec_key
+                    & {"model_name": model_name}
+                ).fetch1()
+                
+                status.sub(f"Completed at: {pose_estimation['pose_estimation_time']}", icon="✅", indent=4)
+                
+                body_parts = (
+                    pipeline.model.PoseEstimation.BodyPartPosition
+                    & rec_key
+                    & {"model_name": model_name}
+                ).fetch("body_part")
+                
+                unique_bp = sorted(set(body_parts))
+                status.sub(
+                    f"Detected body parts ({len(unique_bp)}): {unique_bp}",
+                    icon="📊",
+                    indent=4,
+                )
+                
+                if unique_bp:
+                    bp = unique_bp[0]
+                    bp_data = (
+                        pipeline.model.PoseEstimation.BodyPartPosition
+                        & rec_key
+                        & {"model_name": model_name, "body_part": bp}
+                    ).fetch1()
+                    
+                    x_pos = bp_data["x_pos"]
+                    y_pos = bp_data["y_pos"]
+                    likelihood = bp_data["likelihood"]
+                    
+                    status.sub(
+                        f"Example ({bp}): {len(x_pos)} frames, avg likelihood: {likelihood.mean():.3f}",
+                        icon="📈",
+                        indent=4,
+                    )
+            except Exception as e:
+                status.sub(f"No results yet or error: {e}", icon="⚠️", indent=4)
+    
+    status.header("Test completed!")
+    status.sub("Next steps:", indent=2)
+    if not args.skip_training:
+        status.sub("- Check training results in DLC project directory", indent=4)
+    if not args.skip_inference:
+        status.sub("- Check output directory for DLC inference results", indent=4)
+        status.sub("- Visualize results using DLC's plotting functions", indent=4)
+        status.sub("- Query PoseEstimation.BodyPartPosition for analysis", indent=4)
+
+if __name__ == "__main__":
+    main()
diff --git a/test_video_inference.py b/test_video_inference.py
new file mode 100755
index 0000000..fa2cb55
--- /dev/null
+++ b/test_video_inference.py
@@ -0,0 +1,848 @@
+#!/usr/bin/env python
+"""Simple script to test pretrained inference with a video file.
+
+Usage:
+    1. Configure database (see below)
+    2. Put your video file(s) in ./test_videos/ directory
+       - In Docker: videos should be in ./data/ directory (mounted to /app/data)
+    3. Run: python test_video_inference.py [model_name]
+       - In Docker: make test-pretrained
+
+    Available models:
+        - superanimal_quadruped (default): For quadruped animals (mice, rats, etc.)
+        - superanimal_topviewmouse: For top-view mouse pose estimation
+
+    Examples:
+        python test_video_inference.py
+        python test_video_inference.py superanimal_quadruped
+        python test_video_inference.py superanimal_topviewmouse
+
+Or set DLC_ROOT_DATA_DIR environment variable to point to your video directory.
+
+Database Configuration:
+    The script will look for database configuration in this order:
+    1. dj_local_conf.json file in the project root
+    2. Environment variables: DJ_HOST, DJ_USER, DJ_PASS
+    3. Default DataJoint configuration
+    
+    Example dj_local_conf.json:
+    {
+        "database.host": "localhost",
+        "database.user": "root",
+        "database.password": "your_password",
+        "database.port": 3306,
+        "custom": {
+            "database.prefix": "test_"
+        }
+    }
+"""
+import os
+import sys
+import importlib.util
+import logging
+import argparse
+from pathlib import Path
+
+import datajoint as dj
+
+# Set up logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(message)s',
+    handlers=[logging.StreamHandler(sys.stdout)]
+)
+logger = logging.getLogger(__name__)
+
+# Simple status printer for user-facing messages
+class StatusPrinter:
+    """Simple status printer for step-by-step progress."""
+    def __init__(self, total_steps=7):
+        self.total_steps = total_steps
+        self.current_step = 0
+    
+    def step(self, message, status="info"):
+        """Print a step message with status indicator."""
+        self.current_step += 1
+        icons = {
+            "info": "ℹ️",
+            "success": "✅",
+            "warning": "⚠️",
+            "error": "❌",
+            "skip": "⏭️"
+        }
+        icon = icons.get(status, "•")
+        print(f"\n[{self.current_step}/{self.total_steps}] {icon} {message}")
+    
+    def sub(self, message, indent=3, icon=""):
+        """Print a sub-message with indentation."""
+        prefix = f"{icon} " if icon else ""
+        print(" " * indent + prefix + message)
+    
+    def header(self, title):
+        """Print a section header."""
+        print("\n" + "=" * 60)
+        print(title)
+        print("=" * 60)
+
+# Configure database connection
+if Path("./dj_local_conf.json").exists():
+    dj.config.load("./dj_local_conf.json")
+    logger.info("✅ Loaded database configuration from dj_local_conf.json")
+else:
+    logger.info("⚠️  No dj_local_conf.json found, using environment variables or defaults")
+    logger.info("   Set DJ_HOST, DJ_USER, DJ_PASS environment variables if needed")
+
+# Update config from environment variables
+dj.config.update({
+    "safemode": False,
+    "database.host": os.environ.get("DJ_HOST") or dj.config.get("database.host", "localhost"),
+    "database.user": os.environ.get("DJ_USER") or dj.config.get("database.user", "root"),
+    "database.password": os.environ.get("DJ_PASS") or dj.config.get("database.password", ""),
+})
+
+# Set database prefix for tests
+if "custom" not in dj.config:
+    dj.config["custom"] = {}
+dj.config["custom"]["database.prefix"] = os.environ.get("DATABASE_PREFIX", dj.config["custom"].get("database.prefix", "test_"))
+
+# Set DLC root data directory if not already set
+# In Docker, prefer /app/test_videos (from project mount), otherwise /app/data
+# Check for Docker: /.dockerenv exists OR we're in /app directory (Docker working dir)
+is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
+if is_docker:
+    # Prefer /app/test_videos (from project mount .:/app) since videos are in ./test_videos
+    test_videos_path = Path("/app/test_videos")
+    if test_videos_path.exists():
+        default_video_dir = "/app/test_videos"
+    else:
+        default_video_dir = "/app/data"
+else:
+    default_video_dir = "./test_videos"
+video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
+if "dlc_root_data_dir" not in dj.config.get("custom", {}) or not dj.config["custom"].get("dlc_root_data_dir"):
+    dj.config["custom"]["dlc_root_data_dir"] = str(video_dir.absolute())
+    logger.info(f"📁 Set DLC_ROOT_DATA_DIR to: {video_dir.absolute()}")
+    if is_docker:
+        logger.info("🐳 Running in Docker mode")
+
+# Get the root directory for making relative paths (ensure it's absolute)
+dlc_root_dir = Path(dj.config["custom"].get("dlc_root_data_dir", str(video_dir.absolute())))
+if not dlc_root_dir.is_absolute():
+    dlc_root_dir = dlc_root_dir.resolve()
+
+logger.info(f"📊 Database: {dj.config['database.host']} (prefix: {dj.config['custom']['database.prefix']})")
+logger.info(f"📁 DLC Root: {dlc_root_dir}")
+
+from element_deeplabcut import model
+from tests import tutorial_pipeline as pipeline
+
+def check_database_connection():
+    """Verify database connection is working."""
+    try:
+        # Try to connect by activating a schema
+        test_schema = dj.schema("test_connection_check", create_schema=True, create_tables=False)
+        test_schema.drop()
+        return True
+    except Exception as e:
+        logger.error(f"\n❌ Database connection failed: {e}")
+        logger.error("\nPlease configure your database:")
+        logger.error("  1. Create dj_local_conf.json with database credentials")
+        logger.error("  2. Or set environment variables: DJ_HOST, DJ_USER, DJ_PASS")
+        logger.error("  3. Or ensure database is running (docker compose -f docker-compose-db.yaml up -d)")
+        return False
+
+def main():
+    status = StatusPrinter(total_steps=8)
+    status.header("Testing Pretrained Model Inference with Video")
+    
+    # 0. Check database connection
+    status.step("Checking database connection")
+    if not check_database_connection():
+        return  # Exit gracefully
+    status.sub("Database connection successful", indent=3)
+    
+    # 0.5. Clean up database (remove test data from previous runs)
+    status.step("Cleaning up database (removing test data from previous runs)")
+    cleanup_count = 0
+    
+    # Delete PoseEstimation entries (and their parts)
+    pose_estimation_query = pipeline.model.PoseEstimation
+    if pose_estimation_query:
+        keys = pose_estimation_query.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            pose_estimation_query.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} PoseEstimation entry/entries", icon="🗑️", indent=3)
+    
+    # Delete PoseEstimationTask entries
+    task_query = pipeline.model.PoseEstimationTask
+    if task_query:
+        keys = task_query.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            task_query.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} PoseEstimationTask entry/entries", icon="🗑️", indent=3)
+    
+    # Delete test models (models with names starting with "test_")
+    test_models = model.Model & "model_name LIKE 'test_%'"
+    if test_models:
+        keys = test_models.fetch("KEY")
+        count = len(keys) if keys else 0
+        if count > 0:
+            test_models.delete()
+            cleanup_count += count
+            status.sub(f"Deleted {count} test model(s)", icon="🗑️", indent=3)
+    
+    # Delete test recordings (optional - comment out if you want to keep recordings)
+    # Uncomment if you want to clean recordings too:
+    # if pipeline.model.VideoRecording & {"subject": "test1"}:
+    #     count = len(pipeline.model.VideoRecording & {"subject": "test1"})
+    #     (pipeline.model.VideoRecording & {"subject": "test1"}).delete()
+    #     cleanup_count += count
+    #     if count > 0:
+    #         status.sub(f"Deleted {count} test recording(s)", icon="🗑️", indent=3)
+    
+    if cleanup_count > 0:
+        status.sub(f"Total: {cleanup_count} entry/entries cleaned", icon="✅", indent=3)
+    else:
+        status.sub("No test data found to clean", icon="ℹ️", indent=3)
+    
+    # 1. Find video files
+    status.step("Finding video files")
+    # Use same Docker detection logic as at the top
+    is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
+    
+    # In Docker, prefer /app/test_videos (from project mount .:/app) since videos are in ./test_videos
+    if is_docker:
+        # Check /app/test_videos first (from project mount)
+        test_videos_path = Path("/app/test_videos")
+        if test_videos_path.exists():
+            default_video_dir = "/app/test_videos"
+        else:
+            default_video_dir = "/app/data"
+    else:
+        default_video_dir = "./test_videos"
+    
+    video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
+    
+    if not video_dir.exists():
+        status.sub(f"Video directory not found: {video_dir}", indent=3)
+        if is_docker:
+            status.sub("In Docker: Videos should be in ./test_videos/ on host", indent=3)
+            status.sub("(available at /app/test_videos via project mount)", indent=5)
+        return  # Exit gracefully
+    
+    video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
+    if not video_files:
+        status.sub(f"No video files found in {video_dir}", indent=3)
+        status.sub("Supported formats: .mp4, .avi, .mov", indent=3)
+        if is_docker:
+            status.sub("In Docker: Videos should be in ./test_videos/ on host", indent=3)
+            status.sub("(available at /app/test_videos in container)", indent=5)
+        return  # Exit gracefully
+    
+    status.sub(f"Found {len(video_files)} video file(s):", indent=3)
+    for vf in video_files:
+        status.sub(f"- {vf.name}", indent=5)
+    
+    # 2. Register pretrained model
+    # Get model name from command line or use default
+    pretrained_model_name = getattr(main, 'pretrained_model_name', 'superanimal_quadruped')
+    
+    status.step(f"Registering pretrained model: {pretrained_model_name}")
+    model.PretrainedModel.populate_common_models([pretrained_model_name])
+    status.sub(f"Registered: {pretrained_model_name}", icon="✅")
+    
+    # 3. Insert pretrained model instance
+    status.step("Inserting pretrained model instance")
+    # Use a model name that includes the pretrained model name for clarity
+    model_name = f"test_video_inference_{pretrained_model_name.replace('superanimal_', '')}"
+    
+    # Check if model already exists and verify it's a pretrained model
+    if model.Model & {"model_name": model_name}:
+        existing_model = (model.Model & {"model_name": model_name}).fetch1()
+        config_template = existing_model.get("config_template", {})
+        is_pretrained = config_template.get("_pretrained_model_name") is not None
+        
+        if is_pretrained:
+            existing_pretrained_name = config_template.get("_pretrained_model_name")
+            if existing_pretrained_name == pretrained_model_name:
+                status.sub(f"Model '{model_name}' already exists (pretrained: {pretrained_model_name}), skipping insertion", icon="✅")
+            else:
+                status.sub(f"Model '{model_name}' exists but uses different pretrained model: {existing_pretrained_name}", icon="⚠️")
+                status.sub(f"Expected: {pretrained_model_name}", indent=5)
+                status.sub("Deleting existing model and tasks, creating new one...", indent=5)
+                # Delete any existing tasks that reference this model
+                if pipeline.model.PoseEstimationTask & {"model_name": model_name}:
+                    (pipeline.model.PoseEstimationTask & {"model_name": model_name}).delete()
+                    status.sub("Deleted existing PoseEstimationTask entries", icon="✅", indent=7)
+                # Delete the model
+                (model.Model & {"model_name": model_name}).delete()
+                # Insert the correct pretrained model
+                model.Model.insert_pretrained_model(
+                    model_name=model_name,
+                    pretrained_model_name=pretrained_model_name,
+                    model_description=f"Test model using {pretrained_model_name}",
+                    prompt=False,
+                )
+                status.sub(f"Re-inserted model: {model_name}", icon="✅")
+        else:
+            status.sub(f"Model '{model_name}' exists but is a TRAINED model, not pretrained", icon="⚠️")
+            status.sub("This script requires a PRETRAINED model. Deleting existing model and tasks...", indent=5)
+            # Delete any existing tasks that reference this model
+            if pipeline.model.PoseEstimationTask & {"model_name": model_name}:
+                (pipeline.model.PoseEstimationTask & {"model_name": model_name}).delete()
+                status.sub("Deleted existing PoseEstimationTask entries", icon="✅", indent=7)
+            # Delete the model
+            (model.Model & {"model_name": model_name}).delete()
+            # Insert the correct pretrained model
+            model.Model.insert_pretrained_model(
+                model_name=model_name,
+                pretrained_model_name=pretrained_model_name,
+                model_description=f"Test model using {pretrained_model_name}",
+                prompt=False,
+            )
+            status.sub(f"Inserted pretrained model: {model_name}", icon="✅")
+    else:
+        try:
+            model.Model.insert_pretrained_model(
+                model_name=model_name,
+                pretrained_model_name=pretrained_model_name,
+                model_description=f"Test model using {pretrained_model_name}",
+                prompt=False,
+            )
+            status.sub(f"Inserted model: {model_name}", icon="✅")
+        except dj.errors.DuplicateError as e:
+            # If duplicate error occurs (e.g., same unique index), skip insertion
+            status.sub(f"Model with similar configuration already exists, skipping insertion", icon="⚠️")
+            status.sub(f"Error: {str(e)[:100]}...", indent=5)
+    
+    # 4. Setup test data (subject, session, recordings)
+    status.step("Setting up test data")
+    # Use shorter subject name (element-animal Subject table has limited varchar length)
+    base_key = {
+        "subject": "test1",
+        "session_datetime": "2024-01-01 12:00:00",
+    }
+    
+    pipeline.subject.Subject.insert1({
+        "subject": "test1",  # Short name to fit database column
+        "sex": "F",
+        "subject_birth_date": "2020-01-01",
+        "subject_description": "Test subject for video inference",
+    }, skip_duplicates=True)
+    
+    pipeline.session.Session.insert1({
+        "subject": "test1",
+        "session_datetime": "2024-01-01 12:00:00",
+    }, skip_duplicates=True)
+    
+    # Create a separate recording for each video file
+    recording_keys = []
+    for idx, video_file in enumerate(video_files):
+        recording_key = {
+            **base_key,
+            "recording_id": idx + 1,  # Start from 1
+        }
+        recording_keys.append(recording_key)
+        
+        # Insert recording
+        pipeline.model.VideoRecording.insert1(
+            {**recording_key, "device": "Camera1"}, skip_duplicates=True
+        )
+        
+        # Insert single video file for this recording
+        # Store file path relative to root directory
+        video_file_abs = Path(video_file).resolve()
+        dlc_root_dir_abs = Path(dj.config["custom"].get("dlc_root_data_dir", str(video_dir.absolute()))).resolve()
+        
+        try:
+            relative_path = video_file_abs.relative_to(dlc_root_dir_abs)
+        except ValueError:
+            # If video_file is not under dlc_root_dir, use just the filename
+            # This handles the case where videos are in the root directory itself
+            relative_path = Path(video_file.name)
+        
+        pipeline.model.VideoRecording.File.insert1(
+            {**recording_key, "file_id": 0, "file_path": str(relative_path)},
+            skip_duplicates=True,
+        )
+        status.sub(f"Created recording {recording_key['recording_id']} for {video_file.name}", icon="✅", indent=5)
+    
+    status.sub(f"Created {len(recording_keys)} separate recording(s)", icon="✅", indent=3)
+    
+    # 5. Extract video metadata
+    status.step("Extracting video metadata")
+    try:
+        pipeline.model.RecordingInfo.populate()
+        # Show info for all recordings
+        for rec_key in recording_keys:
+            rec_info = (pipeline.model.RecordingInfo & rec_key).fetch1()
+            status.sub(
+                f"Recording {rec_key['recording_id']}: {rec_info['px_width']}x{rec_info['px_height']}, "
+                f"{rec_info['nframes']} frames, {rec_info['fps']:.1f} fps",
+                icon="✅",
+                indent=5
+            )
+    except ModuleNotFoundError as e:
+        if "cv2" in str(e):
+            status.sub(f"Error: {e}", icon="❌", indent=3)
+            status.sub("OpenCV (cv2) is required for video metadata extraction.", indent=3)
+            status.sub("Install it with: pip install opencv-python", indent=5)
+            status.sub("Or: conda install -c conda-forge opencv", indent=5)
+            return  # Exit gracefully
+        raise
+    
+    # 6. Clean up any tasks that might be using wrong models (from other test scripts)
+    status.step("Cleaning up any conflicting tasks")
+    for rec_key in recording_keys:
+        # Find all tasks for this recording, regardless of model_name
+        all_tasks = (pipeline.model.PoseEstimationTask & rec_key).fetch("model_name")
+        for task_model_name in set(all_tasks):
+            if task_model_name != model_name:
+                status.sub(f"Found task with different model '{task_model_name}' for recording {rec_key['recording_id']}", icon="⚠️", indent=3)
+                status.sub(f"Deleting task (expected model: '{model_name}')...", indent=5)
+                (pipeline.model.PoseEstimationTask & {**rec_key, "model_name": task_model_name}).delete()
+                status.sub("Task deleted", icon="✅", indent=7)
+    
+    # 6. Create pose estimation tasks for each recording
+    status.step("Creating pose estimation tasks")
+    for rec_key in recording_keys:
+        # Check if results already exist
+        task_key = {**rec_key, "model_name": model_name}
+        output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+            task_key, relative=False, mkdir=False
+        )
+        
+        # Check if results exist - look for H5 files directly
+        results_exist = False
+        output_path = Path(output_dir)
+        if output_path.exists():
+            # Check for result files (H5, pickle, or JSON)
+            h5_files = list(output_path.glob("*.h5"))
+            pickle_files = list(output_path.glob("*.pickle"))
+            json_files = list(output_path.glob("*.json"))
+            
+            if h5_files or pickle_files or json_files:
+                results_exist = True
+                status.sub(
+                    f"Results found for recording {rec_key['recording_id']} in: {output_dir.name} "
+                    f"({len(h5_files)} H5, {len(pickle_files)} pickle, {len(json_files)} JSON)",
+                    icon="✅",
+                    indent=5
+                )
+            else:
+                status.sub(f"No result files found for recording {rec_key['recording_id']} in: {output_dir.name}", icon="⚠️", indent=5)
+        else:
+            status.sub(f"Output directory doesn't exist for recording {rec_key['recording_id']}: {output_dir.name}", icon="⚠️", indent=5)
+        
+        # Generate task - it will auto-detect and set task_mode appropriately
+        # Always use "load" mode if results exist - never re-run inference
+        # This prevents expensive re-computation when results already exist
+        if results_exist:
+            task_mode = "load"  # Use existing results - do NOT trigger inference
+            status.sub(f"Results exist for recording {rec_key['recording_id']} - setting task_mode='load'", icon="✅", indent=5)
+        else:
+            task_mode = None  # Auto-detect (will be "trigger" if no results)
+            status.sub(f"No results found for recording {rec_key['recording_id']} - will auto-detect task_mode", icon="ℹ️", indent=5)
+        
+        pipeline.model.PoseEstimationTask.generate(
+            rec_key,
+            model_name=model_name,
+            task_mode=task_mode,
+            analyze_videos_params={
+                "video_inference": {
+                    "scale": 0.4,  # Adjust if needed (0.3-0.5 recommended)
+                    "batchsize": 8,  # Adjust based on GPU memory
+                }
+            },
+        )
+        status.sub(f"Task created for recording {rec_key['recording_id']}", icon="✅", indent=5)
+    
+    # 6.5. Update task modes if needed (in case results were created after task creation)
+    status.step("Checking and updating task modes")
+    for rec_key in recording_keys:
+        task_key = {**rec_key, "model_name": model_name}
+        output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+            task_key, relative=False, mkdir=False
+        )
+        
+        # Check if results exist
+        output_path = Path(output_dir)
+        results_exist = False
+        if output_path.exists():
+            h5_files = list(output_path.glob("*.h5"))
+            pickle_files = list(output_path.glob("*.pickle"))
+            json_files = list(output_path.glob("*.json"))
+            if h5_files or pickle_files or json_files:
+                results_exist = True
+        
+        # Check current task mode
+        try:
+            current_task = (pipeline.model.PoseEstimationTask & task_key).fetch1()
+            current_mode = current_task.get("task_mode", "trigger")
+            
+            # Update to "load" if results exist but task is in "trigger" mode
+            if results_exist and current_mode == "trigger":
+                pipeline.model.PoseEstimationTask.update1(
+                    {**task_key, "task_mode": "load"}
+                )
+                status.sub(f"Updated recording {rec_key['recording_id']} task_mode to 'load' (results exist)", icon="✅", indent=5)
+            elif not results_exist and current_mode == "load":
+                pipeline.model.PoseEstimationTask.update1(
+                    {**task_key, "task_mode": "trigger"}
+                )
+                status.sub(f"Updated recording {rec_key['recording_id']} task_mode to 'trigger' (no results)", icon="⚠️", indent=5)
+            else:
+                status.sub(f"Recording {rec_key['recording_id']} task_mode is '{current_mode}' (correct)", icon="ℹ️", indent=5)
+        except Exception as e:
+            status.sub(f"Could not check/update task for recording {rec_key['recording_id']}: {e}", icon="⚠️", indent=5)
+    
+    # 7. Run inference or load existing results
+    status.step("Running inference or loading existing results")
+    
+    # Check if DeepLabCut is available FIRST (before checking task modes)
+    # This import might print "Loading DLC..." so we do it early
+    deeplabcut_available = False
+    error_msg = None
+    
+    # First check if PyTorch is available (needed for SuperAnimal)
+    try:
+        import torch
+        pytorch_available = True
+        pytorch_version = torch.__version__
+    except ImportError:
+        pytorch_available = False
+        pytorch_version = None
+    
+    try:
+        import deeplabcut
+        deeplabcut_available = True
+        logger.info("DeepLabCut imported successfully")
+        # Verify it's actually usable by checking for a key function
+        if hasattr(deeplabcut, "video_inference_superanimal"):
+            logger.info("DeepLabCut has video_inference_superanimal function")
+        else:
+            logger.warning("DeepLabCut imported but video_inference_superanimal not found")
+    except (ImportError, TypeError, Exception) as e:
+        error_msg = str(e)
+        deeplabcut_available = False
+        logger.warning(f"DeepLabCut import failed: {e}")
+        import traceback
+        logger.debug(f"Traceback: {traceback.format_exc()}")
+    
+    # Double-check task modes and results before proceeding
+    # This ensures we never trigger inference if results exist
+    all_in_load_mode = True
+    any_results_exist = False
+    for rec_key in recording_keys:
+        task_key = {**rec_key, "model_name": model_name}
+        try:
+            task_mode = (pipeline.model.PoseEstimationTask & task_key).fetch1("task_mode")
+            
+            # Check if results actually exist for this task
+            output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+                task_key, relative=False, mkdir=False
+            )
+            output_path = Path(output_dir)
+            results_exist = False
+            if output_path.exists():
+                h5_files = list(output_path.glob("*.h5"))
+                pickle_files = list(output_path.glob("*.pickle"))
+                json_files = list(output_path.glob("*.json"))
+                if h5_files or pickle_files or json_files:
+                    results_exist = True
+                    any_results_exist = True
+            
+            # If results exist but task is in trigger mode, update it
+            if results_exist and task_mode == "trigger":
+                pipeline.model.PoseEstimationTask.update1(
+                    {**task_key, "task_mode": "load"}
+                )
+                status.sub(f"Updated recording {rec_key['recording_id']} to 'load' mode (results exist)", icon="✅", indent=3)
+                task_mode = "load"
+            
+            if task_mode != "load":
+                all_in_load_mode = False
+                status.sub(f"Recording {rec_key['recording_id']} is in '{task_mode}' mode", icon="ℹ️", indent=3)
+        except Exception as e:
+            # Task doesn't exist yet, so not in load mode
+            all_in_load_mode = False
+            status.sub(f"Task for recording {rec_key['recording_id']} doesn't exist: {e}", icon="⚠️", indent=3)
+            break
+    
+    # NEVER run inference if results exist - always use load mode
+    if any_results_exist:
+        status.sub("Results exist - will use 'load' mode (skipping inference)", icon="ℹ️", indent=3)
+        # Ensure all tasks with results are in load mode
+        for rec_key in recording_keys:
+            task_key = {**rec_key, "model_name": model_name}
+            try:
+                output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+                    task_key, relative=False, mkdir=False
+                )
+                output_path = Path(output_dir)
+                if output_path.exists():
+                    h5_files = list(output_path.glob("*.h5"))
+                    pickle_files = list(output_path.glob("*.pickle"))
+                    json_files = list(output_path.glob("*.json"))
+                    if h5_files or pickle_files or json_files:
+                        # Force load mode if results exist
+                        current_task = (pipeline.model.PoseEstimationTask & task_key).fetch1()
+                        if current_task.get("task_mode") != "load":
+                            pipeline.model.PoseEstimationTask.update1(
+                                {**task_key, "task_mode": "load"}
+                            )
+            except Exception:
+                pass
+    
+    # Verify all tasks use the correct pretrained model before inference
+    status.step("Verifying model configuration")
+    for rec_key in recording_keys:
+        task_key = {**rec_key, "model_name": model_name}
+        if pipeline.model.PoseEstimationTask & task_key:
+            task = (pipeline.model.PoseEstimationTask & task_key).fetch1()
+            # Verify the model is actually a pretrained model
+            model_record = (model.Model & {"model_name": model_name}).fetch1()
+            config_template = model_record.get("config_template", {})
+            if config_template.get("_pretrained_model_name") is None:
+                status.sub(f"ERROR: Task for recording {rec_key['recording_id']} references a TRAINED model, not pretrained!", icon="❌", indent=3)
+                status.sub("Deleting incorrect task...", indent=5)
+                (pipeline.model.PoseEstimationTask & task_key).delete()
+                status.sub("Task deleted. Please re-run the script to create correct tasks.", icon="✅", indent=5)
+                return  # Exit gracefully
+    status.sub("All tasks verified to use pretrained model", icon="✅", indent=3)
+    
+    if all_in_load_mode and deeplabcut_available:
+        status.step("Loading existing results")
+        status.sub("All tasks are in 'load' mode - will use existing results", icon="ℹ️", indent=3)
+        status.sub("Skipping inference step (results already exist)", icon="⚠️", indent=3)
+        try:
+            pipeline.model.PoseEstimation.populate()
+            # Check if there are any IndividualMapping entries (for multi-animal data)
+            individual_mappings = (
+                pipeline.model.PoseEstimation.IndividualMapping 
+                & rec_key 
+                & {"model_name": model_name}
+            )
+            num_mappings = len(individual_mappings)
+            
+            if num_mappings > 0:
+                status.sub(f"Results loaded successfully! ({num_mappings} individual mappings created)", icon="✅", indent=3)
+            else:
+                # Check if this is multi-animal data that should have mappings
+                individuals = (
+                    pipeline.model.PoseEstimation.Individual 
+                    & rec_key 
+                    & {"model_name": model_name}
+                )
+                if len(individuals) > 0:
+                    status.sub("Results loaded with warnings: Individual mappings could not be created", icon="⚠️", indent=3)
+                    status.sub(f"Found {len(individuals)} individual(s) but 0 mappings", icon="ℹ️", indent=4)
+                else:
+                    status.sub("Results loaded successfully! (single-animal data)", icon="✅", indent=3)
+        except Exception as e:
+            status.sub(f"Error loading results: {e}", icon="❌", indent=3)
+            raise
+        return  # Exit early if we're just loading
+    
+    # Debug: print what we detected
+    status.sub(f"DLC availability check: deeplabcut_available={deeplabcut_available}, error_msg={error_msg}", indent=3)
+    
+    # If DLC is not available, show error and exit
+    if not deeplabcut_available:
+        status.sub("DeepLabCut is not available - cannot run inference", icon="⚠️", indent=3)
+        
+        # Check if deeplabcut package exists but has missing dependencies
+        if error_msg:
+            spec = importlib.util.find_spec("deeplabcut")
+            if spec is not None:
+                # Package exists but import failed - likely missing dependency
+                if "tensorflow" in error_msg.lower():
+                    if pytorch_available:
+                        status.sub("DeepLabCut is installed but TensorFlow is missing.", icon="⚠️", indent=3)
+                        status.sub(f"PyTorch is available (version {pytorch_version})", icon="✅", indent=5)
+                    status.sub("DeepLabCut's __init__.py tries to import TensorFlow by default,", indent=3)
+                    status.sub("but SuperAnimal models only need PyTorch.", indent=3)
+                    status.sub("Workaround options:", indent=3)
+                    status.sub("1. Install TensorFlow (even if unused): pip install tensorflow", indent=5)
+                    status.sub("2. Or try setting environment variable: export DLC_BACKEND='pytorch'", indent=5)
+                    status.sub("3. Or use DeepLabCut's PyTorch-only installation:", indent=5)
+                    status.sub("   pip install --upgrade 'deeplabcut[superanimal]'", indent=7)
+                else:
+                    status.sub("DeepLabCut is installed but TensorFlow is missing.", icon="⚠️", indent=3)
+                    status.sub("For SuperAnimal pretrained models, you need PyTorch.", indent=3)
+                    status.sub("To fix, install PyTorch: pip install torch", indent=5)
+            if "torch" in error_msg.lower() or "pytorch" in error_msg.lower():
+                status.sub("DeepLabCut is installed but PyTorch is missing.", icon="⚠️", indent=3)
+                status.sub("For SuperAnimal pretrained models, PyTorch is required.", indent=3)
+                status.sub("To fix, install PyTorch: pip install torch", indent=5)
+            elif "tensorpack" in error_msg.lower():
+                status.sub("DeepLabCut is installed but tensorpack is missing.", icon="⚠️", indent=3)
+                if pytorch_available:
+                    status.sub(f"PyTorch is available (version {pytorch_version})", icon="✅", indent=5)
+                status.sub("This is a dependency issue. To fix, reinstall DeepLabCut:", indent=3)
+                status.sub("pip uninstall deeplabcut", indent=5)
+                status.sub("pip install 'deeplabcut[superanimal]==3.0.0rc13'", indent=5)
+            elif "unsupported operand type(s) for |" in error_msg or "|:" in error_msg:
+                import sys
+                python_version = sys.version_info
+                status.sub("Python version incompatibility detected.", icon="⚠️", indent=3)
+                status.sub(f"Current Python version: {python_version.major}.{python_version.minor}.{python_version.micro}", indent=5)
+                status.sub("DeepLabCut 3.0.0rc13 requires Python 3.10 or higher", indent=3)
+                status.sub("(it uses modern type hints like 'int | None' which require Python 3.10+)", indent=5)
+                status.sub("To fix:", indent=3)
+                status.sub("1. Create a new conda environment with Python 3.10+:", indent=5)
+                status.sub("   conda create -n element-dlc python=3.10", indent=7)
+                status.sub("   conda activate element-dlc", indent=7)
+                status.sub("   conda env update -f environment.yml", indent=7)
+                status.sub("2. Or upgrade your current environment:", indent=5)
+                status.sub("   conda install python=3.10", indent=7)
+                status.sub("   pip install --upgrade 'deeplabcut[superanimal]==3.0.0rc13'", indent=7)
+            else:
+                status.sub(f"DeepLabCut is installed but has missing dependencies: {error_msg}", icon="⚠️", indent=3)
+                if pytorch_available:
+                    status.sub(f"PyTorch is available (version {pytorch_version})", icon="✅", indent=5)
+                status.sub("For SuperAnimal pretrained models, you typically need PyTorch.", indent=3)
+                status.sub("To fix, reinstall DeepLabCut:", indent=3)
+                status.sub("pip uninstall deeplabcut", indent=5)
+                status.sub("pip install 'deeplabcut[superanimal]'", indent=5)
+        else:
+            # Package doesn't exist
+            status.sub("DeepLabCut is not installed. Skipping inference step.", icon="⚠️", indent=3)
+            status.sub("To run inference with SuperAnimal models, install:", indent=3)
+            status.sub("pip install 'deeplabcut[superanimal]'", indent=5)
+            status.sub("This will install DeepLabCut with PyTorch support for pretrained models.", indent=5)
+        
+        status.sub("The workflow has been set up successfully up to this point:", indent=3)
+        status.sub("Pretrained model registered", icon="✅", indent=5)
+        status.sub("Model inserted", icon="✅", indent=5)
+        status.sub("Test data created", icon="✅", indent=5)
+        status.sub("Pose estimation tasks created", icon="✅", indent=5)
+        status.sub("After fixing the issue, you can run:", indent=3)
+        status.sub("pipeline.model.PoseEstimation.populate()", indent=5)
+        return
+    
+    # Final check: NEVER run inference if results exist
+    # Check one more time before proceeding
+    has_any_results = False
+    for rec_key in recording_keys:
+        task_key = {**rec_key, "model_name": model_name}
+        try:
+            output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+                task_key, relative=False, mkdir=False
+            )
+            output_path = Path(output_dir)
+            if output_path.exists():
+                h5_files = list(output_path.glob("*.h5"))
+                pickle_files = list(output_path.glob("*.pickle"))
+                json_files = list(output_path.glob("*.json"))
+                if h5_files or pickle_files or json_files:
+                    has_any_results = True
+                    # Force load mode - CRITICAL: prevent inference
+                    pipeline.model.PoseEstimationTask.update1(
+                        {**task_key, "task_mode": "load"}
+                    )
+                    status.sub(f"⚠️ Found results for recording {rec_key['recording_id']} - forcing 'load' mode (will NOT trigger inference)", icon="⚠️", indent=3)
+        except Exception as e:
+            logger.debug(f"Error checking results for {rec_key}: {e}")
+    
+    if has_any_results:
+        status.sub("Results exist - using 'load' mode instead of triggering inference", icon="ℹ️", indent=3)
+        try:
+            pipeline.model.PoseEstimation.populate()
+            status.sub("Results loaded successfully!", icon="✅", indent=3)
+        except Exception as e:
+            status.sub(f"Error loading results: {e}", icon="❌", indent=3)
+            raise
+        return  # Exit - do NOT run inference
+    
+    # Only run inference if NO results exist anywhere
+    status.sub("DeepLabCut is available - proceeding with inference", icon="✅", indent=3)
+    status.sub("This may take a while (requires GPU for reasonable speed)", icon="⚠️", indent=3)
+    status.sub(f"Processing {len(recording_keys)} video(s)...", icon="⚠️", indent=3)
+    try:
+        pipeline.model.PoseEstimation.populate()
+        status.sub("Inference completed!", icon="✅", indent=3)
+    except Exception as e:
+        status.sub(f"Error during inference: {e}", icon="❌", indent=3)
+        status.sub("Troubleshooting:", indent=3)
+        status.sub("- Ensure DeepLabCut is installed: pip install 'deeplabcut[superanimal]'", indent=5)
+        status.sub("- Check GPU availability (or use CPU - will be slow)", indent=5)
+        status.sub("- Try reducing batchsize or scale in analyze_videos_params", indent=5)
+        raise
+    
+    # 8. Show results for each recording
+    status.header("Results")
+    
+    for rec_key in recording_keys:
+        status.sub(f"Recording {rec_key['recording_id']}:", icon="📹", indent=2)
+        try:
+            pose_estimation = (
+                pipeline.model.PoseEstimation 
+                & rec_key 
+                & {"model_name": model_name}
+            ).fetch1()
+            
+            status.sub(f"Completed at: {pose_estimation['pose_estimation_time']}", icon="✅", indent=4)
+            
+            body_parts = (
+                pipeline.model.PoseEstimation.BodyPartPosition 
+                & rec_key 
+                & {"model_name": model_name}
+            ).fetch("body_part")
+            
+            status.sub(f"Detected body parts ({len(set(body_parts))}): {sorted(set(body_parts))}", icon="📊", indent=4)
+            
+            # Show stats for first body part as example
+            if len(set(body_parts)) > 0:
+                bp = sorted(set(body_parts))[0]
+                bp_data = (
+                    pipeline.model.PoseEstimation.BodyPartPosition 
+                    & rec_key 
+                    & {"model_name": model_name, "body_part": bp}
+                ).fetch1()
+                
+                x_pos = bp_data["x_pos"]
+                y_pos = bp_data["y_pos"]
+                likelihood = bp_data["likelihood"]
+                
+                status.sub(f"Example ({bp}): {len(x_pos)} frames, avg likelihood: {likelihood.mean():.3f}", icon="📈", indent=4)
+        except Exception as e:
+            status.sub(f"No results yet or error: {e}", icon="⚠️", indent=4)
+    
+    status.header("Test completed successfully!")
+    status.sub("Next steps:", indent=2)
+    status.sub("- Check output directory for DLC results", indent=4)
+    status.sub("- Visualize results using DLC's plotting functions", indent=4)
+    status.sub("- Query PoseEstimation.BodyPartPosition for analysis", indent=4)
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(
+        description="Test pretrained DeepLabCut inference with video files",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog="""
+Examples:
+  python test_video_inference.py
+  python test_video_inference.py superanimal_quadruped
+  python test_video_inference.py superanimal_topviewmouse
+        """
+    )
+    parser.add_argument(
+        "model",
+        nargs="?",
+        default="superanimal_quadruped",
+        choices=["superanimal_quadruped", "superanimal_topviewmouse"],
+        help="Pretrained model to use (default: superanimal_quadruped)"
+    )
+    
+    args = parser.parse_args()
+    
+    # Store model name as attribute so main() can access it
+    main.pretrained_model_name = args.model
+    
+    main()
+
+
diff --git a/tests/test_pretrained_workflow.py b/tests/test_pretrained_workflow.py
new file mode 100644
index 0000000..09a7a93
--- /dev/null
+++ b/tests/test_pretrained_workflow.py
@@ -0,0 +1,200 @@
+"""
+Tests for pretrained model workflow.
+
+This module tests the pretrained model workflow alongside the existing trained model workflow.
+"""
+
+import pytest
+from pathlib import Path
+
+
+def test_pretrained_model_registration(pipeline):
+    """Test registering pretrained models in the lookup table."""
+    model = pipeline["model"]
+    
+    # Test populate_common_models
+    results = model.PretrainedModel.populate_common_models()
+    assert len(results["inserted"]) > 0 or len(results["skipped"]) > 0
+    
+    # Verify models were registered
+    assert model.PretrainedModel.is_pretrained("superanimal_quadruped")
+    assert model.PretrainedModel.is_pretrained("superanimal_topviewmouse")
+    
+    # Test adding a custom model
+    model.PretrainedModel.add(
+        pretrained_model_name="test_custom_model",
+        source="Test",
+        default_params={"scale": 0.5},
+        description="Test model"
+    )
+    assert model.PretrainedModel.is_pretrained("test_custom_model")
+
+
+def test_insert_pretrained_model(pipeline):
+    """Test inserting a pretrained model into the Model table."""
+    model = pipeline["model"]
+    
+    # First, register a pretrained model
+    if not model.PretrainedModel.is_pretrained("superanimal_quadruped"):
+        model.PretrainedModel.populate_common_models(["superanimal_quadruped"])
+    
+    # Insert pretrained model instance
+    model.Model.insert_pretrained_model(
+        model_name="test_pretrained_model",
+        pretrained_model_name="superanimal_quadruped",
+        model_description="Test pretrained model",
+        prompt=False,
+    )
+    
+    # Verify it was inserted
+    model_record = (model.Model & {"model_name": "test_pretrained_model"}).fetch1()
+    assert model_record["model_name"] == "test_pretrained_model"
+    assert model_record["project_path"] == ""  # Empty for pretrained
+    assert model_record["paramset_idx"] is None  # No training param set
+    
+    # Verify pretrained detection flags
+    config_template = model_record["config_template"]
+    assert config_template.get("_is_pretrained") is True
+    assert config_template.get("_pretrained_model_name") == "superanimal_quadruped"
+
+
+def test_pretrained_vs_trained_detection(pipeline):
+    """Test that pretrained and trained models are correctly detected."""
+    model = pipeline["model"]
+    
+    # Get a trained model (from existing fixture)
+    trained_model = (model.Model & {"model_name": "from_top_tracking_model_test"}).fetch1()
+    trained_config = trained_model["config_template"]
+    
+    # Trained models should not have pretrained flags
+    assert trained_config.get("_is_pretrained") is not True
+    assert trained_config.get("_pretrained_model_name") is None
+    assert trained_model["project_path"] != ""  # Should have project path
+    
+    # Get a pretrained model
+    if not model.PretrainedModel.is_pretrained("superanimal_quadruped"):
+        model.PretrainedModel.populate_common_models(["superanimal_quadruped"])
+    
+    model.Model.insert_pretrained_model(
+        model_name="test_pretrained_detection",
+        pretrained_model_name="superanimal_quadruped",
+        prompt=False,
+    )
+    
+    pretrained_model = (model.Model & {"model_name": "test_pretrained_detection"}).fetch1()
+    pretrained_config = pretrained_model["config_template"]
+    
+    # Pretrained models should have pretrained flags
+    assert pretrained_config.get("_is_pretrained") is True
+    assert pretrained_config.get("_pretrained_model_name") == "superanimal_quadruped"
+    assert pretrained_model["project_path"] == ""  # Empty for pretrained
+
+
+@pytest.mark.skip(
+    reason="Requires actual DLC installation with SuperAnimal support and GPU resources. "
+           "Run manually with: pytest tests/test_pretrained_workflow.py::test_pretrained_inference_workflow -s"
+)
+def test_pretrained_inference_workflow(pipeline, insert_upstreams):
+    """Test the full pretrained inference workflow.
+    
+    This test requires:
+    - DeepLabCut installed with SuperAnimal support
+    - Actual video files
+    - GPU resources (or very long runtime)
+    
+    Run with: pytest tests/test_pretrained_workflow.py::test_pretrained_inference_workflow --run-inference
+    """
+    model = pipeline["model"]
+    
+    # Register pretrained model
+    if not model.PretrainedModel.is_pretrained("superanimal_quadruped"):
+        model.PretrainedModel.populate_common_models(["superanimal_quadruped"])
+    
+    # Insert pretrained model
+    model.Model.insert_pretrained_model(
+        model_name="test_pretrained_inference",
+        pretrained_model_name="superanimal_quadruped",
+        prompt=False,
+    )
+    
+    # Create pose estimation task
+    recording_key = {
+        "subject": "subject6",
+        "session_datetime": "2021-06-02 14:04:22",
+        "recording_id": "1",
+    }
+    
+    model.PoseEstimationTask.generate(
+        recording_key,
+        model_name="test_pretrained_inference",
+        analyze_videos_params={
+            "video_inference": {"scale": 0.4}  # Override default params
+        }
+    )
+    
+    # Run inference (this will actually call DLC)
+    model.PoseEstimation.populate()
+    
+    # Verify results were created
+    pose_estimation = (model.PoseEstimation & recording_key & {"model_name": "test_pretrained_inference"}).fetch1()
+    assert pose_estimation is not None
+    
+    # Verify body part positions exist
+    body_parts = model.PoseEstimation.BodyPartPosition.fetch("body_part")
+    assert len(body_parts) > 0
+
+
+def test_trained_workflow_still_works(pipeline, insert_dlc_model, insert_pose_estimation_task, pose_estimation):
+    """Verify that the existing trained model workflow still works unchanged."""
+    model = pipeline["model"]
+    
+    # Verify trained model exists and has correct structure
+    trained_model = (model.Model & {"model_name": "from_top_tracking_model_test"}).fetch1()
+    assert trained_model["project_path"] != ""  # Should have project path
+    assert trained_model["paramset_idx"] is not None  # Should have paramset
+    
+    # Verify it's detected as trained (not pretrained)
+    config_template = trained_model["config_template"]
+    assert config_template.get("_is_pretrained") is not True
+    
+    # Verify pose estimation results exist
+    body_parts = model.PoseEstimation.BodyPartPosition.fetch("body_part")
+    assert len(body_parts) > 0
+    assert "head" in body_parts or "tailbase" in body_parts
+
+
+def test_pretrained_model_validation(pipeline):
+    """Test validation when using pretrained models."""
+    model = pipeline["model"]
+    
+    # Try to insert pretrained model without registering it first
+    # This should fail gracefully
+    if model.PretrainedModel.is_pretrained("nonexistent_model"):
+        model.PretrainedModel.delete({"pretrained_model_name": "nonexistent_model"})
+    
+    # Should warn but not raise
+    model.Model.insert_pretrained_model(
+        model_name="test_nonexistent",
+        pretrained_model_name="nonexistent_model",
+        prompt=False,
+    )
+    
+    # Verify it wasn't inserted
+    assert not (model.Model & {"model_name": "test_nonexistent"})
+
+
+def test_parameter_merging(pipeline):
+    """Test that default params and user params are merged correctly."""
+    model = pipeline["model"]
+    
+    # Register model with default params
+    if not model.PretrainedModel.is_pretrained("superanimal_quadruped"):
+        model.PretrainedModel.populate_common_models(["superanimal_quadruped"])
+    
+    # Get default params
+    pm = (model.PretrainedModel & {"pretrained_model_name": "superanimal_quadruped"}).fetch1()
+    default_params = pm.get("default_params") or {}
+    
+    # Verify default params exist
+    assert "scale" in default_params or "video_adapt" in default_params or len(default_params) > 0
+

From def9a47aa41b09307b86ffceab6c712589d7bc55 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:34:06 +0100
Subject: [PATCH 07/15] add docker

---
 Dockerfile           | 30 +++++++++++++++++++++
 docker-compose.yaml  | 64 ++++++++++++++++++++++++++++++++++++++++++++
 docker-entrypoint.sh | 10 +++++++
 3 files changed, 104 insertions(+)
 create mode 100644 Dockerfile
 create mode 100644 docker-compose.yaml
 create mode 100644 docker-entrypoint.sh

diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000..04d5440
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,30 @@
+# Dockerfile for element-deeplabcut client environment
+# Uses DeepLabCut's official Docker image as base
+FROM deeplabcut/deeplabcut:latest-jupyter
+
+# Set working directory
+WORKDIR /app
+
+# Install additional system dependencies if needed
+RUN apt-get update && apt-get install -y \
+    git \
+    graphviz \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy the entire project
+COPY . .
+
+# Install element-deeplabcut and its dependencies
+# The DLC image already has DeepLabCut installed, so we just need element-deeplabcut
+RUN pip install -e .[dlc_default,elements,tests]
+
+# Set environment variables
+ENV PYTHONUNBUFFERED=1
+
+# Set entrypoint to bash
+ENTRYPOINT ["/bin/bash"]
+
+# Default command - interactive bash shell
+# Users can override with: docker compose run client -c "python your_script.py"
+CMD ["-i"]
+
diff --git a/docker-compose.yaml b/docker-compose.yaml
new file mode 100644
index 0000000..74840e7
--- /dev/null
+++ b/docker-compose.yaml
@@ -0,0 +1,64 @@
+# Docker Compose configuration for element-deeplabcut client environment
+# Usage: docker compose up --build
+#        docker compose run client python your_script.py
+
+version: "3.8"
+
+services:
+  # MySQL database service
+  db:
+    restart: always
+    image: datajoint/mysql:${MYSQL_VER:-8.0}
+    environment:
+      - MYSQL_ROOT_PASSWORD=${DJ_PASS:-datajoint}
+    ports:
+      - "${DB_PORT:-3306}:3306"
+    volumes:
+      - db_data:/var/lib/mysql
+    healthcheck:
+      test: ["CMD", "mysqladmin", "ping", "-h", "localhost", "-u", "root", "-p${DJ_PASS:-datajoint}"]
+      timeout: 15s
+      retries: 10
+      interval: 15s
+    networks:
+      - element_network
+
+  # Client container
+  client:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    depends_on:
+      db:
+        condition: service_healthy
+    environment:
+      - DJ_HOST=db
+      - DJ_USER=root
+      - DJ_PASS=${DJ_PASS:-datajoint}
+      - DJ_PORT=3306
+      - DATABASE_PREFIX=${DATABASE_PREFIX:-}
+      - DLC_ROOT_DATA_DIR=${DLC_ROOT_DATA_DIR:-/app/test_videos}
+      - PYTHONUNBUFFERED=1
+    volumes:
+      # Mount data directory (can be customized via DLC_DATA_DIR env var)
+      # Default: ./test_videos (for tests) or ./data (for general use)
+      - ${DLC_DATA_DIR:-./test_videos}:/app/data
+      # Mount config file if it exists
+      - ./dj_local_conf.json:/app/dj_local_conf.json:ro
+      # Mount the project directory for development
+      - .:/app
+    networks:
+      - element_network
+    # Default command - interactive bash (entrypoint is /bin/bash)
+    # Example: docker compose run client -c "python test_trained_inference.py"
+    command: ["-i"]
+    stdin_open: true
+    tty: true
+
+volumes:
+  db_data:
+
+networks:
+  element_network:
+    driver: bridge
+
diff --git a/docker-entrypoint.sh b/docker-entrypoint.sh
new file mode 100644
index 0000000..e1162b6
--- /dev/null
+++ b/docker-entrypoint.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+# Docker entrypoint script for element-deeplabcut client
+# Works with DeepLabCut Docker image which already has DLC installed
+
+set -e
+
+# Execute the command
+exec "$@"
+
+

From d1adaf264210c7934dee8e052e2108921d392feb Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:34:29 +0100
Subject: [PATCH 08/15] docker part docs

---
 DOCKER_TEST_README.md | 49 +++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 49 insertions(+)
 create mode 100644 DOCKER_TEST_README.md

diff --git a/DOCKER_TEST_README.md b/DOCKER_TEST_README.md
new file mode 100644
index 0000000..3ea1d97
--- /dev/null
+++ b/DOCKER_TEST_README.md
@@ -0,0 +1,49 @@
+# Docker Testing
+
+## Quick Start
+
+```bash
+# Start database and container
+docker compose up -d
+
+# Run tests
+docker compose run --rm client python test_trained_inference.py
+docker compose run --rm client python test_video_inference.py superanimal_quadruped
+
+# Or use Makefile
+make test-trained
+make test-pretrained
+```
+
+## Configuration
+
+Create `.env` file (optional):
+
+```env
+DJ_PASS=simple
+DB_PORT=3306
+DATABASE_PREFIX=test_
+```
+
+## Volumes
+
+| Mount | Container Path | Description |
+|-------|----------------|-------------|
+| `./test_videos` | `/app/data` | Test videos |
+| `.` | `/app` | Project directory |
+| `./dj_local_conf.json` | `/app/dj_local_conf.json` | Database config |
+
+## Troubleshooting
+
+| Issue | Solution |
+|-------|----------|
+| Database connection | `docker compose ps` to check health |
+| Permission issues | `sudo chown -R $USER:$USER test_videos/` |
+| Code changes | `docker compose build` |
+| Clean up | `docker compose down -v` |
+
+## Development
+
+```bash
+make shell  # Interactive shell
+```

From b559659b9362fe7b3f0009ccefbabdf626fc6dcc Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Wed, 26 Nov 2025 08:34:38 +0100
Subject: [PATCH 09/15] Makefile

---
 Makefile | 31 +++++++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)
 create mode 100644 Makefile

diff --git a/Makefile b/Makefile
new file mode 100644
index 0000000..0be87f2
--- /dev/null
+++ b/Makefile
@@ -0,0 +1,31 @@
+.PHONY: help build up down shell test-trained test-pretrained clean
+
+help:
+	@echo "make build          - Build Docker image"
+	@echo "make up             - Start services"
+	@echo "make down           - Stop services"
+	@echo "make shell          - Interactive shell"
+	@echo "make test-trained   - Run trained model test"
+	@echo "make test-pretrained - Run pretrained model test"
+	@echo "make clean          - Remove volumes"
+
+build:
+	docker compose build
+
+up:
+	docker compose up -d
+
+down:
+	docker compose down
+
+shell:
+	docker compose run --rm client -i
+
+test-trained:
+	docker compose run --rm client -c "python test_trained_inference.py"
+
+test-pretrained:
+	docker compose run --rm client -c "python test_video_inference.py superanimal_quadruped"
+
+clean:
+	docker compose down -v

From 78c2006c7e8c62f690dc371b330a2fde05e9f032 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Thu, 4 Dec 2025 13:01:41 +0100
Subject: [PATCH 10/15] refresh requirements

---
 Dockerfile          |   8 +-
 Makefile            | 242 +++++++++++++++++++++++++++++++++++++++++++-
 docker-compose.yaml |  12 +++
 requirements.txt    |  30 ++++++
 setup.py            |  21 ++--
 5 files changed, 299 insertions(+), 14 deletions(-)
 create mode 100644 requirements.txt

diff --git a/Dockerfile b/Dockerfile
index 04d5440..891ec6e 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,6 +1,7 @@
 # Dockerfile for element-deeplabcut client environment
 # Uses DeepLabCut's official Docker image as base
-FROM deeplabcut/deeplabcut:latest-jupyter
+# Pinned to specific version for reproducibility
+FROM deeplabcut/deeplabcut:3.0.0rc13-jupyter
 
 # Set working directory
 WORKDIR /app
@@ -16,7 +17,10 @@ COPY . .
 
 # Install element-deeplabcut and its dependencies
 # The DLC image already has DeepLabCut installed, so we just need element-deeplabcut
-RUN pip install -e .[dlc_default,elements,tests]
+# Note: We explicitly constrain dlclibrary version to avoid ModelZoo download bug
+# (rename_mapping being a string instead of dict - fixed with runtime monkey patch)
+RUN pip install -e .[dlc_default,elements,tests] && \
+    pip install "dlclibrary>=0.1.0,<0.2.0" || true
 
 # Set environment variables
 ENV PYTHONUNBUFFERED=1
diff --git a/Makefile b/Makefile
index 0be87f2..9441591 100644
--- a/Makefile
+++ b/Makefile
@@ -1,16 +1,33 @@
-.PHONY: help build up down shell test-trained test-pretrained clean
+.PHONY: help build up down shell test-trained test-pretrained clean \
+	quad-superanimal quad-superanimal-auto-refine quad-superanimal-no-adapt quad-superanimal-predict quad-superanimal-refine \
+	quad-superanimal-dataset quad-superanimal-train-fast quad-superanimal-train-slow install-dlc-gui
 
 help:
 	@echo "make build          - Build Docker image"
 	@echo "make up             - Start services"
 	@echo "make down           - Stop services"
 	@echo "make shell          - Interactive shell"
-	@echo "make test-trained   - Run trained model test"
-	@echo "make test-pretrained - Run pretrained model test"
+	@echo "make test-trained   - Run trained model test (CPU, or GPU if available)"
+	@echo "make test-pretrained - Run pretrained model test (CPU, or GPU if available)"
+	@echo "make test-trained-gpu   - Run trained model test with GPU (requires nvidia-container-toolkit)"
+	@echo "make test-pretrained-gpu - Run pretrained model test with GPU (requires nvidia-container-toolkit)"
+	@echo "Workflow (EXACT ORDER) - PyTorch engine (default):"
+	@echo "  1. make quad-superanimal           - Create project + SuperAnimal predictions + extract frames"
+	@echo "     OR make quad-superanimal-auto-refine - Same as above (no auto-refine, use step 2)"
+	@echo "     OR make quad-superanimal-no-adapt - Same but without video adaptation (if OOM errors)"
+	@echo "  2. make quad-superanimal-refine    - Open DLC refine GUI → correct + SAVE (creates CollectedData_*.csv/.h5)"
+	@echo "  3. make quad-superanimal-dataset   - Create training dataset (.mat files) from labels"
+	@echo "  4. make quad-superanimal-train-fast - Fast training (10 epochs) - combines dataset + train"
+	@echo "     OR make quad-superanimal-train-slow - Slow training (50 epochs)"
+	@echo ""
+	@echo "Note: Step 2 is REQUIRED - SuperAnimal predictions ≠ training labels until you save in GUI"
+	@echo "Note: All targets use --engine pytorch (PyTorch ModelZoo with HRNet-W32 + Faster R-CNN)"
+	@echo "make install-dlc-gui - pip install 'deeplabcut[gui]' in current environment"
 	@echo "make clean          - Remove volumes"
 
 build:
 	docker compose build
+	@echo "Built image: element-deeplabcut-client"
 
 up:
 	docker compose up -d
@@ -21,11 +38,226 @@ down:
 shell:
 	docker compose run --rm client -i
 
+# Helper to get the compose project network name
+COMPOSE_PROJECT_NAME := $(shell basename $$(pwd) | tr '[:upper:]' '[:lower:]' | sed 's/[^a-z0-9]//g')
+NETWORK_NAME := $(COMPOSE_PROJECT_NAME)_element_network
+
 test-trained:
-	docker compose run --rm client -c "python test_trained_inference.py"
+	@echo "⚠️  Note: docker compose run doesn't support --gpus flag"
+	@echo "   GPU access requires using docker run directly or nvidia-container-toolkit"
+	@echo "   Tests will run on CPU if GPU is not available"
+	@docker compose ps db > /dev/null 2>&1 || docker compose up -d db
+	@echo "Waiting for database..."
+	@sleep 3
+	docker compose run --rm client -c "python test_trained_inference.py --gpu 0 --batch-size 4"
 
 test-pretrained:
-	docker compose run --rm client -c "python test_video_inference.py superanimal_quadruped"
+	@echo "⚠️  Note: docker compose run doesn't support --gpus flag"
+	@echo "   GPU access requires using docker run directly or nvidia-container-toolkit"
+	@echo "   Tests will run on CPU if GPU is not available"
+	@docker compose ps db > /dev/null 2>&1 || docker compose up -d db
+	@echo "Waiting for database..."
+	@sleep 3
+	docker compose run --rm client -c "python test_video_inference.py superanimal_quadruped --gpu 0 --detector-batch-size 4"
+
+# GPU-enabled test targets (requires nvidia-container-toolkit)
+test-trained-gpu:
+	@echo "🚀 Running with GPU support (requires nvidia-container-toolkit)"
+	@docker compose ps db > /dev/null 2>&1 || docker compose up -d db
+	@echo "Waiting for database..."
+	@sleep 3
+	@IMAGE=$$(docker compose config 2>/dev/null | grep -A 5 '^  client:' | grep 'image:' | awk '{print $$2}' 2>/dev/null || docker images --format '{{.Repository}}:{{.Tag}}' | grep element-deeplabcut-client | head -1); \
+	if [ -z "$$IMAGE" ]; then \
+		echo "Building image..."; \
+		docker compose build client; \
+		IMAGE=element-deeplabcut-client; \
+	fi; \
+	docker run --rm --gpus all \
+		--network $(NETWORK_NAME) \
+		-e DJ_HOST=db -e DJ_USER=root -e DJ_PASS=$${DJ_PASS:-datajoint} -e DJ_PORT=3306 \
+		-e DATABASE_PREFIX=$${DATABASE_PREFIX:-} -e DLC_ROOT_DATA_DIR=$${DLC_ROOT_DATA_DIR:-/app/test_videos} \
+		-e PYTHONUNBUFFERED=1 -e NVIDIA_VISIBLE_DEVICES=all \
+		-v $${DLC_DATA_DIR:-./test_videos}:/app/data \
+		$$([ -f dj_local_conf.json ] && echo "-v $$(pwd)/dj_local_conf.json:/app/dj_local_conf.json:ro") \
+		-v $$(pwd):/app \
+		$$IMAGE \
+		-c "python test_trained_inference.py --gpu 0 --batch-size 4"
+
+test-pretrained-gpu:
+	@echo "🚀 Running with GPU support (requires nvidia-container-toolkit)"
+	@docker compose ps db > /dev/null 2>&1 || docker compose up -d db
+	@echo "Waiting for database..."
+	@sleep 3
+	@IMAGE=$$(docker compose config 2>/dev/null | grep -A 5 '^  client:' | grep 'image:' | awk '{print $$2}' 2>/dev/null || docker images --format '{{.Repository}}:{{.Tag}}' | grep element-deeplabcut-client | head -1); \
+	if [ -z "$$IMAGE" ]; then \
+		echo "Building image..."; \
+		docker compose build client; \
+		IMAGE=element-deeplabcut-client; \
+	fi; \
+	docker run --rm --gpus all \
+		--network $(NETWORK_NAME) \
+		-e DJ_HOST=db -e DJ_USER=root -e DJ_PASS=$${DJ_PASS:-datajoint} -e DJ_PORT=3306 \
+		-e DATABASE_PREFIX=$${DATABASE_PREFIX:-} -e DLC_ROOT_DATA_DIR=$${DLC_ROOT_DATA_DIR:-/app/test_videos} \
+		-e PYTHONUNBUFFERED=1 -e NVIDIA_VISIBLE_DEVICES=all \
+		-v $${DLC_DATA_DIR:-./test_videos}:/app/data \
+		$$([ -f dj_local_conf.json ] && echo "-v $$(pwd)/dj_local_conf.json:/app/dj_local_conf.json:ro") \
+		-v $$(pwd):/app \
+		$$IMAGE \
+		-c "python test_video_inference.py superanimal_quadruped --gpu 0 --detector-batch-size 4"
+
+quad-superanimal:
+	# Step 1: Create project + SuperAnimal predictions + extract frames (PyTorch engine)
+	# After completion, you can run 'make quad-superanimal-refine' to open the GUI
+	# Uses optimized parameters for tiny animals in 4K video
+	# NOTE: If you get CUDA OOM errors, try 'make quad-superanimal-no-adapt' instead
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--create-project \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--videos "/home/mariiapopova/element-deeplabcut/test_videos/IMG_7654.mp4" \
+		--run-superanimal \
+		--batch-size 1 \
+		--detector-batch-size 1 \
+		--bbox-threshold 0.1 \
+		--pcutoff 0.05 \
+		--pseudo-threshold 0.05 \
+		--scale-list 300 400 500 600 700 800 \
+		--video-adapt \
+		--adapt-iterations 500 \
+		--detector-epochs-inference 3 \
+		--pose-epochs-inference 5 \
+		--gpu 0 \
+		--extract-frames
+
+quad-superanimal-auto-refine:
+	# Step 1: Create project + SuperAnimal predictions + extract frames (PyTorch engine)
+	# NOTE: This is the same as 'quad-superanimal' - no auto-refine GUI
+	# After this, run 'make quad-superanimal-refine' to open the refine GUI
+	# Uses optimized parameters for tiny animals in 4K video
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--create-project \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--videos "/home/mariiapopova/element-deeplabcut/test_videos/IMG_7654.mp4" \
+		--run-superanimal \
+		--batch-size 2 \
+		--detector-batch-size 1 \
+		--bbox-threshold 0.1 \
+		--pcutoff 0.05 \
+		--pseudo-threshold 0.05 \
+		--scale-list 300 400 500 600 700 800 \
+		--video-adapt \
+		--adapt-iterations 500 \
+		--detector-epochs-inference 3 \
+		--pose-epochs-inference 5 \
+		--gpu 0 \
+		--extract-frames
+
+quad-superanimal-predict:
+	# Run SuperAnimal inference on existing project (PyTorch engine)
+	# Project directory is auto-detected as the latest quad_superanimal-mariia-* under the repo root.
+	# NOTE: Usually not needed - 'make quad-superanimal' already runs SuperAnimal inference.
+	# Uses optimized parameters for tiny animals in 4K video
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--run-superanimal \
+		--batch-size 2 \
+		--detector-batch-size 1 \
+		--bbox-threshold 0.1 \
+		--pcutoff 0.05 \
+		--pseudo-threshold 0.05 \
+		--scale-list 300 400 500 600 700 800 \
+		--video-adapt \
+		--adapt-iterations 500 \
+		--detector-epochs-inference 3 \
+		--pose-epochs-inference 5 \
+		--gpu 0 \
+		--extract-frames
+
+quad-superanimal-no-adapt:
+	# Step 1 (NO VIDEO ADAPTATION): Create project + SuperAnimal predictions + extract frames
+	# Use this if 'make quad-superanimal' fails with CUDA OOM errors
+	# Disables video adaptation to reduce GPU memory usage
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--create-project \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--videos "/home/mariiapopova/element-deeplabcut/test_videos/IMG_7654.mp4" \
+		--run-superanimal \
+		--batch-size 1 \
+		--detector-batch-size 1 \
+		--bbox-threshold 0.1 \
+		--pcutoff 0.05 \
+		--pseudo-threshold 0.05 \
+		--scale-list 300 400 500 600 700 800 \
+		--no-video-adapt \
+		--gpu 0 \
+		--extract-frames
+
+quad-superanimal-refine:
+	# Step 2 (REQUIRED): Open DLC refine GUI to convert SuperAnimal predictions into training labels
+	# This is an interactive step: you'll correct keypoints in the GUI and save them.
+	# After saving, predictions become CollectedData_*.csv/.h5 files (real labels for training).
+	# PREREQUISITE: Run 'make quad-superanimal' first to get predictions + frames
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--refine-labels
+
+quad-superanimal-dataset:
+	# Step 3: Create training dataset (.mat files) from labels
+	# REQUIRES: CollectedData_*.csv/.h5 files exist (created in step 2 when you save in refine GUI)
+	# This generates training-datasets/.../*.mat files needed for training
+	# PREREQUISITE: Run 'make quad-superanimal-refine' and SAVE your labels in the GUI first
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--create-dataset
+
+quad-superanimal-train-fast:
+	# Step 4: One-shot dataset creation + fast training (10 epochs, save every 5)
+	# PREREQUISITES:
+	#   1. make quad-superanimal (creates project + predictions + frames)
+	#   2. make quad-superanimal-refine (converts predictions → labels via GUI)
+	#   3. Then run this command
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--create-dataset \
+		--train \
+		--epochs 10 \
+		--save-epochs 5 \
+		--train-batch-size 16 \
+		--gpu 0
+
+quad-superanimal-train-slow:
+	# Step 4: One-shot dataset creation + slow training (50 epochs, save every 10)
+	# PREREQUISITES:
+	#   1. make quad-superanimal (creates project + predictions + frames)
+	#   2. make quad-superanimal-refine (converts predictions → labels via GUI)
+	#   3. Then run this command
+	python real_quadruped_training_example.py \
+		--engine pytorch \
+		--project-name quad_superanimal \
+		--experimenter mariia \
+		--create-dataset \
+		--train \
+		--epochs 50 \
+		--save-epochs 10 \
+		--train-batch-size 16 \
+		--gpu 0
+	
+
+install-dlc-gui:
+	pip install 'deeplabcut[gui]'
 
 clean:
 	docker compose down -v
diff --git a/docker-compose.yaml b/docker-compose.yaml
index 74840e7..85fb2a4 100644
--- a/docker-compose.yaml
+++ b/docker-compose.yaml
@@ -39,6 +39,9 @@ services:
       - DATABASE_PREFIX=${DATABASE_PREFIX:-}
       - DLC_ROOT_DATA_DIR=${DLC_ROOT_DATA_DIR:-/app/test_videos}
       - PYTHONUNBUFFERED=1
+      # GPU support - set NVIDIA_VISIBLE_DEVICES to enable GPU access
+      # Can be overridden via -e flag in docker compose run
+      - NVIDIA_VISIBLE_DEVICES=${NVIDIA_VISIBLE_DEVICES:-all}
     volumes:
       # Mount data directory (can be customized via DLC_DATA_DIR env var)
       # Default: ./test_videos (for tests) or ./data (for general use)
@@ -49,6 +52,15 @@ services:
       - .:/app
     networks:
       - element_network
+    # GPU support for docker compose v2
+    # This requires nvidia-container-toolkit to be installed on the host
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: all
+              capabilities: [gpu]
     # Default command - interactive bash (entrypoint is /bin/bash)
     # Example: docker compose run client -c "python test_trained_inference.py"
     command: ["-i"]
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..2bae6d1
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,30 @@
+# Pinned requirements for element-deeplabcut
+# Generated for reproducibility - use with: pip install -r requirements.txt
+
+# Core dependencies
+datajoint==0.14.0
+pydot==1.4.2
+ipykernel==6.29.0
+ipywidgets==8.1.1
+opencv-python==4.8.1.78
+
+# Testing
+pytest==7.4.4
+pytest-cov==4.1.0
+
+# DeepLabCut - pinned version
+deeplabcut[superanimal]==3.0.0rc13
+deeplabcut[gui]==3.0.0rc13
+
+# dlclibrary - constrained to avoid ModelZoo download bug
+# The bug: rename_mapping is sometimes a string instead of dict
+# Constraining version helps, but we also have a runtime monkey patch
+dlclibrary>=0.1.0,<0.2.0
+
+# Element dependencies (from git)
+# Note: These are installed via setup.py extras, but listed here for reference
+# element-lab @ git+https://github.com/datajoint/element-lab.git
+# element-animal @ git+https://github.com/datajoint/element-animal.git
+# element-session @ git+https://github.com/datajoint/element-session.git
+# element-interface @ git+https://github.com/datajoint/element-interface.git
+
diff --git a/setup.py b/setup.py
index cee590d..fd61139 100644
--- a/setup.py
+++ b/setup.py
@@ -25,24 +25,27 @@
     packages=find_packages(exclude=["contrib", "docs", "tests*"]),
     scripts=[],
     install_requires=[
-        "datajoint>=0.14.0",
+        "datajoint==0.14.0",
         "graphviz",
-        "pydot",
-        "ipykernel",
-        "ipywidgets",
+        "pydot==1.4.2",
+        "ipykernel==6.29.0",
+        "ipywidgets==8.1.1",
     ],
     extras_require={
         "dlc_default": [
-            "deeplabcut[superanimal]==3.0.0rc13"
+            "deeplabcut[superanimal]==3.0.0rc13",
+            "dlclibrary>=0.1.0,<0.2.0",  # Pin to avoid ModelZoo download bug
         ],
         "dlc_apple_mchips": [
             "tensorflow-macos==2.12.0",
             "tensorflow-metal",
             "tables==3.7.0",
             "deeplabcut[superanimal]==3.0.0rc13",
+            "dlclibrary>=0.1.0,<0.2.0",  # Pin to avoid ModelZoo download bug
         ],
         "dlc_gui": [
-            "deeplabcut[gui]==3.0.0rc13"
+            "deeplabcut[gui]==3.0.0rc13",
+            "dlclibrary>=0.1.0,<0.2.0",  # Pin to avoid ModelZoo download bug
         ],
         "elements": [
             "element-lab @ git+https://github.com/datajoint/element-lab.git",
@@ -50,6 +53,10 @@
             "element-session @ git+https://github.com/datajoint/element-session.git",
             "element-interface @ git+https://github.com/datajoint/element-interface.git",
         ],
-        "tests": ["pytest", "pytest-cov", "shutils"],
+        "tests": [
+            "pytest==7.4.4",
+            "pytest-cov==4.1.0",
+            "shutils",
+        ],
     },
 )

From d4bb362aa1e85042ec41655c5b36e3a1a85f3404 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Thu, 4 Dec 2025 13:02:26 +0100
Subject: [PATCH 11/15] improve test populates

---
 element_deeplabcut/model.py              |  793 +++++++++-
 element_deeplabcut/readers/dlc_reader.py |   40 +-
 test_trained_inference.py                | 1775 ++++++++++++++--------
 test_video_inference.py                  | 1052 +++++++++----
 4 files changed, 2682 insertions(+), 978 deletions(-)

diff --git a/element_deeplabcut/model.py b/element_deeplabcut/model.py
index 843cdf5..cb9def4 100644
--- a/element_deeplabcut/model.py
+++ b/element_deeplabcut/model.py
@@ -23,6 +23,39 @@
 
 _linking_module = None
 
+# Apply dlclibrary bug patch early at module import
+def _apply_dlclibrary_patch_early():
+    """Apply dlclibrary ModelZoo bug patch at module import time."""
+    try:
+        import dlclibrary.dlcmodelzoo.modelzoo_download as modelzoo_download
+        if hasattr(modelzoo_download, '_handle_downloaded_file'):
+            original_handle = modelzoo_download._handle_downloaded_file
+            
+            def patched_handle_downloaded_file(file_name, target_dir, rename_mapping):
+                """Patched version that handles rename_mapping being a string."""
+                # Fix: If rename_mapping is a string, convert to dict or use empty dict
+                if isinstance(rename_mapping, str):
+                    rename_mapping = {}
+                elif rename_mapping is None:
+                    rename_mapping = {}
+                
+                # Call original function with fixed rename_mapping
+                return original_handle(file_name, target_dir, rename_mapping)
+            
+            # Apply the patch
+            modelzoo_download._handle_downloaded_file = patched_handle_downloaded_file
+            logger.debug("Applied dlclibrary ModelZoo bug patch at module import")
+    except (ImportError, AttributeError):
+        # dlclibrary not available yet, will be patched later if needed
+        pass
+
+# Try to apply patch early (will be applied again in _do_pretrained_inference if needed)
+try:
+    _apply_dlclibrary_patch_early()
+except Exception:
+    # Silently fail - patch will be applied later when needed
+    pass
+
 
 def activate(
     model_schema_name: str,
@@ -958,27 +991,94 @@ def infer_output_dir(cls, key: dict, relative: bool = False, mkdir: bool = False
                 "Please set DLC_ROOT_DATA_DIR environment variable or configure it in dj_local_conf.json"
             )
         
-        video_filepath = find_full_path(
-            root_dirs,
-            (VideoRecording.File & key).fetch("file_path", limit=1)[0],
-        )
+        # Get the stored file path from the database
+        stored_file_path = (VideoRecording.File & key).fetch("file_path", limit=1)[0]
+        
+        try:
+            video_filepath = find_full_path(root_dirs, stored_file_path)
+        except FileNotFoundError as e:
+            # Provide more helpful error message with diagnostic information
+            error_msg = (
+                f"Could not find video file: {stored_file_path}\n"
+                f"Searched in root directories: {root_dirs}\n"
+            )
+            # Check if any files exist in the root directories
+            for root in root_dirs:
+                root_path = Path(root)
+                if root_path.exists():
+                    video_files = list(root_path.glob("*.mp4")) + list(root_path.glob("*.avi")) + list(root_path.glob("*.mov"))
+                    if video_files:
+                        error_msg += f"\nFound {len(video_files)} video file(s) in {root}:\n"
+                        for vf in video_files[:5]:  # Show first 5
+                            error_msg += f"  - {vf.name}\n"
+                        if len(video_files) > 5:
+                            error_msg += f"  ... and {len(video_files) - 5} more\n"
+                    else:
+                        error_msg += f"\nNo video files found in {root}\n"
+                else:
+                    error_msg += f"\nRoot directory does not exist: {root}\n"
+            
+            # Check if the stored path is absolute and exists
+            stored_path = Path(stored_file_path)
+            if stored_path.is_absolute() and stored_path.exists():
+                # File exists at absolute path but not under any root directory
+                # Use it directly as a fallback
+                logger.warning(
+                    f"Video file {stored_file_path} exists at absolute path but is not under any configured root directory. "
+                    f"Using absolute path directly."
+                )
+                video_filepath = stored_path
+            else:
+                # Check if the stored path is absolute
+                if stored_path.is_absolute():
+                    error_msg += (
+                        f"\nNote: Stored path is absolute: {stored_file_path}\n"
+                        "If the file exists at this absolute path, it may not be under any configured root directory.\n"
+                    )
+                    if stored_path.exists():
+                        error_msg += f"The file exists at this absolute path, but it's not under any root directory.\n"
+                
+                raise FileNotFoundError(error_msg) from e
         
         # Ensure video_filepath is an absolute Path
         video_filepath = Path(video_filepath).resolve()
         
-        # Handle case where video is directly in root directory
-        video_parent = video_filepath.parent
+        # Find the root directory that contains this video file
         root_dir = None
-        # Check if parent is one of the root directories
+        video_parent = video_filepath.parent
+        
+        # First, check if the video file itself is directly in a root directory
         for root in root_dirs:
             root_path = Path(root).resolve()
-            if video_parent == root_path:
+            if video_filepath.parent == root_path:
                 root_dir = root_path
                 break
         
-        # If not found, use find_root_directory (for nested paths)
+        # If not found, check if video file is in a subdirectory of a root directory
+        if root_dir is None:
+            for root in root_dirs:
+                root_path = Path(root).resolve()
+                try:
+                    # Check if video_filepath is under this root
+                    video_filepath.relative_to(root_path)
+                    root_dir = root_path
+                    break
+                except ValueError:
+                    # video_filepath is not under this root, continue
+                    continue
+        
+        # If still not found, try find_root_directory on the parent directory
         if root_dir is None:
-            root_dir = Path(find_root_directory(root_dirs, video_filepath.parent)).resolve()
+            try:
+                root_dir = Path(find_root_directory(root_dirs, video_filepath.parent)).resolve()
+            except FileNotFoundError:
+                # Last resort: if video is not under any root, use the first root directory
+                # This handles edge cases where the video path might be absolute but outside roots
+                logger.warning(
+                    f"Video file {video_filepath} is not under any configured root directory. "
+                    f"Using first root directory as fallback: {root_dirs[0]}"
+                )
+                root_dir = Path(root_dirs[0]).resolve()
         recording_key = VideoRecording & key
         device = "-".join(
             str(v)
@@ -989,9 +1089,21 @@ def infer_output_dir(cls, key: dict, relative: bool = False, mkdir: bool = False
         else:  # if processed not provided, default to where video is
             processed_dir = root_dir
 
+        # Calculate relative path from root_dir to video's parent directory
+        try:
+            video_relative_path = video_filepath.parent.relative_to(root_dir)
+        except ValueError:
+            # Video is not under root_dir (edge case - should be rare)
+            # Use video's parent directory name as the relative path
+            logger.warning(
+                f"Video {video_filepath} is not under root directory {root_dir}. "
+                f"Using parent directory name as relative path."
+            )
+            video_relative_path = Path(video_filepath.parent.name)
+
         output_dir = (
             processed_dir
-            / video_filepath.parent.relative_to(root_dir)
+            / video_relative_path
             / (
                 f'device_{device}_recording_{key["recording_id"]}_model_'
                 + key["model_name"].replace(" ", "-")
@@ -1187,6 +1299,42 @@ class IndividualMapping(dj.Part):
         individual_id: varchar(32)  # Individual identifier (must match Individual.individual_id)
         """
 
+    @staticmethod
+    def _patch_dlclibrary_modelzoo_bug():
+        """Monkey patch to fix dlclibrary ModelZoo download bug.
+        
+        The bug: In dlclibrary.dlcmodelzoo.modelzoo_download._handle_downloaded_file,
+        rename_mapping is sometimes a string instead of a dict, causing AttributeError.
+        
+        This patch ensures rename_mapping is always treated as a dict.
+        """
+        try:
+            import dlclibrary.dlcmodelzoo.modelzoo_download as modelzoo_download
+            original_handle = modelzoo_download._handle_downloaded_file
+            
+            def patched_handle_downloaded_file(file_name, target_dir, rename_mapping):
+                """Patched version that handles rename_mapping being a string."""
+                # Fix: If rename_mapping is a string, convert to dict or use empty dict
+                if isinstance(rename_mapping, str):
+                    logger.warning(
+                        f"dlclibrary bug: rename_mapping is a string '{rename_mapping}' instead of dict. "
+                        "Using empty dict as fallback."
+                    )
+                    rename_mapping = {}
+                elif rename_mapping is None:
+                    rename_mapping = {}
+                
+                # Call original function with fixed rename_mapping
+                return original_handle(file_name, target_dir, rename_mapping)
+            
+            # Apply the patch
+            modelzoo_download._handle_downloaded_file = patched_handle_downloaded_file
+            logger.debug("Applied dlclibrary ModelZoo bug patch")
+            return True
+        except (ImportError, AttributeError) as e:
+            logger.debug(f"Could not patch dlclibrary (may not be needed): {e}")
+            return False
+
     @classmethod
     def _do_pretrained_inference(
         cls,
@@ -1213,6 +1361,9 @@ def _do_pretrained_inference(
         """
         import inspect
         import deeplabcut
+        
+        # Apply monkey patch to fix dlclibrary bug before inference
+        cls._patch_dlclibrary_modelzoo_bug()
 
         # --- Fetch pretrained model metadata from lookup ---
         try:
@@ -1281,12 +1432,36 @@ def _do_pretrained_inference(
             logger.info(f"Output will be saved to: {destfolder_str}")
 
             # Call with correct signature: videos, superanimal_name, model_name, **kwargs
-            result = inference_func(
-                video_filepaths,
-                pretrained_model_name,  # superanimal_name (positional, required)
-                backbone_model_name,    # model_name (positional, required)
-                **kwargs,
-            )
+            try:
+                result = inference_func(
+                    video_filepaths,
+                    pretrained_model_name,  # superanimal_name (positional, required)
+                    backbone_model_name,    # model_name (positional, required)
+                    **kwargs,
+                )
+            except ValueError as e:
+                error_msg = str(e)
+                if "need at least one array to stack" in error_msg or "at least one array" in error_msg.lower():
+                    # No animals detected in the video
+                    logger.warning(
+                        f"No animals detected in video(s): {video_filepaths}. "
+                        "This can happen if: "
+                        "1) The detector threshold is too high (try lowering bbox_threshold), "
+                        "2) The animals are too small or not visible, "
+                        "3) The video quality is poor, or "
+                        "4) The model is not suitable for this video type."
+                    )
+                    logger.info(
+                        "No animals detected. The pipeline will skip this recording gracefully. "
+                        "No pose estimation data will be inserted for this video."
+                    )
+                    
+                    # Return None to indicate no detections
+                    # Downstream code will check for result files and skip if none exist
+                    return None
+                else:
+                    # Different ValueError, re-raise it
+                    raise
 
             # Verify files were saved to the correct location
             output_path = Path(destfolder_str)
@@ -1331,6 +1506,202 @@ def _do_pretrained_inference(
             "Expected `video_inference_superanimal` or a compatible `video_inference` wrapper."
         )
 
+    @staticmethod
+    def _sanitize_pytorch_config_yaml(project_path: Path, dlc_config: dict, dlc_model_: dict):
+        """Sanitize pytorch_config.yaml files by removing ruamel.yaml-specific tags.
+        
+        DeepLabCut's training process creates pytorch_config.yaml files with ruamel.yaml
+        round-trip mode tags that can't be read by the safe YAML loader. This function
+        finds and sanitizes these files by reading with ruamel.yaml and rewriting with
+        a safe YAML writer.
+        
+        Args:
+            project_path: Full path to the directory containing the trained model.
+            dlc_config: DeepLabCut config dictionary.
+            dlc_model_: Model record dictionary.
+        """
+        def _convert_to_plain_python(obj):
+            """Recursively convert ruamel.yaml objects to plain Python types."""
+            from ruamel.yaml.comments import CommentedMap, CommentedSeq
+            if isinstance(obj, CommentedMap):
+                return {k: _convert_to_plain_python(v) for k, v in obj.items()}
+            elif isinstance(obj, CommentedSeq):
+                return [_convert_to_plain_python(item) for item in obj]
+            elif isinstance(obj, dict):
+                return {k: _convert_to_plain_python(v) for k, v in obj.items()}
+            elif isinstance(obj, list):
+                return [_convert_to_plain_python(item) for item in obj]
+            else:
+                return obj
+        
+        try:
+            from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+        except ImportError:
+            try:
+                from deeplabcut.utils.auxiliaryfunctions import GetModelFolder as get_model_folder
+            except ImportError:
+                logger.warning("Could not import get_model_folder, skipping pytorch_config.yaml sanitization")
+                return
+        
+        # Find the model training folder
+        try:
+            model_folder = get_model_folder(
+                trainFraction=dlc_config.get("TrainingFraction", [0.95])[dlc_model_.get("trainingsetindex", 0)],
+                shuffle=dlc_model_.get("shuffle", 1),
+                cfg=dlc_config,
+                modelprefix=dlc_model_.get("model_prefix", ""),
+            )
+            model_train_folder = project_path / model_folder / "train"
+        except Exception as e:
+            logger.warning(f"Could not determine model folder: {e}. Searching for pytorch_config.yaml files...")
+            model_train_folder = None
+        
+        # Search for pytorch_config.yaml files in common locations
+        search_paths = []
+        if model_train_folder and model_train_folder.exists():
+            search_paths.append(model_train_folder / "pytorch_config.yaml")
+        
+        # Also search in dlc-models-pytorch directories
+        dlc_models_pytorch = project_path / "dlc-models-pytorch"
+        if dlc_models_pytorch.exists():
+            for iteration_dir in dlc_models_pytorch.glob("iteration-*"):
+                for model_dir in iteration_dir.glob("*"):
+                    train_dir = model_dir / "train"
+                    if train_dir.exists():
+                        search_paths.append(train_dir / "pytorch_config.yaml")
+        
+        # Sanitize each found pytorch_config.yaml file
+        for config_path in search_paths:
+            if not config_path.exists():
+                continue
+            
+            try:
+                # First, check if file can be read by DLC's read_config_as_dict
+                # If it can, and doesn't have ruamel tags, skip sanitization
+                try:
+                    from deeplabcut.core import config as config_utils
+                    test_read = config_utils.read_config_as_dict(str(config_path))
+                    if test_read is not None and "method" in test_read:
+                        # File is already readable by DLC, check if it has ruamel tags
+                        with open(config_path, "r") as f:
+                            content = f.read()
+                        if "!!python/object/new:ruamel.yaml" not in content:
+                            logger.debug(f"pytorch_config.yaml is already valid, skipping sanitization: {config_path}")
+                            continue
+                except (ImportError, Exception):
+                    # Can't verify with DLC, proceed with sanitization
+                    pass
+                
+                # Read with ruamel.yaml round-trip mode (can handle the tags)
+                yaml_rt = YAML(typ="rt")  # round-trip mode
+                with open(config_path, "r") as f:
+                    config_data = yaml_rt.load(f)
+                
+                if config_data is None:
+                    logger.warning(f"pytorch_config.yaml is empty or invalid: {config_path}")
+                    continue
+                
+                # Convert ruamel.yaml objects to plain Python types
+                config_dict = _convert_to_plain_python(config_data)
+                
+                # Validate required keys are present and add defaults if missing
+                if not isinstance(config_dict, dict):
+                    logger.error(f"pytorch_config.yaml is not a dict after conversion: {type(config_dict)}")
+                    continue
+                
+                # Ensure required keys are present
+                if "method" not in config_dict:
+                    config_dict["method"] = "bu"  # bottom-up (default)
+                    logger.info(f"Added default method='bu' to {config_path}")
+                
+                # Ensure metadata section exists (required by DLC)
+                if "metadata" not in config_dict:
+                    config_dict["metadata"] = {}
+                    logger.info(f"Added default metadata section to {config_path}")
+                
+                # Ensure metadata has required fields
+                if "bodyparts" not in config_dict.get("metadata", {}):
+                    # Try to get from dlc_config if available
+                    bodyparts = dlc_config.get("bodyparts", ["bodypart1", "bodypart2", "bodypart3"])
+                    config_dict.setdefault("metadata", {})["bodyparts"] = bodyparts
+                    logger.info(f"Added bodyparts to metadata in {config_path}")
+                
+                # Write back with safe YAML writer
+                # Create backup before overwriting
+                backup_path = config_path.with_suffix('.yaml.backup')
+                try:
+                    import shutil
+                    shutil.copy2(config_path, backup_path)
+                except Exception:
+                    pass  # Backup is optional
+                
+                # Use DLC's own write_config if available, otherwise use ruamel.yaml safe mode
+                yaml_safe = None
+                try:
+                    from deeplabcut.utils.auxiliaryfunctions import write_config
+                    # DLC's write_config handles the format correctly
+                    write_config(str(config_path), config_dict)
+                    logger.debug(f"Used DLC's write_config to sanitize: {config_path}")
+                except (ImportError, Exception) as write_err:
+                    # Fallback to ruamel.yaml safe mode
+                    logger.debug(f"DLC's write_config not available, using ruamel.yaml safe mode: {write_err}")
+                    yaml_safe = YAML(typ="safe", pure=True)
+                    yaml_safe.default_flow_style = False
+                    
+                    with open(config_path, "w") as f:
+                        yaml_safe.dump(config_dict, f)
+                
+                # Verify the sanitized file can be read back by both our YAML loader and DLC's
+                try:
+                    # Test with our YAML loader (if we used ruamel.yaml, otherwise just test with DLC)
+                    if yaml_safe is not None:
+                        with open(config_path, "r") as f:
+                            test_load = yaml_safe.load(f)
+                        if test_load is None or "method" not in test_load:
+                            logger.error(f"Sanitized file is invalid (missing method), restoring backup: {config_path}")
+                            if backup_path.exists():
+                                shutil.copy2(backup_path, config_path)
+                            continue
+                    
+                    # Test with DLC's read_config_as_dict (the one that will actually be used)
+                    try:
+                        from deeplabcut.core import config as config_utils
+                        dlc_test = config_utils.read_config_as_dict(str(config_path))
+                        if dlc_test is None:
+                            logger.error(
+                                f"DLC's read_config_as_dict returned None for sanitized file: {config_path}. "
+                                "Restoring backup."
+                            )
+                            if backup_path.exists():
+                                shutil.copy2(backup_path, config_path)
+                            continue
+                        if "method" not in dlc_test:
+                            logger.error(
+                                f"DLC's read_config_as_dict missing 'method' key: {config_path}. "
+                                "Restoring backup."
+                            )
+                            if backup_path.exists():
+                                shutil.copy2(backup_path, config_path)
+                            continue
+                        logger.debug(f"Verified sanitized file can be read by DLC: {config_path}")
+                    except ImportError:
+                        # DLC's config_utils not available, skip DLC verification
+                        pass
+                    except Exception as e:
+                        logger.warning(f"DLC verification failed (but file structure looks OK): {e}")
+                        # Don't restore backup if our YAML loader can read it
+                        # The DLC error might be for other reasons
+                except Exception as e:
+                    logger.error(f"Sanitized file verification failed: {e}. Restoring backup.")
+                    if backup_path.exists():
+                        shutil.copy2(backup_path, config_path)
+                    continue
+                
+                logger.info(f"Sanitized pytorch_config.yaml: {config_path}")
+            except Exception as e:
+                logger.warning(f"Failed to sanitize {config_path}: {e}")
+                # Continue with other files even if one fails
+
     @classmethod
     def do_trained(
         cls,
@@ -1371,11 +1742,97 @@ def do_trained(
             engine = "tensorflow"
         if engine == "pytorch":
             from deeplabcut.pose_estimation_pytorch import analyze_videos
+            # Sanitize pytorch_config.yaml files before inference
+            cls._sanitize_pytorch_config_yaml(project_path, dlc_config, dlc_model_)
+            
+            # Verify pytorch_config.yaml files are readable after sanitization
+            try:
+                from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+                from deeplabcut.core import config as config_utils
+            except ImportError:
+                try:
+                    from deeplabcut.utils.auxiliaryfunctions import GetModelFolder as get_model_folder
+                except ImportError:
+                    get_model_folder = None
+            
+            if get_model_folder:
+                try:
+                    model_folder = get_model_folder(
+                        trainFraction=dlc_config.get("TrainingFraction", [0.95])[dlc_model_.get("trainingsetindex", 0)],
+                        shuffle=dlc_model_.get("shuffle", 1),
+                        cfg=dlc_config,
+                        modelprefix=dlc_model_.get("model_prefix", ""),
+                    )
+                    model_train_folder = project_path / model_folder / "train"
+                    pytorch_config_path = model_train_folder / "pytorch_config.yaml"
+                    
+                    if pytorch_config_path.exists():
+                        # Test if DLC can read it
+                        try:
+                            test_cfg = config_utils.read_config_as_dict(str(pytorch_config_path))
+                            if test_cfg is None:
+                                logger.error(
+                                    f"pytorch_config.yaml exists but read_config_as_dict returned None: {pytorch_config_path}. "
+                                    "File may be corrupted. Check the file manually."
+                                )
+                            elif "method" not in test_cfg:
+                                logger.error(
+                                    f"pytorch_config.yaml missing 'method' key: {pytorch_config_path}. "
+                                    "This will cause inference to fail."
+                                )
+                        except Exception as e:
+                            logger.error(
+                                f"Failed to read pytorch_config.yaml with DLC's read_config_as_dict: {e}. "
+                                f"File: {pytorch_config_path}"
+                            )
+                except Exception as e:
+                    logger.debug(f"Could not verify pytorch_config.yaml: {e}")
         elif engine == "tensorflow":
             from deeplabcut.pose_estimation_tensorflow import analyze_videos
         else:
             raise ValueError(f"Unknown engine type {engine}")
 
+        # ---- Update pytorch_config.yaml batch_size if provided (for PyTorch) ----
+        # This must happen BEFORE we write the main config file
+        if engine == "pytorch" and analyze_video_params:
+            batch_size_override = analyze_video_params.get("batch_size") or analyze_video_params.get("batchsize")
+            
+            if batch_size_override is not None:
+                try:
+                    from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+                    from deeplabcut.core import config as config_utils
+                    from deeplabcut.utils.auxiliaryfunctions import write_config
+                except ImportError:
+                    try:
+                        from deeplabcut.utils.auxiliaryfunctions import GetModelFolder as get_model_folder
+                    except ImportError:
+                        get_model_folder = None
+                        config_utils = None
+                        write_config = None
+                
+                if get_model_folder and config_utils and write_config:
+                    try:
+                        model_folder = get_model_folder(
+                            trainFraction=dlc_config.get("TrainingFraction", [0.95])[dlc_model_.get("trainingsetindex", 0)],
+                            shuffle=dlc_model_.get("shuffle", 1),
+                            cfg=dlc_config,
+                            modelprefix=dlc_model_.get("model_prefix", ""),
+                        )
+                        model_train_folder = project_path / model_folder / "train"
+                        pytorch_config_path = model_train_folder / "pytorch_config.yaml"
+                        
+                        if pytorch_config_path.exists():
+                            # Read current config
+                            pytorch_cfg = config_utils.read_config_as_dict(str(pytorch_config_path))
+                            if pytorch_cfg and pytorch_cfg.get("batch_size") != batch_size_override:
+                                # Update batch_size in config
+                                pytorch_cfg["batch_size"] = batch_size_override
+                                # Write back using DLC's write_config
+                                write_config(str(pytorch_config_path), pytorch_cfg)
+                                logger.info(f"Updated batch_size to {batch_size_override} in {pytorch_config_path}")
+                    except Exception as e:
+                        logger.debug(f"Could not update pytorch_config.yaml batch_size: {e}")
+
         # ---- Build and save DLC configuration (yaml) file ----
         dlc_project_path = Path(project_path)
         dlc_config["project_path"] = dlc_project_path.as_posix()
@@ -1412,23 +1869,245 @@ def do_trained(
         else:
             config_filepath = output_dir / config_filename
 
+        # ---- Final verification of pytorch_config.yaml (for PyTorch) ----
+        # This is a final check before calling analyze_videos to ensure the file is valid
+        if engine == "pytorch":
+            try:
+                from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+                from deeplabcut.core import config as config_utils
+            except ImportError:
+                try:
+                    from deeplabcut.utils.auxiliaryfunctions import GetModelFolder as get_model_folder
+                except ImportError:
+                    get_model_folder = None
+                    config_utils = None
+            
+            if get_model_folder and config_utils:
+                try:
+                    model_folder = get_model_folder(
+                        trainFraction=dlc_config.get("TrainingFraction", [0.95])[dlc_model_.get("trainingsetindex", 0)],
+                        shuffle=dlc_model_.get("shuffle", 1),
+                        cfg=dlc_config,
+                        modelprefix=dlc_model_.get("model_prefix", ""),
+                    )
+                    model_train_folder = project_path / model_folder / "train"
+                    pytorch_config_path = model_train_folder / "pytorch_config.yaml"
+                    
+                    if not pytorch_config_path.exists():
+                        # Search for pytorch_config.yaml in alternative locations
+                        search_paths = []
+                        
+                        # Check if model_train_folder exists
+                        if model_train_folder.exists():
+                            search_paths.append(model_train_folder)
+                        
+                        # Search in dlc-models-pytorch directories
+                        dlc_models_pytorch = project_path / "dlc-models-pytorch"
+                        if dlc_models_pytorch.exists():
+                            for iteration_dir in dlc_models_pytorch.glob("iteration-*"):
+                                for model_dir in iteration_dir.glob("*"):
+                                    train_dir = model_dir / "train"
+                                    if train_dir.exists():
+                                        search_paths.append(train_dir)
+                        
+                        # Also search in dlc-models directories (TensorFlow-style path)
+                        dlc_models = project_path / "dlc-models"
+                        if dlc_models.exists():
+                            for iteration_dir in dlc_models.glob("iteration-*"):
+                                for model_dir in iteration_dir.glob("*"):
+                                    train_dir = model_dir / "train"
+                                    if train_dir.exists():
+                                        search_paths.append(train_dir)
+                        
+                        # Search for the file in all candidate directories
+                        found_path = None
+                        for search_dir in search_paths:
+                            candidate = search_dir / "pytorch_config.yaml"
+                            if candidate.exists():
+                                found_path = candidate
+                                logger.info(f"Found pytorch_config.yaml at alternative location: {found_path}")
+                                pytorch_config_path = found_path
+                                break
+                        
+                        if found_path is None:
+                            # Check if this might be a TensorFlow model instead
+                            tensorflow_indicators = []
+                            if (model_train_folder / "snapshot").exists():
+                                tensorflow_indicators.append("Found 'snapshot' directory (TensorFlow indicator)")
+                            if (model_train_folder / "train").exists():
+                                # Check for TensorFlow checkpoint files
+                                train_dir = model_train_folder / "train"
+                                if any(train_dir.glob("*.ckpt*")) or any(train_dir.glob("*.index")):
+                                    tensorflow_indicators.append("Found TensorFlow checkpoint files")
+                            
+                            # Provide helpful error message with search locations
+                            error_msg = (
+                                f"pytorch_config.yaml not found at expected location: {pytorch_config_path}\n"
+                                "This file is required for PyTorch inference. It should be created during training.\n"
+                            )
+                            if tensorflow_indicators:
+                                error_msg += (
+                                    "⚠️  WARNING: This appears to be a TensorFlow model, not PyTorch!\n"
+                                    "Indicators found:\n"
+                                )
+                                for indicator in tensorflow_indicators:
+                                    error_msg += f"  - {indicator}\n"
+                                error_msg += (
+                                    "If this model was trained with TensorFlow, set engine='tensorflow' instead of 'pytorch'.\n"
+                                )
+                            if search_paths:
+                                error_msg += f"\nSearched in {len(search_paths)} alternative locations:\n"
+                                for sp in search_paths[:5]:  # Show first 5
+                                    error_msg += f"  - {sp}\n"
+                                if len(search_paths) > 5:
+                                    error_msg += f"  ... and {len(search_paths) - 5} more\n"
+                            else:
+                                error_msg += (
+                                    f"\nModel training directory not found: {model_train_folder}\n"
+                                    "This suggests the model may not have been trained yet, or training failed.\n"
+                                )
+                            error_msg += (
+                                "\nPossible solutions:\n"
+                                "1. Ensure the model was trained with PyTorch (engine='pytorch')\n"
+                                "2. Check that training completed successfully\n"
+                                "3. Verify the model path and training parameters are correct\n"
+                            )
+                            raise FileNotFoundError(error_msg)
+                    
+                    # Verify it can be read by DLC (this is the critical check)
+                    test_cfg = config_utils.read_config_as_dict(str(pytorch_config_path))
+                    if test_cfg is None:
+                        # Try to read the file directly to see what's wrong
+                        try:
+                            with open(pytorch_config_path, "r") as f:
+                                file_content = f.read()
+                            logger.error(f"pytorch_config.yaml content (first 500 chars):\n{file_content[:500]}")
+                        except Exception as read_err:
+                            logger.error(f"Could not even read file: {read_err}")
+                        
+                        # Try one more sanitization attempt
+                        logger.warning("pytorch_config.yaml cannot be read by DLC, attempting emergency sanitization...")
+                        try:
+                            cls._sanitize_pytorch_config_yaml(project_path, dlc_config, dlc_model_)
+                            test_cfg = config_utils.read_config_as_dict(str(pytorch_config_path))
+                            if test_cfg is None:
+                                raise ValueError(
+                                    f"pytorch_config.yaml still cannot be read after sanitization: {pytorch_config_path}. "
+                                    "File may be fundamentally corrupted. Check the file manually."
+                                )
+                        except Exception as sanitize_err:
+                            logger.error(f"Emergency sanitization failed: {sanitize_err}")
+                            raise ValueError(
+                                f"pytorch_config.yaml exists but cannot be read by DLC: {pytorch_config_path}. "
+                                "File may be corrupted or invalid. Check the file manually. "
+                                "This usually happens when the file has ruamel.yaml tags that DLC can't parse. "
+                                "Sanitization attempts have failed."
+                            )
+                    
+                    if "method" not in test_cfg:
+                        raise ValueError(
+                            f"pytorch_config.yaml missing required 'method' key: {pytorch_config_path}. "
+                            f"Available keys: {list(test_cfg.keys())}. "
+                            "File may be corrupted."
+                        )
+                    logger.debug(f"Verified pytorch_config.yaml is valid: {pytorch_config_path}")
+                except Exception as e:
+                    logger.error(f"pytorch_config.yaml validation failed: {e}")
+                    raise  # Always raise - don't continue with invalid config
+
         # ---- Take valid parameters for analyze_videos ----
+        # Get function signature to check what parameters it accepts
+        sig = inspect.signature(analyze_videos)
+        param_names = list(sig.parameters.keys())
+        
         kwargs = {
             k: v
             for k, v in analyze_video_params.items()
-            if k in inspect.signature(analyze_videos).parameters
+            if k in param_names
         }
+        
+        # For PyTorch, ensure batch_size is passed if available (overrides config file default)
+        # Try both 'batch_size' and 'batchsize' parameter names
+        if "batch_size" in param_names and "batch_size" in analyze_video_params:
+            kwargs["batch_size"] = analyze_video_params["batch_size"]
+        elif "batchsize" in param_names and "batchsize" in analyze_video_params:
+            kwargs["batchsize"] = analyze_video_params["batchsize"]
+        elif "batch_size" in param_names and "batchsize" in analyze_video_params:
+            # If function accepts batch_size but we have batchsize, convert it
+            kwargs["batch_size"] = analyze_video_params["batchsize"]
+        elif "batchsize" in param_names and "batch_size" in analyze_video_params:
+            # If function accepts batchsize but we have batch_size, convert it
+            kwargs["batchsize"] = analyze_video_params["batch_size"]
 
         # ---- Trigger DLC prediction job ----
-        analyze_videos(
-            config=config_filepath,
-            videos=video_filepaths,
-            shuffle=dlc_model_["shuffle"],
-            trainingsetindex=dlc_model_["trainingsetindex"],
-            destfolder=output_dir,
-            modelprefix=dlc_model_.get("model_prefix", ""),
-            **kwargs,
-        )
+        try:
+            analyze_videos(
+                config=config_filepath,
+                videos=video_filepaths,
+                shuffle=dlc_model_["shuffle"],
+                trainingsetindex=dlc_model_["trainingsetindex"],
+                destfolder=output_dir,
+                modelprefix=dlc_model_.get("model_prefix", ""),
+                **kwargs,
+            )
+        except ValueError as e:
+            error_msg = str(e)
+            # Handle case where no predictions were found (empty predictions)
+            if "Shape of passed values is" in error_msg and "indices imply" in error_msg:
+                # This happens when DLC tries to create a DataFrame but has no predictions
+                logger.warning(
+                    f"No predictions found for video(s): {video_filepaths}. "
+                    "This can happen if: "
+                    "1) No animals were detected in the video, "
+                    "2) The model confidence threshold is too high, "
+                    "3) The video quality is poor, or "
+                    "4) The model is not suitable for this video type."
+                )
+                logger.info(
+                    "No pose estimation data will be available for this video. "
+                    "The pipeline will skip this recording gracefully."
+                )
+                # Return early - no result files will be created
+                return
+            else:
+                # Different ValueError, re-raise it
+                raise
+        except TypeError as e:
+            if "'NoneType' object is not subscriptable" in str(e):
+                # This is the specific error we're trying to fix
+                logger.error(
+                    "DLC's read_config_as_dict returned None for pytorch_config.yaml. "
+                    "This usually means the file is corrupted or missing required keys."
+                )
+                if engine == "pytorch":
+                    logger.error(
+                        "For PyTorch models, ensure pytorch_config.yaml exists and contains "
+                        "at minimum: 'method' key (e.g., 'bu' or 'td')."
+                    )
+                    # Try to find and list all pytorch_config.yaml files for debugging
+                    try:
+                        from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+                        model_folder = get_model_folder(
+                            trainFraction=dlc_config.get("TrainingFraction", [0.95])[dlc_model_.get("trainingsetindex", 0)],
+                            shuffle=dlc_model_.get("shuffle", 1),
+                            cfg=dlc_config,
+                            modelprefix=dlc_model_.get("model_prefix", ""),
+                        )
+                        model_train_folder = project_path / model_folder / "train"
+                        pytorch_config_path = model_train_folder / "pytorch_config.yaml"
+                        logger.error(f"Expected pytorch_config.yaml at: {pytorch_config_path}")
+                        logger.error(f"File exists: {pytorch_config_path.exists()}")
+                        if pytorch_config_path.exists():
+                            try:
+                                with open(pytorch_config_path, "r") as f:
+                                    content = f.read()
+                                logger.error(f"File size: {len(content)} bytes")
+                                logger.error(f"First 200 chars: {content[:200]}")
+                            except Exception as read_err:
+                                logger.error(f"Could not read file: {read_err}")
+                    except Exception as debug_err:
+                        logger.error(f"Could not determine expected path: {debug_err}")
+            raise
 
     def make(self, key):
         """.populate() method will launch pose estimation inference for each PoseEstimationTask"""
@@ -1506,14 +2185,43 @@ def make(self, key):
                     output_directory=output_dir,
                 )
                 def _do_pretrained_inference():
-                    PoseEstimation._do_pretrained_inference(
+                    result = PoseEstimation._do_pretrained_inference(
                         pretrained_model_name=pretrained_model_name,
                         video_filepaths=video_filepaths,
                         output_dir=output_dir,
                         inference_params=pose_inference_params,
                     )
+                    # If result is None, it means no animals were detected
+                    # Check if result files exist, and if not, skip this recording
+                    if result is None:
+                        # Check if empty result files were created
+                        output_path = Path(output_dir)
+                        result_files = list(output_path.glob("*.h5")) + list(output_path.glob("*.pickle"))
+                        if not result_files:
+                            logger.warning(
+                                f"No animals detected and no result files created for {key}. "
+                                "Skipping this recording - no pose data will be inserted."
+                            )
+                            # Return early to skip inserting pose estimation data
+                            return None
                 
-                _do_pretrained_inference()
+                inference_result = _do_pretrained_inference()
+                # If inference returned None, check if result files were created
+                # (empty result files may have been created to indicate no detections)
+                if inference_result is None:
+                    output_path = Path(output_dir)
+                    result_files = list(output_path.glob("*.h5")) + list(output_path.glob("*.pickle"))
+                    if not result_files:
+                        logger.info(
+                            f"No animals detected in video(s) for key {key} and no result files created. "
+                            "Skipping pose estimation data insertion."
+                        )
+                        return  # Skip the rest of make() - no data to insert
+                    else:
+                        logger.info(
+                            f"No animals detected but empty result files exist. "
+                            "Will attempt to read them (may contain NaN values)."
+                        )
             else:
                 # Original trained model path
                 # Triggering dlc for pose estimation required:
@@ -1553,7 +2261,32 @@ def _do_trained_inference():
 
                 _do_trained_inference()
 
-        dlc_result = dlc_reader.PoseEstimation(output_dir)
+        # Check if result files exist before trying to read them (use rglob to match dlc_reader behavior)
+        output_path = Path(output_dir)
+        result_files = list(output_path.rglob("*.h5")) + list(output_path.rglob("*.pickle"))
+        if not result_files:
+            logger.warning(
+                f"No result files found in {output_dir} for key {key}. "
+                "This may indicate that no animals were detected or inference failed. "
+                "Skipping pose estimation data insertion."
+            )
+            return  # Skip the rest of make() - no data to insert
+        
+        # Try to initialize DLC result reader, handle FileNotFoundError gracefully
+        try:
+            dlc_result = dlc_reader.PoseEstimation(output_dir)
+        except FileNotFoundError as e:
+            error_msg = str(e)
+            if "No DLC output file (.h5) found" in error_msg or ".h5" in error_msg or "No meta file" in error_msg:
+                logger.warning(
+                    f"No DLC result files found in {output_dir} for key {key}. "
+                    "This likely means no animals were detected during inference. "
+                    "Skipping pose estimation data insertion."
+                )
+                return  # Skip the rest of make() - no data to insert
+            else:
+                # Different FileNotFoundError, re-raise it
+                raise
         creation_time = datetime.fromtimestamp(dlc_result.creation_time).strftime(
             "%Y-%m-%d %H:%M:%S"
         )
diff --git a/element_deeplabcut/readers/dlc_reader.py b/element_deeplabcut/readers/dlc_reader.py
index f50c01e..8693b23 100644
--- a/element_deeplabcut/readers/dlc_reader.py
+++ b/element_deeplabcut/readers/dlc_reader.py
@@ -572,11 +572,43 @@ def read_yaml(fullpath: str, filename: str = "*") -> tuple:
         list(fullpath.glob(f"{filename}.y*ml"))
     )
 
-    assert (  # If more than 1 and not DJ-saved,
-        len(yml_paths) == 1
-    ), f"Found more yaml files than expected: {len(yml_paths)}\n{fullpath}"
+    if not yml_paths:
+        raise FileNotFoundError(f"No YAML files found in: {fullpath}")
+
+    # If multiple YAML files are present, choose the most appropriate one:
+    # 1. Prefer explicit config.yaml/config.yml
+    # 2. Then prefer dj_dlc_config*.yaml (most recent by modification time)
+    # 3. Otherwise fall back to the first in the sorted list with a warning
+    chosen_path = None
+
+    # Prefer standard DLC config filenames
+    for name in ("config.yaml", "config.yml"):
+        for p in yml_paths:
+            if p.name == name:
+                chosen_path = p
+                break
+        if chosen_path:
+            break
+
+    # Prefer dj_dlc_config* if no explicit config.* was found
+    if chosen_path is None:
+        dj_configs = [p for p in yml_paths if p.name.startswith("dj_dlc_config")]
+        if dj_configs:
+            # Choose the most recently modified dj_dlc_config*
+            chosen_path = max(dj_configs, key=lambda p: p.stat().st_mtime)
+
+    # Fallback: first match, but emit a warning for debugging
+    if chosen_path is None:
+        chosen_path = yml_paths[0]
+        if len(yml_paths) > 1:
+            logger.warning(
+                "Multiple YAML files found in %s, using %s. Candidates: %s",
+                fullpath,
+                chosen_path,
+                [p.name for p in yml_paths],
+            )
 
-    return yml_paths[0], read_config(yml_paths[0])
+    return chosen_path, read_config(chosen_path)
 
 
 def save_yaml(
diff --git a/test_trained_inference.py b/test_trained_inference.py
index 1bce8d6..217434b 100755
--- a/test_trained_inference.py
+++ b/test_trained_inference.py
@@ -43,25 +43,27 @@
 import logging
 import argparse
 from pathlib import Path
-from unittest.mock import patch, MagicMock
+from unittest.mock import patch
 
 import datajoint as dj
 
 # Set up logging
 logging.basicConfig(
     level=logging.INFO,
-    format='%(message)s',
-    handlers=[logging.StreamHandler(sys.stdout)]
+    format="%(message)s",
+    handlers=[logging.StreamHandler(sys.stdout)],
 )
 logger = logging.getLogger(__name__)
 
+
 # Simple status printer for user-facing messages
 class StatusPrinter:
     """Simple status printer for step-by-step progress."""
+
     def __init__(self, total_steps=10):
         self.total_steps = total_steps
         self.current_step = 0
-    
+
     def step(self, message, status="info"):
         """Print a step message with status indicator."""
         self.current_step += 1
@@ -70,22 +72,23 @@ def step(self, message, status="info"):
             "success": "✅",
             "warning": "⚠️",
             "error": "❌",
-            "skip": "⏭️"
+            "skip": "⏭️",
         }
         icon = icons.get(status, "•")
         print(f"\n[{self.current_step}/{self.total_steps}] {icon} {message}")
-    
+
     def sub(self, message, indent=3, icon=""):
         """Print a sub-message with indentation."""
         prefix = f"{icon} " if icon else ""
         print(" " * indent + prefix + message)
-    
+
     def header(self, title):
         """Print a section header."""
         print("\n" + "=" * 60)
         print(title)
         print("=" * 60)
 
+
 # Configure database connection
 if Path("./dj_local_conf.json").exists():
     dj.config.load("./dj_local_conf.json")
@@ -95,12 +98,17 @@ def header(self, title):
     logger.info("   Set DJ_HOST, DJ_USER, DJ_PASS environment variables if needed")
 
 # Update config from environment variables
-dj.config.update({
-    "safemode": False,
-    "database.host": os.environ.get("DJ_HOST") or dj.config.get("database.host", "localhost"),
-    "database.user": os.environ.get("DJ_USER") or dj.config.get("database.user", "root"),
-    "database.password": os.environ.get("DJ_PASS") or dj.config.get("database.password", ""),
-})
+dj.config.update(
+    {
+        "safemode": False,
+        "database.host": os.environ.get("DJ_HOST")
+        or dj.config.get("database.host", "localhost"),
+        "database.user": os.environ.get("DJ_USER")
+        or dj.config.get("database.user", "root"),
+        "database.password": os.environ.get("DJ_PASS")
+        or dj.config.get("database.password", ""),
+    }
+)
 
 # Set database prefix for tests
 if "custom" not in dj.config:
@@ -112,7 +120,9 @@ def header(self, title):
 # Set DLC root data directory if not already set
 # In Docker, prefer /app/test_videos (from project mount), otherwise /app/data
 # Check for Docker: /.dockerenv exists OR we're in /app directory (Docker working dir)
-is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
+is_docker = os.path.exists("/.dockerenv") or (
+    os.getcwd() == "/app" and os.path.exists("/app")
+)
 if is_docker:
     # Prefer /app/test_videos (from project mount .:/app) since videos are in ./test_videos
     test_videos_path = Path("/app/test_videos")
@@ -122,10 +132,13 @@ def header(self, title):
         default_video_dir = "/app/data"
 else:
     default_video_dir = "./test_videos"
+
 video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
 # CRITICAL: Set dlc_root_data_dir in DataJoint config to match where videos actually are
 # This is used by element-deeplabcut to find video files
-if "dlc_root_data_dir" not in dj.config.get("custom", {}) or not dj.config["custom"].get("dlc_root_data_dir"):
+if "dlc_root_data_dir" not in dj.config.get("custom", {}) or not dj.config[
+    "custom"
+].get("dlc_root_data_dir"):
     dj.config["custom"]["dlc_root_data_dir"] = str(video_dir.absolute())
     logger.info(f"📁 Set DLC_ROOT_DATA_DIR to: {video_dir.absolute()}")
     if is_docker:
@@ -136,48 +149,54 @@ def header(self, title):
 if not dlc_root_dir.is_absolute():
     dlc_root_dir = dlc_root_dir.resolve()
 
-logger.info(f"📊 Database: {dj.config['database.host']} (prefix: {dj.config['custom']['database.prefix']})")
+logger.info(
+    f"📊 Database: {dj.config['database.host']} (prefix: {dj.config['custom']['database.prefix']})"
+)
 logger.info(f"📁 DLC Root: {dlc_root_dir}")
 
 from element_deeplabcut import model, train
 from tests import tutorial_pipeline as pipeline
 
+
 def check_database_connection():
     """Verify database connection is working."""
     try:
-        # Try to connect by activating a schema
-        test_schema = dj.schema("test_connection_check", create_schema=True, create_tables=False)
-        test_schema.drop()
+        dj.conn()
         return True
     except Exception as e:
         logger.error(f"\n❌ Database connection failed: {e}")
         logger.error("\nPlease configure your database:")
         logger.error("  1. Create dj_local_conf.json with database credentials")
         logger.error("  2. Or set environment variables: DJ_HOST, DJ_USER, DJ_PASS")
-        logger.error("  3. Or ensure database is running (docker compose -f docker-compose-db.yaml up -d)")
+        logger.error(
+            "  3. Or ensure database is running (docker compose -f docker-compose-db.yaml up -d)"
+        )
         return False
 
+
 def check_dlc_installation():
     """Check if DeepLabCut is installed and available."""
     try:
-        import deeplabcut
+        import deeplabcut  # noqa: F401
+
         return True, None
     except (ImportError, Exception) as e:
         return False, str(e)
 
+
 def create_dlc_project(project_name, experimenter, video_files, project_dir=None):
     """Create a new DLC project programmatically."""
     import deeplabcut
-    
+
     if project_dir is None:
         project_dir = dlc_root_dir / project_name
-    
+
     # Create project directory if it doesn't exist
     project_dir.mkdir(parents=True, exist_ok=True)
-    
+
     # Convert video files to absolute paths
     video_paths = [str(Path(v).resolve()) for v in video_files]
-    
+
     # Create DLC project
     config_path = deeplabcut.create_new_project(
         project_name,
@@ -186,10 +205,13 @@ def create_dlc_project(project_name, experimenter, video_files, project_dir=None
         working_directory=str(project_dir.parent),
         copy_videos=False,  # Don't copy videos, just reference them
     )
-    
+
     return Path(config_path).parent  # Return project directory
 
-def create_mock_labeled_data(config_path, num_frames=20, bodyparts=None, use_existing_frames=False):
+
+def create_mock_labeled_data(
+    config_path, num_frames=20, bodyparts=None, use_existing_frames=False
+):
     """
     Create mock labeled data with images and CSV files for testing.
 
@@ -289,7 +311,9 @@ def create_mock_labeled_data(config_path, num_frames=20, bodyparts=None, use_exi
 
     df = pd.DataFrame(
         data,
-        columns=pd.MultiIndex.from_tuples(columns, names=["scorer", "bodyparts", "coords"]),
+        columns=pd.MultiIndex.from_tuples(
+            columns, names=["scorer", "bodyparts", "coords"]
+        ),
         index=index_strings,
     )
 
@@ -326,11 +350,12 @@ def create_mock_labeled_data(config_path, num_frames=20, bodyparts=None, use_exi
 
     return csv_path
 
+
 def main():
     training_was_mocked = False
     status = StatusPrinter(total_steps=12)
     status.header("Testing Trained Model Workflow (Training + Inference)")
-    
+
     # Parse arguments
     parser = argparse.ArgumentParser(
         description="Test trained DeepLabCut workflow with video files",
@@ -340,124 +365,186 @@ def main():
         "dlc_project",
         nargs="?",
         default=None,
-        help="Path to DLC project directory or config.yaml file"
+        help="Path to DLC project directory or config.yaml file",
     )
     parser.add_argument(
         "--skip-training",
         action="store_true",
-        help="Skip training step and use existing trained model"
+        help="Skip training step and use existing trained model",
     )
     parser.add_argument(
         "--skip-inference",
         action="store_true",
-        help="Skip inference step (only train the model)"
+        help="Skip inference step (only train the model)",
+    )
+    parser.add_argument(
+        "--mock-results-on-failure",
+        action="store_true",
+        help="If inference fails or no animals detected, insert mock pose estimation results instead of failing. Useful for testing when videos don't contain detectable animals.",
     )
     parser.add_argument(
         "--model-name",
         default="test_trained_model",
-        help="Name for the trained model (default: test_trained_model)"
+        help="Name for the trained model (default: test_trained_model)",
     )
-    
+    parser.add_argument(
+        "--gpu",
+        type=int,
+        default=0,
+        help="GPU index to use (default: 0). Use -1 for CPU.",
+    )
+    parser.add_argument(
+        "--batch-size",
+        type=int,
+        default=4,
+        help=(
+            "Batch size for pose estimation inference (default: 4). Reduce if you get CUDA OOM errors. "
+            "Increase if you have more GPU memory."
+        ),
+    )
+
     args = parser.parse_args()
-    
+
+    # Set CUDA_VISIBLE_DEVICES for PyTorch/TensorFlow
+    if args.gpu >= 0:
+        os.environ["CUDA_VISIBLE_DEVICES"] = str(args.gpu)
+        print(f"🔧 Set CUDA_VISIBLE_DEVICES={args.gpu}")
+
+        # Configure PyTorch device if available
+        try:
+            import torch
+
+            if torch.cuda.is_available():
+                torch.cuda.set_device(args.gpu)
+                print(f"🔧 Set PyTorch default device to GPU {args.gpu}")
+                print(f"🔧 GPU available: {torch.cuda.get_device_name(args.gpu)}")
+            else:
+                print("⚠️  CUDA not available in PyTorch")
+        except ImportError:
+            pass  # PyTorch not available, that's OK
+
     # 0. Check database connection
     status.step("Checking database connection")
     if not check_database_connection():
         sys.exit(1)
     status.sub("Database connection successful", indent=3)
-    
+
     # 0.5. Clean up database (remove test data from previous runs)
     status.step("Cleaning up database (removing test data from previous runs)")
     cleanup_count = 0
-    
+
     # Delete PoseEstimation entries (and their parts)
-    pose_estimation_query = pipeline.model.PoseEstimation
-    if pose_estimation_query:
-        keys = pose_estimation_query.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            pose_estimation_query.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} PoseEstimation entry/entries", icon="🗑️", indent=3)
-    
+    pose_estimation_rel = pipeline.model.PoseEstimation
+    pose_keys = pose_estimation_rel.fetch("KEY")
+    pose_count = len(pose_keys)
+    if pose_count > 0:
+        pose_estimation_rel.delete()
+        cleanup_count += pose_count
+        status.sub(
+            f"Deleted {pose_count} PoseEstimation entry/entries",
+            icon="🗑️",
+            indent=3,
+        )
+
     # Delete PoseEstimationTask entries
-    task_query = pipeline.model.PoseEstimationTask
-    if task_query:
-        keys = task_query.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            task_query.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} PoseEstimationTask entry/entries", icon="🗑️", indent=3)
-    
+    task_rel = pipeline.model.PoseEstimationTask
+    task_keys = task_rel.fetch("KEY")
+    task_count = len(task_keys)
+    if task_count > 0:
+        task_rel.delete()
+        cleanup_count += task_count
+        status.sub(
+            f"Deleted {task_count} PoseEstimationTask entry/entries",
+            icon="🗑️",
+            indent=3,
+        )
+
     # Delete test models (models with names starting with "test_")
-    test_models = model.Model & "model_name LIKE 'test_%'"
-    if test_models:
-        keys = test_models.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            test_models.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} test model(s)", icon="🗑️", indent=3)
-    
+    test_models_rel = model.Model & "model_name LIKE 'test_%'"
+    test_model_keys = test_models_rel.fetch("KEY")
+    test_model_count = len(test_model_keys)
+    if test_model_count > 0:
+        test_models_rel.delete()
+        cleanup_count += test_model_count
+        status.sub(f"Deleted {test_model_count} test model(s)", icon="🗑️", indent=3)
+
     # Delete test training tasks (optional - comment out if you want to keep training history)
-    if pipeline.train.ModelTraining:
-        training_query = pipeline.train.ModelTraining
-        keys = training_query.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            training_query.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} ModelTraining entry/entries", icon="🗑️", indent=3)
-    
+    training_rel = pipeline.train.ModelTraining
+    training_keys = training_rel.fetch("KEY")
+    training_count = len(training_keys)
+    if training_count > 0:
+        training_rel.delete()
+        cleanup_count += training_count
+        status.sub(
+            f"Deleted {training_count} ModelTraining entry/entries",
+            icon="🗑️",
+            indent=3,
+        )
+
     if cleanup_count > 0:
         status.sub(f"Total: {cleanup_count} entry/entries cleaned", icon="✅", indent=3)
     else:
         status.sub("No test data found to clean", icon="ℹ️", indent=3)
-    
+
     # 1. Check DeepLabCut installation
     status.step("Checking DeepLabCut installation")
     dlc_available, dlc_error = check_dlc_installation()
     if not dlc_available:
-        status.sub(f"DeepLabCut is not installed or not importable: {dlc_error}", icon="❌", indent=3)
+        status.sub(
+            f"DeepLabCut is not installed or not importable: {dlc_error}",
+            icon="❌",
+            indent=3,
+        )
         status.sub("Install with: pip install 'deeplabcut[superanimal]'", indent=5)
         sys.exit(1)
     else:
         import deeplabcut
-        status.sub(f"DeepLabCut is available (version {deeplabcut.__version__})", icon="✅", indent=3)
-    
+
+        status.sub(
+            f"DeepLabCut is available (version {deeplabcut.__version__})",
+            icon="✅",
+            indent=3,
+        )
+
     # 2. Create or find DLC project
     status.step("Creating DLC project")
-    
+
     # Find video files for project creation (use first available video or create dummy)
-    # In Docker, check /app/test_videos (from project mount) first, then /app/data
-    is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
-    if is_docker:
-        # Prefer /app/test_videos (from project mount .:/app)
+    is_docker_local = os.path.exists("/.dockerenv") or (
+        os.getcwd() == "/app" and os.path.exists("/app")
+    )
+    if is_docker_local:
         test_videos_path = Path("/app/test_videos")
         if test_videos_path.exists():
-            default_video_dir = "/app/test_videos"
+            default_video_dir_local = "/app/test_videos"
         else:
-            default_video_dir = "/app/data"
+            default_video_dir_local = "/app/data"
     else:
-        default_video_dir = "./test_videos"
-    video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
-    video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
-    
+        default_video_dir_local = "./test_videos"
+
+    video_dir_local = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir_local))
+    video_files = list(video_dir_local.glob("*.mp4")) + list(
+        video_dir_local.glob("*.avi")
+    ) + list(video_dir_local.glob("*.mov"))
+
     if not video_files:
         # Create a dummy video file path (DLC will handle missing videos gracefully)
-        video_files = [str(video_dir / "dummy_video.mp4")]
-        status.sub("No videos found - will create project with dummy video path", icon="⚠️", indent=3)
+        video_files = [str(video_dir_local / "dummy_video.mp4")]
+        status.sub(
+            "No videos found - will create project with dummy video path",
+            icon="⚠️",
+            indent=3,
+        )
         status.sub("(You can add real videos later)", icon="ℹ️", indent=5)
-    
+
     # Create project name
     project_name = f"test_training_project_{args.model_name}"
     experimenter = "test_experimenter"
-    
+
     # Check if project already exists
     project_dir = dlc_root_dir / project_name
     config_file = project_dir / "config.yaml"
-    
+
     if config_file.exists() and not args.skip_training:
         status.sub(f"Project already exists: {project_dir}", icon="ℹ️", indent=3)
         status.sub("Using existing project (delete it to recreate)", icon="ℹ️", indent=5)
@@ -470,89 +557,119 @@ def main():
                 project_name,
                 experimenter,
                 video_files[:1],  # Use first video for project creation
-                project_dir=project_dir
+                project_dir=project_dir,
             )
             status.sub(f"Project created: {dlc_project_path}", icon="✅", indent=5)
         except Exception as e:
             status.sub(f"Error creating project: {e}", icon="❌", indent=3)
             raise
-    
+
     config_file = dlc_project_path / "config.yaml"
     if not config_file.exists():
         status.sub(f"Config file not found: {config_file}", icon="❌", indent=3)
         sys.exit(1)
-    
+
     # Make path relative to dlc_root_dir
     try:
         dlc_project_rel = Path(dlc_project_path).relative_to(dlc_root_dir)
     except ValueError:
         dlc_project_rel = Path(dlc_project_path)
-        status.sub("Warning: Project path not under DLC_ROOT_DATA_DIR, using absolute path", icon="⚠️", indent=3)
-    
+        status.sub(
+            "Warning: Project path not under DLC_ROOT_DATA_DIR, using absolute path",
+            icon="⚠️",
+            indent=3,
+        )
+
     config_file_rel = dlc_project_rel / "config.yaml"
     status.sub(f"Project path: {dlc_project_path}", icon="✅", indent=3)
     status.sub(f"Config file: {config_file_rel}", icon="ℹ️", indent=5)
-    
+
     # 3. Create mock labeled data (skip manual labeling)
     if not args.skip_training:
         status.step("Creating mock labeled data")
         labeled_data_dir = dlc_project_path / "labeled-data"
-        
+
         # Check if labeled data already exists
         if labeled_data_dir.exists() and any(labeled_data_dir.iterdir()):
-            status.sub("Labeled data already exists, skipping mock data creation", icon="ℹ️", indent=3)
+            status.sub(
+                "Labeled data already exists, skipping mock data creation",
+                icon="ℹ️",
+                indent=3,
+            )
         else:
             import yaml
-            with open(config_file, 'r') as f:
+
+            with open(config_file, "r") as f:
                 config = yaml.safe_load(f)
-            
+
             bodyparts = config.get("bodyparts", ["nose", "tailbase", "head"])
-            status.sub(f"Creating mock labeled data with {len(bodyparts)} body parts", icon="ℹ️", indent=3)
+            status.sub(
+                f"Creating mock labeled data with {len(bodyparts)} body parts",
+                icon="ℹ️",
+                indent=3,
+            )
             status.sub(f"Body parts: {bodyparts}", icon="ℹ️", indent=5)
-            
+
             try:
-                create_mock_labeled_data(config_file, num_frames=20, bodyparts=bodyparts)
+                create_mock_labeled_data(
+                    config_file, num_frames=20, bodyparts=bodyparts
+                )
                 status.sub("Mock labeled data created successfully", icon="✅", indent=3)
             except Exception as e:
                 status.sub(f"Error creating mock labeled data: {e}", icon="❌", indent=3)
                 raise
-    
+
     # 4. Setup test data (subject, session, recordings)
     status.step("Setting up test data")
     base_key = {
         "subject": "test1",
         "session_datetime": "2024-01-01 12:00:00",
     }
-    
-    pipeline.subject.Subject.insert1({
-        "subject": "test1",
-        "sex": "F",
-        "subject_birth_date": "2020-01-01",
-        "subject_description": "Test subject for trained model workflow",
-    }, skip_duplicates=True)
-    
-    pipeline.session.Session.insert1({
-        "subject": "test1",
-        "session_datetime": "2024-01-01 12:00:00",
-    }, skip_duplicates=True)
-    
+
+    pipeline.subject.Subject.insert1(
+        {
+            "subject": "test1",
+            "sex": "F",
+            "subject_birth_date": "2020-01-01",
+            "subject_description": "Test subject for trained model workflow",
+        },
+        skip_duplicates=True,
+    )
+
+    pipeline.session.Session.insert1(
+        {
+            "subject": "test1",
+            "session_datetime": "2024-01-01 12:00:00",
+        },
+        skip_duplicates=True,
+    )
+
     # Find video files for inference (reuse from earlier or find again)
     if not video_files:
-        video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
+        video_files = list(video_dir_local.glob("*.mp4")) + list(
+            video_dir_local.glob("*.avi")
+        ) + list(video_dir_local.glob("*.mov"))
     elif video_files and len(video_files) > 0:
         first_video = str(video_files[0])
         if "dummy_video.mp4" in first_video:
-            video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
-    
+            video_files = list(video_dir_local.glob("*.mp4")) + list(
+                video_dir_local.glob("*.avi")
+            ) + list(video_dir_local.glob("*.mov"))
+
     if not video_files and not args.skip_inference:
-        status.sub(f"No video files found in {video_dir}", icon="⚠️", indent=3)
+        status.sub(f"No video files found in {video_dir_local}", icon="⚠️", indent=3)
         status.sub("Supported formats: .mp4, .avi, .mov", icon="ℹ️", indent=3)
-        status.sub("Set DLC_ROOT_DATA_DIR environment variable to point to video directory", indent=3)
+        status.sub(
+            "Set DLC_ROOT_DATA_DIR environment variable to point to video directory",
+            indent=3,
+        )
         if args.skip_training:
             sys.exit(1)
         else:
-            status.sub("Continuing with training only (no inference videos)", icon="ℹ️", indent=3)
-    
+            status.sub(
+                "Continuing with training only (no inference videos)", icon="ℹ️", indent=3
+            )
+
     # Create recordings for inference videos
     recording_keys = []
     if video_files:
@@ -562,25 +679,98 @@ def main():
                 "recording_id": idx + 1,
             }
             recording_keys.append(recording_key)
-            
-            pipeline.model.VideoRecording.insert1(
-                {**recording_key, "device": "Camera1"}, skip_duplicates=True
-            )
-            
+
+            # Insert or update recording
+            existing_rec = pipeline.model.VideoRecording & recording_key
+            if len(existing_rec):
+                existing_device = existing_rec.fetch1("device")
+                if existing_device != "Camera1":
+                    existing_rec.delete()
+                    pipeline.model.VideoRecording.insert1(
+                        {**recording_key, "device": "Camera1"}
+                    )
+                    status.sub(
+                        f"Updated existing recording {recording_key['recording_id']} (device changed)",
+                        icon="🔄",
+                        indent=5,
+                    )
+                else:
+                    status.sub(
+                        f"Recording {recording_key['recording_id']} already exists with correct device",
+                        icon="✅",
+                        indent=5,
+                    )
+            else:
+                pipeline.model.VideoRecording.insert1(
+                    {**recording_key, "device": "Camera1"}
+                )
+                status.sub(
+                    f"Created new recording {recording_key['recording_id']}",
+                    icon="✅",
+                    indent=5,
+                )
+
             video_file_abs = Path(video_file).resolve()
             try:
                 relative_path = video_file_abs.relative_to(dlc_root_dir)
             except ValueError:
                 relative_path = Path(video_file.name)
-            
-            pipeline.model.VideoRecording.File.insert1(
-                {**recording_key, "file_id": 0, "file_path": str(relative_path)},
-                skip_duplicates=True,
-            )
-            status.sub(f"Created recording {recording_key['recording_id']} for {video_file_abs.name}", icon="✅", indent=5)
-    
-    status.sub(f"Created {len(recording_keys)} recording(s) for inference", icon="✅", indent=3)
-    
+
+            # Insert or update file entry
+            file_key = {**recording_key, "file_id": 0}
+            existing_file = pipeline.model.VideoRecording.File & file_key
+            if len(existing_file):
+                existing_path = existing_file.fetch1("file_path")
+                if existing_path != str(relative_path):
+                    file_keys = (
+                        pipeline.model.VideoRecording.File & recording_key
+                    ).fetch("KEY", as_dict=True)
+                    all_files = []
+                    for fk in file_keys:
+                        file_data = (
+                            pipeline.model.VideoRecording.File & fk
+                        ).fetch1()
+                        all_files.append(file_data)
+                    (pipeline.model.VideoRecording & recording_key).delete()
+                    pipeline.model.VideoRecording.insert1(
+                        {**recording_key, "device": "Camera1"}
+                    )
+                    for file_entry in all_files:
+                        if file_entry["file_id"] == 0:
+                            pipeline.model.VideoRecording.File.insert1(
+                                {
+                                    **recording_key,
+                                    "file_id": 0,
+                                    "file_path": str(relative_path),
+                                }
+                            )
+                        else:
+                            pipeline.model.VideoRecording.File.insert1(file_entry)
+                    status.sub(
+                        f"Updated file path for recording {recording_key['recording_id']}: {existing_path} -> {video_file_abs.name}",
+                        icon="🔄",
+                        indent=5,
+                    )
+                else:
+                    status.sub(
+                        f"File path for recording {recording_key['recording_id']} is already correct: {video_file_abs.name}",
+                        icon="✅",
+                        indent=5,
+                    )
+            else:
+                pipeline.model.VideoRecording.File.insert1(
+                    {**file_key, "file_path": str(relative_path)}
+                )
+                status.sub(
+                    f"Created file entry for recording {recording_key['recording_id']}: {video_file_abs.name}",
+                    icon="✅",
+                    indent=5,
+                )
+
+    status.sub(
+        f"Created {len(recording_keys)} recording(s) for inference", icon="✅", indent=3
+    )
+
     # 5. Extract video metadata (if videos exist)
     if recording_keys:
         status.step("Extracting video metadata")
@@ -592,72 +782,99 @@ def main():
                     f"Recording {rec_key['recording_id']}: {rec_info['px_width']}x{rec_info['px_height']}, "
                     f"{rec_info['nframes']} frames, {rec_info['fps']:.1f} fps",
                     icon="✅",
-                    indent=5
+                    indent=5,
                 )
         except ModuleNotFoundError as e:
             if "cv2" in str(e):
-                status.sub("OpenCV (cv2) is required for video metadata extraction", icon="⚠️", indent=3)
+                status.sub(
+                    "OpenCV (cv2) is required for video metadata extraction",
+                    icon="⚠️",
+                    indent=3,
+                )
                 status.sub("Install with: pip install opencv-python", indent=5)
             else:
                 raise
-    
+
     # 6. Training workflow (if not skipped)
     model_name = args.model_name
-    
+
     if not args.skip_training:
         status.step("Setting up training workflow")
-        
+
         # Check if training has already been done
-        if model.Model & {"model_name": model_name}:
+        if len(model.Model & {"model_name": model_name}):
             status.sub(f"Model '{model_name}' already exists", icon="ℹ️", indent=3)
-            status.sub("Use --skip-training to use existing model, or choose different --model-name", indent=5)
+            status.sub(
+                "Use --skip-training to use existing model, or choose different --model-name",
+                indent=5,
+            )
             if not args.skip_inference:
-                status.sub("Skipping training, proceeding to inference...", icon="⏭️", indent=3)
+                status.sub(
+                    "Skipping training, proceeding to inference...",
+                    icon="⏭️",
+                    indent=3,
+                )
                 args.skip_training = True
         else:
             import yaml
-            with open(config_file, 'r') as f:
+
+            with open(config_file, "r") as f:
                 dlc_config = yaml.safe_load(f)
-            
-            # CRITICAL: Truncate Task field early to fit varchar(32) constraint
-            # This must happen BEFORE creating training datasets or model folders
-            # to ensure consistency throughout the process
+
+            # Truncate Task field early to fit varchar(32) constraint
             if "Task" in dlc_config and len(dlc_config["Task"]) > 32:
                 original_task = dlc_config["Task"]
                 dlc_config["Task"] = original_task[:32]
-                status.sub(f"Truncated Task field from {len(original_task)} to 32 chars: '{dlc_config['Task']}'", icon="ℹ️", indent=3)
-                # Update the config file immediately to persist the change
-                with open(config_file, 'w') as f:
+                status.sub(
+                    f"Truncated Task field from {len(original_task)} to 32 chars: '{dlc_config['Task']}'",
+                    icon="ℹ️",
+                    indent=3,
+                )
+                with open(config_file, "w") as f:
                     yaml.dump(dlc_config, f, default_flow_style=False)
                 status.sub("Config file updated with truncated Task", icon="✅", indent=5)
-            
+
             # Check if project has labeled data
             labeled_data_dir = dlc_project_path / "labeled-data"
-            
-            # CRITICAL: Remove old H5 files - they may be in wrong format
-            # DLC will regenerate them from CSV during create_training_dataset
-            old_h5_files = list(labeled_data_dir.rglob("*.h5")) if labeled_data_dir.exists() else []
+
+            # Remove old H5 files - will be regenerated by DLC
+            old_h5_files = (
+                list(labeled_data_dir.rglob("*.h5"))
+                if labeled_data_dir.exists()
+                else []
+            )
             if old_h5_files:
-                status.sub(f"Removing {len(old_h5_files)} old H5 file(s) (will be regenerated by DLC)", icon="⚠️", indent=3)
+                status.sub(
+                    f"Removing {len(old_h5_files)} old H5 file(s) (will be regenerated by DLC)",
+                    icon="⚠️",
+                    indent=3,
+                )
                 for h5_file in old_h5_files:
                     h5_file.unlink()
                 status.sub("Old H5 files removed", icon="✅", indent=5)
-            
+
             labeled_files = (
                 list(labeled_data_dir.rglob("*.csv"))
                 if labeled_data_dir.exists()
                 else []
             )
-            
+
             if len(labeled_files) == 0:
-                status.sub("No labeled data found - creating mock labeled data", icon="⚠️", indent=3)
+                status.sub(
+                    "No labeled data found - creating mock labeled data",
+                    icon="⚠️",
+                    indent=3,
+                )
                 try:
-                    csv_path = create_mock_labeled_data(config_file, num_frames=20, use_existing_frames=False)
-                    status.sub(f"Mock labeled data created: {csv_path}", icon="✅", indent=5)
+                    csv_path = create_mock_labeled_data(
+                        config_file, num_frames=20, use_existing_frames=False
+                    )
+                    status.sub(
+                        f"Mock labeled data created: {csv_path}", icon="✅", indent=5
+                    )
                     labeled_files = list(labeled_data_dir.rglob("*.csv"))
-                    img_files = (
-                        list(labeled_data_dir.rglob("*.png"))
-                        + list(labeled_data_dir.rglob("*.jpg"))
+                    img_files = list(labeled_data_dir.rglob("*.png")) + list(
+                        labeled_data_dir.rglob("*.jpg")
                     )
                     if len(labeled_files) == 0:
                         raise ValueError("Failed to create labeled data files")
@@ -667,238 +884,285 @@ def main():
                         indent=5,
                     )
                 except Exception as e:
-                    status.sub(f"Error creating mock labeled data: {e}", icon="❌", indent=3)
+                    status.sub(
+                        f"Error creating mock labeled data: {e}", icon="❌", indent=3
+                    )
                     import traceback
+
                     status.sub(traceback.format_exc(), indent=5)
                     raise
             else:
-                status.sub(f"Found {len(labeled_files)} existing CSV file(s) (H5 will be generated by DLC)", icon="ℹ️", indent=3)
-            
+                status.sub(
+                    f"Found {len(labeled_files)} existing CSV file(s) (H5 will be generated by DLC)",
+                    icon="ℹ️",
+                    indent=3,
+                )
+
             # Remove old training artifacts
             training_datasets_dir = dlc_project_path / "training-datasets"
             if training_datasets_dir.exists():
-                status.sub("Training dataset exists; deleting to regenerate with current DLC...", icon="⚠️", indent=3)
+                status.sub(
+                    "Training dataset exists; deleting to regenerate with current DLC...",
+                    icon="⚠️",
+                    indent=3,
+                )
                 import shutil
+
                 shutil.rmtree(training_datasets_dir)
-                status.sub("Deleted old training-datasets directory", icon="✅", indent=5)
-            
+                status.sub(
+                    "Deleted old training-datasets directory", icon="✅", indent=5
+                )
+
             dlc_models_dir = dlc_project_path / "dlc-models"
             if dlc_models_dir.exists():
-                status.sub("Cleaning up old dlc-models directory...", icon="ℹ️", indent=5)
+                status.sub(
+                    "Cleaning up old dlc-models directory...", icon="ℹ️", indent=5
+                )
                 import shutil
+
                 shutil.rmtree(dlc_models_dir)
                 status.sub("Deleted old dlc-models directory", icon="✅", indent=5)
-            
+
             dlc_models_pytorch_dir = dlc_project_path / "dlc-models-pytorch"
             if dlc_models_pytorch_dir.exists():
-                status.sub("Cleaning up old dlc-models-pytorch directory...", icon="ℹ️", indent=5)
+                status.sub(
+                    "Cleaning up old dlc-models-pytorch directory...",
+                    icon="ℹ️",
+                    indent=5,
+                )
                 import shutil
+
                 shutil.rmtree(dlc_models_pytorch_dir)
-                status.sub("Deleted old dlc-models-pytorch directory", icon="✅", indent=5)
-            
+                status.sub(
+                    "Deleted old dlc-models-pytorch directory", icon="✅", indent=5
+                )
+
             # Simple training parameters
             shuffle = 1
             trainingsetindex = 0
-            
-            status.sub("Creating training dataset with deeplabcut.create_training_dataset", icon="ℹ️", indent=3)
-            import yaml
-            with open(config_file, 'r') as f:
+
+            status.sub(
+                "Creating training dataset with deeplabcut.create_training_dataset",
+                icon="ℹ️",
+                indent=3,
+            )
+            with open(config_file, "r") as f:
                 create_config = yaml.safe_load(f)
-            
+
             # Ensure engine is pytorch in config
             old_engine = create_config.get("engine", "not set")
             create_config["engine"] = "pytorch"
-            with open(config_file, 'w') as f:
+            with open(config_file, "w") as f:
                 yaml.dump(create_config, f, default_flow_style=False)
-            
+
             status.sub(
                 f"Config updated: engine={create_config.get('engine')} (was {old_engine})",
                 icon="ℹ️",
                 indent=5,
             )
-            
+
             try:
                 import deeplabcut
+                import pandas as pd
+
                 dlc_version = deeplabcut.__version__
                 status.sub(f"Using DLC version: {dlc_version}", icon="ℹ️", indent=5)
-                
-                # CRITICAL: Convert CSV to H5 first (DLC expects H5 files)
+
                 status.sub("Converting CSV to H5 format...", icon="ℹ️", indent=5)
                 try:
-                    # Use convertcsv2h5 with userfeedback=False to avoid prompts
                     deeplabcut.convertcsv2h5(str(config_file), userfeedback=False)
-                    
-                    # CRITICAL WORKAROUND for DLC 3.x bug:
-                    # format_training_data tries to reshape ALL values (including likelihood) into (x, y) pairs
-                    # This causes an error. We need to create a temporary H5 with only x, y columns
-                    # for training dataset creation, then restore the full version.
-                    import pandas as pd
+
                     labeled_data_dir = Path(config_file).parent / "labeled-data"
                     h5_files = list(labeled_data_dir.rglob("CollectedData_*.h5"))
-                    
+
                     for h5_file in h5_files:
                         df = pd.read_hdf(h5_file, key="df_with_missing")
-                        
-                        # Fix 1: If index is tuples, convert to strings
-                        if isinstance(df.index, pd.MultiIndex) or (len(df.index) > 0 and isinstance(df.index[0], tuple)):
-                            df.index = ['/'.join(str(x) for x in idx) if isinstance(idx, tuple) else str(idx) 
-                                       for idx in df.index]
-                        
-                        # WORKAROUND: Create a backup of the full file, then create x, y only version
-                        h5_file_backup = h5_file.parent / f"{h5_file.stem}_full_backup.h5"
-                        df.to_hdf(h5_file_backup, key="df_with_missing", mode="w", format="table")
-                        
-                        # Create x, y only version for format_training_data
+
+                        # Fix index to be strings if needed
+                        if isinstance(df.index, pd.MultiIndex) or (
+                            len(df.index) > 0 and isinstance(df.index[0], tuple)
+                        ):
+                            df.index = [
+                                "/".join(str(x) for x in idx)
+                                if isinstance(idx, tuple)
+                                else str(idx)
+                                for idx in df.index
+                            ]
+
+                        # Backup full file then create x,y-only version
+                        h5_file_backup = (
+                            h5_file.parent / f"{h5_file.stem}_full_backup.h5"
+                        )
+                        df.to_hdf(
+                            h5_file_backup,
+                            key="df_with_missing",
+                            mode="w",
+                            format="table",
+                        )
+
                         if isinstance(df.columns, pd.MultiIndex):
-                            xy_cols = [col for col in df.columns if col[2] in ['x', 'y']]
-                            if len(xy_cols) > 0:
+                            xy_cols = [
+                                col for col in df.columns if col[2] in ["x", "y"]
+                            ]
+                            if xy_cols:
                                 df_xy = df[xy_cols].copy()
-                                # Overwrite the main file with x, y only version
-                                df_xy.to_hdf(h5_file, key="df_with_missing", mode="w", format="table")
-                                status.sub(f"Created x, y only version for training dataset: {h5_file.name}", icon="✅", indent=7)
-                    
-                    status.sub("CSV converted to H5 successfully (x, y only for training dataset)", icon="✅", indent=7)
+                                df_xy.to_hdf(
+                                    h5_file,
+                                    key="df_with_missing",
+                                    mode="w",
+                                    format="table",
+                                )
+                                status.sub(
+                                    f"Created x, y only version for training dataset: {h5_file.name}",
+                                    icon="✅",
+                                    indent=7,
+                                )
+
+                    status.sub(
+                        "CSV converted to H5 successfully (x, y only for training dataset)",
+                        icon="✅",
+                        indent=7,
+                    )
                 except Exception as e:
-                    # If convertcsv2h5 fails, try to manually create H5 from CSV
                     status.sub(f"convertcsv2h5 failed: {e}", icon="⚠️", indent=7)
-                    status.sub("Attempting manual CSV to H5 conversion...", icon="ℹ️", indent=7)
+                    status.sub(
+                        "Attempting manual CSV to H5 conversion...", icon="ℹ️", indent=7
+                    )
                     try:
-                        import pandas as pd
                         import yaml
-                        
-                        # Read config
-                        with open(config_file, 'r') as f:
+
+                        with open(config_file, "r") as f:
                             cfg = yaml.safe_load(f)
-                        
-                        # Find CSV files
+
                         labeled_data_dir = Path(config_file).parent / "labeled-data"
                         csv_files = list(labeled_data_dir.rglob("CollectedData_*.csv"))
-                        
+
                         for csv_file in csv_files:
-                            # Read CSV - DLC CSV has 3 header rows
-                            # First read to get the structure
-                            df_temp = pd.read_csv(csv_file, nrows=0)
-                            
-                            # Read full CSV with MultiIndex
-                            df = pd.read_csv(csv_file, index_col=0, header=[0, 1, 2])
-                            
-                            # CRITICAL: Fix column names - pandas may have used first values as names
-                            # We need to ensure names are ["scorer", "bodyparts", "coords"]
+                            df = pd.read_csv(
+                                csv_file, index_col=0, header=[0, 1, 2]
+                            )
+
                             if isinstance(df.columns, pd.MultiIndex):
-                                # Get the actual level names (may be wrong)
-                                level_names = list(df.columns.names)
-                                
-                                # If names are wrong (e.g., using first values), fix them
-                                if level_names != ["scorer", "bodyparts", "coords"]:
-                                    # Reconstruct with correct names
-                                    new_columns = []
-                                    for col_tuple in df.columns:
-                                        new_columns.append(col_tuple)
-                                    df.columns = pd.MultiIndex.from_tuples(new_columns, names=["scorer", "bodyparts", "coords"])
+                                new_columns = [col for col in df.columns]
+                                df.columns = pd.MultiIndex.from_tuples(
+                                    new_columns,
+                                    names=["scorer", "bodyparts", "coords"],
+                                )
                             else:
-                                raise ValueError(f"Expected MultiIndex columns, got {type(df.columns)}")
-                            
-                            # Ensure index is string paths (not numeric or tuples)
+                                raise ValueError(
+                                    f"Expected MultiIndex columns, got {type(df.columns)}"
+                                )
+
                             if not all(isinstance(idx, str) for idx in df.index):
-                                # Convert index to strings
                                 df.index = [str(idx) for idx in df.index]
-                            
-                            # Save as H5 with proper format
-                            h5_file = csv_file.with_suffix('.h5')
-                            df.to_hdf(h5_file, key="df_with_missing", mode="w", format="table")
-                            status.sub(f"Created {h5_file.name} with correct MultiIndex structure", icon="✅", indent=9)
-                        
-                        status.sub("Manual CSV to H5 conversion completed", icon="✅", indent=7)
+
+                            h5_file = csv_file.with_suffix(".h5")
+                            df.to_hdf(
+                                h5_file,
+                                key="df_with_missing",
+                                mode="w",
+                                format="table",
+                            )
+                            status.sub(
+                                f"Created {h5_file.name} with correct MultiIndex structure",
+                                icon="✅",
+                                indent=9,
+                            )
+
+                        status.sub(
+                            "Manual CSV to H5 conversion completed", icon="✅", indent=7
+                        )
                     except Exception as e2:
-                        status.sub(f"Manual conversion also failed: {e2}", icon="⚠️", indent=7)
+                        status.sub(
+                            f"Manual conversion also failed: {e2}",
+                            icon="⚠️",
+                            indent=7,
+                        )
                         import traceback
+
                         status.sub(traceback.format_exc(), indent=9)
-                        status.sub("Continuing - DLC may handle conversion internally", icon="ℹ️", indent=7)
-                
-                status.sub("Calling deeplabcut.create_training_dataset(..., num_shuffles=1)", icon="ℹ️", indent=5)
-                
-                # Let DLC 3 create .mat, metadata, and model config
+                        status.sub(
+                            "Continuing - DLC may handle conversion internally",
+                            icon="ℹ️",
+                            indent=7,
+                        )
+
+                status.sub(
+                    "Calling deeplabcut.create_training_dataset(..., num_shuffles=1)",
+                    icon="ℹ️",
+                    indent=5,
+                )
+
                 deeplabcut.create_training_dataset(str(config_file), num_shuffles=1)
-                status.sub("Training dataset created successfully by DLC", icon="✅", indent=5)
-                
-                # Restore full H5 files (with likelihood) from backup after training dataset creation
-                import pandas as pd
+                status.sub(
+                    "Training dataset created successfully by DLC", icon="✅", indent=5
+                )
+
+                # Restore full H5 files (with likelihood) from backup
                 labeled_data_dir = Path(config_file).parent / "labeled-data"
                 backup_files = list(labeled_data_dir.rglob("*_full_backup.h5"))
                 for backup_file in backup_files:
-                    original_file = backup_file.parent / backup_file.name.replace("_full_backup.h5", ".h5")
+                    original_file = backup_file.parent / backup_file.name.replace(
+                        "_full_backup.h5", ".h5"
+                    )
                     if original_file.exists():
-                        df_full = pd.read_hdf(backup_file, key="df_with_missing")
-                        df_full.to_hdf(original_file, key="df_with_missing", mode="w", format="table")
-                        backup_file.unlink()  # Remove backup
-                        status.sub(f"Restored full H5 file (with likelihood): {original_file.name}", icon="✅", indent=7)
-                
-                # Quick sanity check: metadata.yaml should exist
+                        df_full = pd.read_hdf(
+                            backup_file, key="df_with_missing"
+                        )
+                        df_full.to_hdf(
+                            original_file,
+                            key="df_with_missing",
+                            mode="w",
+                            format="table",
+                        )
+                        backup_file.unlink()
+                        status.sub(
+                            f"Restored full H5 file (with likelihood): {original_file.name}",
+                            icon="✅",
+                            indent=7,
+                        )
+
                 metadata_files = list(training_datasets_dir.rglob("metadata.yaml"))
                 if not metadata_files:
                     raise FileNotFoundError(
                         "Training dataset metadata file not found after create_training_dataset"
                     )
-                status.sub(f"Found metadata file: {metadata_files[0]}", icon="ℹ️", indent=5)
-            
+                status.sub(
+                    f"Found metadata file: {metadata_files[0]}",
+                    icon="ℹ️",
+                    indent=5,
+                )
+
             except Exception as e:
                 error_str = str(e)
-                # Check if this is the known DLC 3.x bug with format_training_data
-                if "all the input array dimensions" in error_str and "size 4" in error_str and "size 6" in error_str:
-                    status.sub("Known DLC 3.x bug detected in format_training_data", icon="⚠️", indent=3)
-                    status.sub("This is a bug in DLC 3.x where format_training_data tries to reshape", indent=5)
-                    status.sub("all values (including likelihood) into (x, y) pairs.", indent=5)
-                    status.sub("", indent=5)
-                    status.sub("Workaround: Creating training dataset manually...", icon="ℹ️", indent=5)
-                    try:
-                        # Try to work around by using DLC's internal functions differently
-                        # or by creating a minimal training dataset structure
-                        from deeplabcut.generate_training_dataset.trainingsetmanipulation import merge_annotateddatasets
-                        import pandas as pd
-                        
-                        # Read the H5 file
-                        labeled_data_dir = Path(config_file).parent / "labeled-data"
-                        h5_files = list(labeled_data_dir.rglob("CollectedData_*.h5"))
-                        if h5_files:
-                            df = pd.read_hdf(h5_files[0], key="df_with_missing")
-                            # Select only x and y columns for training dataset
-                            xy_cols = [col for col in df.columns if col[2] in ['x', 'y']]
-                            df_xy = df[xy_cols].copy()
-                            
-                            status.sub("This workaround is not yet implemented.", icon="⚠️", indent=7)
-                            status.sub("Please report this bug to DeepLabCut:", indent=7)
-                            status.sub("https://github.com/DeepLabCut/DeepLabCut/issues", indent=7)
-                            status.sub("", indent=5)
-                            status.sub("Alternative: Use DLC 2.x (TensorFlow) for training,", indent=5)
-                            status.sub("or wait for DLC 3.x to fix this issue.", indent=5)
-                    except Exception as e2:
-                        pass
-                
+                if (
+                    "all the input array dimensions" in error_str
+                    and "size 4" in error_str
+                    and "size 6" in error_str
+                ):
+                    status.sub(
+                        "Known DLC 3.x bug detected in format_training_data",
+                        icon="⚠️",
+                        indent=3,
+                    )
                 status.sub(f"Error creating training dataset: {e}", icon="❌", indent=3)
                 import traceback
+
                 status.sub(traceback.format_exc(), indent=5)
                 status.sub(
                     "This appears to be a bug in DLC 3.x's format_training_data function.",
                     indent=5,
                 )
-                status.sub(
-                    "The function tries to reshape all values (including likelihood) into (x, y) pairs,",
-                    indent=5,
-                )
-                status.sub(
-                    "but should only reshape x and y values.",
-                    indent=5,
-                )
                 sys.exit(1)
-            
+
             # Ensure VideoSet exists
             video_set_key = {"video_set_id": 1}
-            if not (train.VideoSet & video_set_key):
+            if not len(train.VideoSet & video_set_key):
                 train.VideoSet.insert1(video_set_key, skip_duplicates=True)
-            
+
             # TrainingParamSet
             paramset_key = {"paramset_idx": 0}
-            if not (train.TrainingParamSet & paramset_key):
+            if not len(train.TrainingParamSet & paramset_key):
                 default_params = {
                     "shuffle": shuffle,
                     "trainingsetindex": trainingsetindex,
@@ -911,20 +1175,27 @@ def main():
                     params=default_params,
                     paramset_idx=0,
                 )
-            
+
             # TrainingTask
             training_id = 1
-            training_task_key = {**video_set_key, **paramset_key, "training_id": training_id}
-            
-            # Delete old training task if it exists with wrong project path
-            if train.TrainingTask & training_task_key:
+            training_task_key = {
+                **video_set_key,
+                **paramset_key,
+                "training_id": training_id,
+            }
+
+            if len(train.TrainingTask & training_task_key):
                 old_task = (train.TrainingTask & training_task_key).fetch1()
                 if old_task["project_path"] != str(dlc_project_rel):
-                    status.sub(f"Deleting old training task with wrong project path: {old_task['project_path']}", icon="⚠️", indent=3)
+                    status.sub(
+                        f"Deleting old training task with wrong project path: {old_task['project_path']}",
+                        icon="⚠️",
+                        indent=3,
+                    )
                     (train.TrainingTask & training_task_key).delete()
                     status.sub("Old training task deleted", icon="✅", indent=5)
-            
-            if not (train.TrainingTask & training_task_key):
+
+            if not len(train.TrainingTask & training_task_key):
                 train.TrainingTask.insert1(
                     {
                         **training_task_key,
@@ -935,65 +1206,62 @@ def main():
                 )
                 status.sub("Created training task", icon="✅", indent=3)
             else:
-                status.sub("Training task already exists with correct project path", icon="ℹ️", indent=3)
-            
+                status.sub(
+                    "Training task already exists with correct project path",
+                    icon="ℹ️",
+                    indent=3,
+                )
+
             # 7. Train the model (mocked for functional test)
             status.step("Training the model (mocked)")
             status.sub("Training is mocked for this functional test", icon="ℹ️", indent=3)
             status.sub("No actual model training will occur", icon="ℹ️", indent=3)
-            
+
             training_was_mocked = True
-            
+
             def create_mock_pytorch_config(config_path, project_path, dlc_config):
                 """Create a mock pytorch_config.yaml file for inference."""
                 import yaml
-                
-                # Get bodyparts and other metadata from dlc_config
-                bodyparts = dlc_config.get("bodyparts", ["bodypart1", "bodypart2", "bodypart3"])
+
+                bodyparts = dlc_config.get(
+                    "bodyparts", ["bodypart1", "bodypart2", "bodypart3"]
+                )
                 unique_bodyparts = dlc_config.get("uniquebodyparts", [])
                 individuals = dlc_config.get("individuals", [])
                 multianimal = dlc_config.get("multianimalproject", False)
-                
-                # Create minimal but valid pytorch_config.yaml
+
                 pytorch_config = {
                     "data": {
                         "bbox_margin": 20,
                         "colormode": "RGB",
-                        "inference": {
-                            "normalize_images": True
-                        },
+                        "inference": {"normalize_images": True},
                         "train": {
                             "affine": {
                                 "p": 0.5,
                                 "rotation": 30,
                                 "scaling": [0.5, 1.25],
-                                "translation": 0
+                                "translation": 0,
                             },
                             "crop_sampling": {
                                 "width": 448,
                                 "height": 448,
                                 "max_shift": 0.1,
-                                "method": "hybrid"
+                                "method": "hybrid",
                             },
                             "gaussian_noise": 12.75,
                             "motion_blur": True,
-                            "normalize_images": True
-                        }
+                            "normalize_images": True,
+                        },
                     },
                     "device": "auto",
                     "inference": {
                         "multithreading": {
                             "enabled": True,
                             "queue_length": 4,
-                            "timeout": 30.0
-                        },
-                        "compile": {
-                            "enabled": False,
-                            "backend": "inductor"
+                            "timeout": 30.0,
                         },
-                        "autocast": {
-                            "enabled": False
-                        }
+                        "compile": {"enabled": False, "backend": "inductor"},
+                        "autocast": {"enabled": False},
                     },
                     "metadata": {
                         "project_path": str(project_path),
@@ -1001,7 +1269,7 @@ def create_mock_pytorch_config(config_path, project_path, dlc_config):
                         "bodyparts": bodyparts,
                         "unique_bodyparts": unique_bodyparts,
                         "individuals": individuals if multianimal else [],
-                        "with_identity": multianimal
+                        "with_identity": multianimal,
                     },
                     "method": "bu",
                     "model": {
@@ -1010,7 +1278,7 @@ def create_mock_pytorch_config(config_path, project_path, dlc_config):
                             "model_name": "resnet50_gn",
                             "output_stride": 16,
                             "freeze_bn_stats": False,
-                            "freeze_bn_weights": False
+                            "freeze_bn_weights": False,
                         },
                         "backbone_output_channels": 2048,
                         "heads": {
@@ -1022,7 +1290,7 @@ def create_mock_pytorch_config(config_path, project_path, dlc_config):
                                     "apply_sigmoid": False,
                                     "clip_scores": True,
                                     "location_refinement": True,
-                                    "locref_std": 7.2801
+                                    "locref_std": 7.2801,
                                 },
                                 "target_generator": {
                                     "type": "HeatmapGaussianGenerator",
@@ -1031,30 +1299,30 @@ def create_mock_pytorch_config(config_path, project_path, dlc_config):
                                     "heatmap_mode": "KEYPOINT",
                                     "gradient_masking": False,
                                     "generate_locref": True,
-                                    "locref_std": 7.2801
+                                    "locref_std": 7.2801,
                                 },
                                 "criterion": {
                                     "heatmap": {
                                         "type": "WeightedMSECriterion",
-                                        "weight": 1.0
+                                        "weight": 1.0,
                                     },
                                     "locref": {
                                         "type": "WeightedHuberCriterion",
-                                        "weight": 0.05
-                                    }
+                                        "weight": 0.05,
+                                    },
                                 },
                                 "heatmap_config": {
                                     "channels": [2048, len(bodyparts)],
                                     "kernel_size": [3],
-                                    "strides": [2]
+                                    "strides": [2],
                                 },
                                 "locref_config": {
                                     "channels": [2048, len(bodyparts) * 2],
                                     "kernel_size": [3],
-                                    "strides": [2]
-                                }
+                                    "strides": [2],
+                                },
                             }
-                        }
+                        },
                     },
                     "net_type": "resnet_50",
                     "runner": {
@@ -1065,22 +1333,20 @@ def create_mock_pytorch_config(config_path, project_path, dlc_config):
                         "eval_interval": 10,
                         "optimizer": {
                             "type": "AdamW",
-                            "params": {
-                                "lr": 0.0005
-                            }
+                            "params": {"lr": 0.0005},
                         },
                         "scheduler": {
                             "type": "LRListScheduler",
                             "params": {
                                 "lr_list": [[0.0001], [1e-05]],
-                                "milestones": [90, 120]
-                            }
+                                "milestones": [90, 120],
+                            },
                         },
                         "snapshots": {
                             "max_snapshots": 5,
                             "save_epochs": 25,
-                            "save_optimizer_state": False
-                        }
+                            "save_optimizer_state": False,
+                        },
                     },
                     "train_settings": {
                         "batch_size": 8,
@@ -1088,246 +1354,275 @@ def create_mock_pytorch_config(config_path, project_path, dlc_config):
                         "dataloader_pin_memory": False,
                         "display_iters": 500,
                         "epochs": 200,
-                        "seed": 42
-                    }
+                        "seed": 42,
+                    },
                 }
-                
-                # Write the config file
+
                 with open(config_path, "w") as f:
                     yaml.dump(pytorch_config, f, default_flow_style=False, sort_keys=False)
-            
+
             try:
                 # Store original make method
                 original_make = pipeline.train.ModelTraining.make
-                
+
                 def mocked_make(self, key):
                     """Mocked make() that skips training but creates snapshot file."""
                     from pathlib import Path
-                    import yaml
+                    import yaml as _yaml
                     from element_interface.utils import find_full_path
-                    from element_deeplabcut.train import get_dlc_root_data_dir, TrainingTask, TrainingParamSet
-                    from element_deeplabcut.readers import dlc_reader
-                    
-                    # Get project path and config (same as original make())
+                    from element_deeplabcut.train import (
+                        get_dlc_root_data_dir,
+                        TrainingTask,
+                        TrainingParamSet,
+                    )
+                    from element_deeplabcut.readers import dlc_reader as _dlc_reader
+
                     project_path, model_prefix = (TrainingTask & key).fetch1(
                         "project_path", "model_prefix"
                     )
-                    project_path = find_full_path(get_dlc_root_data_dir(), project_path)
+                    project_path = find_full_path(
+                        get_dlc_root_data_dir(), project_path
+                    )
                     project_path = Path(project_path)
                     if project_path.is_file():
                         project_path = project_path.parent
-                    
-                    # Read config
-                    _, dlc_config = dlc_reader.read_yaml(project_path)
+
+                    _, dlc_config_local = _dlc_reader.read_yaml(project_path)
                     training_params = (TrainingParamSet & key).fetch1("params")
-                    shuffle = training_params.get("shuffle", dlc_config.get("shuffle", 1))
-                    trainingsetindex = training_params.get("trainingsetindex", dlc_config.get("trainingsetindex", 0))
-                    
-                    # Update config (simplified version of original make())
-                    dlc_config["shuffle"] = int(shuffle)
-                    dlc_config["trainingsetindex"] = int(trainingsetindex)
-                    train_fraction = dlc_config["TrainingFraction"][int(trainingsetindex)]
-                    dlc_config["train_fraction"] = train_fraction
-                    dlc_config["project_path"] = project_path.as_posix()
-                    dlc_config["modelprefix"] = model_prefix
-                    
-                    # Determine model folder and create snapshot
+                    shuffle_local = training_params.get(
+                        "shuffle", dlc_config_local.get("shuffle", 1)
+                    )
+                    trainingsetindex_local = training_params.get(
+                        "trainingsetindex", dlc_config_local.get("trainingsetindex", 0)
+                    )
+
+                    dlc_config_local["shuffle"] = int(shuffle_local)
+                    dlc_config_local["trainingsetindex"] = int(trainingsetindex_local)
+                    train_fraction = dlc_config_local["TrainingFraction"][
+                        int(trainingsetindex_local)
+                    ]
+                    dlc_config_local["train_fraction"] = train_fraction
+                    dlc_config_local["project_path"] = project_path.as_posix()
+                    dlc_config_local["modelprefix"] = model_prefix
+
                     try:
-                        from deeplabcut.utils.auxiliaryfunctions import get_model_folder
+                        from deeplabcut.utils.auxiliaryfunctions import (
+                            get_model_folder,
+                        )
                     except ImportError:
-                        from deeplabcut.utils.auxiliaryfunctions import GetModelFolder as get_model_folder
-                    
+                        from deeplabcut.utils.auxiliaryfunctions import (
+                            GetModelFolder as get_model_folder,
+                        )
+
                     model_folder = get_model_folder(
                         trainFraction=train_fraction,
-                        shuffle=int(shuffle),
-                        cfg=dlc_config,
+                        shuffle=int(shuffle_local),
+                        cfg=dlc_config_local,
                         modelprefix=model_prefix,
                     )
-                    
-                    # For DLC 3.x PyTorch, the folder should be under dlc-models-pytorch, not dlc-models
-                    # get_model_folder might return a path with dlc-models, so we need to adjust it
-                    engine = dlc_config.get("engine", "pytorch")
+
+                    engine = dlc_config_local.get("engine", "pytorch")
                     model_folder_str = str(model_folder)
-                    
-                    if engine == "pytorch":
-                        # For PyTorch, ensure we're using dlc-models-pytorch instead of dlc-models
-                        # Replace any occurrence of dlc-models with dlc-models-pytorch
-                        if "dlc-models-pytorch" not in model_folder_str:
-                            model_folder_str = model_folder_str.replace("dlc-models", "dlc-models-pytorch")
-                        model_folder = model_folder_str
-                    
-                    # Ensure model_folder is a Path object and construct train folder path
+
+                    if engine == "pytorch" and "dlc-models-pytorch" not in model_folder_str:
+                        model_folder_str = model_folder_str.replace(
+                            "dlc-models", "dlc-models-pytorch"
+                        )
+                    model_folder = model_folder_str
+
                     if isinstance(model_folder, str):
                         model_folder_path = Path(model_folder)
                     else:
                         model_folder_path = Path(model_folder)
-                    
-                    # Construct absolute path to train folder
+
                     if model_folder_path.is_absolute():
                         model_train_folder = model_folder_path / "train"
                     else:
                         model_train_folder = project_path / model_folder_path / "train"
-                    
+
                     model_train_folder = model_train_folder.resolve()
                     model_train_folder.mkdir(parents=True, exist_ok=True)
-                    
-                    # Log the absolute path for debugging
+
                     logger.info(f"Model train folder (absolute): {model_train_folder}")
-                    
-                    # Log the path for debugging
-                    logger.info(f"Creating mock snapshots in: {model_train_folder}")
-                    logger.info(f"Model train folder exists: {model_train_folder.exists()}")
-                    
-                    # Create fake snapshot file (DLC looks for snapshot*.index files)
-                    # Use a snapshot number that matches saveiters (typically 1000)
-                    snapshot_num = 1000  # Common snapshot number
+
+                    snapshot_num = 1000
                     snapshot_file = model_train_folder / f"snapshot-{snapshot_num}.index"
                     snapshot_file.touch()
-                    logger.info(f"Created: {snapshot_file} (exists: {snapshot_file.exists()})")
-                    
-                    # Also create the corresponding .data and .meta files that DLC might expect
-                    snapshot_data = model_train_folder / f"snapshot-{snapshot_num}.data-00000-of-00001"
+                    logger.info(
+                        f"Created: {snapshot_file} (exists: {snapshot_file.exists()})"
+                    )
+
+                    snapshot_data = (
+                        model_train_folder
+                        / f"snapshot-{snapshot_num}.data-00000-of-00001"
+                    )
                     snapshot_data.touch()
-                    logger.info(f"Created: {snapshot_data} (exists: {snapshot_data.exists()})")
-                    
+                    logger.info(
+                        f"Created: {snapshot_data} (exists: {snapshot_data.exists()})"
+                    )
+
                     snapshot_meta = model_train_folder / f"snapshot-{snapshot_num}.meta"
                     snapshot_meta.touch()
-                    logger.info(f"Created: {snapshot_meta} (exists: {snapshot_meta.exists()})")
-                    
-                    # For PyTorch, DLC's get_model_snapshots looks for .pth files
-                    # Create a minimal valid PyTorch checkpoint file
+                    logger.info(
+                        f"Created: {snapshot_meta} (exists: {snapshot_meta.exists()})"
+                    )
+
                     if engine == "pytorch":
                         try:
                             import torch
-                            snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
-                            # Create a minimal PyTorch checkpoint dict
-                            # DLC expects certain keys, including "model" for loading state_dict
+
+                            snapshot_pth = (
+                                model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            )
                             mock_checkpoint = {
                                 "epoch": 0,
-                                "state_dict": {},  # Empty state dict is fine for mock
-                                "model": {},  # DLC expects this key for model.load_state_dict(snapshot["model"])
+                                "state_dict": {},
+                                "model": {},
                                 "optimizer": None,
                             }
                             torch.save(mock_checkpoint, snapshot_pth)
                             logger.info(f"Created PyTorch snapshot: {snapshot_pth}")
-                            
-                            # Also create files with underscore pattern (some DLC versions use this)
-                            snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+
+                            snapshot_pth_alt = (
+                                model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            )
                             if not snapshot_pth_alt.exists():
                                 torch.save(mock_checkpoint, snapshot_pth_alt)
-                                logger.info(f"Created alternate PyTorch snapshot: {snapshot_pth_alt}")
+                                logger.info(
+                                    f"Created alternate PyTorch snapshot: {snapshot_pth_alt}"
+                                )
                         except ImportError:
-                            # If torch is not available, create empty .pth files as fallback
-                            logger.warning("PyTorch not available, creating empty .pth files")
-                            snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
-                            snapshot_pth.write_bytes(b"")  # Create empty file
-                            snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            logger.warning(
+                                "PyTorch not available, creating empty .pth files"
+                            )
+                            snapshot_pth = (
+                                model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            )
+                            snapshot_pth.write_bytes(b"")
+                            snapshot_pth_alt = (
+                                model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            )
                             snapshot_pth_alt.write_bytes(b"")
                         except Exception as e:
-                            logger.error(f"Error creating PyTorch snapshots: {e}")
-                            # Fallback: create empty files
-                            snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            logger.error(
+                                f"Error creating PyTorch snapshots: {e}"
+                            )
+                            snapshot_pth = (
+                                model_train_folder / f"snapshot-{snapshot_num}.pth"
+                            )
                             snapshot_pth.write_bytes(b"")
-                            snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            snapshot_pth_alt = (
+                                model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            )
                             snapshot_pth_alt.write_bytes(b"")
-                        
-                        # CRITICAL: Ensure .pth files exist - DLC's get_model_snapshots looks for these
-                        # Create them even if torch.save failed
-                        snapshot_pth = model_train_folder / f"snapshot-{snapshot_num}.pth"
+
+                        snapshot_pth = (
+                            model_train_folder / f"snapshot-{snapshot_num}.pth"
+                        )
                         if not snapshot_pth.exists():
-                            logger.warning(f"snapshot-{snapshot_num}.pth not found, creating empty file")
-                            snapshot_pth.write_bytes(b"PK\x03\x04")  # Minimal zip header (PyTorch uses zip format)
-                        
-                        snapshot_pth_alt = model_train_folder / f"snapshot_{snapshot_num}.pth"
+                            logger.warning(
+                                f"snapshot-{snapshot_num}.pth not found, creating empty file"
+                            )
+                            snapshot_pth.write_bytes(b"PK\x03\x04")
+
+                        snapshot_pth_alt = (
+                            model_train_folder / f"snapshot_{snapshot_num}.pth"
+                        )
                         if not snapshot_pth_alt.exists():
                             snapshot_pth_alt.write_bytes(b"PK\x03\x04")
-                        
-                        # Verify files were created
+
                         created_files = list(model_train_folder.glob("snapshot*"))
-                        logger.info(f"All snapshot files in directory: {[f.name for f in created_files]}")
-                        
-                        # Double-check .pth files exist (DLC requires these for PyTorch)
+                        logger.info(
+                            f"All snapshot files in directory: {[f.name for f in created_files]}"
+                        )
+
                         pth_files = list(model_train_folder.glob("*.pth"))
                         logger.info(f".pth files found: {[f.name for f in pth_files]}")
                         if not pth_files:
                             raise FileNotFoundError(
-                                f"No .pth files found in {model_train_folder} after creation attempt. "
-                                f"Directory contents: {[f.name for f in model_train_folder.iterdir()]}"
+                                f"No .pth files found in {model_train_folder} after creation attempt."
                             )
-                        
-                        # Create mock pytorch_config.yaml file for inference
+
                         pytorch_config_path = model_train_folder / "pytorch_config.yaml"
-                        create_mock_pytorch_config(pytorch_config_path, project_path, dlc_config)
-                        logger.info(f"Created mock pytorch_config.yaml: {pytorch_config_path}")
-                    
-                    # Update snapshotindex in config (same as original make() does)
-                    # Since we have one snapshot, the index is 0
-                    dlc_config["snapshotindex"] = 0
+                        create_mock_pytorch_config(
+                            pytorch_config_path, project_path, dlc_config_local
+                        )
+                        logger.info(
+                            f"Created mock pytorch_config.yaml: {pytorch_config_path}"
+                        )
+
+                    dlc_config_local["snapshotindex"] = 0
                     try:
                         from deeplabcut.utils.auxiliaryfunctions import edit_config
-                    except ImportError:
-                        # If edit_config doesn't exist, we'll just update the config dict
-                        pass
-                    else:
+
                         config_file_path = project_path / "config.yaml"
                         edit_config(str(config_file_path), {"snapshotindex": 0})
-                    
-                    # Insert the record (same as original make() does at the end)
+                    except ImportError:
+                        pass
+
                     self.insert1(
-                        {**key, "latest_snapshot": snapshot_num, "config_template": dlc_config}
+                        {
+                            **key,
+                            "latest_snapshot": snapshot_num,
+                            "config_template": dlc_config_local,
+                        }
                     )
-                
-                # Temporarily replace make() method
+
                 pipeline.train.ModelTraining.make = mocked_make
-                
+
                 try:
                     pipeline.train.ModelTraining.populate()
-                    status.sub("Model training completed (mocked)!", icon="✅", indent=3)
+                    status.sub(
+                        "Model training completed (mocked)!", icon="✅", indent=3
+                    )
                 finally:
-                    # Restore original make() method
                     pipeline.train.ModelTraining.make = original_make
-                        
+
             except KeyboardInterrupt:
                 status.sub("Training interrupted by user", icon="⚠️", indent=3)
-                status.sub("Resume later with: pipeline.train.ModelTraining.populate()", icon="ℹ️", indent=5)
+                status.sub(
+                    "Resume later with: pipeline.train.ModelTraining.populate()",
+                    icon="ℹ️",
+                    indent=5,
+                )
                 sys.exit(0)
             except Exception as e:
                 status.sub(f"Error during training: {e}", icon="❌", indent=3)
                 raise
-            
+
             # 8. Insert trained model into Model table
             status.step("Inserting trained model into Model table")
-            
-            training_result = (pipeline.train.ModelTraining & training_task_key).fetch1()
+
+            training_result = (
+                pipeline.train.ModelTraining & training_task_key
+            ).fetch1()
             latest_snapshot = training_result["latest_snapshot"]
             status.sub(f"Using snapshot: {latest_snapshot}", icon="ℹ️", indent=3)
-            
-            # ------------------------------------------------------------------
-            # DLC 3.x workaround for MOCKED TRAINING:
-            # element_deeplabcut.model.insert_new_model calls get_scorer_name,
-            # which tries to find real snapshot files on disk.
-            # Since we only created fake snapshots (no real training), we patch
-            # get_scorer_name to avoid the filesystem check.
-            # ------------------------------------------------------------------
+
             def _mock_get_scorer_name(*args, **kwargs):
-                # Return any valid-looking scorer string; DLC only uses this as a prefix.
                 return "mock_scorer"
-            
-            # Task field should already be truncated (done early in the workflow)
-            # Just verify it's still within limits before model insertion
+
             import yaml
-            with open(config_file, 'r') as f:
+
+            with open(config_file, "r") as f:
                 dlc_config_for_insert = yaml.safe_load(f)
-            
-            if "Task" in dlc_config_for_insert and len(dlc_config_for_insert["Task"]) > 32:
-                # This shouldn't happen if truncation was done early, but handle it just in case
-                status.sub(f"WARNING: Task field still too long ({len(dlc_config_for_insert['Task'])} chars), truncating now", icon="⚠️", indent=3)
+
+            if "Task" in dlc_config_for_insert and len(
+                dlc_config_for_insert["Task"]
+            ) > 32:
+                status.sub(
+                    f"WARNING: Task field still too long ({len(dlc_config_for_insert['Task'])} chars), truncating now",
+                    icon="⚠️",
+                    indent=3,
+                )
                 dlc_config_for_insert["Task"] = dlc_config_for_insert["Task"][:32]
-                with open(config_file, 'w') as f:
+                with open(config_file, "w") as f:
                     yaml.dump(dlc_config_for_insert, f, default_flow_style=False)
-            
-            # Patch get_scorer_name at the module where it's imported
-            with patch('deeplabcut.pose_estimation_pytorch.apis.utils.get_scorer_name', side_effect=_mock_get_scorer_name):
+
+            with patch(
+                "deeplabcut.pose_estimation_pytorch.apis.utils.get_scorer_name",
+                side_effect=_mock_get_scorer_name,
+            ):
                 model.Model.insert_new_model(
                     model_name=model_name,
                     dlc_config=str(config_file_rel),
@@ -1339,14 +1634,14 @@ def _mock_get_scorer_name(*args, **kwargs):
             status.sub(f"Inserted model: {model_name}", icon="✅", indent=3)
     else:
         status.step("Skipping training (using existing model)")
-        if not (model.Model & {"model_name": model_name}):
+        if not len(model.Model & {"model_name": model_name}):
             status.sub(f"Model '{model_name}' not found", icon="❌", indent=3)
             status.sub("Available models:", indent=3)
             for m in model.Model.fetch("model_name"):
                 status.sub(f"  - {m}", indent=5)
             sys.exit(1)
         status.sub(f"Using existing model: {model_name}", icon="✅", indent=3)
-    
+
     # 9. Create pose estimation tasks (if videos exist)
     if recording_keys and not args.skip_inference:
         status.step("Creating pose estimation tasks")
@@ -1355,7 +1650,7 @@ def _mock_get_scorer_name(*args, **kwargs):
             output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
                 task_key, relative=False, mkdir=False
             )
-            
+
             results_exist = False
             output_path = Path(output_dir)
             if output_path.exists():
@@ -1368,222 +1663,183 @@ def _mock_get_scorer_name(*args, **kwargs):
                         icon="✅",
                         indent=5,
                     )
-            
+
             task_mode = "load" if results_exist else None
-            
+
             pipeline.model.PoseEstimationTask.generate(
                 rec_key,
                 model_name=model_name,
                 task_mode=task_mode,
                 analyze_videos_params={
                     "videotype": ".mp4",
-                    "gputouse": 0,
+                    "gputouse": args.gpu if args.gpu >= 0 else None,
+                    "device": f"cuda:{args.gpu}" if args.gpu >= 0 else "cpu",
+                    "batch_size": args.batch_size,
+                    "batchsize": args.batch_size,
                     "save_as_csv": True,
                 },
             )
-            status.sub(f"Task created for recording {rec_key['recording_id']}", icon="✅", indent=5)
-    
+            status.sub(
+                f"Task created for recording {rec_key['recording_id']}",
+                icon="✅",
+                indent=5,
+            )
+
     # 10. Run inference (if not skipped)
     if recording_keys and not args.skip_inference:
         status.step("Running inference or loading existing results")
-        
+
         if training_was_mocked:
-            status.sub("Using mock trained model files for inference", icon="ℹ️", indent=3)
-            status.sub("Note: Results will be based on mock model weights", icon="⚠️", indent=5)
-        
+            status.sub(
+                "Using mock trained model files for inference",
+                icon="ℹ️",
+                indent=3,
+            )
+            status.sub(
+                "Note: Results will be based on mock model weights",
+                icon="⚠️",
+                indent=5,
+            )
+
         all_in_load_mode = True
         for rec_key in recording_keys:
             task_key = {**rec_key, "model_name": model_name}
             try:
-                task_mode = (pipeline.model.PoseEstimationTask & task_key).fetch1("task_mode")
+                task_mode = (
+                    pipeline.model.PoseEstimationTask & task_key
+                ).fetch1("task_mode")
                 if task_mode != "load":
                     all_in_load_mode = False
-            except:
+            except Exception:
                 all_in_load_mode = False
-        
+
         if all_in_load_mode:
-            status.sub("All tasks in 'load' mode - using existing results", icon="ℹ️", indent=3)
+            status.sub(
+                "All tasks in 'load' mode - using existing results",
+                icon="ℹ️",
+                indent=3,
+            )
         else:
             status.sub("Running inference (this may take a while)", icon="⚠️", indent=3)
             status.sub("GPU is recommended for speed", icon="ℹ️", indent=5)
-        
-        # Patch DLC's get_model_snapshots during inference so it always
-        # "finds" at least one snapshot and (if needed) creates dummy files.
+
         def _mock_get_model_snapshots(*args, **kwargs):
-            """
-            Mock replacement for deeplabcut.pose_estimation_pytorch.apis.utils.get_model_snapshots
-
-            - Accepts any arguments (flexible signature)
-            - Extracts train_dir from args or kwargs
-            - Ensures the `train_dir` exists
-            - Creates dummy snapshot-1000.* files if missing
-            - Returns a list with exactly one snapshot base path
-            """
             from pathlib import Path
-            
-            # Extract train_dir from args or kwargs
-            # DLC typically calls: get_model_snapshots(snapshot_index, train_dir, pose_task=None)
+
             train_dir = None
             if args and len(args) >= 2:
-                train_dir = args[1]  # Second positional arg is usually train_dir
+                train_dir = args[1]
             elif "train_dir" in kwargs:
                 train_dir = kwargs["train_dir"]
             elif args and len(args) >= 1:
-                # Sometimes train_dir might be first arg
                 train_dir = args[0]
-            
+
             if train_dir is None:
-                # Fallback: try to find it from kwargs with different names
                 for key in ["train_dir", "train_path", "model_dir", "snapshot_dir"]:
                     if key in kwargs:
                         train_dir = kwargs[key]
                         break
-            
+
             if train_dir is None:
                 raise ValueError(
-                    f"Could not determine train_dir from args={args}, kwargs={kwargs}. "
-                    "Mock get_model_snapshots needs train_dir to create snapshot files."
+                    f"Could not determine train_dir from args={args}, kwargs={kwargs}."
                 )
-            
+
             train_dir = Path(train_dir)
             train_dir.mkdir(parents=True, exist_ok=True)
-            
-            logger.info(f"[MOCK get_model_snapshots] train_dir={train_dir}, args={args}, kwargs={kwargs}")
+
+            logger.info(
+                f"[MOCK get_model_snapshots] train_dir={train_dir}, args={args}, kwargs={kwargs}"
+            )
 
             base_name = "snapshot-1000"
-            # Create minimal dummy files DLC expects
             for ext in [".index", ".meta", ".data-00000-of-00001"]:
                 f = train_dir / f"{base_name}{ext}"
                 if not f.exists():
                     f.touch()
                     logger.info(f"[MOCK get_model_snapshots] Created: {f}")
-            
-            # For PyTorch, create a minimal valid .pth checkpoint file
+
             snapshot_pth = train_dir / f"{base_name}.pth"
             if not snapshot_pth.exists():
                 try:
                     import torch
-                    # Create a minimal PyTorch checkpoint dict
-                    # DLC expects "model" key for loading state_dict
+
                     mock_checkpoint = {
                         "epoch": 0,
-                        "state_dict": {},  # Empty state dict is fine for mock
-                        "model": {},  # DLC expects this key for model.load_state_dict(snapshot["model"])
+                        "state_dict": {},
+                        "model": {},
                         "optimizer": None,
                     }
                     torch.save(mock_checkpoint, snapshot_pth)
                     logger.info(f"Created PyTorch snapshot: {snapshot_pth}")
                 except ImportError:
-                    logger.warning("PyTorch not available, creating minimal .pth file")
-                    # Fallback: create empty file with minimal zip header
+                    logger.warning(
+                        "PyTorch not available, creating minimal .pth file"
+                    )
                     snapshot_pth.write_bytes(b"PK\x03\x04")
                 except Exception as e:
-                    logger.warning(f"Could not create PyTorch snapshot with torch.save: {e}")
-                    # Fallback: create empty file with minimal zip header
+                    logger.warning(
+                        f"Could not create PyTorch snapshot with torch.save: {e}"
+                    )
                     snapshot_pth.write_bytes(b"PK\x03\x04")
 
-            # DLC's original function returns a list of snapshot objects with a .path attribute
-            # Create a simple object that mimics DLC's snapshot structure
             class MockSnapshot:
                 def __init__(self, path):
-                    # Store as Path object, but ensure it can be used as string when needed
-                    self.path = Path(path) if not isinstance(path, Path) else path
-                    # Also store as string for compatibility
+                    self.path = Path(path)
                     self.path_str = str(self.path)
-                
+
                 def __fspath__(self):
-                    """Implement os.PathLike protocol so Path(MockSnapshot) works."""
                     return str(self.path)
-                
+
                 def __str__(self):
-                    """String representation returns the path."""
                     return str(self.path)
-                
+
                 def __repr__(self):
-                    """Representation for debugging."""
                     return f"MockSnapshot({self.path!r})"
-            
-            # DLC's torch.load expects the file to exist at the exact path
-            # The error shows DLC is looking for 'snapshot-1000' (no extension)
-            # So we need to ensure the file exists at that exact path
-            snapshot_path_pth = train_dir / f"{base_name}.pth"
+
             snapshot_path_no_ext = train_dir / base_name
-            
-            # Ensure the .pth file exists (it should have been created above)
-            if not snapshot_path_pth.exists():
-                logger.warning(f"snapshot-1000.pth not found at {snapshot_path_pth}, creating it now")
-                try:
-                    import torch
-                    # DLC expects "model" key for loading state_dict
-                    mock_checkpoint = {
-                        "epoch": 0,
-                        "state_dict": {},
-                        "model": {},  # DLC expects this key for model.load_state_dict(snapshot["model"])
-                        "optimizer": None,
-                    }
-                    torch.save(mock_checkpoint, snapshot_path_pth)
-                except Exception as e:
-                    logger.warning(f"Could not create {snapshot_path_pth}: {e}")
-                    # Create minimal file as fallback
-                    snapshot_path_pth.write_bytes(b"PK\x03\x04")
-            
-            # CRITICAL: DLC's torch.load is looking for 'snapshot-1000' (no extension)
-            # Create a symlink or copy so the file exists at both paths
+
             if not snapshot_path_no_ext.exists():
+                import shutil
+
                 try:
-                    # Try creating a symlink first (more efficient)
-                    snapshot_path_no_ext.symlink_to(snapshot_path_pth)
-                    logger.info(f"Created symlink: {snapshot_path_no_ext} -> {snapshot_path_pth}")
+                    snapshot_path_no_ext.symlink_to(snapshot_pth)
+                    logger.info(
+                        f"Created symlink: {snapshot_path_no_ext} -> {snapshot_pth}"
+                    )
                 except (OSError, NotImplementedError):
-                    # If symlinks don't work (e.g., on Windows), copy the file
-                    import shutil
-                    shutil.copy2(snapshot_path_pth, snapshot_path_no_ext)
-                    logger.info(f"Copied file: {snapshot_path_pth} -> {snapshot_path_no_ext}")
-            
-            # Return the path WITHOUT extension (as DLC expects it)
-            # DLC will use this path directly in torch.load()
+                    shutil.copy2(snapshot_pth, snapshot_path_no_ext)
+                    logger.info(
+                        f"Copied file: {snapshot_pth} -> {snapshot_path_no_ext}"
+                    )
+
             return [MockSnapshot(snapshot_path_no_ext)]
 
-        # Patch load_state_dict to use strict=False for mock checkpoints
-        # This allows loading empty state dicts without errors (smoke test)
-        # Also patch dlc_reader validation to be lenient for smoke tests
         try:
             import torch.nn as nn
-            original_load_state_dict = nn.Module.load_state_dict
-            
-            def mock_load_state_dict(self, state_dict, strict=True, *args, **kwargs):
-                """Mock load_state_dict that always uses strict=False for smoke test."""
-                # Always use strict=False to allow loading empty/mock state dicts
-                return original_load_state_dict(self, state_dict, strict=False, *args, **kwargs)
-            
-            # Patch dlc_reader validation to be lenient for smoke tests
-            # The assertion in dlc_reader.PoseEstimation.pkl checks metadata consistency
-            # We'll wrap the property to catch AssertionError and return minimal data
             from element_deeplabcut.readers import dlc_reader
-            
-            # Get the underlying function from the property before we replace it
+
+            original_load_state_dict = nn.Module.load_state_dict
             original_pkl_property = dlc_reader.PoseEstimation.pkl
             original_pkl_fget = original_pkl_property.fget
-            
+
+            def mock_load_state_dict(self, state_dict, strict=True, *args, **kwargs):
+                return original_load_state_dict(
+                    self, state_dict, strict=False, *args, **kwargs
+                )
+
             def lenient_pkl_wrapper(self):
-                """Wrapper that catches AssertionError from metadata validation."""
                 try:
-                    # Call the original property's getter function directly
                     return original_pkl_fget(self)
                 except AssertionError as e:
                     if "Inconsistent DLC-model-config file used" in str(e):
                         logger.warning(
-                            f"Smoke test: Metadata validation failed (expected for mock models): {e}. "
+                            "Smoke test: Metadata validation failed (expected for mock models). "
                             "Returning minimal pkl structure."
                         )
-                        # Return minimal structure that won't break downstream code
-                        # Scorer must:
-                        # 1. End with a number (e.g., "_1000") because code does: int(self.pkl["Scorer"].split("_")[-1])
-                        # 2. Contain "shuffle" followed by a number (e.g., "shuffle1") because code does:
-                        #    re.search(r"shuffle(\d+)", self.pkl["Scorer"]).groups()[0]
                         return {
                             "nframes": 0,
-                            "Scorer": "DLC_mock_scorer_shuffle1_1000",  # Contains shuffle1 and ends with number
+                            "Scorer": "DLC_mock_scorer_shuffle1_1000",
                             "Task": "mock_task",
                             "date": "2024-01-01",
                             "iteration (active-learning)": 0,
@@ -1591,55 +1847,216 @@ def lenient_pkl_wrapper(self):
                         }
                     else:
                         raise
-            
-            # Replace the property with our wrapper
+
             dlc_reader.PoseEstimation.pkl = property(lenient_pkl_wrapper)
-            
-            # Patch both get_model_snapshots and load_state_dict
-            try:
-                with patch(
-                    "deeplabcut.pose_estimation_pytorch.apis.utils.get_model_snapshots",
-                    side_effect=_mock_get_model_snapshots,
-                ), patch.object(
-                    nn.Module,
-                    "load_state_dict",
-                    mock_load_state_dict,
-                ):
+
+            with patch(
+                "deeplabcut.pose_estimation_pytorch.apis.utils.get_model_snapshots",
+                side_effect=_mock_get_model_snapshots,
+            ), patch.object(nn.Module, "load_state_dict", mock_load_state_dict):
+                # Store original make method for potential restoration
+                PoseEst = pipeline.model.PoseEstimation
+                original_pe_make = PoseEst.make
+                
+                # Define mock pose estimation make function
+                def mock_pose_make(self, key):
+                    """Mock PoseEstimation.make: skip DLC, directly insert fake results."""
+                    import numpy as np
+                    import datajoint as dj
+                    
+                    # Get body parts from model config if available
+                    try:
+                        model_key = {**key, "model_name": key.get("model_name", model_name)}
+                        model_data = (pipeline.model.Model & model_key).fetch1()
+                        config_template = model_data.get("config_template", {})
+                        body_parts = config_template.get("bodyparts", ["nose", "tailbase", "head"])
+                    except Exception:
+                        # Fallback to default body parts
+                        body_parts = ["nose", "tailbase", "head"]
+                    
+                    # Get video info to determine frame count
+                    try:
+                        from element_interface.utils import find_full_path
+                        from element_deeplabcut.model import get_dlc_root_data_dir
+                        
+                        rec_key = {k: v for k, v in key.items() if k in ["device", "recording_id"]}
+                        video_files = (pipeline.model.VideoRecording.File & rec_key).fetch("file_path")
+                        if video_files:
+                            # Try to get frame count from first video
+                            try:
+                                import cv2
+                                video_path = find_full_path(get_dlc_root_data_dir(), video_files[0])
+                                cap = cv2.VideoCapture(str(video_path))
+                                n_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+                                cap.release()
+                                if n_frames == 0:
+                                    n_frames = 100  # Fallback
+                            except Exception:
+                                n_frames = 100  # Fallback
+                        else:
+                            n_frames = 100  # Fallback
+                    except Exception:
+                        n_frames = 100  # Fallback
+                    
+                    logger.info(
+                        f"Mock PoseEstimation.make: inserting fake results for {len(body_parts)} body parts, "
+                        f"{n_frames} frames"
+                    )
+                    
+                    # Insert master row
+                    self.insert1({**key, "pose_estimation_time": dj.now()})
+                    
+                    # Insert fake body part positions
+                    for bp in body_parts:
+                        x = np.random.uniform(0, 640, size=n_frames)
+                        y = np.random.uniform(0, 480, size=n_frames)
+                        likelihood = np.random.uniform(0.8, 1.0, size=n_frames)
+                        
+                        pipeline.model.PoseEstimation.BodyPartPosition.insert1(
+                            {
+                                **key,
+                                "body_part": bp,
+                                "x_pos": x,
+                                "y_pos": y,
+                                "likelihood": likelihood,
+                            }
+                        )
+                
+                # Try normal populate first
+                try:
                     pipeline.model.PoseEstimation.populate()
                     status.sub("Inference completed!", icon="✅", indent=3)
-            finally:
-                # Restore original pkl property
-                dlc_reader.PoseEstimation.pkl = original_pkl_property
+                except Exception as populate_err:
+                    # If populate fails and mock-results-on-failure is enabled, use mock
+                    if args.mock_results_on_failure:
+                        error_msg = str(populate_err)
+                        if (
+                            "need at least one array to stack" in error_msg
+                            or "Shape of passed values is" in error_msg
+                            or "No DLC output file" in error_msg
+                            or "No animals detected" in error_msg.lower()
+                        ):
+                            status.sub(
+                                "Inference failed (no animals detected or empty results). "
+                                "Inserting mock results instead.",
+                                icon="⚠️",
+                                indent=3,
+                            )
+                            # Temporarily replace make method with mock
+                            PoseEst.make = mock_pose_make
+                            try:
+                                # Populate with mock results for each recording
+                                for rec_key in recording_keys:
+                                    task_key = {**rec_key, "model_name": model_name}
+                                    # Check if results already exist
+                                    if len(PoseEst & task_key) == 0:
+                                        try:
+                                            mock_pose_make(PoseEst, task_key)
+                                        except Exception as mock_err:
+                                            logger.warning(
+                                                f"Failed to insert mock results for {task_key}: {mock_err}"
+                                            )
+                                status.sub("Mock results inserted!", icon="✅", indent=3)
+                            finally:
+                                # Restore original make method
+                                PoseEst.make = original_pe_make
+                        else:
+                            # Different error, re-raise
+                            raise
+                    else:
+                        # Mock not enabled, re-raise original error
+                        raise
+
+            dlc_reader.PoseEstimation.pkl = original_pkl_property
+
         except Exception as e:
             status.sub(f"Error during inference: {e}", icon="❌", indent=3)
             raise
-        
+
         # 11. Show results
         status.step("Results")
         for rec_key in recording_keys:
             status.sub(f"Recording {rec_key['recording_id']}:", icon="📹", indent=2)
             try:
-                pose_estimation = (
+                # Check if pose estimation results exist
+                pose_estimation_query = (
                     pipeline.model.PoseEstimation
                     & rec_key
                     & {"model_name": model_name}
-                ).fetch1()
+                )
                 
-                status.sub(f"Completed at: {pose_estimation['pose_estimation_time']}", icon="✅", indent=4)
+                if len(pose_estimation_query) == 0:
+                    status.sub(
+                        "No pose estimation results found.",
+                        icon="⚠️",
+                        indent=4,
+                    )
+                    status.sub(
+                        "This may indicate that:",
+                        indent=5,
+                    )
+                    status.sub(
+                        "1) No animals were detected in the video",
+                        indent=6,
+                    )
+                    status.sub(
+                        "2) Inference failed or was skipped",
+                        indent=6,
+                    )
+                    status.sub(
+                        "3) Results are still being processed",
+                        indent=6,
+                    )
+                    # Check if output directory exists and has files
+                    try:
+                        task_key = {**rec_key, "model_name": model_name}
+                        output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
+                            task_key, relative=False, mkdir=False
+                        )
+                        output_path = Path(output_dir)
+                        if output_path.exists():
+                            result_files = list(output_path.rglob("*.h5")) + list(output_path.rglob("*.pickle"))
+                            if result_files:
+                                status.sub(
+                                    f"Found {len(result_files)} result file(s) in {output_dir}",
+                                    icon="ℹ️",
+                                    indent=5,
+                                )
+                                status.sub(
+                                    "Results may not have been inserted into database yet.",
+                                    indent=5,
+                                )
+                            else:
+                                status.sub(
+                                    f"No result files found in {output_dir}",
+                                    icon="ℹ️",
+                                    indent=5,
+                                )
+                    except Exception as check_err:
+                        logger.debug(f"Could not check output directory: {check_err}")
+                    continue
                 
+                pose_estimation = pose_estimation_query.fetch1()
+
+                status.sub(
+                    f"Completed at: {pose_estimation['pose_estimation_time']}",
+                    icon="✅",
+                    indent=4,
+                )
+
                 body_parts = (
                     pipeline.model.PoseEstimation.BodyPartPosition
                     & rec_key
                     & {"model_name": model_name}
                 ).fetch("body_part")
-                
+
                 unique_bp = sorted(set(body_parts))
                 status.sub(
                     f"Detected body parts ({len(unique_bp)}): {unique_bp}",
                     icon="📊",
                     indent=4,
                 )
-                
+
                 if unique_bp:
                     bp = unique_bp[0]
                     bp_data = (
@@ -1647,27 +2064,47 @@ def lenient_pkl_wrapper(self):
                         & rec_key
                         & {"model_name": model_name, "body_part": bp}
                     ).fetch1()
-                    
+
                     x_pos = bp_data["x_pos"]
                     y_pos = bp_data["y_pos"]
                     likelihood = bp_data["likelihood"]
-                    
+
                     status.sub(
                         f"Example ({bp}): {len(x_pos)} frames, avg likelihood: {likelihood.mean():.3f}",
                         icon="📈",
                         indent=4,
                     )
             except Exception as e:
-                status.sub(f"No results yet or error: {e}", icon="⚠️", indent=4)
-    
+                error_msg = str(e)
+                if "fetch1 requires exactly one tuple" in error_msg:
+                    status.sub(
+                        "No pose estimation results found in database.",
+                        icon="⚠️",
+                        indent=4,
+                    )
+                    status.sub(
+                        "This likely means no animals were detected or inference was skipped.",
+                        icon="ℹ️",
+                        indent=5,
+                    )
+                else:
+                    status.sub(f"Error fetching results: {e}", icon="❌", indent=4)
+
     status.header("Test completed!")
     status.sub("Next steps:", indent=2)
     if not args.skip_training:
         status.sub("- Check training results in DLC project directory", indent=4)
     if not args.skip_inference:
-        status.sub("- Check output directory for DLC inference results", indent=4)
-        status.sub("- Visualize results using DLC's plotting functions", indent=4)
-        status.sub("- Query PoseEstimation.BodyPartPosition for analysis", indent=4)
+        status.sub(
+            "- Check output directory for DLC inference results", indent=4
+        )
+        status.sub(
+            "- Visualize results using DLC's plotting functions", indent=4
+        )
+        status.sub(
+            "- Query PoseEstimation.BodyPartPosition for analysis", indent=4
+        )
+
 
 if __name__ == "__main__":
     main()
diff --git a/test_video_inference.py b/test_video_inference.py
index fa2cb55..7d673d5 100755
--- a/test_video_inference.py
+++ b/test_video_inference.py
@@ -48,18 +48,20 @@
 # Set up logging
 logging.basicConfig(
     level=logging.INFO,
-    format='%(message)s',
-    handlers=[logging.StreamHandler(sys.stdout)]
+    format="%(message)s",
+    handlers=[logging.StreamHandler(sys.stdout)],
 )
 logger = logging.getLogger(__name__)
 
+
 # Simple status printer for user-facing messages
 class StatusPrinter:
     """Simple status printer for step-by-step progress."""
-    def __init__(self, total_steps=7):
+
+    def __init__(self, total_steps=8):
         self.total_steps = total_steps
         self.current_step = 0
-    
+
     def step(self, message, status="info"):
         """Print a step message with status indicator."""
         self.current_step += 1
@@ -68,22 +70,23 @@ def step(self, message, status="info"):
             "success": "✅",
             "warning": "⚠️",
             "error": "❌",
-            "skip": "⏭️"
+            "skip": "⏭️",
         }
         icon = icons.get(status, "•")
         print(f"\n[{self.current_step}/{self.total_steps}] {icon} {message}")
-    
+
     def sub(self, message, indent=3, icon=""):
         """Print a sub-message with indentation."""
         prefix = f"{icon} " if icon else ""
         print(" " * indent + prefix + message)
-    
+
     def header(self, title):
         """Print a section header."""
         print("\n" + "=" * 60)
         print(title)
         print("=" * 60)
 
+
 # Configure database connection
 if Path("./dj_local_conf.json").exists():
     dj.config.load("./dj_local_conf.json")
@@ -93,22 +96,29 @@ def header(self, title):
     logger.info("   Set DJ_HOST, DJ_USER, DJ_PASS environment variables if needed")
 
 # Update config from environment variables
-dj.config.update({
-    "safemode": False,
-    "database.host": os.environ.get("DJ_HOST") or dj.config.get("database.host", "localhost"),
-    "database.user": os.environ.get("DJ_USER") or dj.config.get("database.user", "root"),
-    "database.password": os.environ.get("DJ_PASS") or dj.config.get("database.password", ""),
-})
+dj.config.update(
+    {
+        "safemode": False,
+        "database.host": os.environ.get("DJ_HOST")
+        or dj.config.get("database.host", "localhost"),
+        "database.user": os.environ.get("DJ_USER")
+        or dj.config.get("database.user", "root"),
+        "database.password": os.environ.get("DJ_PASS")
+        or dj.config.get("database.password", ""),
+    }
+)
 
 # Set database prefix for tests
 if "custom" not in dj.config:
     dj.config["custom"] = {}
-dj.config["custom"]["database.prefix"] = os.environ.get("DATABASE_PREFIX", dj.config["custom"].get("database.prefix", "test_"))
+dj.config["custom"]["database.prefix"] = os.environ.get(
+    "DATABASE_PREFIX", dj.config["custom"].get("database.prefix", "test_")
+)
 
-# Set DLC root data directory if not already set
-# In Docker, prefer /app/test_videos (from project mount), otherwise /app/data
-# Check for Docker: /.dockerenv exists OR we're in /app directory (Docker working dir)
-is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
+# Detect docker & set DLC root data directory
+is_docker = os.path.exists("/.dockerenv") or (
+    os.getcwd() == "/app" and os.path.exists("/app")
+)
 if is_docker:
     # Prefer /app/test_videos (from project mount .:/app) since videos are in ./test_videos
     test_videos_path = Path("/app/test_videos")
@@ -118,8 +128,11 @@ def header(self, title):
         default_video_dir = "/app/data"
 else:
     default_video_dir = "./test_videos"
+
 video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
-if "dlc_root_data_dir" not in dj.config.get("custom", {}) or not dj.config["custom"].get("dlc_root_data_dir"):
+if "dlc_root_data_dir" not in dj.config.get("custom", {}) or not dj.config[
+    "custom"
+].get("dlc_root_data_dir"):
     dj.config["custom"]["dlc_root_data_dir"] = str(video_dir.absolute())
     logger.info(f"📁 Set DLC_ROOT_DATA_DIR to: {video_dir.absolute()}")
     if is_docker:
@@ -136,148 +149,169 @@ def header(self, title):
 from element_deeplabcut import model
 from tests import tutorial_pipeline as pipeline
 
+
 def check_database_connection():
     """Verify database connection is working."""
     try:
-        # Try to connect by activating a schema
-        test_schema = dj.schema("test_connection_check", create_schema=True, create_tables=False)
-        test_schema.drop()
+        # Just ensure we can connect; no schema creation.
+        dj.conn()
         return True
     except Exception as e:
         logger.error(f"\n❌ Database connection failed: {e}")
         logger.error("\nPlease configure your database:")
         logger.error("  1. Create dj_local_conf.json with database credentials")
         logger.error("  2. Or set environment variables: DJ_HOST, DJ_USER, DJ_PASS")
-        logger.error("  3. Or ensure database is running (docker compose -f docker-compose-db.yaml up -d)")
+        logger.error(
+            "  3. Or ensure database is running (docker compose -f docker-compose-db.yaml up -d)"
+        )
         return False
 
+
 def main():
     status = StatusPrinter(total_steps=8)
     status.header("Testing Pretrained Model Inference with Video")
-    
+
     # 0. Check database connection
     status.step("Checking database connection")
     if not check_database_connection():
         return  # Exit gracefully
     status.sub("Database connection successful", indent=3)
-    
+
     # 0.5. Clean up database (remove test data from previous runs)
     status.step("Cleaning up database (removing test data from previous runs)")
     cleanup_count = 0
-    
+
     # Delete PoseEstimation entries (and their parts)
-    pose_estimation_query = pipeline.model.PoseEstimation
-    if pose_estimation_query:
-        keys = pose_estimation_query.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            pose_estimation_query.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} PoseEstimation entry/entries", icon="🗑️", indent=3)
-    
+    pose_estimation_rel = pipeline.model.PoseEstimation
+    pose_keys = pose_estimation_rel.fetch("KEY")
+    pose_count = len(pose_keys)
+    if pose_count > 0:
+        pose_estimation_rel.delete()
+        cleanup_count += pose_count
+        status.sub(
+            f"Deleted {pose_count} PoseEstimation entry/entries", icon="🗑️", indent=3
+        )
+
     # Delete PoseEstimationTask entries
-    task_query = pipeline.model.PoseEstimationTask
-    if task_query:
-        keys = task_query.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            task_query.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} PoseEstimationTask entry/entries", icon="🗑️", indent=3)
-    
+    task_rel = pipeline.model.PoseEstimationTask
+    task_keys = task_rel.fetch("KEY")
+    task_count = len(task_keys)
+    if task_count > 0:
+        task_rel.delete()
+        cleanup_count += task_count
+        status.sub(
+            f"Deleted {task_count} PoseEstimationTask entry/entries",
+            icon="🗑️",
+            indent=3,
+        )
+
     # Delete test models (models with names starting with "test_")
-    test_models = model.Model & "model_name LIKE 'test_%'"
-    if test_models:
-        keys = test_models.fetch("KEY")
-        count = len(keys) if keys else 0
-        if count > 0:
-            test_models.delete()
-            cleanup_count += count
-            status.sub(f"Deleted {count} test model(s)", icon="🗑️", indent=3)
-    
+    test_models_rel = model.Model & "model_name LIKE 'test_%'"
+    test_model_keys = test_models_rel.fetch("KEY")
+    test_model_count = len(test_model_keys)
+    if test_model_count > 0:
+        test_models_rel.delete()
+        cleanup_count += test_model_count
+        status.sub(f"Deleted {test_model_count} test model(s)", icon="🗑️", indent=3)
+
     # Delete test recordings (optional - comment out if you want to keep recordings)
-    # Uncomment if you want to clean recordings too:
-    # if pipeline.model.VideoRecording & {"subject": "test1"}:
-    #     count = len(pipeline.model.VideoRecording & {"subject": "test1"})
+    # Example (fixed pattern):
+    # n_test_recordings = len(pipeline.model.VideoRecording & {"subject": "test1"})
+    # if n_test_recordings:
     #     (pipeline.model.VideoRecording & {"subject": "test1"}).delete()
-    #     cleanup_count += count
-    #     if count > 0:
-    #         status.sub(f"Deleted {count} test recording(s)", icon="🗑️", indent=3)
-    
+    #     cleanup_count += n_test_recordings
+    #     status.sub(f"Deleted {n_test_recordings} test recording(s)", icon="🗑️", indent=3)
+
     if cleanup_count > 0:
         status.sub(f"Total: {cleanup_count} entry/entries cleaned", icon="✅", indent=3)
     else:
         status.sub("No test data found to clean", icon="ℹ️", indent=3)
-    
+
     # 1. Find video files
     status.step("Finding video files")
     # Use same Docker detection logic as at the top
-    is_docker = os.path.exists("/.dockerenv") or (os.getcwd() == "/app" and os.path.exists("/app"))
-    
+    is_docker_local = os.path.exists("/.dockerenv") or (
+        os.getcwd() == "/app" and os.path.exists("/app")
+    )
+
     # In Docker, prefer /app/test_videos (from project mount .:/app) since videos are in ./test_videos
-    if is_docker:
-        # Check /app/test_videos first (from project mount)
+    if is_docker_local:
         test_videos_path = Path("/app/test_videos")
         if test_videos_path.exists():
-            default_video_dir = "/app/test_videos"
+            default_video_dir_local = "/app/test_videos"
         else:
-            default_video_dir = "/app/data"
+            default_video_dir_local = "/app/data"
     else:
-        default_video_dir = "./test_videos"
-    
-    video_dir = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir))
-    
-    if not video_dir.exists():
-        status.sub(f"Video directory not found: {video_dir}", indent=3)
-        if is_docker:
+        default_video_dir_local = "./test_videos"
+
+    video_dir_local = Path(os.getenv("DLC_ROOT_DATA_DIR", default_video_dir_local))
+
+    if not video_dir_local.exists():
+        status.sub(f"Video directory not found: {video_dir_local}", indent=3)
+        if is_docker_local:
             status.sub("In Docker: Videos should be in ./test_videos/ on host", indent=3)
             status.sub("(available at /app/test_videos via project mount)", indent=5)
         return  # Exit gracefully
-    
-    video_files = list(video_dir.glob("*.mp4")) + list(video_dir.glob("*.avi")) + list(video_dir.glob("*.mov"))
+
+    video_files = list(video_dir_local.glob("*.mp4")) + list(
+        video_dir_local.glob("*.avi")
+    ) + list(video_dir_local.glob("*.mov"))
+
     if not video_files:
-        status.sub(f"No video files found in {video_dir}", indent=3)
+        status.sub(f"No video files found in {video_dir_local}", indent=3)
         status.sub("Supported formats: .mp4, .avi, .mov", indent=3)
-        if is_docker:
+        if is_docker_local:
             status.sub("In Docker: Videos should be in ./test_videos/ on host", indent=3)
             status.sub("(available at /app/test_videos in container)", indent=5)
         return  # Exit gracefully
-    
+
     status.sub(f"Found {len(video_files)} video file(s):", indent=3)
     for vf in video_files:
         status.sub(f"- {vf.name}", indent=5)
-    
+
     # 2. Register pretrained model
     # Get model name from command line or use default
-    pretrained_model_name = getattr(main, 'pretrained_model_name', 'superanimal_quadruped')
-    
+    pretrained_model_name = getattr(main, "pretrained_model_name", "superanimal_quadruped")
+
     status.step(f"Registering pretrained model: {pretrained_model_name}")
     model.PretrainedModel.populate_common_models([pretrained_model_name])
     status.sub(f"Registered: {pretrained_model_name}", icon="✅")
-    
+
     # 3. Insert pretrained model instance
     status.step("Inserting pretrained model instance")
     # Use a model name that includes the pretrained model name for clarity
     model_name = f"test_video_inference_{pretrained_model_name.replace('superanimal_', '')}"
-    
+
     # Check if model already exists and verify it's a pretrained model
-    if model.Model & {"model_name": model_name}:
+    if len(model.Model & {"model_name": model_name}):
         existing_model = (model.Model & {"model_name": model_name}).fetch1()
         config_template = existing_model.get("config_template", {})
         is_pretrained = config_template.get("_pretrained_model_name") is not None
-        
+
         if is_pretrained:
             existing_pretrained_name = config_template.get("_pretrained_model_name")
             if existing_pretrained_name == pretrained_model_name:
-                status.sub(f"Model '{model_name}' already exists (pretrained: {pretrained_model_name}), skipping insertion", icon="✅")
+                status.sub(
+                    f"Model '{model_name}' already exists (pretrained: {pretrained_model_name}), skipping insertion",
+                    icon="✅",
+                )
             else:
-                status.sub(f"Model '{model_name}' exists but uses different pretrained model: {existing_pretrained_name}", icon="⚠️")
+                status.sub(
+                    f"Model '{model_name}' exists but uses different pretrained model: {existing_pretrained_name}",
+                    icon="⚠️",
+                )
                 status.sub(f"Expected: {pretrained_model_name}", indent=5)
-                status.sub("Deleting existing model and tasks, creating new one...", indent=5)
+                status.sub(
+                    "Deleting existing model and tasks, creating new one...", indent=5
+                )
                 # Delete any existing tasks that reference this model
-                if pipeline.model.PoseEstimationTask & {"model_name": model_name}:
+                if len(pipeline.model.PoseEstimationTask & {"model_name": model_name}):
                     (pipeline.model.PoseEstimationTask & {"model_name": model_name}).delete()
-                    status.sub("Deleted existing PoseEstimationTask entries", icon="✅", indent=7)
+                    status.sub(
+                        "Deleted existing PoseEstimationTask entries",
+                        icon="✅",
+                        indent=7,
+                    )
                 # Delete the model
                 (model.Model & {"model_name": model_name}).delete()
                 # Insert the correct pretrained model
@@ -289,12 +323,22 @@ def main():
                 )
                 status.sub(f"Re-inserted model: {model_name}", icon="✅")
         else:
-            status.sub(f"Model '{model_name}' exists but is a TRAINED model, not pretrained", icon="⚠️")
-            status.sub("This script requires a PRETRAINED model. Deleting existing model and tasks...", indent=5)
+            status.sub(
+                f"Model '{model_name}' exists but is a TRAINED model, not pretrained",
+                icon="⚠️",
+            )
+            status.sub(
+                "This script requires a PRETRAINED model. Deleting existing model and tasks...",
+                indent=5,
+            )
             # Delete any existing tasks that reference this model
-            if pipeline.model.PoseEstimationTask & {"model_name": model_name}:
+            if len(pipeline.model.PoseEstimationTask & {"model_name": model_name}):
                 (pipeline.model.PoseEstimationTask & {"model_name": model_name}).delete()
-                status.sub("Deleted existing PoseEstimationTask entries", icon="✅", indent=7)
+                status.sub(
+                    "Deleted existing PoseEstimationTask entries",
+                    icon="✅",
+                    indent=7,
+                )
             # Delete the model
             (model.Model & {"model_name": model_name}).delete()
             # Insert the correct pretrained model
@@ -316,9 +360,12 @@ def main():
             status.sub(f"Inserted model: {model_name}", icon="✅")
         except dj.errors.DuplicateError as e:
             # If duplicate error occurs (e.g., same unique index), skip insertion
-            status.sub(f"Model with similar configuration already exists, skipping insertion", icon="⚠️")
+            status.sub(
+                "Model with similar configuration already exists, skipping insertion",
+                icon="⚠️",
+            )
             status.sub(f"Error: {str(e)[:100]}...", indent=5)
-    
+
     # 4. Setup test data (subject, session, recordings)
     status.step("Setting up test data")
     # Use shorter subject name (element-animal Subject table has limited varchar length)
@@ -326,19 +373,25 @@ def main():
         "subject": "test1",
         "session_datetime": "2024-01-01 12:00:00",
     }
-    
-    pipeline.subject.Subject.insert1({
-        "subject": "test1",  # Short name to fit database column
-        "sex": "F",
-        "subject_birth_date": "2020-01-01",
-        "subject_description": "Test subject for video inference",
-    }, skip_duplicates=True)
-    
-    pipeline.session.Session.insert1({
-        "subject": "test1",
-        "session_datetime": "2024-01-01 12:00:00",
-    }, skip_duplicates=True)
-    
+
+    pipeline.subject.Subject.insert1(
+        {
+            "subject": "test1",  # Short name to fit database column
+            "sex": "F",
+            "subject_birth_date": "2020-01-01",
+            "subject_description": "Test subject for video inference",
+        },
+        skip_duplicates=True,
+    )
+
+    pipeline.session.Session.insert1(
+        {
+            "subject": "test1",
+            "session_datetime": "2024-01-01 12:00:00",
+        },
+        skip_duplicates=True,
+    )
+
     # Create a separate recording for each video file
     recording_keys = []
     for idx, video_file in enumerate(video_files):
@@ -347,32 +400,108 @@ def main():
             "recording_id": idx + 1,  # Start from 1
         }
         recording_keys.append(recording_key)
-        
-        # Insert recording
-        pipeline.model.VideoRecording.insert1(
-            {**recording_key, "device": "Camera1"}, skip_duplicates=True
-        )
-        
-        # Insert single video file for this recording
+
+        # Insert or update recording and file entry
         # Store file path relative to root directory
         video_file_abs = Path(video_file).resolve()
-        dlc_root_dir_abs = Path(dj.config["custom"].get("dlc_root_data_dir", str(video_dir.absolute()))).resolve()
-        
+        dlc_root_dir_abs = Path(
+            dj.config["custom"].get("dlc_root_data_dir", str(video_dir_local.absolute()))
+        ).resolve()
+
         try:
             relative_path = video_file_abs.relative_to(dlc_root_dir_abs)
         except ValueError:
             # If video_file is not under dlc_root_dir, use just the filename
             # This handles the case where videos are in the root directory itself
             relative_path = Path(video_file.name)
-        
-        pipeline.model.VideoRecording.File.insert1(
-            {**recording_key, "file_id": 0, "file_path": str(relative_path)},
-            skip_duplicates=True,
-        )
-        status.sub(f"Created recording {recording_key['recording_id']} for {video_file.name}", icon="✅", indent=5)
-    
-    status.sub(f"Created {len(recording_keys)} separate recording(s)", icon="✅", indent=3)
-    
+
+        # Check if we need to update anything
+        existing_rec = pipeline.model.VideoRecording & recording_key
+        file_key = {**recording_key, "file_id": 0}
+        existing_file = pipeline.model.VideoRecording.File & file_key
+
+        needs_update = False
+        update_reason = []
+
+        if len(existing_rec):
+            existing_device = existing_rec.fetch1("device")
+            if existing_device != "Camera1":
+                needs_update = True
+                update_reason.append("device changed")
+        else:
+            needs_update = True
+            update_reason.append("recording doesn't exist")
+
+        if len(existing_file):
+            existing_path = existing_file.fetch1("file_path")
+            if existing_path != str(relative_path):
+                needs_update = True
+                update_reason.append("file path changed")
+        else:
+            needs_update = True
+            update_reason.append("file entry doesn't exist")
+
+        if needs_update:
+            # Get all file entries first (if they exist) to preserve them
+            all_files = []
+            if len(existing_rec):
+                # Fetch all file entries for this recording
+                file_keys = (
+                    pipeline.model.VideoRecording.File & recording_key
+                ).fetch("KEY", as_dict=True)
+                for fk in file_keys:
+                    file_data = (
+                        pipeline.model.VideoRecording.File & fk
+                    ).fetch1()
+                    all_files.append(file_data)
+                # Delete the master record (which cascades to all Part entries)
+                (pipeline.model.VideoRecording & recording_key).delete()
+
+            # Re-insert the master record
+            pipeline.model.VideoRecording.insert1({**recording_key, "device": "Camera1"})
+
+            # Re-insert all file entries with updated path
+            file_updated = False
+            for file_entry in all_files:
+                if file_entry["file_id"] == 0:
+                    # Update this file entry with new path
+                    pipeline.model.VideoRecording.File.insert1(
+                        {**recording_key, "file_id": 0, "file_path": str(relative_path)}
+                    )
+                    file_updated = True
+                else:
+                    # Re-insert other file entries as-is
+                    pipeline.model.VideoRecording.File.insert1(file_entry)
+
+            # If no file entry existed, insert it
+            if not file_updated:
+                pipeline.model.VideoRecording.File.insert1(
+                    {**file_key, "file_path": str(relative_path)}
+                )
+
+            if len(update_reason) > 0:
+                status.sub(
+                    f"Updated recording {recording_key['recording_id']} ({', '.join(update_reason)}): {video_file.name}",
+                    icon="🔄",
+                    indent=5,
+                )
+            else:
+                status.sub(
+                    f"Created recording {recording_key['recording_id']} for {video_file.name}",
+                    icon="✅",
+                    indent=5,
+                )
+        else:
+            status.sub(
+                f"Recording {recording_key['recording_id']} already exists with correct data: {video_file.name}",
+                icon="✅",
+                indent=5,
+            )
+
+    status.sub(
+        f"Created {len(recording_keys)} separate recording(s)", icon="✅", indent=3
+    )
+
     # 5. Extract video metadata
     status.step("Extracting video metadata")
     try:
@@ -384,17 +513,19 @@ def main():
                 f"Recording {rec_key['recording_id']}: {rec_info['px_width']}x{rec_info['px_height']}, "
                 f"{rec_info['nframes']} frames, {rec_info['fps']:.1f} fps",
                 icon="✅",
-                indent=5
+                indent=5,
             )
     except ModuleNotFoundError as e:
         if "cv2" in str(e):
             status.sub(f"Error: {e}", icon="❌", indent=3)
-            status.sub("OpenCV (cv2) is required for video metadata extraction.", indent=3)
+            status.sub(
+                "OpenCV (cv2) is required for video metadata extraction.", indent=3
+            )
             status.sub("Install it with: pip install opencv-python", indent=5)
             status.sub("Or: conda install -c conda-forge opencv", indent=5)
             return  # Exit gracefully
         raise
-    
+
     # 6. Clean up any tasks that might be using wrong models (from other test scripts)
     status.step("Cleaning up any conflicting tasks")
     for rec_key in recording_keys:
@@ -402,11 +533,17 @@ def main():
         all_tasks = (pipeline.model.PoseEstimationTask & rec_key).fetch("model_name")
         for task_model_name in set(all_tasks):
             if task_model_name != model_name:
-                status.sub(f"Found task with different model '{task_model_name}' for recording {rec_key['recording_id']}", icon="⚠️", indent=3)
-                status.sub(f"Deleting task (expected model: '{model_name}')...", indent=5)
+                status.sub(
+                    f"Found task with different model '{task_model_name}' for recording {rec_key['recording_id']}",
+                    icon="⚠️",
+                    indent=3,
+                )
+                status.sub(
+                    f"Deleting task (expected model: '{model_name}')...", indent=5
+                )
                 (pipeline.model.PoseEstimationTask & {**rec_key, "model_name": task_model_name}).delete()
                 status.sub("Task deleted", icon="✅", indent=7)
-    
+
     # 6. Create pose estimation tasks for each recording
     status.step("Creating pose estimation tasks")
     for rec_key in recording_keys:
@@ -415,7 +552,7 @@ def main():
         output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
             task_key, relative=False, mkdir=False
         )
-        
+
         # Check if results exist - look for H5 files directly
         results_exist = False
         output_path = Path(output_dir)
@@ -424,30 +561,45 @@ def main():
             h5_files = list(output_path.glob("*.h5"))
             pickle_files = list(output_path.glob("*.pickle"))
             json_files = list(output_path.glob("*.json"))
-            
+
             if h5_files or pickle_files or json_files:
                 results_exist = True
                 status.sub(
                     f"Results found for recording {rec_key['recording_id']} in: {output_dir.name} "
                     f"({len(h5_files)} H5, {len(pickle_files)} pickle, {len(json_files)} JSON)",
                     icon="✅",
-                    indent=5
+                    indent=5,
                 )
             else:
-                status.sub(f"No result files found for recording {rec_key['recording_id']} in: {output_dir.name}", icon="⚠️", indent=5)
+                status.sub(
+                    f"No result files found for recording {rec_key['recording_id']} in: {output_dir.name}",
+                    icon="⚠️",
+                    indent=5,
+                )
         else:
-            status.sub(f"Output directory doesn't exist for recording {rec_key['recording_id']}: {output_dir.name}", icon="⚠️", indent=5)
-        
+            status.sub(
+                f"Output directory doesn't exist for recording {rec_key['recording_id']}: {output_dir.name}",
+                icon="⚠️",
+                indent=5,
+            )
+
         # Generate task - it will auto-detect and set task_mode appropriately
         # Always use "load" mode if results exist - never re-run inference
-        # This prevents expensive re-computation when results already exist
         if results_exist:
             task_mode = "load"  # Use existing results - do NOT trigger inference
-            status.sub(f"Results exist for recording {rec_key['recording_id']} - setting task_mode='load'", icon="✅", indent=5)
+            status.sub(
+                f"Results exist for recording {rec_key['recording_id']} - setting task_mode='load'",
+                icon="✅",
+                indent=5,
+            )
         else:
             task_mode = None  # Auto-detect (will be "trigger" if no results)
-            status.sub(f"No results found for recording {rec_key['recording_id']} - will auto-detect task_mode", icon="ℹ️", indent=5)
-        
+            status.sub(
+                f"No results found for recording {rec_key['recording_id']} - will auto-detect task_mode",
+                icon="ℹ️",
+                indent=5,
+            )
+
         pipeline.model.PoseEstimationTask.generate(
             rec_key,
             model_name=model_name,
@@ -455,12 +607,22 @@ def main():
             analyze_videos_params={
                 "video_inference": {
                     "scale": 0.4,  # Adjust if needed (0.3-0.5 recommended)
-                    "batchsize": 8,  # Adjust based on GPU memory
+                    "batchsize": 8,  # Pose estimation batch size (adjust based on GPU memory)
+                    "detector_batch_size": getattr(main, "detector_batch_size", 4),
+                    "device": (
+                        f"cuda:{getattr(main, 'gpu', 0)}"
+                        if getattr(main, "gpu", 0) >= 0
+                        else "cpu"
+                    ),
                 }
             },
         )
-        status.sub(f"Task created for recording {rec_key['recording_id']}", icon="✅", indent=5)
-    
+        status.sub(
+            f"Task created for recording {rec_key['recording_id']}",
+            icon="✅",
+            indent=5,
+        )
+
     # 6.5. Update task modes if needed (in case results were created after task creation)
     status.step("Checking and updating task modes")
     for rec_key in recording_keys:
@@ -468,7 +630,7 @@ def main():
         output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
             task_key, relative=False, mkdir=False
         )
-        
+
         # Check if results exist
         output_path = Path(output_dir)
         results_exist = False
@@ -478,61 +640,82 @@ def main():
             json_files = list(output_path.glob("*.json"))
             if h5_files or pickle_files or json_files:
                 results_exist = True
-        
+
         # Check current task mode
         try:
             current_task = (pipeline.model.PoseEstimationTask & task_key).fetch1()
             current_mode = current_task.get("task_mode", "trigger")
-            
+
             # Update to "load" if results exist but task is in "trigger" mode
             if results_exist and current_mode == "trigger":
                 pipeline.model.PoseEstimationTask.update1(
                     {**task_key, "task_mode": "load"}
                 )
-                status.sub(f"Updated recording {rec_key['recording_id']} task_mode to 'load' (results exist)", icon="✅", indent=5)
+                status.sub(
+                    f"Updated recording {rec_key['recording_id']} task_mode to 'load' (results exist)",
+                    icon="✅",
+                    indent=5,
+                )
             elif not results_exist and current_mode == "load":
                 pipeline.model.PoseEstimationTask.update1(
                     {**task_key, "task_mode": "trigger"}
                 )
-                status.sub(f"Updated recording {rec_key['recording_id']} task_mode to 'trigger' (no results)", icon="⚠️", indent=5)
+                status.sub(
+                    f"Updated recording {rec_key['recording_id']} task_mode to 'trigger' (no results)",
+                    icon="⚠️",
+                    indent=5,
+                )
             else:
-                status.sub(f"Recording {rec_key['recording_id']} task_mode is '{current_mode}' (correct)", icon="ℹ️", indent=5)
+                status.sub(
+                    f"Recording {rec_key['recording_id']} task_mode is '{current_mode}' (correct)",
+                    icon="ℹ️",
+                    indent=5,
+                )
         except Exception as e:
-            status.sub(f"Could not check/update task for recording {rec_key['recording_id']}: {e}", icon="⚠️", indent=5)
-    
+            status.sub(
+                f"Could not check/update task for recording {rec_key['recording_id']}: {e}",
+                icon="⚠️",
+                indent=5,
+            )
+
     # 7. Run inference or load existing results
     status.step("Running inference or loading existing results")
-    
+
     # Check if DeepLabCut is available FIRST (before checking task modes)
     # This import might print "Loading DLC..." so we do it early
     deeplabcut_available = False
     error_msg = None
-    
+
     # First check if PyTorch is available (needed for SuperAnimal)
     try:
         import torch
+
         pytorch_available = True
         pytorch_version = torch.__version__
     except ImportError:
         pytorch_available = False
         pytorch_version = None
-    
+
     try:
         import deeplabcut
+
         deeplabcut_available = True
         logger.info("DeepLabCut imported successfully")
         # Verify it's actually usable by checking for a key function
         if hasattr(deeplabcut, "video_inference_superanimal"):
             logger.info("DeepLabCut has video_inference_superanimal function")
         else:
-            logger.warning("DeepLabCut imported but video_inference_superanimal not found")
+            logger.warning(
+                "DeepLabCut imported but video_inference_superanimal not found"
+            )
     except (ImportError, TypeError, Exception) as e:
         error_msg = str(e)
         deeplabcut_available = False
         logger.warning(f"DeepLabCut import failed: {e}")
         import traceback
+
         logger.debug(f"Traceback: {traceback.format_exc()}")
-    
+
     # Double-check task modes and results before proceeding
     # This ensures we never trigger inference if results exist
     all_in_load_mode = True
@@ -540,8 +723,10 @@ def main():
     for rec_key in recording_keys:
         task_key = {**rec_key, "model_name": model_name}
         try:
-            task_mode = (pipeline.model.PoseEstimationTask & task_key).fetch1("task_mode")
-            
+            task_mode = (pipeline.model.PoseEstimationTask & task_key).fetch1(
+                "task_mode"
+            )
+
             # Check if results actually exist for this task
             output_dir = pipeline.model.PoseEstimationTask.infer_output_dir(
                 task_key, relative=False, mkdir=False
@@ -555,24 +740,36 @@ def main():
                 if h5_files or pickle_files or json_files:
                     results_exist = True
                     any_results_exist = True
-            
+
             # If results exist but task is in trigger mode, update it
             if results_exist and task_mode == "trigger":
                 pipeline.model.PoseEstimationTask.update1(
                     {**task_key, "task_mode": "load"}
                 )
-                status.sub(f"Updated recording {rec_key['recording_id']} to 'load' mode (results exist)", icon="✅", indent=3)
+                status.sub(
+                    f"Updated recording {rec_key['recording_id']} to 'load' mode (results exist)",
+                    icon="✅",
+                    indent=3,
+                )
                 task_mode = "load"
-            
+
             if task_mode != "load":
                 all_in_load_mode = False
-                status.sub(f"Recording {rec_key['recording_id']} is in '{task_mode}' mode", icon="ℹ️", indent=3)
+                status.sub(
+                    f"Recording {rec_key['recording_id']} is in '{task_mode}' mode",
+                    icon="ℹ️",
+                    indent=3,
+                )
         except Exception as e:
             # Task doesn't exist yet, so not in load mode
             all_in_load_mode = False
-            status.sub(f"Task for recording {rec_key['recording_id']} doesn't exist: {e}", icon="⚠️", indent=3)
+            status.sub(
+                f"Task for recording {rec_key['recording_id']} doesn't exist: {e}",
+                icon="⚠️",
+                indent=3,
+            )
             break
-    
+
     # NEVER run inference if results exist - always use load mode
     if any_results_exist:
         status.sub("Results exist - will use 'load' mode (skipping inference)", icon="ℹ️", indent=3)
@@ -590,71 +787,99 @@ def main():
                     json_files = list(output_path.glob("*.json"))
                     if h5_files or pickle_files or json_files:
                         # Force load mode if results exist
-                        current_task = (pipeline.model.PoseEstimationTask & task_key).fetch1()
+                        current_task = (
+                            pipeline.model.PoseEstimationTask & task_key
+                        ).fetch1()
                         if current_task.get("task_mode") != "load":
                             pipeline.model.PoseEstimationTask.update1(
                                 {**task_key, "task_mode": "load"}
                             )
             except Exception:
                 pass
-    
+
     # Verify all tasks use the correct pretrained model before inference
     status.step("Verifying model configuration")
     for rec_key in recording_keys:
         task_key = {**rec_key, "model_name": model_name}
-        if pipeline.model.PoseEstimationTask & task_key:
+        if len(pipeline.model.PoseEstimationTask & task_key):
             task = (pipeline.model.PoseEstimationTask & task_key).fetch1()
             # Verify the model is actually a pretrained model
             model_record = (model.Model & {"model_name": model_name}).fetch1()
             config_template = model_record.get("config_template", {})
             if config_template.get("_pretrained_model_name") is None:
-                status.sub(f"ERROR: Task for recording {rec_key['recording_id']} references a TRAINED model, not pretrained!", icon="❌", indent=3)
+                status.sub(
+                    f"ERROR: Task for recording {rec_key['recording_id']} references a TRAINED model, not pretrained!",
+                    icon="❌",
+                    indent=3,
+                )
                 status.sub("Deleting incorrect task...", indent=5)
                 (pipeline.model.PoseEstimationTask & task_key).delete()
-                status.sub("Task deleted. Please re-run the script to create correct tasks.", icon="✅", indent=5)
+                status.sub(
+                    "Task deleted. Please re-run the script to create correct tasks.",
+                    icon="✅",
+                    indent=5,
+                )
                 return  # Exit gracefully
     status.sub("All tasks verified to use pretrained model", icon="✅", indent=3)
-    
+
     if all_in_load_mode and deeplabcut_available:
         status.step("Loading existing results")
         status.sub("All tasks are in 'load' mode - will use existing results", icon="ℹ️", indent=3)
         status.sub("Skipping inference step (results already exist)", icon="⚠️", indent=3)
         try:
             pipeline.model.PoseEstimation.populate()
+
             # Check if there are any IndividualMapping entries (for multi-animal data)
             individual_mappings = (
-                pipeline.model.PoseEstimation.IndividualMapping 
-                & rec_key 
+                pipeline.model.PoseEstimation.IndividualMapping
                 & {"model_name": model_name}
             )
             num_mappings = len(individual_mappings)
-            
+
             if num_mappings > 0:
-                status.sub(f"Results loaded successfully! ({num_mappings} individual mappings created)", icon="✅", indent=3)
+                status.sub(
+                    f"Results loaded successfully! ({num_mappings} individual mappings created in total)",
+                    icon="✅",
+                    indent=3,
+                )
             else:
                 # Check if this is multi-animal data that should have mappings
                 individuals = (
-                    pipeline.model.PoseEstimation.Individual 
-                    & rec_key 
+                    pipeline.model.PoseEstimation.Individual
                     & {"model_name": model_name}
                 )
                 if len(individuals) > 0:
-                    status.sub("Results loaded with warnings: Individual mappings could not be created", icon="⚠️", indent=3)
-                    status.sub(f"Found {len(individuals)} individual(s) but 0 mappings", icon="ℹ️", indent=4)
+                    status.sub(
+                        "Results loaded with warnings: Individual mappings could not be created",
+                        icon="⚠️",
+                        indent=3,
+                    )
+                    status.sub(
+                        f"Found {len(individuals)} individual(s) but 0 mappings",
+                        icon="ℹ️",
+                        indent=4,
+                    )
                 else:
-                    status.sub("Results loaded successfully! (single-animal data)", icon="✅", indent=3)
+                    status.sub(
+                        "Results loaded successfully! (single-animal data)",
+                        icon="✅",
+                        indent=3,
+                    )
         except Exception as e:
             status.sub(f"Error loading results: {e}", icon="❌", indent=3)
             raise
         return  # Exit early if we're just loading
-    
+
     # Debug: print what we detected
-    status.sub(f"DLC availability check: deeplabcut_available={deeplabcut_available}, error_msg={error_msg}", indent=3)
-    
+    status.sub(
+        f"DLC availability check: deeplabcut_available={deeplabcut_available}, error_msg={error_msg}",
+        indent=3,
+    )
+
     # If DLC is not available, show error and exit
     if not deeplabcut_available:
         status.sub("DeepLabCut is not available - cannot run inference", icon="⚠️", indent=3)
-        
+
         # Check if deeplabcut package exists but has missing dependencies
         if error_msg:
             spec = importlib.util.find_spec("deeplabcut")
@@ -662,60 +887,169 @@ def main():
                 # Package exists but import failed - likely missing dependency
                 if "tensorflow" in error_msg.lower():
                     if pytorch_available:
-                        status.sub("DeepLabCut is installed but TensorFlow is missing.", icon="⚠️", indent=3)
-                        status.sub(f"PyTorch is available (version {pytorch_version})", icon="✅", indent=5)
-                    status.sub("DeepLabCut's __init__.py tries to import TensorFlow by default,", indent=3)
-                    status.sub("but SuperAnimal models only need PyTorch.", indent=3)
+                        status.sub(
+                            f"PyTorch is available (version {pytorch_version})",
+                            icon="✅",
+                            indent=5,
+                        )
+                    status.sub(
+                        "DeepLabCut is installed but TensorFlow is missing.",
+                        icon="⚠️",
+                        indent=3,
+                    )
+                    status.sub(
+                        "DeepLabCut's __init__.py tries to import TensorFlow by default,",
+                        indent=3,
+                    )
+                    status.sub(
+                        "but SuperAnimal models only need PyTorch.", indent=3
+                    )
                     status.sub("Workaround options:", indent=3)
-                    status.sub("1. Install TensorFlow (even if unused): pip install tensorflow", indent=5)
-                    status.sub("2. Or try setting environment variable: export DLC_BACKEND='pytorch'", indent=5)
-                    status.sub("3. Or use DeepLabCut's PyTorch-only installation:", indent=5)
-                    status.sub("   pip install --upgrade 'deeplabcut[superanimal]'", indent=7)
+                    status.sub(
+                        "1. Install TensorFlow (even if unused): pip install tensorflow",
+                        indent=5,
+                    )
+                    status.sub(
+                        "2. Or try setting environment variable: export DLC_BACKEND='pytorch'",
+                        indent=5,
+                    )
+                    status.sub(
+                        "3. Or use DeepLabCut's PyTorch-only installation:",
+                        indent=5,
+                    )
+                    status.sub(
+                        "   pip install --upgrade 'deeplabcut[superanimal]'",
+                        indent=7,
+                    )
+                elif "torch" in error_msg.lower() or "pytorch" in error_msg.lower():
+                    status.sub(
+                        "DeepLabCut is installed but PyTorch is missing.",
+                        icon="⚠️",
+                        indent=3,
+                    )
+                    status.sub(
+                        "For SuperAnimal pretrained models, PyTorch is required.",
+                        indent=3,
+                    )
+                    status.sub(
+                        "To fix, install PyTorch: pip install torch", indent=5
+                    )
+                elif "tensorpack" in error_msg.lower():
+                    status.sub(
+                        "DeepLabCut is installed but tensorpack is missing.",
+                        icon="⚠️",
+                        indent=3,
+                    )
+                    if pytorch_available:
+                        status.sub(
+                            f"PyTorch is available (version {pytorch_version})",
+                            icon="✅",
+                            indent=5,
+                        )
+                    status.sub(
+                        "This is a dependency issue. To fix, reinstall DeepLabCut:",
+                        indent=3,
+                    )
+                    status.sub("pip uninstall deeplabcut", indent=5)
+                    status.sub(
+                        "pip install 'deeplabcut[superanimal]==3.0.0rc13'",
+                        indent=5,
+                    )
+                elif "unsupported operand type(s) for |" in error_msg or "|:" in error_msg:
+                    import sys
+
+                    python_version = sys.version_info
+                    status.sub(
+                        "Python version incompatibility detected.",
+                        icon="⚠️",
+                        indent=3,
+                    )
+                    status.sub(
+                        f"Current Python version: {python_version.major}.{python_version.minor}.{python_version.micro}",
+                        indent=5,
+                    )
+                    status.sub(
+                        "DeepLabCut 3.0.0rc13 requires Python 3.10 or higher",
+                        indent=3,
+                    )
+                    status.sub(
+                        "(it uses modern type hints like 'int | None' which require Python 3.10+)",
+                        indent=5,
+                    )
+                    status.sub("To fix:", indent=3)
+                    status.sub(
+                        "1. Create a new conda environment with Python 3.10+:",
+                        indent=5,
+                    )
+                    status.sub(
+                        "   conda create -n element-dlc python=3.10",
+                        indent=7,
+                    )
+                    status.sub(
+                        "   conda activate element-dlc",
+                        indent=7,
+                    )
+                    status.sub(
+                        "   conda env update -f environment.yml",
+                        indent=7,
+                    )
+                    status.sub(
+                        "2. Or upgrade your current environment:",
+                        indent=5,
+                    )
+                    status.sub(
+                        "   conda install python=3.10",
+                        indent=7,
+                    )
+                    status.sub(
+                        "   pip install --upgrade 'deeplabcut[superanimal]==3.0.0rc13'",
+                        indent=7,
+                    )
                 else:
-                    status.sub("DeepLabCut is installed but TensorFlow is missing.", icon="⚠️", indent=3)
-                    status.sub("For SuperAnimal pretrained models, you need PyTorch.", indent=3)
-                    status.sub("To fix, install PyTorch: pip install torch", indent=5)
-            if "torch" in error_msg.lower() or "pytorch" in error_msg.lower():
-                status.sub("DeepLabCut is installed but PyTorch is missing.", icon="⚠️", indent=3)
-                status.sub("For SuperAnimal pretrained models, PyTorch is required.", indent=3)
-                status.sub("To fix, install PyTorch: pip install torch", indent=5)
-            elif "tensorpack" in error_msg.lower():
-                status.sub("DeepLabCut is installed but tensorpack is missing.", icon="⚠️", indent=3)
-                if pytorch_available:
-                    status.sub(f"PyTorch is available (version {pytorch_version})", icon="✅", indent=5)
-                status.sub("This is a dependency issue. To fix, reinstall DeepLabCut:", indent=3)
-                status.sub("pip uninstall deeplabcut", indent=5)
-                status.sub("pip install 'deeplabcut[superanimal]==3.0.0rc13'", indent=5)
-            elif "unsupported operand type(s) for |" in error_msg or "|:" in error_msg:
-                import sys
-                python_version = sys.version_info
-                status.sub("Python version incompatibility detected.", icon="⚠️", indent=3)
-                status.sub(f"Current Python version: {python_version.major}.{python_version.minor}.{python_version.micro}", indent=5)
-                status.sub("DeepLabCut 3.0.0rc13 requires Python 3.10 or higher", indent=3)
-                status.sub("(it uses modern type hints like 'int | None' which require Python 3.10+)", indent=5)
-                status.sub("To fix:", indent=3)
-                status.sub("1. Create a new conda environment with Python 3.10+:", indent=5)
-                status.sub("   conda create -n element-dlc python=3.10", indent=7)
-                status.sub("   conda activate element-dlc", indent=7)
-                status.sub("   conda env update -f environment.yml", indent=7)
-                status.sub("2. Or upgrade your current environment:", indent=5)
-                status.sub("   conda install python=3.10", indent=7)
-                status.sub("   pip install --upgrade 'deeplabcut[superanimal]==3.0.0rc13'", indent=7)
-            else:
-                status.sub(f"DeepLabCut is installed but has missing dependencies: {error_msg}", icon="⚠️", indent=3)
-                if pytorch_available:
-                    status.sub(f"PyTorch is available (version {pytorch_version})", icon="✅", indent=5)
-                status.sub("For SuperAnimal pretrained models, you typically need PyTorch.", indent=3)
-                status.sub("To fix, reinstall DeepLabCut:", indent=3)
-                status.sub("pip uninstall deeplabcut", indent=5)
-                status.sub("pip install 'deeplabcut[superanimal]'", indent=5)
+                    status.sub(
+                        f"DeepLabCut is installed but has missing dependencies: {error_msg}",
+                        icon="⚠️",
+                        indent=3,
+                    )
+                    if pytorch_available:
+                        status.sub(
+                            f"PyTorch is available (version {pytorch_version})",
+                            icon="✅",
+                            indent=5,
+                        )
+                    status.sub(
+                        "For SuperAnimal pretrained models, you typically need PyTorch.",
+                        indent=3,
+                    )
+                    status.sub("To fix, reinstall DeepLabCut:", indent=3)
+                    status.sub(
+                        "pip uninstall deeplabcut",
+                        indent=5,
+                    )
+                    status.sub(
+                        "pip install 'deeplabcut[superanimal]'",
+                        indent=5,
+                    )
         else:
             # Package doesn't exist
-            status.sub("DeepLabCut is not installed. Skipping inference step.", icon="⚠️", indent=3)
-            status.sub("To run inference with SuperAnimal models, install:", indent=3)
-            status.sub("pip install 'deeplabcut[superanimal]'", indent=5)
-            status.sub("This will install DeepLabCut with PyTorch support for pretrained models.", indent=5)
-        
+            status.sub(
+                "DeepLabCut is not installed. Skipping inference step.",
+                icon="⚠️",
+                indent=3,
+            )
+            status.sub(
+                "To run inference with SuperAnimal models, install:",
+                indent=3,
+            )
+            status.sub(
+                "pip install 'deeplabcut[superanimal]'",
+                indent=5,
+            )
+            status.sub(
+                "This will install DeepLabCut with PyTorch support for pretrained models.",
+                indent=5,
+            )
+
         status.sub("The workflow has been set up successfully up to this point:", indent=3)
         status.sub("Pretrained model registered", icon="✅", indent=5)
         status.sub("Model inserted", icon="✅", indent=5)
@@ -724,7 +1058,7 @@ def main():
         status.sub("After fixing the issue, you can run:", indent=3)
         status.sub("pipeline.model.PoseEstimation.populate()", indent=5)
         return
-    
+
     # Final check: NEVER run inference if results exist
     # Check one more time before proceeding
     has_any_results = False
@@ -745,80 +1079,215 @@ def main():
                     pipeline.model.PoseEstimationTask.update1(
                         {**task_key, "task_mode": "load"}
                     )
-                    status.sub(f"⚠️ Found results for recording {rec_key['recording_id']} - forcing 'load' mode (will NOT trigger inference)", icon="⚠️", indent=3)
+                    status.sub(
+                        f"⚠️ Found results for recording {rec_key['recording_id']} - forcing 'load' mode (will NOT trigger inference)",
+                        icon="⚠️",
+                        indent=3,
+                    )
         except Exception as e:
             logger.debug(f"Error checking results for {rec_key}: {e}")
-    
+
     if has_any_results:
-        status.sub("Results exist - using 'load' mode instead of triggering inference", icon="ℹ️", indent=3)
+        status.sub(
+            "Results exist - using 'load' mode instead of triggering inference",
+            icon="ℹ️",
+            indent=3,
+        )
         try:
             pipeline.model.PoseEstimation.populate()
             status.sub("Results loaded successfully!", icon="✅", indent=3)
         except Exception as e:
+            # Handle known DeepLabCut ModelZoo download bug gracefully
+            import traceback
+
+            error_msg = str(e)
+            tb_str = "".join(traceback.format_exception(type(e), e, e.__traceback__))
+
+            # Check for the ModelZoo bug in multiple ways - be very lenient
+            is_modelzoo_bug = (
+                ("modelzoo_download" in tb_str or "modelzoo_download" in error_msg)
+                and (
+                    "'str' object has no attribute 'get'" in tb_str
+                    or "'str' object has no attribute 'get'" in error_msg
+                    or "has no attribute 'get'" in error_msg
+                )
+            ) or (
+                isinstance(e, AttributeError)
+                and ("get" in error_msg.lower())
+                and (
+                    "modelzoo" in tb_str.lower()
+                    or "dlclibrary" in tb_str.lower()
+                    or "modelzoo" in error_msg.lower()
+                )
+            ) or (
+                "'str' object has no attribute 'get'" in error_msg
+                and (
+                    "modelzoo" in tb_str.lower()
+                    or "dlclibrary" in tb_str.lower()
+                )
+            )
+
+            if is_modelzoo_bug:
+                status.sub(
+                    "Encountered known DeepLabCut ModelZoo bug "
+                    "('str' object has no attribute 'get' in dlclibrary.dlcmodelzoo).",
+                    icon="⚠️",
+                    indent=3,
+                )
+                status.sub(
+                    "This is an upstream issue with the installed dlclibrary / DeepLabCut version.",
+                    indent=5,
+                )
+                status.sub(
+                    "Skipping inference step for this test (environment-dependent).",
+                    indent=5,
+                )
+                logger.warning(f"ModelZoo bug detected. Full error: {error_msg}")
+                logger.debug(f"Traceback: {tb_str}")
+                return  # treat as soft skip instead of failing the test
+
             status.sub(f"Error loading results: {e}", icon="❌", indent=3)
             raise
         return  # Exit - do NOT run inference
-    
+
     # Only run inference if NO results exist anywhere
-    status.sub("DeepLabCut is available - proceeding with inference", icon="✅", indent=3)
-    status.sub("This may take a while (requires GPU for reasonable speed)", icon="⚠️", indent=3)
-    status.sub(f"Processing {len(recording_keys)} video(s)...", icon="⚠️", indent=3)
+    status.sub(
+        "DeepLabCut is available - proceeding with inference", icon="✅", indent=3
+    )
+    status.sub(
+        "This may take a while (requires GPU for reasonable speed)",
+        icon="⚠️",
+        indent=3,
+    )
+    status.sub(
+        f"Processing {len(recording_keys)} video(s)...", icon="⚠️", indent=3
+    )
     try:
         pipeline.model.PoseEstimation.populate()
         status.sub("Inference completed!", icon="✅", indent=3)
     except Exception as e:
+        # Handle known DeepLabCut ModelZoo download bug gracefully
+        import traceback
+
+        error_msg = str(e)
+        tb_str = "".join(traceback.format_exception(type(e), e, e.__traceback__))
+
+        # Check for the ModelZoo bug in multiple ways - be very lenient
+        is_modelzoo_bug = (
+            ("modelzoo_download" in tb_str or "modelzoo_download" in error_msg)
+            and (
+                "'str' object has no attribute 'get'" in tb_str
+                or "'str' object has no attribute 'get'" in error_msg
+                or "has no attribute 'get'" in error_msg
+            )
+        ) or (
+            isinstance(e, AttributeError)
+            and ("get" in error_msg.lower())
+            and (
+                "modelzoo" in tb_str.lower()
+                or "dlclibrary" in tb_str.lower()
+                or "modelzoo" in error_msg.lower()
+            )
+        ) or (
+            "'str' object has no attribute 'get'" in error_msg
+            and (
+                "modelzoo" in tb_str.lower()
+                or "dlclibrary" in tb_str.lower()
+            )
+        )
+
+        if is_modelzoo_bug:
+            status.sub(
+                "Encountered known DeepLabCut ModelZoo bug "
+                "('str' object has no attribute 'get' in dlclibrary.dlcmodelzoo).",
+                icon="⚠️",
+                indent=3,
+            )
+            status.sub(
+                "This is an upstream issue with the installed dlclibrary / DeepLabCut version.",
+                indent=5,
+            )
+            status.sub(
+                "Skipping pretrained inference step for this test (environment-dependent).",
+                indent=5,
+            )
+            logger.warning(f"ModelZoo bug detected. Full error: {error_msg}")
+            logger.debug(f"Traceback: {tb_str}")
+            return  # treat as soft skip instead of failing the test
+
         status.sub(f"Error during inference: {e}", icon="❌", indent=3)
         status.sub("Troubleshooting:", indent=3)
-        status.sub("- Ensure DeepLabCut is installed: pip install 'deeplabcut[superanimal]'", indent=5)
-        status.sub("- Check GPU availability (or use CPU - will be slow)", indent=5)
-        status.sub("- Try reducing batchsize or scale in analyze_videos_params", indent=5)
+        status.sub(
+            "- Ensure DeepLabCut is installed: pip install 'deeplabcut[superanimal]'",
+            indent=5,
+        )
+        status.sub(
+            "- Check GPU availability (or use CPU - will be slow)",
+            indent=5,
+        )
+        status.sub(
+            "- Try reducing batchsize or scale in analyze_videos_params", indent=5
+        )
         raise
-    
+
     # 8. Show results for each recording
     status.header("Results")
-    
+
     for rec_key in recording_keys:
         status.sub(f"Recording {rec_key['recording_id']}:", icon="📹", indent=2)
         try:
             pose_estimation = (
-                pipeline.model.PoseEstimation 
-                & rec_key 
+                pipeline.model.PoseEstimation
+                & rec_key
                 & {"model_name": model_name}
             ).fetch1()
-            
-            status.sub(f"Completed at: {pose_estimation['pose_estimation_time']}", icon="✅", indent=4)
-            
+
+            status.sub(
+                f"Completed at: {pose_estimation['pose_estimation_time']}",
+                icon="✅",
+                indent=4,
+            )
+
             body_parts = (
-                pipeline.model.PoseEstimation.BodyPartPosition 
-                & rec_key 
+                pipeline.model.PoseEstimation.BodyPartPosition
+                & rec_key
                 & {"model_name": model_name}
             ).fetch("body_part")
-            
-            status.sub(f"Detected body parts ({len(set(body_parts))}): {sorted(set(body_parts))}", icon="📊", indent=4)
-            
+
+            status.sub(
+                f"Detected body parts ({len(set(body_parts))}): {sorted(set(body_parts))}",
+                icon="📊",
+                indent=4,
+            )
+
             # Show stats for first body part as example
             if len(set(body_parts)) > 0:
                 bp = sorted(set(body_parts))[0]
                 bp_data = (
-                    pipeline.model.PoseEstimation.BodyPartPosition 
-                    & rec_key 
+                    pipeline.model.PoseEstimation.BodyPartPosition
+                    & rec_key
                     & {"model_name": model_name, "body_part": bp}
                 ).fetch1()
-                
+
                 x_pos = bp_data["x_pos"]
                 y_pos = bp_data["y_pos"]
                 likelihood = bp_data["likelihood"]
-                
-                status.sub(f"Example ({bp}): {len(x_pos)} frames, avg likelihood: {likelihood.mean():.3f}", icon="📈", indent=4)
+
+                status.sub(
+                    f"Example ({bp}): {len(x_pos)} frames, avg likelihood: {likelihood.mean():.3f}",
+                    icon="📈",
+                    indent=4,
+                )
         except Exception as e:
             status.sub(f"No results yet or error: {e}", icon="⚠️", indent=4)
-    
+
     status.header("Test completed successfully!")
     status.sub("Next steps:", indent=2)
     status.sub("- Check output directory for DLC results", indent=4)
     status.sub("- Visualize results using DLC's plotting functions", indent=4)
     status.sub("- Query PoseEstimation.BodyPartPosition for analysis", indent=4)
 
+
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(
         description="Test pretrained DeepLabCut inference with video files",
@@ -827,22 +1296,55 @@ def main():
 Examples:
   python test_video_inference.py
   python test_video_inference.py superanimal_quadruped
-  python test_video_inference.py superanimal_topviewmouse
-        """
+  python test_video_inference.py superanimal_topviewmouse --gpu 0
+        """,
     )
     parser.add_argument(
         "model",
         nargs="?",
         default="superanimal_quadruped",
         choices=["superanimal_quadruped", "superanimal_topviewmouse"],
-        help="Pretrained model to use (default: superanimal_quadruped)"
+        help="Pretrained model to use (default: superanimal_quadruped)",
     )
-    
+    parser.add_argument(
+        "--gpu",
+        type=int,
+        default=0,
+        help="GPU index to use (default: 0). Use -1 for CPU.",
+    )
+    parser.add_argument(
+        "--detector-batch-size",
+        type=int,
+        default=4,
+        help=(
+            "Detector batch size for pretrained inference (default: 4). "
+            "Increase for faster inference if you have GPU memory."
+        ),
+    )
+
     args = parser.parse_args()
-    
-    # Store model name as attribute so main() can access it
-    main.pretrained_model_name = args.model
-    
-    main()
 
+    # Set CUDA_VISIBLE_DEVICES for PyTorch/TensorFlow
+    if args.gpu >= 0:
+        os.environ["CUDA_VISIBLE_DEVICES"] = str(args.gpu)
+        print(f"🔧 Set CUDA_VISIBLE_DEVICES={args.gpu}")
+
+        # Configure PyTorch device if available
+        try:
+            import torch
+
+            if torch.cuda.is_available():
+                torch.cuda.set_device(args.gpu)
+                print(f"🔧 Set PyTorch default device to GPU {args.gpu}")
+                print(f"🔧 GPU available: {torch.cuda.get_device_name(args.gpu)}")
+            else:
+                print("⚠️  CUDA not available in PyTorch")
+        except ImportError:
+            pass  # PyTorch not available, that's OK
 
+    # Store model name, GPU, and detector batch size as attributes so main() can access them
+    main.pretrained_model_name = args.model
+    main.gpu = args.gpu
+    main.detector_batch_size = args.detector_batch_size
+
+    main()

From fd95d108a09ff995d6e041359fa6fdc0670610a1 Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Thu, 4 Dec 2025 13:02:50 +0100
Subject: [PATCH 12/15] training attempt

---
 real_quadruped_training_example.py | 886 +++++++++++++++++++++++++++++
 1 file changed, 886 insertions(+)
 create mode 100644 real_quadruped_training_example.py

diff --git a/real_quadruped_training_example.py b/real_quadruped_training_example.py
new file mode 100644
index 0000000..f3866e4
--- /dev/null
+++ b/real_quadruped_training_example.py
@@ -0,0 +1,886 @@
+#!/usr/bin/env python
+"""
+Real fine-tuning of SuperAnimal-Quadruped on your own data
+==========================================================
+
+This script supports **both**:
+- TensorFlow SuperAnimal ("classic" DLC SuperAnimal)
+- PyTorch SuperAnimal ModelZoo (HRNet-W32 + Faster R-CNN)
+
+You choose the engine with:  --engine tensorflow   OR   --engine pytorch
+
+End-to-end workflow (exact order)
+---------------------------------
+1. Create project + run SuperAnimal + extract frames
+   - `--create-project --run-superanimal --extract-frames`
+   - For TF: uses create_pretrained_project(model="superanimal_quadruped")
+   - For PT: uses create_new_project(engine=pytorch) + ModelZoo (hrnet_w32)
+
+2. Open GUI with refine_labels → correct + save
+   - `dlc.refine_labels(config)` or `--refine-labels`
+   - Load SuperAnimal predictions + frames in GUI
+   - Correct keypoints interactively
+   - SAVE → creates CollectedData_*.csv/.h5  (your training labels)
+
+3. Create training dataset
+   - `--create-dataset`
+   - Uses CollectedData_*.csv/.h5 from step 2
+   - For PyTorch: creates a top-down HRNet-W32 + Faster R-CNN dataset
+     with SuperAnimal-Quadruped weights (transfer learning).
+
+4. Train the model
+   - `--train`
+   - For TF: standard DLC training (maxiters-based)
+   - For PT: DLC training with epoch-based PyTorch API
+     and SuperAnimal transfer learning (ModelZoo weights)
+"""
+
+import argparse
+import sys
+from pathlib import Path
+
+import deeplabcut as dlc
+
+
+# ----------------------------------------------------------------------
+# Argument parsing
+# ----------------------------------------------------------------------
+
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description="Real fine-tuning of SuperAnimal-Quadruped (TF or PyTorch)",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog="""\
+Examples
+--------
+
+# 1) Create project + run SuperAnimal + extract frames (one shot)
+python real_quadruped_training_example.py \\
+    --engine tensorflow \\
+    --project-name quad_superanimal \\
+    --experimenter mariia \\
+    --videos /path/to/your_quadruped_video.mp4 \\
+    --create-project \\
+    --run-superanimal \\
+    --extract-frames
+
+# Same but with PyTorch ModelZoo backend
+python real_quadruped_training_example.py \\
+    --engine pytorch \\
+    --project-name quad_superanimal \\
+    --experimenter mariia \\
+    --videos /path/to/your_quadruped_video.mp4 \\
+    --create-project \\
+    --run-superanimal \\
+    --extract-frames
+
+# 2) Refine labels in GUI (after predictions & frames exist)
+python real_quadruped_training_example.py \\
+    --engine pytorch \\
+    --project-dir /path/to/quad_superanimal-mariia-YYYY-MM-DD \\
+    --refine-labels
+
+# 3) Create dataset from refined labels
+python real_quadruped_training_example.py \\
+    --engine pytorch \\
+    --project-dir /path/to/quad_superanimal-mariia-YYYY-MM-DD \\
+    --create-dataset
+
+# 4) Train (fine-tune) the model
+python real_quadruped_training_example.py \\
+    --engine pytorch \\
+    --project-dir /path/to/quad_superanimal-mariia-YYYY-MM-DD \\
+    --train \\
+    --epochs 50 \\
+    --save-epochs 10
+""",
+    )
+
+    # Engine selection
+    parser.add_argument(
+        "--engine",
+        type=str,
+        choices=["tensorflow", "pytorch"],
+        default="pytorch",
+        help="Backend engine to use: 'tensorflow' (classic) or 'pytorch' (ModelZoo). Default: pytorch.",
+    )
+
+    # Project / config location
+    parser.add_argument(
+        "--project-dir",
+        type=str,
+        default=None,
+        help="Existing DLC project directory (if omitted and --create-project is used, a new project is created).",
+    )
+    parser.add_argument(
+        "--project-name",
+        type=str,
+        default="quad_superanimal",
+        help="Project name (default: quad_superanimal).",
+    )
+    parser.add_argument(
+        "--experimenter",
+        type=str,
+        default="mariia",
+        help="Experimenter name (default: mariia).",
+    )
+    parser.add_argument(
+        "--videos",
+        type=str,
+        nargs="+",
+        default=None,
+        help="One or more video paths for project creation (required for --create-project).",
+    )
+
+    # Workflow flags
+    parser.add_argument(
+        "--create-project",
+        action="store_true",
+        help="Create a new project (TF: create_pretrained_project; PT: create_new_project).",
+    )
+    parser.add_argument(
+        "--extract-frames",
+        action="store_true",
+        help="Run deeplabcut.extract_frames on the config.",
+    )
+    parser.add_argument(
+        "--run-superanimal",
+        action="store_true",
+        help="Run SuperAnimal inference on project videos (auto-predict).",
+    )
+    parser.add_argument(
+        "--refine-labels",
+        action="store_true",
+        help="Open DLC refine_labels GUI to correct predictions into labels.",
+    )
+    parser.add_argument(
+        "--create-dataset",
+        action="store_true",
+        help="Run deeplabcut.create_training_dataset on the config.",
+    )
+    parser.add_argument(
+        "--train",
+        action="store_true",
+        help="Run deeplabcut.train_network (real training / fine-tuning).",
+    )
+
+    # SuperAnimal / GPU parameters (inference)
+    parser.add_argument(
+        "--batch-size",
+        type=int,
+        default=16,
+        help="Batch size for SuperAnimal inference (where supported). Default: 16.",
+    )
+    parser.add_argument(
+        "--gpu",
+        type=int,
+        default=0,
+        help="GPU index to use (where supported by DLC). Default: 0.",
+    )
+    
+    # PyTorch inference parameters (for better detection of tiny animals in 4K video)
+    # Note: --detector-batch-size is defined in training section below (shared for both inference and training)
+    parser.add_argument(
+        "--bbox-threshold",
+        type=float,
+        default=0.1,
+        help="Bounding box threshold for detector (lower = less strict). Default: 0.1.",
+    )
+    parser.add_argument(
+        "--pcutoff",
+        type=float,
+        default=0.05,
+        help="P-cutoff threshold for pose estimation (lower = less strict). Default: 0.05.",
+    )
+    parser.add_argument(
+        "--pseudo-threshold",
+        type=float,
+        default=0.05,
+        help="Pseudo threshold for pose estimation. Default: 0.05.",
+    )
+    parser.add_argument(
+        "--scale-list",
+        type=int,
+        nargs="+",
+        default=[300, 400, 500, 600, 700, 800],
+        help="Scale list for multi-scale detection (better for tiny animals). Default: [300, 400, 500, 600, 700, 800].",
+    )
+    parser.add_argument(
+        "--video-adapt",
+        action="store_true",
+        help="Enable video adaptation for better tracking (default: True).",
+    )
+    parser.add_argument(
+        "--no-video-adapt",
+        dest="video_adapt",
+        action="store_false",
+        help="Disable video adaptation.",
+    )
+    # Set default after adding arguments (before parsing)
+    parser.set_defaults(video_adapt=True)
+    parser.add_argument(
+        "--adapt-iterations",
+        type=int,
+        default=1500,
+        help="Number of iterations for video adaptation. Default: 1500.",
+    )
+    parser.add_argument(
+        "--detector-epochs-inference",
+        type=int,
+        default=10,
+        help="Detector epochs for inference (if supported). Default: 10.",
+    )
+    parser.add_argument(
+        "--pose-epochs-inference",
+        type=int,
+        default=10,
+        help="Pose epochs for inference (if supported). Default: 10.",
+    )
+
+    # Training dataset / training hyperparameters
+    parser.add_argument(
+        "--shuffle",
+        type=int,
+        default=1,
+        help="Shuffle index for training (default: 1).",
+    )
+    parser.add_argument(
+        "--trainingsetindex",
+        type=int,
+        default=0,
+        help="Training set index (default: 0).",
+    )
+
+    # TF-style training params (used only if engine == tensorflow)
+    parser.add_argument(
+        "--maxiters",
+        type=int,
+        default=50000,
+        help="Max iterations for TF train_network (default: 50000).",
+    )
+    parser.add_argument(
+        "--displayiters",
+        type=int,
+        default=100,
+        help="Display iterations for TF train_network (default: 100).",
+    )
+    parser.add_argument(
+        "--saveiters",
+        type=int,
+        default=1000,
+        help="Save iterations for TF train_network (default: 1000).",
+    )
+
+    # PyTorch-style training params (used only if engine == pytorch)
+    parser.add_argument(
+        "--epochs",
+        type=int,
+        default=50,
+        help="Number of epochs for PyTorch training (default: 50).",
+    )
+    parser.add_argument(
+        "--save-epochs",
+        type=int,
+        default=10,
+        help="Save snapshot every N epochs for PyTorch (default: 10).",
+    )
+    parser.add_argument(
+        "--detector-epochs",
+        type=int,
+        default=0,
+        help="Detector epochs for PyTorch top-down SuperAnimal (default: 0 = only pose head).",
+    )
+    parser.add_argument(
+        "--detector-save-epochs",
+        type=int,
+        default=None,
+        help="Detector save interval in epochs (PyTorch). If None, use pytorch_config.yaml.",
+    )
+    parser.add_argument(
+        "--train-batch-size",
+        type=int,
+        default=16,
+        help="Batch size for PyTorch training (pose model). Default: 16.",
+    )
+    parser.add_argument(
+        "--detector-batch-size",
+        type=int,
+        default=1,
+        help="Detector batch size for PyTorch training. Default: 1.",
+    )
+
+    return parser.parse_args()
+
+
+# ----------------------------------------------------------------------
+# Config / project handling
+# ----------------------------------------------------------------------
+
+
+def get_config_path(args: argparse.Namespace) -> Path:
+    """
+    Resolve or create the DLC config.yaml, depending on engine.
+
+    For TensorFlow engine:
+      - --create-project uses create_pretrained_project(model="superanimal_quadruped")
+    For PyTorch engine:
+      - --create-project uses create_new_project(..., engine="pytorch")
+        and sets engine: pytorch in config.yaml
+    """
+    if args.create_project:
+        if not args.videos:
+            raise ValueError("--create-project requires at least one --videos path.")
+
+        video_paths = [str(Path(v).expanduser().resolve()) for v in args.videos]
+
+        print("\n=== Creating project ===")
+        print(f"  engine       : {args.engine}")
+        print(f"  project_name : {args.project_name}")
+        print(f"  experimenter : {args.experimenter}")
+        print(f"  videos       : {video_paths}")
+
+        if args.engine == "tensorflow":
+            # Classic TF SuperAnimal (dlcrnet-based) via create_pretrained_project
+            config_path = dlc.create_pretrained_project(
+                args.project_name,
+                args.experimenter,
+                video_paths,
+                model="superanimal_quadruped",
+            )
+            config_path = Path(config_path)
+        else:
+            # PyTorch engine: normal project, then we use ModelZoo weights later
+            project_path = dlc.create_new_project(
+                args.project_name,
+                args.experimenter,
+                video_paths,
+                copy_videos=False,
+            )
+            # create_new_project returns the config.yaml path directly (as a string)
+            config_path = Path(project_path)
+
+            # Verify it's actually a config.yaml file
+            if not config_path.exists():
+                raise FileNotFoundError(f"Config file not found at {config_path}")
+            if config_path.name != "config.yaml":
+                raise ValueError(f"Expected config.yaml, got {config_path.name}")
+
+            # Ensure engine is set to pytorch in config
+            import yaml
+
+            with open(config_path, "r") as f:
+                cfg = yaml.safe_load(f)
+            old_engine = cfg.get("engine", "not set")
+            cfg["engine"] = "pytorch"
+            with open(config_path, "w") as f:
+                yaml.dump(cfg, f, default_flow_style=False)
+            print(f"  ✅ Set engine: {old_engine} → pytorch in config.yaml")
+
+        print(f"\n✅ Project created. Config: {config_path}")
+        return config_path
+
+    # Reuse existing project
+    if args.project_dir:
+        project_dir = Path(args.project_dir).expanduser().resolve()
+    else:
+        # Auto-discover latest project matching pattern <project_name>-<experimenter>-*
+        search_root = Path.cwd()
+        pattern = f"{args.project_name}-{args.experimenter}-*"
+        candidates = list(search_root.glob(pattern))
+
+        if not candidates:
+            raise FileNotFoundError(
+                "No existing project found and --create-project was not used.\n"
+                f"Looked for directories matching '{pattern}' in: {search_root}\n\n"
+                "Either run with --create-project first, or pass --project-dir explicitly.\n"
+            )
+        project_dir = max(candidates, key=lambda p: p.stat().st_mtime)
+
+    config_path = project_dir / "config.yaml"
+    if not config_path.exists():
+        raise FileNotFoundError(f"config.yaml not found at {config_path}")
+
+    print(f"\nUsing existing project: {project_dir}")
+    print(f"Config: {config_path}")
+    return config_path
+
+
+# ----------------------------------------------------------------------
+# Optional: minimal bodyparts override
+# ----------------------------------------------------------------------
+
+
+def enforce_minimal_bodyparts(config_path: Path, bodyparts=None):
+    """
+    Optionally override the project to use a minimal set of bodyparts.
+
+    This is useful if you only care about a couple of keypoints
+    (e.g. head, tailbase) and want a "minimal pose" model.
+    """
+    import yaml
+
+    if bodyparts is None:
+        bodyparts = ["head", "tailbase"]
+
+    with open(config_path, "r") as f:
+        cfg = yaml.safe_load(f)
+
+    cfg["bodyparts"] = bodyparts
+
+    with open(config_path, "w") as f:
+        yaml.dump(cfg, f, default_flow_style=False)
+
+    print(f"✅ Minimal bodyparts set written to {config_path}: {bodyparts}")
+
+
+# ----------------------------------------------------------------------
+# Steps: extract frames, run SuperAnimal, refine, dataset, train
+# ----------------------------------------------------------------------
+
+
+def step_extract_frames(config_path: Path):
+    """Run DLC frame extraction."""
+    print("\n=== Step: extract_frames ===")
+    dlc.extract_frames(
+        str(config_path),
+        mode="automatic",
+        algo="kmeans",
+        crop=False,
+    )
+    print("✅ Frames extracted.")
+    print("👉 Next: run --run-superanimal (if not done yet), then refine labels in the GUI.")
+
+
+def step_run_superanimal_inference_tf(config_path: Path, args: argparse.Namespace):
+    """
+    TensorFlow SuperAnimal inference (classic).
+
+    - Uses: superanimal_quadruped (TF dlcrnet model)
+    - API:  video_inference_superanimal(videos, superanimal_name=..., ...)
+    """
+    from deeplabcut.utils import auxiliaryfunctions as aux
+
+    print("\n=== Step: video_inference_superanimal (TensorFlow) ===")
+    cfg = aux.read_config(str(config_path))
+
+    if args.videos:
+        videos = [str(Path(v).expanduser().resolve()) for v in args.videos]
+    else:
+        videos = list(cfg.get("video_sets", {}).keys())
+
+    if not videos:
+        raise ValueError("No videos found. Pass --videos or ensure video_sets is defined in config.yaml.")
+
+    dest_folder = Path(config_path).parent / "superanimal_predictions_tf"
+    dest_folder.mkdir(parents=True, exist_ok=True)
+
+    print(f"  engine          : tensorflow")
+    print(f"  superanimal_name: superanimal_quadruped")
+    print(f"  dest_folder     : {dest_folder}")
+    print(f"  gputouse        : {args.gpu}")
+    print(f"  batch_size      : {args.batch_size} (used if DLC TF API supports it)")
+
+    # Check what parameters the function accepts
+    import inspect
+
+    sig = inspect.signature(dlc.video_inference_superanimal)
+    param_names = list(sig.parameters.keys())
+
+    kwargs = {
+        "superanimal_name": "superanimal_quadruped",
+        "dest_folder": str(dest_folder),
+    }
+
+    # Use device parameter if available (PyTorch), otherwise try gputouse (TensorFlow)
+    if "device" in param_names:
+        device = f"cuda:{args.gpu}" if args.gpu >= 0 else "cpu"
+        kwargs["device"] = device
+        print(f"  device          : {device}")
+    elif "gputouse" in param_names:
+        kwargs["gputouse"] = args.gpu
+        print(f"  gputouse        : {args.gpu}")
+
+    if "batch_size" in param_names:
+        kwargs["batch_size"] = args.batch_size
+
+    dlc.video_inference_superanimal(
+        videos,
+        **kwargs,
+    )
+
+    print("✅ SuperAnimal (TF) predictions saved.")
+    print("👉 Next: open DLC refine GUI to correct predictions into labels.")
+
+
+def step_run_superanimal_inference_pt(config_path: Path, args: argparse.Namespace):
+    """
+    PyTorch SuperAnimal inference using ModelZoo.
+
+    - superanimal_name: "superanimal_quadruped"
+    - model_name     : "hrnet_w32"
+    - detector_name  : "fasterrcnn_resnet50_fpn_v2"
+    """
+    import os
+    from deeplabcut.utils import auxiliaryfunctions as aux
+
+    print("\n=== Step: video_inference_superanimal (PyTorch ModelZoo) ===")
+
+    # NOTE: deeplabcut is already imported at module level.
+    # We still set CUDA_VISIBLE_DEVICES here for downstream torch usage.
+    original_cuda_visible = os.environ.get("CUDA_VISIBLE_DEVICES", None)
+    os.environ["CUDA_VISIBLE_DEVICES"] = str(args.gpu)
+    print(f"🔧 Set CUDA_VISIBLE_DEVICES={args.gpu}")
+
+    try:
+        import torch
+
+        if torch.cuda.is_available():
+            torch.cuda.set_device(args.gpu)
+            print(f"🔧 Set PyTorch default device to GPU {args.gpu}")
+            print(f"🔧 GPU available: {torch.cuda.get_device_name(args.gpu)}")
+        else:
+            print(f"⚠️  CUDA not available in PyTorch")
+    except ImportError:
+        print(f"⚠️  PyTorch not available")
+    except Exception as e:
+        print(f"⚠️  Error setting PyTorch device: {e}")
+
+    cfg = aux.read_config(str(config_path))
+
+    if args.videos:
+        videos = [str(Path(v).expanduser().resolve()) for v in args.videos]
+    else:
+        videos = list(cfg.get("video_sets", {}).keys())
+
+    if not videos:
+        raise ValueError("No videos found. Pass --videos or ensure video_sets is defined in config.yaml.")
+
+    dest_folder = Path(config_path).parent / "superanimal_predictions_pt"
+    dest_folder.mkdir(parents=True, exist_ok=True)
+
+    superanimal_name = "superanimal_quadruped"
+    model_name = "hrnet_w32"
+    detector_name = "fasterrcnn_resnet50_fpn_v2"
+
+    print(f"  engine          : pytorch")
+    print(f"  superanimal_name: {superanimal_name}")
+    print(f"  model_name      : {model_name}")
+    print(f"  detector_name   : {detector_name}")
+    print(f"  dest_folder     : {dest_folder}")
+    print(f"  device          : cuda:{args.gpu} (GPU {args.gpu})")
+
+    # Use device parameter instead of gputouse (PyTorch API)
+    device = f"cuda:{args.gpu}" if args.gpu >= 0 else "cpu"
+
+    # Check what parameters the function accepts
+    import inspect
+
+    sig = inspect.signature(dlc.video_inference_superanimal)
+    param_names = list(sig.parameters.keys())
+    print(f"  🔍 video_inference_superanimal accepts: {param_names}")
+
+    # Build kwargs - keep memory under control
+    safe_batch_size = min(args.batch_size, 4)
+    print(f"  batch_size      : {safe_batch_size} (capped from {args.batch_size} to prevent OOM)")
+
+    # Build call_kwargs with all PyTorch inference parameters
+    call_kwargs = {
+        "model_name": model_name,
+        "detector_name": detector_name,
+        "dest_folder": str(dest_folder),
+        "batch_size": safe_batch_size,
+        "detector_batch_size": args.detector_batch_size,
+        
+        # Make detector less strict (better for tiny animals)
+        "bbox_threshold": args.bbox_threshold,
+        "pcutoff": args.pcutoff,
+        "pseudo_threshold": args.pseudo_threshold,
+        
+        # Better for tiny mice in 4K video
+        "scale_list": args.scale_list,
+        
+        # Improve video adaptation
+        "video_adapt": args.video_adapt,
+        "adapt_iterations": args.adapt_iterations,
+        "detector_epochs": args.detector_epochs_inference,
+        "pose_epochs": args.pose_epochs_inference,
+    }
+
+    # Add device parameter
+    if "device" in param_names:
+        call_kwargs["device"] = device
+        print(f"  ✅ Passing device={device} (GPU {args.gpu})")
+    elif "gputouse" in param_names:
+        call_kwargs["gputouse"] = args.gpu
+        print(f"  ✅ Passing gputouse={args.gpu} (GPU {args.gpu})")
+    else:
+        print(f"  ⚠️  Function doesn't accept device/gputouse parameter")
+    
+    # Filter to only include parameters that the function accepts
+    final_kwargs = {k: v for k, v in call_kwargs.items() if k in param_names}
+    
+    # Print all parameters being used
+    print(f"\n  🔍 PyTorch inference parameters:")
+    print(f"     batch_size: {final_kwargs.get('batch_size', 'N/A')}")
+    print(f"     detector_batch_size: {final_kwargs.get('detector_batch_size', 'N/A')}")
+    print(f"     bbox_threshold: {final_kwargs.get('bbox_threshold', 'N/A')}")
+    print(f"     pcutoff: {final_kwargs.get('pcutoff', 'N/A')}")
+    print(f"     pseudo_threshold: {final_kwargs.get('pseudo_threshold', 'N/A')}")
+    print(f"     scale_list: {final_kwargs.get('scale_list', 'N/A')}")
+    print(f"     video_adapt: {final_kwargs.get('video_adapt', 'N/A')}")
+    print(f"     adapt_iterations: {final_kwargs.get('adapt_iterations', 'N/A')}")
+    print(f"     detector_epochs: {final_kwargs.get('detector_epochs', 'N/A')}")
+    print(f"     pose_epochs: {final_kwargs.get('pose_epochs', 'N/A')}")
+
+    # Show which parameters were skipped (not accepted by function)
+    skipped = {k: v for k, v in call_kwargs.items() if k not in param_names}
+    if skipped:
+        print(f"\n  ⚠️  Parameters not accepted by function (skipped):")
+        for key, value in skipped.items():
+            print(f"     {key}: {value}")
+
+    dlc.video_inference_superanimal(
+        videos,
+        superanimal_name,
+        **final_kwargs,
+    )
+
+    print("✅ SuperAnimal (PyTorch) predictions saved.")
+    print("👉 Next: open DLC refine GUI to correct predictions into labels.")
+
+    # Restore CUDA_VISIBLE_DEVICES
+    if original_cuda_visible is not None:
+        os.environ["CUDA_VISIBLE_DEVICES"] = original_cuda_visible
+    elif "CUDA_VISIBLE_DEVICES" in os.environ:
+        del os.environ["CUDA_VISIBLE_DEVICES"]
+
+
+def step_refine_labels_gui(config_path: Path):
+    """
+    Launch DLC's refine_labels GUI (single-animal refinement).
+
+    Workflow:
+      1. SuperAnimal predictions (H5/CSV) are NOT training labels
+      2. This GUI lets you load predictions + frames, correct keypoints
+      3. When you SAVE in the GUI, it creates CollectedData_*.csv/.h5 files
+      4. Those CollectedData files ARE the training labels you need
+    """
+    print("\n=== Step: refine_labels (GUI) ===")
+    print("⚠️ SuperAnimal predictions ≠ training labels.")
+    print("   This GUI converts predictions → labels (CollectedData_*.csv/.h5).")
+    print("   You MUST save your refined labels in the GUI.")
+
+    project_dir = config_path.parent
+    labeled_dir = project_dir / "labeled-data"
+    if not labeled_dir.exists():
+        print("⚠️ No 'labeled-data' directory found.")
+        print("   You probably need to run --extract-frames and --run-superanimal first.")
+
+    dlc.refine_labels(str(config_path))
+    print("✅ Refine GUI closed.")
+
+    collected = list(labeled_dir.rglob("CollectedData_*.csv")) + list(
+        labeled_dir.rglob("CollectedData_*.h5")
+    )
+    if collected:
+        print(f"✅ Found {len(collected)} label file(s) - you can now run --create-dataset.")
+    else:
+        print("⚠️ No CollectedData_*.csv/.h5 files found. Did you SAVE in the GUI?")
+
+
+def step_check_labels(config_path: Path):
+    """Check labels (optional but recommended)."""
+    print("\n=== Step: check_labels ===")
+    dlc.check_labels(str(config_path))
+    print("✅ Labels plot created (inspect figures).")
+
+
+def step_create_training_dataset(config_path: Path, engine: str):
+    """
+    Create the training dataset (.mat) used for training.
+
+    For PyTorch:
+      - Uses ModelZoo weight initialization (SuperAnimal Quadruped)
+      - Creates a top-down HRNet-W32 + Faster R-CNN dataset.
+    """
+    print("\n=== Step: create_training_dataset ===")
+
+    project_dir = config_path.parent
+    labeled_data_dir = project_dir / "labeled-data"
+
+    if not labeled_data_dir.exists():
+        print("❌ Error: No 'labeled-data' directory found!")
+        print(f"   Expected: {labeled_data_dir}")
+        print("   You need to refine predictions first to create labels.")
+        sys.exit(1)
+
+    collected = list(labeled_data_dir.rglob("CollectedData_*.csv")) + list(
+        labeled_data_dir.rglob("CollectedData_*.h5")
+    )
+    if not collected:
+        print("❌ Error: No CollectedData_*.csv or CollectedData_*.h5 files found!")
+        print(f"   Searched in: {labeled_data_dir}")
+        print("   SuperAnimal predictions are NOT the same as training labels.")
+        print("   Refine in GUI and SAVE to create CollectedData files.")
+        sys.exit(1)
+
+    print(f"✅ Found {len(collected)} label file(s) - proceeding with dataset creation")
+
+    if engine == "pytorch":
+        # Use ModelZoo weight initialization for transfer learning
+        from deeplabcut.modelzoo import build_weight_init
+
+        super_animal = "superanimal_quadruped"
+        model_name = "hrnet_w32"
+        detector_name = "fasterrcnn_resnet50_fpn_v2"
+
+        print("Using PyTorch ModelZoo weight_init for training dataset (SuperAnimal transfer learning)...")
+        print(f"  super_animal : {super_animal}")
+        print(f"  model_name   : {model_name}")
+        print(f"  detector_name: {detector_name}")
+
+        # Note: cfg is passed as string path; DLC handles reading internally.
+        weight_init = build_weight_init(
+            cfg=str(config_path),
+            super_animal=super_animal,
+            model_name=model_name,
+            detector_name=detector_name,
+            with_decoder=False,  # transfer learning (new decoder), as in docs
+        )
+
+        dlc.create_training_dataset(
+            str(config_path),
+            num_shuffles=1,
+            net_type=f"top_down_{model_name}",
+            detector_type=detector_name,
+            weight_init=weight_init,
+            userfeedback=False,
+        )
+    else:
+        # Classic TF path (ImageNet or SuperAnimal via superanimal_name in config)
+        dlc.create_training_dataset(str(config_path), num_shuffles=1)
+
+    print("✅ Training dataset created.")
+
+
+def step_train_network(config_path: Path, args: argparse.Namespace):
+    """
+    Run real training / fine-tuning.
+
+    - For TensorFlow: uses maxiters/saveiters/displayiters
+    - For PyTorch: uses epoch-based API (epochs, save_epochs, device, batch sizes)
+    """
+    print("\n=== Step: train_network ===")
+    if args.engine == "tensorflow":
+        print(
+            f"[TF] shuffle={args.shuffle}, trainingsetindex={args.trainingsetindex}, "
+            f"maxiters={args.maxiters}, displayiters={args.displayiters}, saveiters={args.saveiters}"
+        )
+        dlc.train_network(
+            str(config_path),
+            shuffle=args.shuffle,
+            trainingsetindex=args.trainingsetindex,
+            maxiters=args.maxiters,
+            displayiters=args.displayiters,
+            saveiters=args.saveiters,
+            allow_growth=True,
+        )
+    else:
+        # PyTorch engine: use epoch-based interface
+        device = f"cuda:{args.gpu}" if args.gpu >= 0 else "cpu"
+        print(
+            f"[PyTorch] shuffle={args.shuffle}, trainingsetindex={args.trainingsetindex}, "
+            f"epochs={args.epochs}, save_epochs={args.save_epochs}, "
+            f"batch_size={args.train_batch_size}, detector_batch_size={args.detector_batch_size}, "
+            f"detector_epochs={args.detector_epochs}, detector_save_epochs={args.detector_save_epochs}, "
+            f"device={device}"
+        )
+
+        dlc.train_network(
+            str(config_path),
+            shuffle=args.shuffle,
+            trainingsetindex=args.trainingsetindex,
+            device=device,
+            batch_size=args.train_batch_size,
+            detector_batch_size=args.detector_batch_size,
+            epochs=args.epochs,
+            save_epochs=args.save_epochs,
+            detector_epochs=args.detector_epochs,
+            detector_save_epochs=args.detector_save_epochs,
+        )
+
+    print("✅ Training finished. Snapshots saved under dlc-models / dlc-models-pytorch.")
+
+
+# ----------------------------------------------------------------------
+# Main
+# ----------------------------------------------------------------------
+
+
+def main():
+    args = parse_args()
+    config_path = get_config_path(args)
+
+    # Uncomment if you want a minimal pose model (e.g. head + tailbase only)
+    # enforce_minimal_bodyparts(config_path, ["head", "tailbase"])
+
+    # Run SuperAnimal inference
+    if args.run_superanimal:
+        if args.engine == "tensorflow":
+            step_run_superanimal_inference_tf(config_path, args)
+        else:
+            step_run_superanimal_inference_pt(config_path, args)
+
+    # Extract frames
+    if args.extract_frames:
+        step_extract_frames(config_path)
+        print(
+            "\n👉 Next: refine predictions / label frames in the DLC GUI,"
+            " then rerun this script with --create-dataset and/or --train."
+        )
+
+    # Refine labels in GUI
+    if args.refine_labels:
+        step_refine_labels_gui(config_path)
+
+    # Create dataset from refined labels
+    if args.create_dataset:
+        step_check_labels(config_path)
+        step_create_training_dataset(config_path, engine=args.engine)
+
+    # Train network
+    if args.train:
+        project_dir = config_path.parent
+        training_datasets_dir = project_dir / "training-datasets"
+        if not training_datasets_dir.exists():
+            print("❌ Error: Training dataset not found!")
+            print(f"   Expected: {training_datasets_dir}")
+            print("   Run with --create-dataset first to create the training dataset.")
+            sys.exit(1)
+
+        mat_files = list(training_datasets_dir.rglob("*.mat"))
+        if not mat_files:
+            print("❌ Error: No .mat files found in training-datasets directory!")
+            print(f"   Directory: {training_datasets_dir}")
+            print("   Run with --create-dataset first to create the training dataset.")
+            sys.exit(1)
+
+        step_train_network(config_path, args)
+
+    if not (
+        args.extract_frames
+        or args.create_dataset
+        or args.train
+        or args.run_superanimal
+        or args.refine_labels
+    ):
+        print(
+            "\nNothing to do: specify at least one of "
+            "--run-superanimal, --refine-labels, --extract-frames, "
+            "--create-dataset, or --train.\n"
+        )
+
+
+if __name__ == "__main__":
+    main()

From 5c3bb4a5c50bd69d1bb92e8c83811704169e69cf Mon Sep 17 00:00:00 2001
From: maria <mariaplettre@gmail.com>
Date: Thu, 4 Dec 2025 13:03:07 +0100
Subject: [PATCH 13/15] clean env

---
 environment.yml | 25 ++++++++++++++++---------
 1 file changed, 16 insertions(+), 9 deletions(-)

diff --git a/environment.yml b/environment.yml
index 15ccadc..5d63359 100644
--- a/environment.yml
+++ b/environment.yml
@@ -8,18 +8,25 @@ dependencies:
   - graphviz
   - ffmpeg
   - pip:
-    - datajoint>=0.14.0
-    - pydot
-    - ipykernel
-    - ipywidgets
-    - pytest
-    - pytest-cov
-    - opencv-python  # Required for video metadata extraction
+    # Core dependencies - pinned versions for reproducibility
+    - datajoint==0.14.0
+    - pydot==1.4.2
+    - ipykernel==6.29.0
+    - ipywidgets==8.1.1
+    - pytest==7.4.4
+    - pytest-cov==4.1.0
+    - opencv-python==4.8.1.78  # Required for video metadata extraction
+    # Element dependencies - pinned to specific commits for reproducibility
     - element-lab @ git+https://github.com/datajoint/element-lab.git
     - element-animal @ git+https://github.com/datajoint/element-animal.git
     - element-session @ git+https://github.com/datajoint/element-session.git
     - element-interface @ git+https://github.com/datajoint/element-interface.git
-    # DeepLabCut for inference (optional - comment out if not needed)
+    # DeepLabCut - pinned version to avoid compatibility issues
     - deeplabcut[superanimal]==3.0.0rc13  # For pretrained SuperAnimal models and inference (DLC 3.x)
-    # Alternative: - deeplabcut[tf] @ git+https://github.com/DeepLabCut/DeepLabCut.git  # For TensorFlow backend only
+    # DeepLabCut GUI support (optional - needed for labeling / refine GUI)
+    - deeplabcut[gui]==3.0.0rc13
+    # dlclibrary - pin to avoid ModelZoo download bug
+    # Note: This is a dependency of deeplabcut[superanimal], but we pin it explicitly
+    # to ensure we get a compatible version that doesn't have the rename_mapping bug
+    - dlclibrary>=0.1.0,<0.2.0  # Constrain version to avoid known bugs
 

From ad2ee8254a6739d3c5e1b9f7114cbaf7963d26e9 Mon Sep 17 00:00:00 2001
From: mary <43879378+maryapp@users.noreply.github.com>
Date: Thu, 4 Dec 2025 13:06:11 +0100
Subject: [PATCH 14/15] Update test_video_inference.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 test_video_inference.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/test_video_inference.py b/test_video_inference.py
index 7d673d5..d76208b 100755
--- a/test_video_inference.py
+++ b/test_video_inference.py
@@ -794,8 +794,8 @@ def main():
                             pipeline.model.PoseEstimationTask.update1(
                                 {**task_key, "task_mode": "load"}
                             )
-            except Exception:
-                pass
+            except Exception as e:
+                logging.warning(f"Failed to set 'load' mode for recording {rec_key.get('recording_id', rec_key)}: {e}")
 
     # Verify all tasks use the correct pretrained model before inference
     status.step("Verifying model configuration")

From f078a39d3800e4c8d9d10dfff8d7463bfc615ef9 Mon Sep 17 00:00:00 2001
From: mary <43879378+maryapp@users.noreply.github.com>
Date: Thu, 4 Dec 2025 13:06:33 +0100
Subject: [PATCH 15/15] Update element_deeplabcut/model.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 element_deeplabcut/model.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/element_deeplabcut/model.py b/element_deeplabcut/model.py
index cb9def4..4623e10 100644
--- a/element_deeplabcut/model.py
+++ b/element_deeplabcut/model.py
@@ -842,8 +842,8 @@ def insert_pretrained_model(
                     logger.info("\t{}: {}".format(k, v))
                 else:
                     logger.info("\t-- Template/Contents of config.yaml --")
-                    for k, v in model_dict["config_template"].items():
-                        logger.info("\t\t{}: {}".format(k, v))
+                    for ck, cv in model_dict["config_template"].items():
+                        logger.info("\t\t{}: {}".format(ck, cv))
 
         if (
             prompt