ttngu207 · Feb 24, 2022
diff --git a/‎.gitignore
+1 b/‎.gitignore
+1
diff --git a/‎README.md
+11-6 b/‎README.md
+11-6
diff --git a/‎element_behavior/dlc.py
-444 b/‎element_behavior/dlc.py
-444
diff --git a/‎element_behavior/__init__.py ‎element_deeplabcut/__init__.py b/‎element_behavior/__init__.py ‎element_deeplabcut/__init__.py
diff --git a/‎element_deeplabcut/dlc.py
+575 b/‎element_deeplabcut/dlc.py
+575
diff --git a/‎element_behavior/export/__init__.py ‎element_deeplabcut/export/__init__.py b/‎element_behavior/export/__init__.py ‎element_deeplabcut/export/__init__.py
diff --git a/‎element_deeplabcut/readers/__init__.py b/‎element_deeplabcut/readers/__init__.py
diff --git a/‎element_deeplabcut/readers/dlc_reader.py
+171 b/‎element_deeplabcut/readers/dlc_reader.py
+171
diff --git a/‎element_behavior/version.py ‎element_deeplabcut/version.py b/‎element_behavior/version.py ‎element_deeplabcut/version.py
diff --git a/‎images/diagram_dlc.svg
+210-79 b/‎images/diagram_dlc.svg
+210-79
diff --git a/‎setup.py
+1-1 b/‎setup.py
+1-1
@@ -25,6 +25,7 @@ wheels/
 *.spec
 pip-log.txt
 pip-delete*.txt
+.idea/
 
 # Unit test / coverage reports
 htmlcov/
 
@@ -9,20 +9,25 @@ modular pipeline element can be flexibly attached downstream to any particular d
 experiment session, thus assembling a fully functional behavior pipeline (see the
 example [workflow-deeplabcut](https://github.com/datajoint/workflow-deeplabcut)).
 
-This Element currently supports single-animal, single-camera 2D models, and does not yet support multi-animal, multi-camera, or 3D models.
+This Element currently supports single-animal, single-camera 2D models, and does not yet support multi-animal or multi-camera models.
 
 ## The Pipeline Architecture
 
 ![element-deeplabcut diagram](images/diagram_dlc.svg)
 
 As the diagram depicts, the DeepLabCut element starts immediately downstream from ***Session***, with the following tables.
 
-+ ***Recording***: All recordings from a given session.
++ ***VideoRecording***: All recordings from a given session.
 + ***ConfigParamSet***: A collection of model parameters, represented by an index.
-+ ***Config***: A pairing of model parameters and a recording, with a `config.yaml` file.
-+ ***Model***: A DLC model, as described by a `config.yaml` file.
-+ ***Model.Data***: A part table storing model data, with one table for each body part represented in the model.
-
++ ***TrainingTask***: A set of tasks specifying models to train
++ ***ModelTraining***: A record of training iterations for a given model.
++ ***Model***: A central table for storing unique models
++ ***ModelEval***: Evaluation parameters for each model
++ ***BodyPart***: Unique body parts and descriptions thereof (a.k.a. joints) in a given model.
++ ***PoseEstimationTask***: A series of pose estimation tasks to be completed. This is where one would list videos of experimental sessions.
++ ***PoseEstimation***: Results of pose estimation using a given model. The part table here has a method for directly fetching the results as a pandas dataframe.
+
+A ***Device*** table must be declared elsewhere to uniqely identify cameras.
 
 ## Installation
 
 
@@ -0,0 +1,171 @@
+import re
+import numpy as np
+import pandas as pd
+from pathlib import Path
+import pickle
+import ruamel.yaml as yaml
+
+
+class PoseEstimation:
+
+    def __init__(self, dlc_dir=None, pkl_path=None, h5_path=None, yml_path=None,
+                 filename_prefix=''):
+        if dlc_dir is None:
+            assert pkl_path and h5_path and yml_path, \
+                ('If "dlc_dir" is not provided, then pkl_path, h5_path, and yml_path '
+                 + 'must be provided')
+        else:
+            self.dlc_dir = Path(dlc_dir)
+            if self.dlc_dir.stem != 'videos':
+                self.dlc_dir = dlc_dir / 'videos'
+            assert self.dlc_dir.exists(), f'Unable to find {dlc_dir}'
+
+        # meta file: pkl - info about this  DLC run (input video, configuration, etc.)
+        if pkl_path is None:
+            pkl_paths = list(self.dlc_dir.rglob(f'{filename_prefix}*meta.pickle'))
+            assert len(pkl_paths) == 1, ('Unable to find one unique .pickle file in: '
+                                         + f'{dlc_dir} - Found: {len(pkl_paths)}')
+            self.pkl_path = pkl_paths[0]
+        else:
+            self.pkl_path = Path(pkl_path)
+            assert self.pkl_path.exists()
+
+        # data file: h5 - body part outputs from the DLC post estimation step
+        if h5_path is None:
+            h5_paths = list(self.dlc_dir.rglob(f'{filename_prefix}*.h5'))
+            assert len(h5_paths) == 1, ('Unable to find one unique .h5 file in: '
+                                        + f'{dlc_dir} - Found: {len(h5_paths)}')
+            self.h5_path = h5_paths[0]
+        else:
+            self.h5_path = Path(h5_path)
+            assert self.h5_path.exists()
+
+        assert self.pkl_path.stem == self.h5_path.stem + '_meta', \
+            (f'Mismatching h5 ({self.h5_path.stem}) and pickle {self.pkl_path.stem}')
+
+        # config file: yaml - configuration for invoking the DLC post estimation step
+        if yml_path is None:
+            yml_paths = list(self.dlc_dir.parent.glob(f'{filename_prefix}*.yaml'))
+            # remove the one we save
+            yml_paths = [val for val in yml_paths if not val.stem == "dlc_config_file"]
+            assert len(yml_paths) == 1, ('Unable to find one unique .yaml file in: '
+                                         + f'{dlc_dir} - Found: {len(yml_paths)}')
+            self.yml_path = yml_paths[0]
+        else:
+            self.yml_path = Path(yml_path)
+            assert self.yml_path.exists()
+
+        self._pkl = None
+        self._rawdata = None
+        self._yml = None
+        self._data = None
+
+        train_idx = np.where((np.array(self.yml['TrainingFraction'])*100
+                              ).astype(int) == int(self.pkl['training set fraction'
+                                                            ] * 100))[0][0]
+        train_iter = int(self.pkl['Scorer'].split('_')[-1])
+
+        self.model = {'Scorer': self.pkl['Scorer'],
+                      'Task': self.yml['Task'],
+                      'date': self.yml['date'],
+                      'iteration': self.pkl['iteration (active-learning)'],
+                      'shuffle': int(re.search('shuffle(\d+)',
+                                               self.pkl['Scorer']).groups()[0]),
+                      'snapshotindex': self.yml['snapshotindex'],
+                      'trainingsetindex': train_idx,
+                      'training_iteration': train_iter}
+
+        self.fps = self.pkl['fps']
+        self.nframes = self.pkl['nframes']
+
+        self.creation_time = self.h5_path.stat().st_mtime
+
+    @property
+    def pkl(self):
+        if self._pkl is None:
+            with open(self.pkl_path, 'rb') as f:
+                self._pkl = pickle.load(f)
+        return self._pkl['data']
+
+    @property
+    def yml(self):
+        if self._yml is None:
+            with open(self.yml_path, 'rb') as f:
+                self._yml = yaml.safe_load(f)
+        return self._yml
+
+    @property
+    def rawdata(self):
+        if self._rawdata is None:
+            self._rawdata = pd.read_hdf(self.h5_path)
+        return self._rawdata
+
+    @property
+    def data(self):
+        if self._data is None:
+            self._data = self.reformat_rawdata()
+        return self._data
+
+    @property
+    def df(self):
+        top_level = self.rawdata.columns.levels[0][0]
+        return self.rawdata.get(top_level)
+
+    @property
+    def body_parts(self):
+        return self.df.columns.levels[0]
+
+    def reformat_rawdata(self):
+        error_message = (f'Total frames from .h5 file ({len(self.rawdata)}) differs '
+                         + f'from .pickle ({self.pkl["nframes"]})')
+        assert len(self.rawdata) == self.pkl['nframes'], error_message
+
+        top_level = self.rawdata.columns.levels[0][0]
+
+        body_parts_position = {}
+        for body_part in self.body_parts:
+            body_parts_position[body_part] = {c: self.df.get(body_part).get(c).values
+                                              for c in self.df.get(body_part).columns}
+
+        return body_parts_position
+
+
+def do_pose_estimation(video_filepaths, dlc_model, project_path, output_dir,
+                       videotype=None, gputouse=None, save_as_csv=False, batchsize=None,
+                       cropping=None, TFGPUinference=True, dynamic=(False, 0.5, 10),
+                       robust_nframes=False, allow_growth=False, use_shelve=False,
+                       modelprefix="",  # need from paramset
+                       ):
+    """Launch DLC's analyze_videos within element-deeplabcut
+    :param video_filepaths: list of videos to analyze
+    :param dlc_model: element-deeplabcut dlc.Model dict
+    :param project_path: path to project config.yml
+    :param output_dir: where to save output
+    Remaining parameters are DLC's defaults
+    """
+    from deeplabcut.pose_estimation_tensorflow import analyze_videos
+
+    # ---- Build and save DLC configuration (yaml) file ----
+    dlc_config = dlc_model['config_template']
+    dlc_project_path = Path(project_path)
+    assert dlc_project_path.exists(), (f'DLC project path ({dlc_project_path}) not '
+                                       + 'found on this machine')
+    dlc_config['project_path'] = dlc_project_path.as_posix()
+
+    # ---- Write DLC and basefolder yaml (config) files ----
+
+    # Write dlc config file to base (data) folder
+    # This is important for parsing the DLC in datajoint imaging
+    output_dir.mkdir(exist_ok=True)
+    dlc_cfg_filepath = output_dir / 'dlc_config_file.yaml'
+    with open(dlc_cfg_filepath, 'w') as f:
+        yaml.dump(dlc_config, f)
+
+    # ---- Trigger DLC prediction job ----
+    analyze_videos(config=dlc_cfg_filepath, videos=video_filepaths,
+                   shuffle=dlc_model['shuffle'],
+                   trainingsetindex=dlc_model['training_fract_idx'],
+                   destfolder=output_dir,
+                   videotype=None, gputouse=None, save_as_csv=False, batchsize=None,
+                   cropping=None, TFGPUinference=True, dynamic=(False, 0.5, 10),
+                   robust_nframes=False, allow_growth=False, use_shelve=False)
@@ -16,7 +16,7 @@
 setup(
     name=pkg_name.replace('_', '-'),
     version=__version__,
-    description="DataJoint Element for Continuous Behavior Tracking",
+    description="DataJoint Element for Continuous Behavior Tracking via DeepLabCut",
     long_description=long_description,
     long_description_content_type='text/markdown',
     author='DataJoint',